In [3]:
from transformers import GPT2LMHeadModel, GPT2TokenizerFast

device = "cuda:1"
model_id = "gpt2-large"
model = GPT2LMHeadModel.from_pretrained(model_id).to(device)
tokenizer = GPT2TokenizerFast.from_pretrained(model_id)

In [25]:
import torch
from tqdm import tqdm

def compute_perplexity(dialog, prmt, mod_idx=None):
    # Tokenize both utterances
    perpl = []
    
    for idx, (cntx, tkn) in enumerate(zip(dialog[:-1], dialog[1:])):
        if mod_idx is None:
            add_ = ""
        else:
            # if it is not [MOD]'s turn and we are not trying to predict [MOD]'s utterance, we want to add its utterance as context!
            if ("[MOD]" not in cntx and "[MOD]" not in tkn) and idx!=0:
                add_ = np.asarray(dialog)[mod_idx[idx] + 1]
            else:
                add_ = ""
        
        prompt = tokenizer.encode(prmt, return_tensors="pt") 
        context = tokenizer.encode(add_ + " " + cntx, return_tensors="pt")
        tokens = tokenizer.encode(tkn, return_tensors="pt")
        encodings = torch.cat((prompt, context,tokens), dim=1)
        max_length = model.config.n_positions

        stride = 2024
        seq_len = encodings.size(1)

        nlls = []
        prev_end_loc = prompt.size(1) + context.size(1)

        for begin_loc in range(0, seq_len, stride):
            end_loc = min(begin_loc + max_length, seq_len)
            trg_len = end_loc - prev_end_loc  # may be different from stride on last loop
            input_ids = encodings[:, begin_loc:end_loc].to(device)
            target_ids = input_ids.clone()
            target_ids[:, :-trg_len] = -100
            
            with torch.no_grad():
                outputs = model(input_ids, labels=target_ids)

                # loss is calculated using CrossEntropyLoss which averages over valid labels
                # N.B. the model only calculates loss over trg_len - 1 labels, because it internally shifts the labels
                # to the left by 1.
                neg_log_likelihood = outputs.loss

            nlls.append(neg_log_likelihood)

            prev_end_loc = end_loc
            if end_loc == seq_len:
                break
        perpl.append(torch.exp(torch.stack(nlls).mean()).item())
        print(torch.exp(torch.stack(nlls).mean()).item())
    return perpl

In [40]:
import torch
from tqdm import tqdm

def compute_perplexity(dialog, prmt, mod_idx=None):
    # Tokenize both utterances
    perpl = []
    
    for idx, cntx in enumerate(dialog[1:]):
        
        prompt = tokenizer.encode(prmt, return_tensors="pt") 
        context += tokenizer.encode(cntx, return_tensors="pt")
        tokens = tokenizer.encode(tkn, return_tensors="pt")

        encodings = torch.cat((prompt, context,tokens), dim=1)
        max_length = model.config.n_positions

        stride = 2024
        seq_len = encodings.size(1)

        nlls = []
        prev_end_loc = prompt.size(1) + context.size(1)
        
        for begin_loc in range(0, seq_len, stride):
            end_loc = min(begin_loc + max_length, seq_len)
            trg_len = end_loc - prev_end_loc  # may be different from stride on last loop
            input_ids = encodings[:, begin_loc:end_loc].to(device)
            target_ids = input_ids.clone()
            target_ids[:, :-trg_len] = -100
            
            with torch.no_grad():
                outputs = model(input_ids, labels=target_ids)
                neg_log_likelihood = outputs.loss

            nlls.append(neg_log_likelihood)

            prev_end_loc = end_loc
            if end_loc == seq_len:
                break
        perpl.append(torch.exp(torch.stack(nlls).mean()).item())
        print(torch.exp(torch.stack(nlls).mean()).item())
    return perpl

In [41]:
import numpy as np
import re
# Example usage
dialog = ["",
          "[Mark]: How are you doing today?",
          "[Lisa]: I'm good, thanks for asking.",
          "[Mark]: Did you complete the report?",
          "[Lisa]: Not yet, but I'll have it ready by tomorrow."]
prmt = "This is a conversation between Mark and Lisa.\nPredict the next most probable utterance:"

pattern = r'\[([^\]]+)\]'
matches = re.findall(pattern, "".join(dialog))
perpl = compute_perplexity(dialog, prmt)

for patt in np.unique(matches):
    idx = np.asarray([index for index, element in enumerate(matches) if element == patt])
    print(f"{patt} :", np.mean(np.asarray(perpl)[idx]))

for d, p in zip(dialog[1:], perpl):
    print(f"{d}, {p}")

RuntimeError: output with shape [0] doesn't match the broadcast shape [1, 0]

In [27]:
gpt1 = ["",
        "[D]: Hey, I've been thinking about our upcoming project. I believe we should take a more assertive approach to meet our deadlines.",
        "[S]: Oh, absolutely. I completely agree. What specific tasks do you think I should focus on to support our goals?",
        "[D]: Great. I need you to take charge of the research phase. Make sure to gather all the relevant information and compile a detailed report by the end of the week.",
        "[S]: Of course, I'll get started right away. Should I consider any specific sources or themes?",
        "[D]: I trust your judgment, but prioritize industry reports and recent studies. We need solid data to make our case.",
        "[S]: Got it. I'll make sure to provide a comprehensive overview in the report.",
        "[D]: Perfect. Additionally, I'd like you to prepare a brief presentation summarizing the key findings. We have a meeting next Monday, and your insights will be crucial.",
        "[S]: No problem. I'll ensure the presentation is concise and highlights the most important points.",
        "[D]: Good. Let me know if you need any assistance, but I expect you to handle this with minimal supervision.",
        "[S]: Thank you for entrusting me with this responsibility. I'll do my best to meet your expectations."]

prmt = "This is a conversation between D and S.\nPredict the next most probable utterance:"

pattern = r'\[([^\]]+)\]'
matches = re.findall(pattern, "".join(gpt1))
perpl = compute_perplexity(gpt1, prmt)
print(perpl)
for patt in np.unique(matches):
    idx = np.asarray([index for index, element in enumerate(matches) if element == patt])
    print(f"{patt} :", np.mean(np.asarray(perpl)[idx]))
for d, p in zip(gpt1[1:], perpl):
    print(f"{d}, {p}")

prompt:  This is a conversation between D and S.
Predict the next most probable utterance:
context:  
token:  [D]: Hey, I've been thinking about our upcoming project. I believe we should take a more assertive approach to meet our deadlines.
25.97359848022461
prompt:  This is a conversation between D and S.
Predict the next most probable utterance:
context:  [D]: Hey, I've been thinking about our upcoming project. I believe we should take a more assertive approach to meet our deadlines.
token:  [S]: Oh, absolutely. I completely agree. What specific tasks do you think I should focus on to support our goals?
13.740754127502441
prompt:  This is a conversation between D and S.
Predict the next most probable utterance:
context:  [S]: Oh, absolutely. I completely agree. What specific tasks do you think I should focus on to support our goals?
token:  [D]: Great. I need you to take charge of the research phase. Make sure to gather all the relevant information and compile a detailed report by th

In [28]:
file_path = "../data/gpt4/teacher_dominated.txt"
with open(file_path, 'r') as file:
    datasets = file.read().split('\n\n')

# Now 'dataset' is a list where each element is a chunk from the file
for dataset in datasets:
    firstliner = ""
    dataset = [firstliner] + dataset.split("\n")
    print(dataset)
    prmt = "This is a conversation between Teacher and Student.\nPredict the next most probable utterance:"

    pattern = r'\[([^\]]+)\]'
    matches = re.findall(pattern, "".join(dataset))
    perpl = compute_perplexity(dataset, prmt)
    for patt in np.unique(matches):
        idx = np.asarray([index for index, element in enumerate(matches) if element == patt])
        print(f"{patt} :", np.mean(np.asarray(perpl)[idx]))

['', '[Teacher]: "Good morning, John. Did you complete your homework?"', '[Student]: "Yes, I did."', '[Teacher]: "Great! Can you show it to me?"', '[Student]: "Sure, here it is."', '[Teacher]: "Well done, John. Keep up the good work."']
prompt:  This is a conversation between Teacher and Student.
Predict the next most probable utterance:
context:  
token:  [Teacher]: "Good morning, John. Did you complete your homework?"
23.159488677978516
prompt:  This is a conversation between Teacher and Student.
Predict the next most probable utterance:
context:  [Teacher]: "Good morning, John. Did you complete your homework?"
token:  [Student]: "Yes, I did."
3.780818462371826
prompt:  This is a conversation between Teacher and Student.
Predict the next most probable utterance:
context:  [Student]: "Yes, I did."
token:  [Teacher]: "Great! Can you show it to me?"
9.264633178710938
prompt:  This is a conversation between Teacher and Student.
Predict the next most probable utterance:
context:  [Teacher

7.033215045928955
prompt:  This is a conversation between Teacher and Student.
Predict the next most probable utterance:
context:  [Teacher]: "Let's go over it together."
token:  [Student]: "That would be helpful."
10.414844512939453
prompt:  This is a conversation between Teacher and Student.
Predict the next most probable utterance:
context:  [Student]: "That would be helpful."
token:  [Teacher]: "First, let's look at the instructions."
11.24404525756836
prompt:  This is a conversation between Teacher and Student.
Predict the next most probable utterance:
context:  [Teacher]: "First, let's look at the instructions."
token:  [Student]: "Oh, I see where I went wrong."
10.238276481628418
Student : 25.426980018615723
Teacher : 9.138630151748657
['', '[Teacher]: "Today we will be discussing the civil war. Any questions before we start?"', '[Student]: "No, I\'m ready."', '[Teacher]: "Great, let\'s begin."', '[Student]: "Okay."', '[Teacher]: "The civil war was a pivotal moment in our histor

6.835707664489746
prompt:  This is a conversation between Teacher and Student.
Predict the next most probable utterance:
context:  [Student]: "Okay."
token:  [Teacher]: "Democracy is a form of government where the people have the power to choose their leaders."
6.414319038391113
Student : 5.971709489822388
Teacher : 13.262872536977133
['', '[Student]: "Can we go over the last chapter again? I\'m a bit confused."', '[Teacher]: "Of course, let\'s review it together."', '[Student]: "Thank you."', '[Teacher]: "Let\'s start from the beginning."', '[Student]: "That makes it clearer."']
prompt:  This is a conversation between Teacher and Student.
Predict the next most probable utterance:
context:  
token:  [Student]: "Can we go over the last chapter again? I'm a bit confused."
27.45329475402832
prompt:  This is a conversation between Teacher and Student.
Predict the next most probable utterance:
context:  [Student]: "Can we go over the last chapter again? I'm a bit confused."
token:  [Teacher

6.415534973144531
prompt:  This is a conversation between Teacher and Student.
Predict the next most probable utterance:
context:  [Teacher]: "Of course, let's review it together."
token:  [Student]: "Thank you."
7.232381820678711
prompt:  This is a conversation between Teacher and Student.
Predict the next most probable utterance:
context:  [Student]: "Thank you."
token:  [Teacher]: "Let's start from the beginning."
6.786656379699707
prompt:  This is a conversation between Teacher and Student.
Predict the next most probable utterance:
context:  [Teacher]: "Let's start from the beginning."
token:  [Student]: "That makes it clearer."
19.93571662902832
Student : 18.207131067911785
Teacher : 6.601095676422119
['', '[Teacher]: "Let\'s start the class with a quick recap of yesterday\'s lesson."', '[Student]: "Sure."', '[Teacher]: "We discussed the concept of democracy. Can you tell me what you remember?"', '[Student]: "Democracy is a form of government where the people have the power to cho

19.93571662902832
Student : 18.207131067911785
Teacher : 6.601095676422119
['', '[Teacher]: "Let\'s start the class with a quick recap of yesterday\'s lesson."', '[Student]: "Sure."', '[Teacher]: "We discussed the concept of evolution. Can you tell me what you remember?"', '[Student]: "Evolution is the process by which species of organisms undergo change over time."', '[Teacher]: "Excellent! Let\'s move on to today\'s lesson."']
prompt:  This is a conversation between Teacher and Student.
Predict the next most probable utterance:
context:  
token:  [Teacher]: "Let's start the class with a quick recap of yesterday's lesson."
20.01887321472168
prompt:  This is a conversation between Teacher and Student.
Predict the next most probable utterance:
context:  [Teacher]: "Let's start the class with a quick recap of yesterday's lesson."
token:  [Student]: "Sure."
8.22253131866455
prompt:  This is a conversation between Teacher and Student.
Predict the next most probable utterance:
context:  [St

14.846953392028809
prompt:  This is a conversation between Teacher and Student.
Predict the next most probable utterance:
context:  [Teacher]: "We discussed the concept of human rights. Can you tell me what you remember?"
token:  [Student]: "Human rights are the basic rights and freedoms to which all individuals are entitled."
6.3163323402404785
prompt:  This is a conversation between Teacher and Student.
Predict the next most probable utterance:
context:  [Student]: "Human rights are the basic rights and freedoms to which all individuals are entitled."
token:  [Teacher]: "Excellent! Let's move on to today's lesson."
8.33304214477539
Student : 7.269431829452515
Teacher : 14.399622917175293
['', '[Teacher]: "Today we will be discussing the concept of renewable energy. Are you ready?"', '[Student]: "Yes, I am."', '[Teacher]: "Great, let\'s start with the definition."', '[Student]: "Okay."', '[Teacher]: "Renewable energy is energy that is collected from renewable resources, which are natu

24.141788482666016
prompt:  This is a conversation between Teacher and Student.
Predict the next most probable utterance:
context:  [Teacher]: "Today we will be discussing the concept of algebra. Are you ready?"
token:  [Student]: "Yes, I am."
3.8100030422210693
prompt:  This is a conversation between Teacher and Student.
Predict the next most probable utterance:
context:  [Student]: "Yes, I am."
token:  [Teacher]: "Great, let's start with the definition."
9.019451141357422
prompt:  This is a conversation between Teacher and Student.
Predict the next most probable utterance:
context:  [Teacher]: "Great, let's start with the definition."
token:  [Student]: "Okay."
7.042109489440918
prompt:  This is a conversation between Teacher and Student.
Predict the next most probable utterance:
context:  [Student]: "Okay."
token:  [Teacher]: "Algebra is a branch of mathematics dealing with symbols and the rules for manipulating those symbols."
12.009552001953125
Student : 5.426056265830994
Teacher 

7.042109489440918
prompt:  This is a conversation between Teacher and Student.
Predict the next most probable utterance:
context:  [Student]: "Okay."
token:  [Teacher]: "Geometry is a branch of mathematics concerned with questions of shape, size, relative position of figures, and the properties of space."
13.482544898986816
Student : 5.451420783996582
Teacher : 15.421844164530436
['', '[Student]: "I\'m having trouble with this biology question."', '[Teacher]: "Let\'s break it down together."', '[Student]: "That would be helpful."', '[Teacher]: "First, let\'s look at the cell structure."', '[Student]: "Oh, I see where I went wrong."']
prompt:  This is a conversation between Teacher and Student.
Predict the next most probable utterance:
context:  
token:  [Student]: "I'm having trouble with this biology question."
54.13230895996094
prompt:  This is a conversation between Teacher and Student.
Predict the next most probable utterance:
context:  [Student]: "I'm having trouble with this biol

8.528223991394043
prompt:  This is a conversation between Teacher and Student.
Predict the next most probable utterance:
context:  [Teacher]: "Let's break it down together."
token:  [Student]: "That would be helpful."
10.194622039794922
prompt:  This is a conversation between Teacher and Student.
Predict the next most probable utterance:
context:  [Student]: "That would be helpful."
token:  [Teacher]: "First, let's look at the grammar rules."
9.624067306518555
prompt:  This is a conversation between Teacher and Student.
Predict the next most probable utterance:
context:  [Teacher]: "First, let's look at the grammar rules."
token:  [Student]: "Oh, I see where I went wrong."
11.429396629333496
Student : 22.622727394104004
Teacher : 9.076145648956299
['', '[Teacher]: "Today we will be discussing the concept of economics. Any questions before we start?"', '[Student]: "No, I\'m ready."', '[Teacher]: "Great, let\'s begin."', '[Student]: "Okay."', '[Teacher]: "Economics is a social science co

12.185187339782715
Student : 10.541337172190348
Teacher : 6.964186906814575
['', '[Teacher]: "I\'ve reviewed your assignment, and I have some feedback. You\'ve done a good job overall, but there are a few areas where you could improve."', '[Student]: "I appreciate your feedback, sir. Could you please elaborate on the areas I need to improve?"', '[Teacher]: "Sure. In the second question, you didn\'t provide enough evidence to support your argument. Also, your conclusion could be more concise."', '[Student]: "I understand. I\'ll work on these areas. Thank you for your feedback."', '[Teacher]: "You\'re welcome. Keep up the good work."']
prompt:  This is a conversation between Teacher and Student.
Predict the next most probable utterance:
context:  
token:  [Teacher]: "I've reviewed your assignment, and I have some feedback. You've done a good job overall, but there are a few areas where you could improve."
10.789400100708008
prompt:  This is a conversation between Teacher and Student.
Pre

14.313230514526367
prompt:  This is a conversation between Teacher and Student.
Predict the next most probable utterance:
context:  [Teacher]: "That's a good strategy. Remember to take breaks and not to cram all the information at once. Consistent study is more effective."
token:  [Student]: "Thank you for the advice, sir. I'll keep that in mind."
5.5925374031066895
prompt:  This is a conversation between Teacher and Student.
Predict the next most probable utterance:
context:  [Student]: "Thank you for the advice, sir. I'll keep that in mind."
token:  [Teacher]: "You're welcome. All the best for your exams."
6.720533847808838
Student : 22.289026498794556
Teacher : 14.60498571395874
['', '[Teacher]: "Effective time management is crucial for academic success. Have you thought about how you plan your study time?"', '[Student]: "I try to study for a few hours every day after school. But sometimes, I find it hard to stick to my schedule."', '[Teacher]: "It\'s important to have a realistic s

6.416811943054199
prompt:  This is a conversation between Teacher and Student.
Predict the next most probable utterance:
context:  [Student]: "I haven't, but I'll consider it. Thank you for your understanding, sir."
token:  [Teacher]: "You're welcome. Remember, we're here to support you."
5.70031213760376
Student : 16.489840030670166
Teacher : 5.958224058151245
['', '[Teacher]: "I\'ve noticed you have a keen interest in literature. Have you thought about exploring this interest further?"', '[Student]: "I love reading, but I\'m not sure how to explore it further."', '[Teacher]: "You could consider joining a book club or even starting a blog to review books. It could be a great way to nurture your interest."', '[Student]: "That sounds interesting. I\'ll definitely consider it. Thank you, Miss."', '[Teacher]: "You\'re welcome. I\'m sure you\'ll do great."']
prompt:  This is a conversation between Teacher and Student.
Predict the next most probable utterance:
context:  
token:  [Teacher]: 

8.188695907592773
Student : 11.753832817077637
Teacher : 9.189117272694906
['', '[Teacher]: "Understanding the real-world application of a subject can enhance its relevance. Can anyone give an example of how we use algebra in our daily lives?"', '[Student]: "We use algebra when we calculate distances or when we manage our finances."', '[Teacher]: "Exactly. Understanding the practical application of a subject can make it more interesting."', '[Student]: "I agree, sir. It makes the subject more relatable."', '[Teacher]: "Absolutely. Let\'s try to relate our subjects to real-world scenarios whenever we can."']
prompt:  This is a conversation between Teacher and Student.
Predict the next most probable utterance:
context:  
token:  [Teacher]: "Understanding the real-world application of a subject can enhance its relevance. Can anyone give an example of how we use algebra in our daily lives?"
39.850704193115234
prompt:  This is a conversation between Teacher and Student.
Predict the next mos

2106.2685546875
prompt:  This is a conversation between Teacher and Student.
Predict the next most probable utterance:
context:   
token:  [Student]: "Sir, we're having some conflicts in our group project. We can't agree on the direction of the project."
19.74815559387207
prompt:  This is a conversation between Teacher and Student.
Predict the next most probable utterance:
context:  [Student]: "Sir, we're having some conflicts in our group project. We can't agree on the direction of the project."
token:  [Teacher]: "Conflicts are common in group projects. The key is to communicate effectively. Listen to each other's ideas and try to find a compromise."
8.028877258300781
prompt:  This is a conversation between Teacher and Student.
Predict the next most probable utterance:
context:  [Teacher]: "Conflicts are common in group projects. The key is to communicate effectively. Listen to each other's ideas and try to find a compromise."
token:  [Student]: "We'll try that. Thank you, sir."
12.4

9.331642150878906
prompt:  This is a conversation between Teacher and Student.
Predict the next most probable utterance:
context:  [Teacher]: "That's a valid point. AI might not consider fairness, privacy, and other ethical issues. What can be done to address this?"
token:  [Student]: "We could incorporate ethical guidelines into the AI's decision-making process."
8.555794715881348
prompt:  This is a conversation between Teacher and Student.
Predict the next most probable utterance:
context:  [Student]: "We could incorporate ethical guidelines into the AI's decision-making process."
token:  [Teacher]: "Excellent. That's one possible solution. Any other thoughts?"
13.542702674865723
Student : 12.557013034820557
Teacher : 14.573992729187012
['', '[Student]: "Miss, I\'m feeling stressed about the upcoming exams. I\'m not sure how to manage it."', '[Teacher]: "It\'s normal to feel stressed before exams. But there are ways to manage it. Firstly, create a study schedule. This will help you s

RuntimeError: Expected tensor for argument #1 'indices' to have one of the following scalar types: Long, Int; but got torch.cuda.FloatTensor instead (while checking arguments for embedding)

In [29]:
file_path = "../data/gpt4/student_dominated.txt"
with open(file_path, 'r') as file:
    datasets = file.read().split('\n\n')

# Now 'dataset' is a list where each element is a chunk from the file
for dataset in datasets:
    firstliner = "This is a conversation between Teacher and Student. "
    dataset = [firstliner] + dataset.split("\n")
    print(dataset)
    prmt = "Predict the next most probable utterance:"

    pattern = r'\[([^\]]+)\]'
    matches = re.findall(pattern, "".join(dataset))
    perpl = compute_perplexity(dataset, prmt)
    for patt in np.unique(matches):
        idx = np.asarray([index for index, element in enumerate(matches) if element == patt])
        print(f"{patt} :", np.mean(np.asarray(perpl)[idx]))

['This is a conversation between Teacher and Student. ', '[Student]: "Miss, I have prepared a presentation on the solar system. Can I present it to the class?"', '[Teacher]: "Sure, go ahead."', '[Student]: "Thank you. So, the solar system consists of the Sun and everything that orbits around it."', '[Teacher]: "That\'s correct."', '[Student]: "There are eight planets in the solar system. They are Mercury, Venus, Earth, Mars, Jupiter, Saturn, Uranus, and Neptune."', '[Teacher]: "Very good. Continue."']
prompt:  Predict the next most probable utterance:
context:  This is a conversation between Teacher and Student. 
token:  [Student]: "Miss, I have prepared a presentation on the solar system. Can I present it to the class?"
20.73455238342285
prompt:  Predict the next most probable utterance:
context:  [Student]: "Miss, I have prepared a presentation on the solar system. Can I present it to the class?"
token:  [Teacher]: "Sure, go ahead."
5.137509346008301
prompt:  Predict the next most pr

5.735140800476074
prompt:  Predict the next most probable utterance:
context:  [Teacher]: "Sure, go ahead."
token:  [Student]: "Thank you. 'To Kill a Mockingbird' is a novel by Harper Lee published in 1960. It was immediately successful, winning the Pulitzer Prize, and has become a classic of modern American literature."
8.99692153930664
prompt:  Predict the next most probable utterance:
context:  [Student]: "Thank you. 'To Kill a Mockingbird' is a novel by Harper Lee published in 1960. It was immediately successful, winning the Pulitzer Prize, and has become a classic of modern American literature."
token:  [Teacher]: "That's correct."
12.32402515411377
prompt:  Predict the next most probable utterance:
context:  [Teacher]: "That's correct."
token:  [Student]: "The plot and characters are loosely based on Lee's observations of her family, her neighbors and an event that occurred near her hometown of Monroeville, Alabama, in 1936, when she was 10 years old."
20.284957885742188
prompt: 

7.917330741882324
prompt:  Predict the next most probable utterance:
context:  [Teacher]: "That's correct."
token:  [Student]: "It's the force that keeps us on the ground and the planets orbiting the sun."
21.184602737426758
prompt:  Predict the next most probable utterance:
context:  [Student]: "It's the force that keeps us on the ground and the planets orbiting the sun."
token:  [Teacher]: "Excellent explanation."
34.6729621887207
Student : 14.81723403930664
Teacher : 24.765034039815266
['This is a conversation between Teacher and Student. ', '[Student]: "Sir, I have prepared a presentation on the human body. Can I present it to the class?"', '[Teacher]: "Sure, go ahead."', '[Student]: "Thank you. The human body is made up of several organ systems that work together as one unit."', '[Teacher]: "That\'s correct."', '[Student]: "These systems include the circulatory system, respiratory system, immune system, skeletal system, digestive system, nervous system, and more."', '[Teacher]: "V

8.733360290527344
prompt:  Predict the next most probable utterance:
context:  [Teacher]: "That's correct."
token:  [Student]: "It's a major issue that's largely caused by human activities, such as burning fossil fuels, deforestation, and industrial processes."
17.133880615234375
prompt:  Predict the next most probable utterance:
context:  [Student]: "It's a major issue that's largely caused by human activities, such as burning fossil fuels, deforestation, and industrial processes."
token:  [Teacher]: "Excellent explanation."
33.373477935791016
Student : 12.7946138381958
Teacher : 24.07387860616048
['This is a conversation between Teacher and Student. ', '[Student]: "Miss, I have prepared a presentation on the Roman Empire. Can I present it to the class?"', '[Teacher]: "Sure, go ahead."', '[Student]: "Thank you. The Roman Empire was the post-Republican period of ancient Rome."', '[Teacher]: "That\'s correct."', '[Student]: "It had a government headed by emperors and large territorial h

37.34337615966797
prompt:  Predict the next most probable utterance:
context:  [Student]: "Enlightenment thinkers sought to reform society and advance knowledge using reason and the scientific method."
token:  [Teacher]: "Very good. Continue."
24.090097427368164
Student : 25.961419105529785
Teacher : 13.59657653172811
['This is a conversation between Teacher and Student. ', '[Teacher]: "Can anyone explain the concept of artificial intelligence?"', '[Student]: "Yes, I can. Artificial intelligence refers to the simulation of human intelligence in machines that are programmed to think like humans and mimic their actions."', '[Teacher]: "That\'s correct."', '[Student]: "The term may also be applied to any machine that exhibits traits associated with a human mind such as learning and problem-solving."', '[Teacher]: "Excellent explanation."']
prompt:  Predict the next most probable utterance:
context:  This is a conversation between Teacher and Student. 
token:  [Teacher]: "Can anyone explai

11.351787567138672
prompt:  Predict the next most probable utterance:
context:  [Student]: "Yes, I can. Genetic engineering is the direct manipulation of an organism's genes using biotechnology. It's a set of technologies used to change the genetic makeup of cells, including the transfer of genes within and across species boundaries to produce improved or novel organisms."
token:  [Teacher]: "That's a comprehensive definition. Can you give us an example of its application?"
9.51156234741211
prompt:  Predict the next most probable utterance:
context:  [Teacher]: "That's a comprehensive definition. Can you give us an example of its application?"
token:  [Student]: "Sure, one of the most common examples is the creation of genetically modified crops, like corn and soybeans, that are resistant to pests or drought."
8.279818534851074
prompt:  Predict the next most probable utterance:
context:  [Student]: "Sure, one of the most common examples is the creation of genetically modified crops, li

25.855445861816406
prompt:  Predict the next most probable utterance:
context:  [Student]: "Miss, I've been researching the topic of the American Civil Rights Movement. May I share my findings?"
token:  [Teacher]: "Absolutely, we'd love to hear your insights."
7.725945949554443
prompt:  Predict the next most probable utterance:
context:  [Teacher]: "Absolutely, we'd love to hear your insights."
token:  [Student]: "The American Civil Rights Movement was a decades-long struggle by African Americans and their like-minded allies to end institutionalized racial discrimination, disenfranchisement, and racial segregation in the United States. The movement has its roots in the Reconstruction era during the late 19th century, although it made its largest legislative gains in the mid-1960s after years of direct actions and grassroots protests."
11.205387115478516
prompt:  Predict the next most probable utterance:
context:  [Student]: "The American Civil Rights Movement was a decades-long struggl

11.22217845916748
prompt:  Predict the next most probable utterance:
context:  [Student]: "I plan to review the lecture notes and textbook chapters first, then do the practice problems. After that, I'll review the solutions to the problems and make sure I understand them. Finally, I'll review the material again and do more practice problems."
token:  [Teacher]: "That sounds like a solid strategy. Just make sure to take breaks and not to cram all your studying into one session."
12.196406364440918
prompt:  Predict the next most probable utterance:
context:  [Teacher]: "That sounds like a solid strategy. Just make sure to take breaks and not to cram all your studying into one session."
token:  [Student]: "I'll keep that in mind. Thanks for the feedback."
6.843672275543213
Student : 10.282826582590738
Teacher : 8.896633863449097
['This is a conversation between Teacher and Student. ', '[Student]: "Miss, I\'ve been reviewing the material for the exam and I\'ve noticed that I\'m having trou

17.2763671875
prompt:  Predict the next most probable utterance:
context:  [Student]: "Firstly, I'm having trouble understanding the concept of the water cycle. Could you explain it again?"
token:  [Teacher]: "Sure, the water cycle describes the continuous movement of water on, above, and below the surface of the Earth."
7.956638336181641
prompt:  Predict the next most probable utterance:
context:  [Teacher]: "Sure, the water cycle describes the continuous movement of water on, above, and below the surface of the Earth."
token:  [Student]: "I see, so it's a cycle of evaporation, condensation, and precipitation. And what role does the sun play in this cycle?"
6.188226699829102
prompt:  Predict the next most probable utterance:
context:  [Student]: "I see, so it's a cycle of evaporation, condensation, and precipitation. And what role does the sun play in this cycle?"
token:  [Teacher]: "The sun provides the energy that drives the water cycle. It causes the evaporation of water from the o

24.664369583129883
prompt:  Predict the next most probable utterance:
context:  [Student]: "Sir, I want to discuss my academic goals for this semester. I aim to improve my grades in Mathematics and Science."
token:  [Teacher]: "That's a good goal. How do you plan to achieve it?"
5.0992045402526855
prompt:  Predict the next most probable utterance:
context:  [Teacher]: "That's a good goal. How do you plan to achieve it?"
token:  [Student]: "I plan to devote more time to these subjects and solve more practice problems. I also plan to attend extra classes if necessary."
18.05356216430664
prompt:  Predict the next most probable utterance:
context:  [Student]: "I plan to devote more time to these subjects and solve more practice problems. I also plan to attend extra classes if necessary."
token:  [Teacher]: "That sounds like a good plan. Remember, consistency is key. Keep me updated on your progress."
9.688471794128418
prompt:  Predict the next most probable utterance:
context:  [Teacher]: 

7.666356086730957
prompt:  Predict the next most probable utterance:
context:  [Teacher]: "I'm glad you found it useful. What were your key takeaways?"
token:  [Student]: "The speaker emphasized the importance of resilience and innovation in entrepreneurship. He also shared his own experiences which were very inspiring."
21.74724578857422
prompt:  Predict the next most probable utterance:
context:  [Student]: "The speaker emphasized the importance of resilience and innovation in entrepreneurship. He also shared his own experiences which were very inspiring."
token:  [Teacher]: "Those are great takeaways. Remember, learning is not confined to the classroom. There's a lot we can learn from people's experiences."
13.245261192321777
prompt:  Predict the next most probable utterance:
context:  [Teacher]: "Those are great takeaways. Remember, learning is not confined to the classroom. There's a lot we can learn from people's experiences."
token:  [Student]: "Absolutely, sir. I look forward t

6.389886379241943
prompt:  Predict the next most probable utterance:
context:  [Teacher]: "I'm glad you found it useful. What was your favorite part?"
token:  [Student]: "I particularly enjoyed the exhibit on Egyptian civilization. The artifacts were fascinating and the information provided was very detailed."
23.96896743774414
prompt:  Predict the next most probable utterance:
context:  [Student]: "I particularly enjoyed the exhibit on Egyptian civilization. The artifacts were fascinating and the information provided was very detailed."
token:  [Teacher]: "That's great. Did you learn anything new?"
7.723758220672607
prompt:  Predict the next most probable utterance:
context:  [Teacher]: "That's great. Did you learn anything new?"
token:  [Student]: "Yes, I learned about their writing system, hieroglyphics, and their religious beliefs. It was interesting to see how advanced their civilization was."
9.910542488098145
prompt:  Predict the next most probable utterance:
context:  [Student]

6.356403827667236
prompt:  Predict the next most probable utterance:
context:  [Student]: "I think I didn't manage my time well. I spent too much time on a few questions and didn't have enough time for the rest."
token:  [Teacher]: "That's a common issue. You need to practice more to improve your time management skills."
8.719470977783203
prompt:  Predict the next most probable utterance:
context:  [Teacher]: "That's a common issue. You need to practice more to improve your time management skills."
token:  [Student]: "Yes, I will do that. Also, I found some questions confusing. Can we go over them?"
15.029474258422852
prompt:  Predict the next most probable utterance:
context:  [Student]: "Yes, I will do that. Also, I found some questions confusing. Can we go over them?"
token:  [Teacher]: "Of course. Let's go through them."
5.871679782867432
Student : 11.503943602244059
Teacher : 7.266357898712158
['This is a conversation between Teacher and Student. ', '[Student]: "Miss, I need some 

7.869128227233887
prompt:  Predict the next most probable utterance:
context:  [Teacher]: "That sounds like a good plan. Make sure everyone gets a chance to contribute."
token:  [Student]: "Yes, sir. I will ensure that. Thank you for your support."
10.803418159484863
prompt:  Predict the next most probable utterance:
context:  [Student]: "Yes, sir. I will ensure that. Thank you for your support."
token:  [Teacher]: "You're welcome. Good luck with your study group."
8.914324760437012
Student : 15.957160631815592
Teacher : 7.978887875874837
['This is a conversation between Teacher and Student. ', '[Student]: "Miss, I\'m interested in getting involved in extracurricular activities. Can you suggest some opportunities?"', '[Teacher]: "Sure. What are your interests?"', '[Student]: "I\'m interested in sports, music, and community service. I believe these activities can help me develop my skills and broaden my horizons."', '[Teacher]: "That\'s true. You can join the school\'s sports teams, mus

9.101644515991211
prompt:  Predict the next most probable utterance:
context:  [Student]: "Thank you, sir. I believe it will be a positive change."
token:  [Teacher]: "You're welcome. I appreciate your initiative."
9.555538177490234
Student : 22.277028401692707
Teacher : 8.177759806315104
['This is a conversation between Teacher and Student. ', '[Student]: "Miss, I found the career development workshop very informative. I have some questions, though."', '[Teacher]: "Sure, go ahead."', '[Student]: "You mentioned the importance of internships. How can we find internships that align with our career goals?"', '[Teacher]: "You can start by researching companies in your field of interest. Look for internship opportunities on their websites or on job portals."', '[Student]: "Thank you, Miss. I will do that. Also, can you provide some tips on writing a good resume?"', '[Teacher]: "Of course. A good resume should be concise, well-organized, and tailored to the job you\'re applying for."']
promp

In [30]:
import pandas as pd

multisimo_df = pd.read_csv("../data/processed/multisimo_text.csv")
multisimo_df

Unnamed: 0,path,text
0,speech transcription_Transcriber/S05.trs,"[MOD] Ok hi welcome, thank you for coming toda..."
1,speech transcription_Transcriber/S17.trs,"[MOD] Hello guys, thanks very much for being h..."
2,speech transcription_Transcriber/S10.trs,[MOD] Ok. So I would like us to play a quiz. O...
3,speech transcription_Transcriber/S21.trs,[MOD] Ok so hello guys. Thanks very [S1] Hi. [...
4,speech transcription_Transcriber/S18.trs,[MOD] Ok hi guys Thanks very much for coming [...
5,speech transcription_Transcriber/S14.trs,[MOD] Hello guys thanks very much for coming h...
6,speech transcription_Transcriber/S19.trs,[MOD] Perfect. Well hi guys. Welcome. [S1] Hi....
7,speech transcription_Transcriber/S22.trs,[MOD] Ah it's fine. Hello guys. Thanks very mu...
8,speech transcription_Transcriber/S11.trs,"[MOD] Right. So, I would like us to play a qui..."
9,speech transcription_Transcriber/S20.trs,[MOD] So hello. Thanks very [S1] Hi. [MOD] muc...


In [31]:
import re

dominance_scores = {}

for el,path in zip(multisimo_df["text"], multisimo_df["path"]):
    print(path)
    dataset = re.sub(r'\[', r'\n[', el).split("\n")[1:]
    pattern = r'\[(S\d|MOD)\]'
    matches = re.findall(pattern, "".join(dataset))
    MOD_idxs = np.argwhere(np.asarray(matches) =='MOD').ravel()
    mod_idx = []
    for idx,(el, nxt_el) in enumerate(zip(MOD_idxs[:-1], MOD_idxs[1:])):
        mod_idx +=[el for idx in range(nxt_el - el)]
    mod_idx += [MOD_idxs[-1] for _ in range(len(dataset) - MOD_idxs[-1])]
    firstliner = ""
    dataset = [firstliner] + dataset
    assert len(mod_idx) == len(dataset[1:])
    prmt = "This is a conversation between users in parethesis ([S1], [S2], [MOD])\n Predict the next most probable utterance:"
    perpl = compute_perplexity(dataset, prmt, mod_idx=np.asarray(mod_idx))
    dominance_scores[path] = {}
    for patt in np.unique(matches):
        idx = np.asarray([index for index, element in enumerate(matches) if element == patt])
        dominance_scores[path][patt] = np.mean(np.asarray(perpl)[idx])
        print(f"{patt} :", np.mean(np.asarray(perpl)[idx]))

speech transcription_Transcriber/S05.trs
prompt:  This is a conversation between users in parethesis ([S1], [S2], [MOD])
 Predict the next most probable utterance:
context:  
token:  [MOD] Ok hi welcome, thank you for coming today. We're going to play a quiz. I would like to ask you three questions which were posed to a group of one hundred people and I would like you to guess the three most popular answers to these questions. 
17.746978759765625
prompt:  This is a conversation between users in parethesis ([S1], [S2], [MOD])
 Predict the next most probable utterance:
context:  [MOD] Ok hi welcome, thank you for coming today. We're going to play a quiz. I would like to ask you three questions which were posed to a group of one hundred people and I would like you to guess the three most popular answers to these questions. 
token:  [S2] Ok. 
21.13665008544922
prompt:  This is a conversation between users in parethesis ([S1], [S2], [MOD])
 Predict the next most probable utterance:
context:

24.186880111694336
prompt:  This is a conversation between users in parethesis ([S1], [S2], [MOD])
 Predict the next most probable utterance:
context:  [S2] Yeah. 
token:  [S1] Ok. 
4.780437469482422
prompt:  This is a conversation between users in parethesis ([S1], [S2], [MOD])
 Predict the next most probable utterance:
context:  [S1] Ok. 
token:  [MOD] Right. So, the first think I would like you to name is a public place where you would be more likely to catch f the flu or a cold. 
39.64106750488281
prompt:  This is a conversation between users in parethesis ([S1], [S2], [MOD])
 Predict the next most probable utterance:
context:  [MOD] Right. So, the first think I would like you to name is a public place where you would be more likely to catch f the flu or a cold. 
token:  [S1] hmm The the bus? 
113.41551208496094
prompt:  This is a conversation between users in parethesis ([S1], [S2], [MOD])
 Predict the next most probable utterance:
context:  [S1] hmm The the bus? 
token:  [S2] Yea

48.72734069824219
prompt:  This is a conversation between users in parethesis ([S1], [S2], [MOD])
 Predict the next most probable utterance:
context:  [S2] the 
token:  [MOD] what's the most popular answer? 
52.939998626708984
prompt:  This is a conversation between users in parethesis ([S1], [S2], [MOD])
 Predict the next most probable utterance:
context:  [MOD] what's the most popular answer? 
token:  [S1] So it's eh So it's hospital, school and airplane. 
142.50291442871094
prompt:  This is a conversation between users in parethesis ([S1], [S2], [MOD])
 Predict the next most probable utterance:
context:  [S1] So it's eh So it's hospital, school and airplane. 
token:  [S2] mhmm 
19.463489532470703
prompt:  This is a conversation between users in parethesis ([S1], [S2], [MOD])
 Predict the next most probable utterance:
context:  [S2] mhmm 
token:  [S1] So Maybe school? 
83.89259338378906
prompt:  This is a conversation between users in parethesis ([S1], [S2], [MOD])
 Predict the next 

14.541047096252441
prompt:  This is a conversation between users in parethesis ([S1], [S2], [MOD])
 Predict the next most probable utterance:
context:  [S2] yeah 
token:  [S1] one. 
17.82081413269043
prompt:  This is a conversation between users in parethesis ([S1], [S2], [MOD])
 Predict the next most probable utterance:
context:  [S1] one. 
token:  [S2] But at the same time like I think you you're more likely to travel when you're sick. I mean by by airplane because you know you already booked a plane and you know unless you've got insurance and you you're gonna cancel the flight 
39.83600997924805
prompt:  This is a conversation between users in parethesis ([S1], [S2], [MOD])
 Predict the next most probable utterance:
context:  [S2] But at the same time like I think you you're more likely to travel when you're sick. I mean by by airplane because you know you already booked a plane and you know unless you've got insurance and you you're gonna cancel the flight 
token:  [S1] hmm 
15.76

269.0171813964844
prompt:  This is a conversation between users in parethesis ([S1], [S2], [MOD])
 Predict the next most probable utterance:
context:  [MOD] And would the top 
token:  [S1] hm I I then I would you know hospital before 
271.1746826171875
prompt:  This is a conversation between users in parethesis ([S1], [S2], [MOD])
 Predict the next most probable utterance:
context:  [S1] hm I I then I would you know hospital before 
token:  [S2] top would be 
28.301973342895508
prompt:  This is a conversation between users in parethesis ([S1], [S2], [MOD])
 Predict the next most probable utterance:
context:  [S2] top would be 
token:  [S1] airplane would in first would be schools yeah 
309.9883117675781
prompt:  This is a conversation between users in parethesis ([S1], [S2], [MOD])
 Predict the next most probable utterance:
context:  [S1] airplane would in first would be schools yeah 
token:  [S2] bef and school yeah yeah 
43.23312759399414
prompt:  This is a conversation between users

56.173561096191406
prompt:  This is a conversation between users in parethesis ([S1], [S2], [MOD])
 Predict the next most probable utterance:
context:  [MOD] Nope. 
token:  [S2] No. 
20.83803367614746
prompt:  This is a conversation between users in parethesis ([S1], [S2], [MOD])
 Predict the next most probable utterance:
context:  [S2] No. 
token:  [MOD] It allows you to give the rhythm the melody as well. 
116.17231750488281
prompt:  This is a conversation between users in parethesis ([S1], [S2], [MOD])
 Predict the next most probable utterance:
context:  [MOD] It allows you to give the rhythm the melody as well. 
token:  [S2] ok 
109.47976684570312
prompt:  This is a conversation between users in parethesis ([S1], [S2], [MOD])
 Predict the next most probable utterance:
context:  [S2] ok 
token:  [S1] hmm I guess so eh a drum? 
54.1176872253418
prompt:  This is a conversation between users in parethesis ([S1], [S2], [MOD])
 Predict the next most probable utterance:
context:  [S1] hmm

28.973188400268555
prompt:  This is a conversation between users in parethesis ([S1], [S2], [MOD])
 Predict the next most probable utterance:
context:  [S2] sort of so it wouldn't be as visible I'd say. 
token:  [MOD] So what would be your final decision? 
29.93851661682129
prompt:  This is a conversation between users in parethesis ([S1], [S2], [MOD])
 Predict the next most probable utterance:
context:  [MOD] So what would be your final decision? 
token:  [S1] yeah 
76.59479522705078
prompt:  This is a conversation between users in parethesis ([S1], [S2], [MOD])
 Predict the next most probable utterance:
context:  [S1] yeah 
token:  [S2] yeah vi 
41.78853988647461
prompt:  This is a conversation between users in parethesis ([S1], [S2], [MOD])
 Predict the next most probable utterance:
context:  [S2] yeah vi 
token:  [S1] like ah violin 
125.1852798461914
prompt:  This is a conversation between users in parethesis ([S1], [S2], [MOD])
 Predict the next most probable utterance:
context: 

195.0156707763672
prompt:  This is a conversation between users in parethesis ([S1], [S2], [MOD])
 Predict the next most probable utterance:
context:  [MOD] y 
token:  [S2] no 
80.55239868164062
prompt:  This is a conversation between users in parethesis ([S1], [S2], [MOD])
 Predict the next most probable utterance:
context:  [S2] no 
token:  [MOD] yeah good idea but it wasn't one of the popu lar answers ok 
142.7668914794922
prompt:  This is a conversation between users in parethesis ([S1], [S2], [MOD])
 Predict the next most probable utterance:
context:  [MOD] yeah good idea but it wasn't one of the popu lar answers ok 
token:  [S1] a juat 
152.2194061279297
prompt:  This is a conversation between users in parethesis ([S1], [S2], [MOD])
 Predict the next most probable utterance:
context:  [S1] a juat 
token:  [S2] Hair? 
66.04971313476562
prompt:  This is a conversation between users in parethesis ([S1], [S2], [MOD])
 Predict the next most probable utterance:
context:  [S2] Hair? 
to

105.54261779785156
prompt:  This is a conversation between users in parethesis ([S1], [S2], [MOD])
 Predict the next most probable utterance:
context:  [S1] Yeah but I think hair as well is I don't know eh i it's both with scissors so I don't know yeah many paper 
token:  [S2] cut hair 
19.84585952758789
prompt:  This is a conversation between users in parethesis ([S1], [S2], [MOD])
 Predict the next most probable utterance:
context:  [S2] cut hair 
token:  [S1] ah I don't know eh sorry 
35.16575241088867
prompt:  This is a conversation between users in parethesis ([S1], [S2], [MOD])
 Predict the next most probable utterance:
context:  [S1] ah I don't know eh sorry 
token:  [S2] paper I think I don't know you made me unsure again yeah I think I think you're right I think meat should probably be very close 
48.516273498535156
prompt:  This is a conversation between users in parethesis ([S1], [S2], [MOD])
 Predict the next most probable utterance:
context:  [S2] paper I think I don't kno

57.1881217956543
prompt:  This is a conversation between users in parethesis ([S1], [S2], [MOD])
 Predict the next most probable utterance:
context:  [MOD] borate, you need to talk to each other and then you'll have to rank those answers. Ok? 
token:  [S1] Ok. 
16.575759887695312
prompt:  This is a conversation between users in parethesis ([S1], [S2], [MOD])
 Predict the next most probable utterance:
context:  [S1] Ok. 
token:  [MOD] Are you ready or would you like an example or what do you feel? You're ready for the first question or 
42.08979034423828
prompt:  This is a conversation between users in parethesis ([S1], [S2], [MOD])
 Predict the next most probable utterance:
context:  [MOD] Are you ready or would you like an example or what do you feel? You're ready for the first question or 
token:  [S2] Sure go yeah. 
162.3961639404297
prompt:  This is a conversation between users in parethesis ([S1], [S2], [MOD])
 Predict the next most probable utterance:
context:  [S2] Sure go yeah.

24.56195831298828
prompt:  This is a conversation between users in parethesis ([S1], [S2], [MOD])
 Predict the next most probable utterance:
context:  [S1] buses 
token:  [S2] or 
14.113424301147461
prompt:  This is a conversation between users in parethesis ([S1], [S2], [MOD])
 Predict the next most probable utterance:
context:  [S2] or 
token:  [S1] yeah 
31.060440063476562
prompt:  This is a conversation between users in parethesis ([S1], [S2], [MOD])
 Predict the next most probable utterance:
context:  [S1] yeah 
token:  [S2] yeah 
5.347904205322266
prompt:  This is a conversation between users in parethesis ([S1], [S2], [MOD])
 Predict the next most probable utterance:
context:  [S2] yeah 
token:  [S1] I'd say bu ses 
60.43922805786133
prompt:  This is a conversation between users in parethesis ([S1], [S2], [MOD])
 Predict the next most probable utterance:
context:  [S1] I'd say bu ses 
token:  [S2] yeah 
23.213293075561523
prompt:  This is a conversation between users in parethes

73.89102172851562
prompt:  This is a conversation between users in parethesis ([S1], [S2], [MOD])
 Predict the next most probable utterance:
context:  [S2] say would be pretty poular. 
token:  [S1] Yeah. 
12.632354736328125
prompt:  This is a conversation between users in parethesis ([S1], [S2], [MOD])
 Predict the next most probable utterance:
context:  [S1] Yeah. 
token:  [S2] I don't know. 
3.658543348312378
prompt:  This is a conversation between users in parethesis ([S1], [S2], [MOD])
 Predict the next most probable utterance:
context:  [S2] I don't know. 
token:  [S1] Yeah I think that would be the most popular I'm not sure if 
20.884418487548828
prompt:  This is a conversation between users in parethesis ([S1], [S2], [MOD])
 Predict the next most probable utterance:
context:  [S1] Yeah I think that would be the most popular I'm not sure if 
token:  [S2] yeah 
14.787836074829102
prompt:  This is a conversation between users in parethesis ([S1], [S2], [MOD])
 Predict the next most

59.0811653137207
prompt:  This is a conversation between users in parethesis ([S1], [S2], [MOD])
 Predict the next most probable utterance:
context:  [MOD] Can you name an instrument you can find in a symphony orchestra. 
token:  [S1] Flute? 
22.5559024810791
prompt:  This is a conversation between users in parethesis ([S1], [S2], [MOD])
 Predict the next most probable utterance:
context:  [S1] Flute? 
token:  [S2] Violin? Oh we want the three most common aswers 
49.23714828491211
prompt:  This is a conversation between users in parethesis ([S1], [S2], [MOD])
 Predict the next most probable utterance:
context:  [S2] Violin? Oh we want the three most common aswers 
token:  [MOD] mhmm 
81.12238311767578
prompt:  This is a conversation between users in parethesis ([S1], [S2], [MOD])
 Predict the next most probable utterance:
context:  [MOD] mhmm 
token:  [S2] to that. ok. 
85.91227722167969
prompt:  This is a conversation between users in parethesis ([S1], [S2], [MOD])
 Predict the next m

347.1676025390625
prompt:  This is a conversation between users in parethesis ([S1], [S2], [MOD])
 Predict the next most probable utterance:
context:  [MOD] strings. 
token:  [S2] Ok, no strings. 
55.88539123535156
prompt:  This is a conversation between users in parethesis ([S1], [S2], [MOD])
 Predict the next most probable utterance:
context:  [S2] Ok, no strings. 
token:  [S1] No strings. Ok. Like something with percussion or? 
56.911598205566406
prompt:  This is a conversation between users in parethesis ([S1], [S2], [MOD])
 Predict the next most probable utterance:
context:  [S1] No strings. Ok. Like something with percussion or? 
token:  [MOD] Could be. 
37.2971076965332
prompt:  This is a conversation between users in parethesis ([S1], [S2], [MOD])
 Predict the next most probable utterance:
context:  [MOD] Could be. 
token:  [S2] Timpani? or Maybe piano? But it's not they're not usually 
111.02336883544922
prompt:  This is a conversation between users in parethesis ([S1], [S2], 

72.02225494384766
prompt:  This is a conversation between users in parethesis ([S1], [S2], [MOD])
 Predict the next most probable utterance:
context:  [MOD] You need to 
token:  [S2] Tuba? 
160.02427673339844
prompt:  This is a conversation between users in parethesis ([S1], [S2], [MOD])
 Predict the next most probable utterance:
context:  [S2] Tuba? 
token:  [MOD] come up with the last one. 
53.68950271606445
prompt:  This is a conversation between users in parethesis ([S1], [S2], [MOD])
 Predict the next most probable utterance:
context:  [MOD] come up with the last one. 
token:  [S1] No? 
38.23398208618164
prompt:  This is a conversation between users in parethesis ([S1], [S2], [MOD])
 Predict the next most probable utterance:
context:  [S1] No? 
token:  [S2] Oh we need to come up with the last one. 
6.447992324829102
prompt:  This is a conversation between users in parethesis ([S1], [S2], [MOD])
 Predict the next most probable utterance:
context:  [S2] Oh we need to come up with th

14.195422172546387
prompt:  This is a conversation between users in parethesis ([S1], [S2], [MOD])
 Predict the next most probable utterance:
context:  [S2] Yeah. 
token:  [S1] Yes. 
4.998136520385742
prompt:  This is a conversation between users in parethesis ([S1], [S2], [MOD])
 Predict the next most probable utterance:
context:  [S1] Yes. 
token:  [MOD] That's correct 
66.80220031738281
prompt:  This is a conversation between users in parethesis ([S1], [S2], [MOD])
 Predict the next most probable utterance:
context:  [MOD] That's correct 
token:  [S1] ok well done guys. 
75.72529602050781
prompt:  This is a conversation between users in parethesis ([S1], [S2], [MOD])
 Predict the next most probable utterance:
context:  [S1] ok well done guys. 
token:  [MOD] So we have the third question which is the last one. 
32.564903259277344
prompt:  This is a conversation between users in parethesis ([S1], [S2], [MOD])
 Predict the next most probable utterance:
context:  [MOD] So we have the th

55.69911193847656
prompt:  This is a conversation between users in parethesis ([S1], [S2], [MOD])
 Predict the next most probable utterance:
context:  [S2] bread 
token:  [S1] ra ah we don't will you confirm which are the correct ones? 
80.2726058959961
prompt:  This is a conversation between users in parethesis ([S1], [S2], [MOD])
 Predict the next most probable utterance:
context:  [S1] ra ah we don't will you confirm which are the correct ones? 
token:  [MOD] Which ones do you have now? 
25.604419708251953
prompt:  This is a conversation between users in parethesis ([S1], [S2], [MOD])
 Predict the next most probable utterance:
context:  [MOD] Which ones do you have now? 
token:  [S1] So we have 
47.068695068359375
prompt:  This is a conversation between users in parethesis ([S1], [S2], [MOD])
 Predict the next most probable utterance:
context:  [S1] So we have 
token:  [S2] bread meat 
131.82470703125
prompt:  This is a conversation between users in parethesis ([S1], [S2], [MOD])
 P

34.87508010864258
prompt:  This is a conversation between users in parethesis ([S1], [S2], [MOD])
 Predict the next most probable utterance:
context:  [S1] Alright. 
token:  [S2] Ok. 
5.4255452156066895
prompt:  This is a conversation between users in parethesis ([S1], [S2], [MOD])
 Predict the next most probable utterance:
context:  [S2] Ok. 
token:  [S1] piece of what 
48.063316345214844
prompt:  This is a conversation between users in parethesis ([S1], [S2], [MOD])
 Predict the next most probable utterance:
context:  [S1] piece of what 
token:  [S2] hm 
19.07562255859375
prompt:  This is a conversation between users in parethesis ([S1], [S2], [MOD])
 Predict the next most probable utterance:
context:  [S2] hm 
token:  [S1] Fabric? 
69.68670654296875
prompt:  This is a conversation between users in parethesis ([S1], [S2], [MOD])
 Predict the next most probable utterance:
context:  [S1] Fabric? 
token:  [S2] ok cut So we see it everyday like 
201.4953155517578
prompt:  This is a conve

33.477603912353516
prompt:  This is a conversation between users in parethesis ([S1], [S2], [MOD])
 Predict the next most probable utterance:
context:  [S1] Thank you . 
token:  [MOD] So that was it. I hope you enjoyed it. 
16.68807601928711
prompt:  This is a conversation between users in parethesis ([S1], [S2], [MOD])
 Predict the next most probable utterance:
context:  [MOD] So that was it. I hope you enjoyed it. 
token:  [S1] Yes. 
15.044355392456055
prompt:  This is a conversation between users in parethesis ([S1], [S2], [MOD])
 Predict the next most probable utterance:
context:  [S1] Yes. 
token:  [S2] Yeah. 
5.793904781341553
prompt:  This is a conversation between users in parethesis ([S1], [S2], [MOD])
 Predict the next most probable utterance:
context:  [S2] Yeah. 
token:  [MOD] Thanks for coming again. 
54.24306869506836
prompt:  This is a conversation between users in parethesis ([S1], [S2], [MOD])
 Predict the next most probable utterance:
context:  [MOD] Thanks for coming

34.03059387207031
prompt:  This is a conversation between users in parethesis ([S1], [S2], [MOD])
 Predict the next most probable utterance:
context:  [S1] Yeah. 
token:  [MOD] Can you give 
94.77132415771484
prompt:  This is a conversation between users in parethesis ([S1], [S2], [MOD])
 Predict the next most probable utterance:
context:  [MOD] Can you give 
token:  [S1] ah 
177.69650268554688
prompt:  This is a conversation between users in parethesis ([S1], [S2], [MOD])
 Predict the next most probable utterance:
context:  [S1] ah 
token:  [MOD] a specific examples? 
326.881103515625
prompt:  This is a conversation between users in parethesis ([S1], [S2], [MOD])
 Predict the next most probable utterance:
context:  [MOD] a specific examples? 
token:  [S1] I'd guess a 
67.12316131591797
prompt:  This is a conversation between users in parethesis ([S1], [S2], [MOD])
 Predict the next most probable utterance:
context:  [S1] I'd guess a 
token:  [S2] bus it ten 
175.3490447998047
prompt: 

143.1768798828125
prompt:  This is a conversation between users in parethesis ([S1], [S2], [MOD])
 Predict the next most probable utterance:
context:  [S1] Hospital I would have so hospi 
token:  [MOD] mhmm 
160.15786743164062
prompt:  This is a conversation between users in parethesis ([S1], [S2], [MOD])
 Predict the next most probable utterance:
context:  [MOD] mhmm 
token:  [S1] tal first yeah. probably then school cause I wouldn't immediately jump to public transport 
424.8908386230469
prompt:  This is a conversation between users in parethesis ([S1], [S2], [MOD])
 Predict the next most probable utterance:
context:  [S1] tal first yeah. probably then school cause I wouldn't immediately jump to public transport 
token:  [S2] Yeah ha. 
41.50859832763672
prompt:  This is a conversation between users in parethesis ([S1], [S2], [MOD])
 Predict the next most probable utterance:
context:  [S2] Yeah ha. 
token:  [S1] Yeah. 
6.308543682098389
prompt:  This is a conversation between users in

51.15168380737305
prompt:  This is a conversation between users in parethesis ([S1], [S2], [MOD])
 Predict the next most probable utterance:
context:  [S1] s I'd say w would be like some sort of like a flute 
token:  [S2] The flute? 
9.540661811828613
prompt:  This is a conversation between users in parethesis ([S1], [S2], [MOD])
 Predict the next most probable utterance:
context:  [S2] The flute? 
token:  [S1] yeah 
21.661882400512695
prompt:  This is a conversation between users in parethesis ([S1], [S2], [MOD])
 Predict the next most probable utterance:
context:  [S1] yeah 
token:  [MOD] hmm Not really 
112.3855972290039
prompt:  This is a conversation between users in parethesis ([S1], [S2], [MOD])
 Predict the next most probable utterance:
context:  [MOD] hmm Not really 
token:  [S2] Is it a wind instrument? 
51.45106506347656
prompt:  This is a conversation between users in parethesis ([S1], [S2], [MOD])
 Predict the next most probable utterance:
context:  [S2] Is it a wind instr

7.964885234832764
prompt:  This is a conversation between users in parethesis ([S1], [S2], [MOD])
 Predict the next most probable utterance:
context:  [S1] yeah 
token:  [S2] it see ms reasonable. 
162.03762817382812
prompt:  This is a conversation between users in parethesis ([S1], [S2], [MOD])
 Predict the next most probable utterance:
context:  [S2] it see ms reasonable. 
token:  [MOD] Well done 
184.70289611816406
prompt:  This is a conversation between users in parethesis ([S1], [S2], [MOD])
 Predict the next most probable utterance:
context:  [MOD] Well done 
token:  [S1] yeah 
58.649410247802734
prompt:  This is a conversation between users in parethesis ([S1], [S2], [MOD])
 Predict the next most probable utterance:
context:  [S1] yeah 
token:  [MOD] that's it you found it. 
53.33615493774414
prompt:  This is a conversation between users in parethesis ([S1], [S2], [MOD])
 Predict the next most probable utterance:
context:  [MOD] that's it you found it. 
token:  [S2] Well 
91.531

24.780399322509766
prompt:  This is a conversation between users in parethesis ([S1], [S2], [MOD])
 Predict the next most probable utterance:
context:  [S1] Yeah that's good. 
token:  [MOD] yes. 
42.43696975708008
prompt:  This is a conversation between users in parethesis ([S1], [S2], [MOD])
 Predict the next most probable utterance:
context:  [MOD] yes. 
token:  [S2] So it's two. 
38.928680419921875
prompt:  This is a conversation between users in parethesis ([S1], [S2], [MOD])
 Predict the next most probable utterance:
context:  [S2] So it's two. 
token:  [MOD] mhmm So one more. 
51.223819732666016
prompt:  This is a conversation between users in parethesis ([S1], [S2], [MOD])
 Predict the next most probable utterance:
context:  [MOD] mhmm So one more. 
token:  [S1] It's not another food item 
67.88472747802734
prompt:  This is a conversation between users in parethesis ([S1], [S2], [MOD])
 Predict the next most probable utterance:
context:  [S1] It's not another food item 
token:  

87.13555145263672
prompt:  This is a conversation between users in parethesis ([S1], [S2], [MOD])
 Predict the next most probable utterance:
context:  [S1] yeah 
token:  [MOD] Now you didn't get this one ri ght it was the hair first paper second and meat came third. 
189.58189392089844
prompt:  This is a conversation between users in parethesis ([S1], [S2], [MOD])
 Predict the next most probable utterance:
context:  [MOD] Now you didn't get this one ri ght it was the hair first paper second and meat came third. 
token:  [S1] Ok. 
26.048046112060547
prompt:  This is a conversation between users in parethesis ([S1], [S2], [MOD])
 Predict the next most probable utterance:
context:  [S1] Ok. 
token:  [MOD] If you think about the most frequently used phrase you you know most people say have a haircut right? It's a very frequently used word combination. I'm going to have a haircut and 
39.06939697265625
prompt:  This is a conversation between users in parethesis ([S1], [S2], [MOD])
 Predict 

55.56281661987305
prompt:  This is a conversation between users in parethesis ([S1], [S2], [MOD])
 Predict the next most probable utterance:
context:  [MOD] it's a 
token:  [S2] decide which are the populars eh? 
193.6833038330078
prompt:  This is a conversation between users in parethesis ([S1], [S2], [MOD])
 Predict the next most probable utterance:
context:  [S2] decide which are the populars eh? 
token:  [S1] Yeah. 
15.434473037719727
prompt:  This is a conversation between users in parethesis ([S1], [S2], [MOD])
 Predict the next most probable utterance:
context:  [S1] Yeah. 
token:  [S2] More. 
15.61414623260498
prompt:  This is a conversation between users in parethesis ([S1], [S2], [MOD])
 Predict the next most probable utterance:
context:  [S2] More. 
token:  [MOD] th think about there's something connected to the airport 
326.88018798828125
prompt:  This is a conversation between users in parethesis ([S1], [S2], [MOD])
 Predict the next most probable utterance:
context:  [MOD

27.92127227783203
prompt:  This is a conversation between users in parethesis ([S1], [S2], [MOD])
 Predict the next most probable utterance:
context:  [MOD] Yeah. 
token:  [S1] If you got a child. 
30.61693000793457
prompt:  This is a conversation between users in parethesis ([S1], [S2], [MOD])
 Predict the next most probable utterance:
context:  [S1] If you got a child. 
token:  [MOD] So it's the school. 
47.015079498291016
prompt:  This is a conversation between users in parethesis ([S1], [S2], [MOD])
 Predict the next most probable utterance:
context:  [MOD] So it's the school. 
token:  [S1] School ok. 
57.36444091796875
prompt:  This is a conversation between users in parethesis ([S1], [S2], [MOD])
 Predict the next most probable utterance:
context:  [S1] School ok. 
token:  [MOD] Yeah. That's great guys, so you have the three answ ers. 
71.82865142822266
prompt:  This is a conversation between users in parethesis ([S1], [S2], [MOD])
 Predict the next most probable utterance:
conte

26.940719604492188
prompt:  This is a conversation between users in parethesis ([S1], [S2], [MOD])
 Predict the next most probable utterance:
context:  [MOD] Very good. Ready for the second one? 
token:  [S2] mhmm 
37.116737365722656
prompt:  This is a conversation between users in parethesis ([S1], [S2], [MOD])
 Predict the next most probable utterance:
context:  [S2] mhmm 
token:  [MOD] Yeah? 
86.58048248291016
prompt:  This is a conversation between users in parethesis ([S1], [S2], [MOD])
 Predict the next most probable utterance:
context:  [MOD] Yeah? 
token:  [S1] Ok. 
14.51305103302002
prompt:  This is a conversation between users in parethesis ([S1], [S2], [MOD])
 Predict the next most probable utterance:
context:  [S1] Ok. 
token:  [MOD] Can you name an instrument you can find in a symphony orchestra. 
38.42345428466797
prompt:  This is a conversation between users in parethesis ([S1], [S2], [MOD])
 Predict the next most probable utterance:
context:  [MOD] Can you name an instr

21.90727424621582
prompt:  This is a conversation between users in parethesis ([S1], [S2], [MOD])
 Predict the next most probable utterance:
context:  [S2] Hit it? 
token:  [MOD] Yeah. 
48.06699752807617
prompt:  This is a conversation between users in parethesis ([S1], [S2], [MOD])
 Predict the next most probable utterance:
context:  [MOD] Yeah. 
token:  [S2] Yes. So drums 
179.32220458984375
prompt:  This is a conversation between users in parethesis ([S1], [S2], [MOD])
 Predict the next most probable utterance:
context:  [S2] Yes. So drums 
token:  [S1] Drums? 
10.237733840942383
prompt:  This is a conversation between users in parethesis ([S1], [S2], [MOD])
 Predict the next most probable utterance:
context:  [S1] Drums? 
token:  [MOD] Drums yeah very good. 
57.22486114501953
prompt:  This is a conversation between users in parethesis ([S1], [S2], [MOD])
 Predict the next most probable utterance:
context:  [MOD] Drums yeah very good. 
token:  [S2] hm hmm hm 
32.54014587402344
promp

55.81010818481445
prompt:  This is a conversation between users in parethesis ([S1], [S2], [MOD])
 Predict the next most probable utterance:
context:  [S1] Well, I I support your point that that drums are always in the back 
token:  [S2] yes 
11.755651473999023
prompt:  This is a conversation between users in parethesis ([S1], [S2], [MOD])
 Predict the next most probable utterance:
context:  [S2] yes 
token:  [S1] I think that makes a sense to put even the third place 
55.51790237426758
prompt:  This is a conversation between users in parethesis ([S1], [S2], [MOD])
 Predict the next most probable utterance:
context:  [S1] I think that makes a sense to put even the third place 
token:  [S2] The third place. 
10.456238746643066
prompt:  This is a conversation between users in parethesis ([S1], [S2], [MOD])
 Predict the next most probable utterance:
context:  [S2] The third place. 
token:  [S1] Makes a sense to me. 
14.024653434753418
prompt:  This is a conversation between users in paret

13.699899673461914
prompt:  This is a conversation between users in parethesis ([S1], [S2], [MOD])
 Predict the next most probable utterance:
context:  [S2] hm 
token:  [S1] cut the paper 
28.66712760925293
prompt:  This is a conversation between users in parethesis ([S1], [S2], [MOD])
 Predict the next most probable utterance:
context:  [S1] cut the paper 
token:  [MOD] Paper is right actually. 
179.8455810546875
prompt:  This is a conversation between users in parethesis ([S1], [S2], [MOD])
 Predict the next most probable utterance:
context:  [MOD] Paper is right actually. 
token:  [S1] or cut the crap if it's something else 
62.92634201049805
prompt:  This is a conversation between users in parethesis ([S1], [S2], [MOD])
 Predict the next most probable utterance:
context:  [S1] or cut the crap if it's something else 
token:  [MOD] m no we need something more tangible 
192.2998046875
prompt:  This is a conversation between users in parethesis ([S1], [S2], [MOD])
 Predict the next mos

13.166196823120117
prompt:  This is a conversation between users in parethesis ([S1], [S2], [MOD])
 Predict the next most probable utterance:
context:  [S1] I'm not a vegetarian. 
token:  [S2] So you well meat hair and eh pa 
590.8807373046875
prompt:  This is a conversation between users in parethesis ([S1], [S2], [MOD])
 Predict the next most probable utterance:
context:  [S2] So you well meat hair and eh pa 
token:  [S1] paper 
41.90790939331055
prompt:  This is a conversation between users in parethesis ([S1], [S2], [MOD])
 Predict the next most probable utterance:
context:  [S1] paper 
token:  [S2] per 
53.22109603881836
prompt:  This is a conversation between users in parethesis ([S1], [S2], [MOD])
 Predict the next most probable utterance:
context:  [S2] per 
token:  [S1] Oh in this digital world you don't cut the paper so much. 
52.30253219604492
prompt:  This is a conversation between users in parethesis ([S1], [S2], [MOD])
 Predict the next most probable utterance:
context:  

89.59741973876953
prompt:  This is a conversation between users in parethesis ([S1], [S2], [MOD])
 Predict the next most probable utterance:
context:  [S1] ch to discuss if you have d if you disagree with. 
token:  [S2] Ah oh no. No, I think then we can go for meat , hair and then paper. 
64.7562026977539
prompt:  This is a conversation between users in parethesis ([S1], [S2], [MOD])
 Predict the next most probable utterance:
context:  [S2] Ah oh no. No, I think then we can go for meat , hair and then paper. 
token:  [S1] Ok. Ok. Works for me. 
10.238398551940918
prompt:  This is a conversation between users in parethesis ([S1], [S2], [MOD])
 Predict the next most probable utterance:
context:  [S1] Ok. Ok. Works for me. 
token:  [MOD] Yeah? 
35.444034576416016
prompt:  This is a conversation between users in parethesis ([S1], [S2], [MOD])
 Predict the next most probable utterance:
context:  [MOD] Yeah? 
token:  [S1] No? 
15.189308166503906
prompt:  This is a conversation between users 

89.93805694580078
prompt:  This is a conversation between users in parethesis ([S1], [S2], [MOD])
 Predict the next most probable utterance:
context:  [S1] We think yeah 
token:  [S2] We think yeah 
5.3654656410217285
prompt:  This is a conversation between users in parethesis ([S1], [S2], [MOD])
 Predict the next most probable utterance:
context:  [S2] We think yeah 
token:  [MOD] Yeah? 
59.97245788574219
prompt:  This is a conversation between users in parethesis ([S1], [S2], [MOD])
 Predict the next most probable utterance:
context:  [MOD] Yeah? 
token:  [S2] Yeah go ahead. 
28.297452926635742
prompt:  This is a conversation between users in parethesis ([S1], [S2], [MOD])
 Predict the next most probable utterance:
context:  [S2] Yeah go ahead. 
token:  [MOD] Can you name a public place where it's likely to catch a cold or a flu bug. 
45.53079605102539
prompt:  This is a conversation between users in parethesis ([S1], [S2], [MOD])
 Predict the next most probable utterance:
context:  

105.53195190429688
prompt:  This is a conversation between users in parethesis ([S1], [S2], [MOD])
 Predict the next most probable utterance:
context:  [S2] hmm ok So the airplane. air 
token:  [S1] airplane yeah 
40.881832122802734
prompt:  This is a conversation between users in parethesis ([S1], [S2], [MOD])
 Predict the next most probable utterance:
context:  [S1] airplane yeah 
token:  [MOD] You agree? 
83.876708984375
prompt:  This is a conversation between users in parethesis ([S1], [S2], [MOD])
 Predict the next most probable utterance:
context:  [MOD] You agree? 
token:  [S1] yeah 
62.4335823059082
prompt:  This is a conversation between users in parethesis ([S1], [S2], [MOD])
 Predict the next most probable utterance:
context:  [S1] yeah 
token:  [S2] yeah 
4.482073783874512
prompt:  This is a conversation between users in parethesis ([S1], [S2], [MOD])
 Predict the next most probable utterance:
context:  [S2] yeah 
token:  [MOD] So you have eh plane 
400.4423828125
prompt:  

21.92849349975586
prompt:  This is a conversation between users in parethesis ([S1], [S2], [MOD])
 Predict the next most probable utterance:
context:  [S2] hospital 
token:  [S1] hmm 
18.114465713500977
prompt:  This is a conversation between users in parethesis ([S1], [S2], [MOD])
 Predict the next most probable utterance:
context:  [S1] hmm 
token:  [S2] eh 
11.237034797668457
prompt:  This is a conversation between users in parethesis ([S1], [S2], [MOD])
 Predict the next most probable utterance:
context:  [S2] eh 
token:  [MOD] and third is 
235.5081024169922
prompt:  This is a conversation between users in parethesis ([S1], [S2], [MOD])
 Predict the next most probable utterance:
context:  [MOD] and third is 
token:  [S2] ok 
141.2379608154297
prompt:  This is a conversation between users in parethesis ([S1], [S2], [MOD])
 Predict the next most probable utterance:
context:  [S2] ok 
token:  [MOD] plane 
341.4992370605469
prompt:  This is a conversation between users in parethesis (

154.89190673828125
prompt:  This is a conversation between users in parethesis ([S1], [S2], [MOD])
 Predict the next most probable utterance:
context:  [MOD] You agree both of you? 
token:  [S2] yeah yeah 
104.90445709228516
prompt:  This is a conversation between users in parethesis ([S1], [S2], [MOD])
 Predict the next most probable utterance:
context:  [S2] yeah yeah 
token:  [S1] hmm 
8.355359077453613
prompt:  This is a conversation between users in parethesis ([S1], [S2], [MOD])
 Predict the next most probable utterance:
context:  [S1] hmm 
token:  [S2] yeah it can be the drum 
45.90712356567383
prompt:  This is a conversation between users in parethesis ([S1], [S2], [MOD])
 Predict the next most probable utterance:
context:  [S2] yeah it can be the drum 
token:  [MOD] yeah it's the drum, well done! And can you order now the answers please? 
72.2256088256836
prompt:  This is a conversation between users in parethesis ([S1], [S2], [MOD])
 Predict the next most probable utterance:


30.420289993286133
prompt:  This is a conversation between users in parethesis ([S1], [S2], [MOD])
 Predict the next most probable utterance:
context:  [S1] so 
token:  [S2] yeah I mean I mean I mean the bread seems ok I mean I 
45.325096130371094
prompt:  This is a conversation between users in parethesis ([S1], [S2], [MOD])
 Predict the next most probable utterance:
context:  [S2] yeah I mean I mean I mean the bread seems ok I mean I 
token:  [S1] ok let's go for bread first so bread first 
36.033905029296875
prompt:  This is a conversation between users in parethesis ([S1], [S2], [MOD])
 Predict the next most probable utterance:
context:  [S1] ok let's go for bread first so bread first 
token:  [S2] do you think we should opt for for another food eh than cheese 
54.21983337402344
prompt:  This is a conversation between users in parethesis ([S1], [S2], [MOD])
 Predict the next most probable utterance:
context:  [S2] do you think we should opt for for another food eh than cheese 
toke

149.59286499023438
prompt:  This is a conversation between users in parethesis ([S1], [S2], [MOD])
 Predict the next most probable utterance:
context:  [MOD] Think of something that both men and women cut. maybe men more often 
token:  [S2] ah smoking is for certain f f smoking is 
326.0688171386719
prompt:  This is a conversation between users in parethesis ([S1], [S2], [MOD])
 Predict the next most probable utterance:
context:  [S2] ah smoking is for certain f f smoking is 
token:  [MOD] hmm 
80.86455535888672
prompt:  This is a conversation between users in parethesis ([S1], [S2], [MOD])
 Predict the next most probable utterance:
context:  [MOD] hmm 
token:  [S2] one thing eh if we if we'd use it metaphorically though but 
191.51730346679688
prompt:  This is a conversation between users in parethesis ([S1], [S2], [MOD])
 Predict the next most probable utterance:
context:  [S2] one thing eh if we if we'd use it metaphorically though but 
token:  [MOD] It has to do with appearance. 
4

287.27911376953125
prompt:  This is a conversation between users in parethesis ([S1], [S2], [MOD])
 Predict the next most probable utterance:
context:  [S2] meat meat 
token:  [S1] ok 
19.954315185546875
prompt:  This is a conversation between users in parethesis ([S1], [S2], [MOD])
 Predict the next most probable utterance:
context:  [S1] ok 
token:  [MOD] then 
71.5307388305664
prompt:  This is a conversation between users in parethesis ([S1], [S2], [MOD])
 Predict the next most probable utterance:
context:  [MOD] then 
token:  [S2] hmm 
60.17437744140625
prompt:  This is a conversation between users in parethesis ([S1], [S2], [MOD])
 Predict the next most probable utterance:
context:  [S2] hmm 
token:  [MOD] there is one more left. 
56.183685302734375
prompt:  This is a conversation between users in parethesis ([S1], [S2], [MOD])
 Predict the next most probable utterance:
context:  [MOD] there is one more left. 
token:  [S2] o k 
126.91854095458984
prompt:  This is a conversation be

58.20984649658203
prompt:  This is a conversation between users in parethesis ([S1], [S2], [MOD])
 Predict the next most probable utterance:
context:  [S2] and then meat and then no paper meat 
token:  [S1] ok we'll go with that yeah 
24.97891616821289
prompt:  This is a conversation between users in parethesis ([S1], [S2], [MOD])
 Predict the next most probable utterance:
context:  [S1] ok we'll go with that yeah 
token:  [S2] hair pa per meat 
402.6614074707031
prompt:  This is a conversation between users in parethesis ([S1], [S2], [MOD])
 Predict the next most probable utterance:
context:  [S2] hair pa per meat 
token:  [S1] hair paper meat 
47.26845169067383
prompt:  This is a conversation between users in parethesis ([S1], [S2], [MOD])
 Predict the next most probable utterance:
context:  [S1] hair paper meat 
token:  [MOD] you're sure? 
71.9852066040039
prompt:  This is a conversation between users in parethesis ([S1], [S2], [MOD])
 Predict the next most probable utterance:
conte

172.93643188476562
prompt:  This is a conversation between users in parethesis ([S1], [S2], [MOD])
 Predict the next most probable utterance:
context:  [S1] Oh yeah ri ah ok 
token:  [S2] Yeah. 
9.22781753540039
prompt:  This is a conversation between users in parethesis ([S1], [S2], [MOD])
 Predict the next most probable utterance:
context:  [S2] Yeah. 
token:  [S1] Ok so 
27.930130004882812
prompt:  This is a conversation between users in parethesis ([S1], [S2], [MOD])
 Predict the next most probable utterance:
context:  [S1] Ok so 
token:  [S2] A bus maybe, public transportation bus a bus 
117.9043960571289
prompt:  This is a conversation between users in parethesis ([S1], [S2], [MOD])
 Predict the next most probable utterance:
context:  [S2] A bus maybe, public transportation bus a bus 
token:  [S1] Yeah, something that has like the you know the air conditioning? 
36.38888168334961
prompt:  This is a conversation between users in parethesis ([S1], [S2], [MOD])
 Predict the next mos

7.926351547241211
prompt:  This is a conversation between users in parethesis ([S1], [S2], [MOD])
 Predict the next most probable utterance:
context:  [S1] yeah 
token:  [MOD] You already found two. 
104.22848510742188
prompt:  This is a conversation between users in parethesis ([S1], [S2], [MOD])
 Predict the next most probable utterance:
context:  [MOD] You already found two. 
token:  [S1] Ok, plane bus? 
171.52886962890625
prompt:  This is a conversation between users in parethesis ([S1], [S2], [MOD])
 Predict the next most probable utterance:
context:  [S1] Ok, plane bus? 
token:  [MOD] You have plane hospital 
297.9273986816406
prompt:  This is a conversation between users in parethesis ([S1], [S2], [MOD])
 Predict the next most probable utterance:
context:  [MOD] You have plane hospital 
token:  [S1] Oh hospit 
116.64512634277344
prompt:  This is a conversation between users in parethesis ([S1], [S2], [MOD])
 Predict the next most probable utterance:
context:  [S1] Oh hospit 
tok

33.51115036010742
prompt:  This is a conversation between users in parethesis ([S1], [S2], [MOD])
 Predict the next most probable utterance:
context:  [S1] a school 
token:  [S2] school and then 
21.79804039001465
prompt:  This is a conversation between users in parethesis ([S1], [S2], [MOD])
 Predict the next most probable utterance:
context:  [S2] school and then 
token:  [S1] hospital, plane hm 
101.62501525878906
prompt:  This is a conversation between users in parethesis ([S1], [S2], [MOD])
 Predict the next most probable utterance:
context:  [S1] hospital, plane hm 
token:  [S2] hospital you're not supposed to get cold 
28.004362106323242
prompt:  This is a conversation between users in parethesis ([S1], [S2], [MOD])
 Predict the next most probable utterance:
context:  [S2] hospital you're not supposed to get cold 
token:  [S1] yeah we're just surrounded with sick people ah yeah so 
66.13534545898438
prompt:  This is a conversation between users in parethesis ([S1], [S2], [MOD])


23.18852996826172
prompt:  This is a conversation between users in parethesis ([S1], [S2], [MOD])
 Predict the next most probable utterance:
context:  [S1] Violin yeah. 
token:  [S2] do you think? 
14.991884231567383
prompt:  This is a conversation between users in parethesis ([S1], [S2], [MOD])
 Predict the next most probable utterance:
context:  [S2] do you think? 
token:  [S1] 
7.911811828613281
prompt:  This is a conversation between users in parethesis ([S1], [S2], [MOD])
 Predict the next most probable utterance:
context:  [S1] 
token:  [S2] So gui Flute? f floute flu te? 
449.9436340332031
prompt:  This is a conversation between users in parethesis ([S1], [S2], [MOD])
 Predict the next most probable utterance:
context:  [S2] So gui Flute? f floute flu te? 
token:  [S1] Flute yeah. 
18.056333541870117
prompt:  This is a conversation between users in parethesis ([S1], [S2], [MOD])
 Predict the next most probable utterance:
context:  [S1] Flute yeah. 
token:  [S2] le let's first sa

52.1905403137207
prompt:  This is a conversation between users in parethesis ([S1], [S2], [MOD])
 Predict the next most probable utterance:
context:  [S1] Then cello, drum? 
token:  [S2] mhmm 
19.340431213378906
prompt:  This is a conversation between users in parethesis ([S1], [S2], [MOD])
 Predict the next most probable utterance:
context:  [S2] mhmm 
token:  [MOD] That's correct yeah, well done! That's brilliant. 
64.50267028808594
prompt:  This is a conversation between users in parethesis ([S1], [S2], [MOD])
 Predict the next most probable utterance:
context:  [MOD] That's correct yeah, well done! That's brilliant. 
token:  [S1] I just know what's the most obscure so I go for the last one ok. 
39.23000717163086
prompt:  This is a conversation between users in parethesis ([S1], [S2], [MOD])
 Predict the next most probable utterance:
context:  [S1] I just know what's the most obscure so I go for the last one ok. 
token:  [MOD] Perfect. Are you ready for the third question? 
26.02283

78.82054901123047
prompt:  This is a conversation between users in parethesis ([S1], [S2], [MOD])
 Predict the next most probable utterance:
context:  [S2] rope 
token:  [S1] Cut paper? 
52.87858963012695
prompt:  This is a conversation between users in parethesis ([S1], [S2], [MOD])
 Predict the next most probable utterance:
context:  [S1] Cut paper? 
token:  [S2] mhmm 
13.369482040405273
prompt:  This is a conversation between users in parethesis ([S1], [S2], [MOD])
 Predict the next most probable utterance:
context:  [S2] mhmm 
token:  [MOD] of course paper 
274.2367248535156
prompt:  This is a conversation between users in parethesis ([S1], [S2], [MOD])
 Predict the next most probable utterance:
context:  [MOD] of course paper 
token:  [S2] yes you're right. 
37.106101989746094
prompt:  This is a conversation between users in parethesis ([S1], [S2], [MOD])
 Predict the next most probable utterance:
context:  [S2] yes you're right. 
token:  [S1] paper cut 
48.246864318847656
prompt:

22.770164489746094
prompt:  This is a conversation between users in parethesis ([S1], [S2], [MOD])
 Predict the next most probable utterance:
context:  [S1] ok 
token:  [S2] But I'm not 
16.386554718017578
prompt:  This is a conversation between users in parethesis ([S1], [S2], [MOD])
 Predict the next most probable utterance:
context:  [S2] But I'm not 
token:  [S1] yeah 
21.03838348388672
prompt:  This is a conversation between users in parethesis ([S1], [S2], [MOD])
 Predict the next most probable utterance:
context:  [S1] yeah 
token:  [S2] hundred per cent sure. 
34.34004211425781
prompt:  This is a conversation between users in parethesis ([S1], [S2], [MOD])
 Predict the next most probable utterance:
context:  [S2] hundred per cent sure. 
token:  [S1] Yeah me 
52.87065887451172
prompt:  This is a conversation between users in parethesis ([S1], [S2], [MOD])
 Predict the next most probable utterance:
context:  [S1] Yeah me 
token:  [S2] so we have hair, paper 
86.27613067626953
pro

37.67164611816406
prompt:  This is a conversation between users in parethesis ([S1], [S2], [MOD])
 Predict the next most probable utterance:
context:  [S2] important decision so I think 
token:  [S1] It is it is ok so meat 
76.00321960449219
prompt:  This is a conversation between users in parethesis ([S1], [S2], [MOD])
 Predict the next most probable utterance:
context:  [S1] It is it is ok so meat 
token:  [S2] e e 
26.548921585083008
prompt:  This is a conversation between users in parethesis ([S1], [S2], [MOD])
 Predict the next most probable utterance:
context:  [S2] e e 
token:  [S1] first 
24.357419967651367
prompt:  This is a conversation between users in parethesis ([S1], [S2], [MOD])
 Predict the next most probable utterance:
context:  [S1] first 
token:  [S2] meat, hair and paper 
72.68701934814453
prompt:  This is a conversation between users in parethesis ([S1], [S2], [MOD])
 Predict the next most probable utterance:
context:  [S2] meat, hair and paper 
token:  [S1] Meat, 

58.85484313964844
prompt:  This is a conversation between users in parethesis ([S1], [S2], [MOD])
 Predict the next most probable utterance:
context:  [S2] ok. 
token:  [MOD] Is it clear? Ye 
191.41432189941406
prompt:  This is a conversation between users in parethesis ([S1], [S2], [MOD])
 Predict the next most probable utterance:
context:  [MOD] Is it clear? Ye 
token:  [S1] Yep. 
57.41337203979492
prompt:  This is a conversation between users in parethesis ([S1], [S2], [MOD])
 Predict the next most probable utterance:
context:  [S1] Yep. 
token:  [MOD] ah. 
80.26112365722656
prompt:  This is a conversation between users in parethesis ([S1], [S2], [MOD])
 Predict the next most probable utterance:
context:  [MOD] ah. 
token:  [S2] Yes yeah. 
48.50630569458008
prompt:  This is a conversation between users in parethesis ([S1], [S2], [MOD])
 Predict the next most probable utterance:
context:  [S2] Yes yeah. 
token:  [MOD] ok 
164.3433380126953
prompt:  This is a conversation between user

167.98306274414062
prompt:  This is a conversation between users in parethesis ([S1], [S2], [MOD])
 Predict the next most probable utterance:
context:  [MOD] hmm think of f different age groups. 
token:  [S2] Different age groups as 
66.59906005859375
prompt:  This is a conversation between users in parethesis ([S1], [S2], [MOD])
 Predict the next most probable utterance:
context:  [S2] Different age groups as 
token:  [MOD] Think about 
125.22139739990234
prompt:  This is a conversation between users in parethesis ([S1], [S2], [MOD])
 Predict the next most probable utterance:
context:  [MOD] Think about 
token:  [S2] in 
36.22412872314453
prompt:  This is a conversation between users in parethesis ([S1], [S2], [MOD])
 Predict the next most probable utterance:
context:  [S2] in 
token:  [MOD] ch children for example. 
406.5423278808594
prompt:  This is a conversation between users in parethesis ([S1], [S2], [MOD])
 Predict the next most probable utterance:
context:  [MOD] ch children f

74.28202056884766
prompt:  This is a conversation between users in parethesis ([S1], [S2], [MOD])
 Predict the next most probable utterance:
context:  [MOD] The second one is hospital and the third is the plane. So you just missed 
token:  [S2] ok. 
84.4184341430664
prompt:  This is a conversation between users in parethesis ([S1], [S2], [MOD])
 Predict the next most probable utterance:
context:  [S2] ok. 
token:  [MOD] the first two but 
167.33168029785156
prompt:  This is a conversation between users in parethesis ([S1], [S2], [MOD])
 Predict the next most probable utterance:
context:  [MOD] the first two but 
token:  [S1] Yeah. 
68.21853637695312
prompt:  This is a conversation between users in parethesis ([S1], [S2], [MOD])
 Predict the next most probable utterance:
context:  [S1] Yeah. 
token:  [MOD] Yeah. 
18.43769073486328
prompt:  This is a conversation between users in parethesis ([S1], [S2], [MOD])
 Predict the next most probable utterance:
context:  [MOD] Yeah. 
token:  [S2]

501.3931579589844
prompt:  This is a conversation between users in parethesis ([S1], [S2], [MOD])
 Predict the next most probable utterance:
context:  [S2] and th there's eh well one of those eh trumpet a trumpet eh eh cla 
token:  [S1] Clarinet. 
62.206398010253906
prompt:  This is a conversation between users in parethesis ([S1], [S2], [MOD])
 Predict the next most probable utterance:
context:  [S1] Clarinet. 
token:  [S2] arinet clari 
97.63428497314453
prompt:  This is a conversation between users in parethesis ([S1], [S2], [MOD])
 Predict the next most probable utterance:
context:  [S2] arinet clari 
token:  [MOD] No 
142.64065551757812
prompt:  This is a conversation between users in parethesis ([S1], [S2], [MOD])
 Predict the next most probable utterance:
context:  [MOD] No 
token:  [S2] net 
138.57177734375
prompt:  This is a conversation between users in parethesis ([S1], [S2], [MOD])
 Predict the next most probable utterance:
context:  [S2] net 
token:  [S1] No. 
16.643024444

158.74769592285156
prompt:  This is a conversation between users in parethesis ([S1], [S2], [MOD])
 Predict the next most probable utterance:
context:  [S1] ly yeah Drum i 
token:  [S2] ah is more like for a rock band. 
39.97986602783203
prompt:  This is a conversation between users in parethesis ([S1], [S2], [MOD])
 Predict the next most probable utterance:
context:  [S2] ah is more like for a rock band. 
token:  [S1] Yeah 
15.227802276611328
prompt:  This is a conversation between users in parethesis ([S1], [S2], [MOD])
 Predict the next most probable utterance:
context:  [S1] Yeah 
token:  [S2] You know like you don't this is not the first thing that comes to mind with a symphony orchestra. 
17.776859283447266
prompt:  This is a conversation between users in parethesis ([S1], [S2], [MOD])
 Predict the next most probable utterance:
context:  [S2] You know like you don't this is not the first thing that comes to mind with a symphony orchestra. 
token:  [S1] So we've violin cello and d

53.06706237792969
prompt:  This is a conversation between users in parethesis ([S1], [S2], [MOD])
 Predict the next most probable utterance:
context:  [MOD] It could be. 
token:  [S2] or when y 
228.9556884765625
prompt:  This is a conversation between users in parethesis ([S1], [S2], [MOD])
 Predict the next most probable utterance:
context:  [S2] or when y 
token:  [MOD] It could 
408.6750793457031
prompt:  This is a conversation between users in parethesis ([S1], [S2], [MOD])
 Predict the next most probable utterance:
context:  [MOD] It could 
token:  [S2] you're shaving. When you 
95.26500701904297
prompt:  This is a conversation between users in parethesis ([S1], [S2], [MOD])
 Predict the next most probable utterance:
context:  [S2] you're shaving. When you 
token:  [S1] Like an injury yeah. 
95.48516845703125
prompt:  This is a conversation between users in parethesis ([S1], [S2], [MOD])
 Predict the next most probable utterance:
context:  [S1] Like an injury yeah. 
token:  [S2] 

96.23682403564453
prompt:  This is a conversation between users in parethesis ([S1], [S2], [MOD])
 Predict the next most probable utterance:
context:  [S1] m the most way yeah 
token:  [S2] So is is a gain it's hai 
109.33958435058594
prompt:  This is a conversation between users in parethesis ([S1], [S2], [MOD])
 Predict the next most probable utterance:
context:  [S2] So is is a gain it's hai 
token:  [S1] in 
27.311279296875
prompt:  This is a conversation between users in parethesis ([S1], [S2], [MOD])
 Predict the next most probable utterance:
context:  [S1] in 
token:  [S2] air 
38.894065856933594
prompt:  This is a conversation between users in parethesis ([S1], [S2], [MOD])
 Predict the next most probable utterance:
context:  [S2] air 
token:  [MOD] Meat 
357.3693542480469
prompt:  This is a conversation between users in parethesis ([S1], [S2], [MOD])
 Predict the next most probable utterance:
context:  [MOD] Meat 
token:  [S2] eh me 
228.08546447753906
prompt:  This is a conve

84.4993896484375
prompt:  This is a conversation between users in parethesis ([S1], [S2], [MOD])
 Predict the next most probable utterance:
context:  [MOD] No I'm Then what's the second one? 
token:  [S2] I don't know like the first one no the first c is paper. 
55.05736541748047
prompt:  This is a conversation between users in parethesis ([S1], [S2], [MOD])
 Predict the next most probable utterance:
context:  [S2] I don't know like the first one no the first c is paper. 
token:  [MOD] It's pape 
126.08238220214844
prompt:  This is a conversation between users in parethesis ([S1], [S2], [MOD])
 Predict the next most probable utterance:
context:  [MOD] It's pape 
token:  [S2] The 
69.95323944091797
prompt:  This is a conversation between users in parethesis ([S1], [S2], [MOD])
 Predict the next most probable utterance:
context:  [S2] The 
token:  [MOD] r. 
300.6296691894531
prompt:  This is a conversation between users in parethesis ([S1], [S2], [MOD])
 Predict the next most probable ut

27.458276748657227
prompt:  This is a conversation between users in parethesis ([S1], [S2], [MOD])
 Predict the next most probable utterance:
context:  [S1] Yeah. 
token:  [S2] Yeah. 
4.207853317260742
prompt:  This is a conversation between users in parethesis ([S1], [S2], [MOD])
 Predict the next most probable utterance:
context:  [S2] Yeah. 
token:  [MOD] Ready to start? 
32.9071044921875
prompt:  This is a conversation between users in parethesis ([S1], [S2], [MOD])
 Predict the next most probable utterance:
context:  [MOD] Ready to start? 
token:  [S1] Yeah. 
19.238344192504883
prompt:  This is a conversation between users in parethesis ([S1], [S2], [MOD])
 Predict the next most probable utterance:
context:  [S1] Yeah. 
token:  [MOD] Yeah. 
18.43769073486328
prompt:  This is a conversation between users in parethesis ([S1], [S2], [MOD])
 Predict the next most probable utterance:
context:  [MOD] Yeah. 
token:  [S2] Yeah. 
13.424955368041992
prompt:  This is a conversation between u

309.600830078125
prompt:  This is a conversation between users in parethesis ([S1], [S2], [MOD])
 Predict the next most probable utterance:
context:  [S2] p three? Ok. Oh we're doing fairly 
token:  [S1] Awh good. 
38.74245834350586
prompt:  This is a conversation between users in parethesis ([S1], [S2], [MOD])
 Predict the next most probable utterance:
context:  [S1] Awh good. 
token:  [MOD]  doing grea So nice. 
301.5030822753906
prompt:  This is a conversation between users in parethesis ([S1], [S2], [MOD])
 Predict the next most probable utterance:
context:  [MOD]  doing grea So nice. 
token:  [MOD] doing well. 
43.1670036315918
prompt:  This is a conversation between users in parethesis ([S1], [S2], [MOD])
 Predict the next most probable utterance:
context:  [MOD] doing well. 
token:  [S2] t. Yeah. 
77.97394561767578
prompt:  This is a conversation between users in parethesis ([S1], [S2], [MOD])
 Predict the next most probable utterance:
context:  [S2] t. Yeah. 
token:  [S1] Somew

325.7045593261719
prompt:  This is a conversation between users in parethesis ([S1], [S2], [MOD])
 Predict the next most probable utterance:
context:  [MOD] So hos 
token:  [S1] Yeah. 
65.1232681274414
prompt:  This is a conversation between users in parethesis ([S1], [S2], [MOD])
 Predict the next most probable utterance:
context:  [S1] Yeah. 
token:  [MOD] pital first then? 
478.66522216796875
prompt:  This is a conversation between users in parethesis ([S1], [S2], [MOD])
 Predict the next most probable utterance:
context:  [MOD] pital first then? 
token:  [S2] Yeah. 
47.10780334472656
prompt:  This is a conversation between users in parethesis ([S1], [S2], [MOD])
 Predict the next most probable utterance:
context:  [S2] Yeah. 
token:  [S1] Then 
14.148193359375
prompt:  This is a conversation between users in parethesis ([S1], [S2], [MOD])
 Predict the next most probable utterance:
context:  [S1] Then 
token:  [S2] Then 
4.075507640838623
prompt:  This is a conversation between user

269.23199462890625
prompt:  This is a conversation between users in parethesis ([S1], [S2], [MOD])
 Predict the next most probable utterance:
context:  [S1] And is a sym phony. 
token:  [MOD] For the la st one. 
147.202880859375
prompt:  This is a conversation between users in parethesis ([S1], [S2], [MOD])
 Predict the next most probable utterance:
context:  [MOD] For the la st one. 
token:  [S2] I'm trying to think what's probably the most What jumps out when you think symphony orchestra? 
65.76708984375
prompt:  This is a conversation between users in parethesis ([S1], [S2], [MOD])
 Predict the next most probable utterance:
context:  [S2] I'm trying to think what's probably the most What jumps out when you think symphony orchestra? 
token:  [S1] Y your 
82.14413452148438
prompt:  This is a conversation between users in parethesis ([S1], [S2], [MOD])
 Predict the next most probable utterance:
context:  [S1] Y your 
token:  [S2] Y yes. 
9.991506576538086
prompt:  This is a conversatio

8.243498802185059
prompt:  This is a conversation between users in parethesis ([S1], [S2], [MOD])
 Predict the next most probable utterance:
context:  [S1] Yeah. 
token:  [S2] Yeah? And then what? The drums wa 
144.26309204101562
prompt:  This is a conversation between users in parethesis ([S1], [S2], [MOD])
 Predict the next most probable utterance:
context:  [S2] Yeah? And then what? The drums wa 
token:  [S1] And then drums. 
31.420196533203125
prompt:  This is a conversation between users in parethesis ([S1], [S2], [MOD])
 Predict the next most probable utterance:
context:  [S1] And then drums. 
token:  [S2] s the third one we had. 
41.75739669799805
prompt:  This is a conversation between users in parethesis ([S1], [S2], [MOD])
 Predict the next most probable utterance:
context:  [S2] s the third one we had. 
token:  [S1] Yeah. 
8.116808891296387
prompt:  This is a conversation between users in parethesis ([S1], [S2], [MOD])
 Predict the next most probable utterance:
context:  [S1

130.5613555908203
prompt:  This is a conversation between users in parethesis ([S1], [S2], [MOD])
 Predict the next most probable utterance:
context:  [S2] The opposite of ve getable? 
token:  [MOD] If you're a vegetarian like think of what you would 
89.43244171142578
prompt:  This is a conversation between users in parethesis ([S1], [S2], [MOD])
 Predict the next most probable utterance:
context:  [MOD] If you're a vegetarian like think of what you would 
token:  [S1] Meat? 
44.83694076538086
prompt:  This is a conversation between users in parethesis ([S1], [S2], [MOD])
 Predict the next most probable utterance:
context:  [S1] Meat? 
token:  [MOD] Meat. Yeah. 
56.470428466796875
prompt:  This is a conversation between users in parethesis ([S1], [S2], [MOD])
 Predict the next most probable utterance:
context:  [MOD] Meat. Yeah. 
token:  [S2] Ok. 
24.80381202697754
prompt:  This is a conversation between users in parethesis ([S1], [S2], [MOD])
 Predict the next most probable utterance

30.342357635498047
prompt:  This is a conversation between users in parethesis ([S1], [S2], [MOD])
 Predict the next most probable utterance:
context:  [S2] But every time we've 
token:  [S1] s paper either? 
143.93678283691406
prompt:  This is a conversation between users in parethesis ([S1], [S2], [MOD])
 Predict the next most probable utterance:
context:  [S1] s paper either? 
token:  [S2] Yeah. I'd say meat paper, hair maybe? 
92.42871856689453
prompt:  This is a conversation between users in parethesis ([S1], [S2], [MOD])
 Predict the next most probable utterance:
context:  [S2] Yeah. I'd say meat paper, hair maybe? 
token:  [S1] Meat, paper, hair? 
6.344846725463867
prompt:  This is a conversation between users in parethesis ([S1], [S2], [MOD])
 Predict the next most probable utterance:
context:  [S1] Meat, paper, hair? 
token:  [S2] We've been wrong with the order every time so far so 
40.42560577392578
prompt:  This is a conversation between users in parethesis ([S1], [S2], [MO

18.56334686279297
prompt:  This is a conversation between users in parethesis ([S1], [S2], [MOD])
 Predict the next most probable utterance:
context:  [S1] Ok. 
token:  [S2] Ok. 
3.769420623779297
prompt:  This is a conversation between users in parethesis ([S1], [S2], [MOD])
 Predict the next most probable utterance:
context:  [S2] Ok. 
token:  [MOD] Are you ready for the first question? 
17.934473037719727
prompt:  This is a conversation between users in parethesis ([S1], [S2], [MOD])
 Predict the next most probable utterance:
context:  [MOD] Are you ready for the first question? 
token:  [S1] Yeah. 
19.63398551940918
prompt:  This is a conversation between users in parethesis ([S1], [S2], [MOD])
 Predict the next most probable utterance:
context:  [S1] Yeah. 
token:  [MOD] Ok. 
23.830276489257812
prompt:  This is a conversation between users in parethesis ([S1], [S2], [MOD])
 Predict the next most probable utterance:
context:  [MOD] Ok. 
token:  [S2] Ok. 
14.052390098571777
prompt: 

91.93988037109375
prompt:  This is a conversation between users in parethesis ([S1], [S2], [MOD])
 Predict the next most probable utterance:
context:  [MOD] yes 
token:  [S1] where with bad ventilation like in the theatre in 
264.9595031738281
prompt:  This is a conversation between users in parethesis ([S1], [S2], [MOD])
 Predict the next most probable utterance:
context:  [S1] where with bad ventilation like in the theatre in 
token:  [MOD] If you stick to the means of transport you me 
124.2529067993164
prompt:  This is a conversation between users in parethesis ([S1], [S2], [MOD])
 Predict the next most probable utterance:
context:  [MOD] If you stick to the means of transport you me 
token:  [S1] ok 
90.44139862060547
prompt:  This is a conversation between users in parethesis ([S1], [S2], [MOD])
 Predict the next most probable utterance:
context:  [S1] ok 
token:  [MOD] ntion some more. 
347.2777404785156
prompt:  This is a conversation between users in parethesis ([S1], [S2], [M

15.526985168457031
prompt:  This is a conversation between users in parethesis ([S1], [S2], [MOD])
 Predict the next most probable utterance:
context:  [S2] makes sense. 
token:  [MOD] exactly. 
77.81526947021484
prompt:  This is a conversation between users in parethesis ([S1], [S2], [MOD])
 Predict the next most probable utterance:
context:  [MOD] exactly. 
token:  [S1] yeah 
116.24861907958984
prompt:  This is a conversation between users in parethesis ([S1], [S2], [MOD])
 Predict the next most probable utterance:
context:  [S1] yeah 
token:  [MOD] So you have the three, alright? Schools 
218.51187133789062
prompt:  This is a conversation between users in parethesis ([S1], [S2], [MOD])
 Predict the next most probable utterance:
context:  [MOD] So you have the three, alright? Schools 
token:  [S1] mhmm 
41.92586898803711
prompt:  This is a conversation between users in parethesis ([S1], [S2], [MOD])
 Predict the next most probable utterance:
context:  [S1] mhmm 
token:  [MOD] hospita

198.11155700683594
prompt:  This is a conversation between users in parethesis ([S1], [S2], [MOD])
 Predict the next most probable utterance:
context:  [MOD] rst answer 
token:  [S2] hmm 
55.788902282714844
prompt:  This is a conversation between users in parethesis ([S1], [S2], [MOD])
 Predict the next most probable utterance:
context:  [S2] hmm 
token:  [MOD] right? Hospital is number two airplane is number three 
216.8293914794922
prompt:  This is a conversation between users in parethesis ([S1], [S2], [MOD])
 Predict the next most probable utterance:
context:  [MOD] right? Hospital is number two airplane is number three 
token:  [S1] Ok. 
44.910369873046875
prompt:  This is a conversation between users in parethesis ([S1], [S2], [MOD])
 Predict the next most probable utterance:
context:  [S1] Ok. 
token:  [MOD] you you were right about airplanes. 
186.89830017089844
prompt:  This is a conversation between users in parethesis ([S1], [S2], [MOD])
 Predict the next most probable utter

30.985227584838867
prompt:  This is a conversation between users in parethesis ([S1], [S2], [MOD])
 Predict the next most probable utterance:
context:  [S1] Ok. 
token:  [MOD] the drum. So what would be the right order then in terms of popularity. 
84.21904754638672
prompt:  This is a conversation between users in parethesis ([S1], [S2], [MOD])
 Predict the next most probable utterance:
context:  [MOD] the drum. So what would be the right order then in terms of popularity. 
token:  [S1] Oh v v v Violin o pro probably the first. and drum I think drum would be the the last. 
134.65367126464844
prompt:  This is a conversation between users in parethesis ([S1], [S2], [MOD])
 Predict the next most probable utterance:
context:  [S1] Oh v v v Violin o pro probably the first. and drum I think drum would be the the last. 
token:  [S2] So sorry what was the second one? 
16.49104118347168
prompt:  This is a conversation between users in parethesis ([S1], [S2], [MOD])
 Predict the next most probab

61.868133544921875
prompt:  This is a conversation between users in parethesis ([S1], [S2], [MOD])
 Predict the next most probable utterance:
context:  [S2] the I mean it's not the literal meaning 
token:  [MOD] Let's think about the literal meaning of 
26.982080459594727
prompt:  This is a conversation between users in parethesis ([S1], [S2], [MOD])
 Predict the next most probable utterance:
context:  [MOD] Let's think about the literal meaning of 
token:  [S2] yeah 
280.8720703125
prompt:  This is a conversation between users in parethesis ([S1], [S2], [MOD])
 Predict the next most probable utterance:
context:  [S2] yeah 
token:  [MOD] the wo rd 
173.637939453125
prompt:  This is a conversation between users in parethesis ([S1], [S2], [MOD])
 Predict the next most probable utterance:
context:  [MOD] the wo rd 
token:  [S2] hmm 
131.3003692626953
prompt:  This is a conversation between users in parethesis ([S1], [S2], [MOD])
 Predict the next most probable utterance:
context:  [S2] hm

86.4261703491211
prompt:  This is a conversation between users in parethesis ([S1], [S2], [MOD])
 Predict the next most probable utterance:
context:  [MOD] Excellent, yes yes. 
token:  [S1] mhmm 
37.52107238769531
prompt:  This is a conversation between users in parethesis ([S1], [S2], [MOD])
 Predict the next most probable utterance:
context:  [S1] mhmm 
token:  [MOD] So you need one more. 
68.47508239746094
prompt:  This is a conversation between users in parethesis ([S1], [S2], [MOD])
 Predict the next most probable utterance:
context:  [MOD] So you need one more. 
token:  [S1] Meat, hair and cu t Paper? 
429.0921936035156
prompt:  This is a conversation between users in parethesis ([S1], [S2], [MOD])
 Predict the next most probable utterance:
context:  [S1] Meat, hair and cu t Paper? 
token:  [MOD] Very good so you have the 
122.66029357910156
prompt:  This is a conversation between users in parethesis ([S1], [S2], [MOD])
 Predict the next most probable utterance:
context:  [MOD] V

37.44369125366211
prompt:  This is a conversation between users in parethesis ([S1], [S2], [MOD])
 Predict the next most probable utterance:
context:  [S2] Ok. 
token:  [MOD] Is it clear? 
39.235721588134766
prompt:  This is a conversation between users in parethesis ([S1], [S2], [MOD])
 Predict the next most probable utterance:
context:  [MOD] Is it clear? 
token:  [S1] Yeah. 
20.525400161743164
prompt:  This is a conversation between users in parethesis ([S1], [S2], [MOD])
 Predict the next most probable utterance:
context:  [S1] Yeah. 
token:  [MOD] Are you ready 
69.02218627929688
prompt:  This is a conversation between users in parethesis ([S1], [S2], [MOD])
 Predict the next most probable utterance:
context:  [MOD] Are you ready 
token:  [S2] Yeah. 
47.60600280761719
prompt:  This is a conversation between users in parethesis ([S1], [S2], [MOD])
 Predict the next most probable utterance:
context:  [S2] Yeah. 
token:  [MOD] for the first question? 
81.02925872802734
prompt:  This 

69.23469543457031
prompt:  This is a conversation between users in parethesis ([S1], [S2], [MOD])
 Predict the next most probable utterance:
context:  [MOD] So 
token:  [S2] so we need one more? 
56.9674186706543
prompt:  This is a conversation between users in parethesis ([S1], [S2], [MOD])
 Predict the next most probable utterance:
context:  [S2] so we need one more? 
token:  [MOD] one more and it's you mentioned public transpo rt 
229.5259552001953
prompt:  This is a conversation between users in parethesis ([S1], [S2], [MOD])
 Predict the next most probable utterance:
context:  [MOD] one more and it's you mentioned public transpo rt 
token:  [S1] Hmm we mentioned public tran sport, work? No. 
149.22802734375
prompt:  This is a conversation between users in parethesis ([S1], [S2], [MOD])
 Predict the next most probable utterance:
context:  [S1] Hmm we mentioned public tran sport, work? No. 
token:  [MOD] It it's it's about public trans port. 
79.71452331542969
prompt:  This is a con

16.672386169433594
prompt:  This is a conversation between users in parethesis ([S1], [S2], [MOD])
 Predict the next most probable utterance:
context:  [S1] Most popular. 
token:  [S2] Think hospital might be most popular. 
53.5261344909668
prompt:  This is a conversation between users in parethesis ([S1], [S2], [MOD])
 Predict the next most probable utterance:
context:  [S2] Think hospital might be most popular. 
token:  [S1] Ok. 
11.730086326599121
prompt:  This is a conversation between users in parethesis ([S1], [S2], [MOD])
 Predict the next most probable utterance:
context:  [S1] Ok. 
token:  [S2] What do you think? 
4.730863094329834
prompt:  This is a conversation between users in parethesis ([S1], [S2], [MOD])
 Predict the next most probable utterance:
context:  [S2] What do you think? 
token:  [S1] I'll go with that cause there's I don't know, I just think it's safe safe enough. Should be safe to be in a hospital 
31.625980377197266
prompt:  This is a conversation between use

46.27540969848633
prompt:  This is a conversation between users in parethesis ([S1], [S2], [MOD])
 Predict the next most probable utterance:
context:  [MOD] Ah but still ah that's good. Are you ready for the second one? 
token:  [S2] Sure. 
17.1470947265625
prompt:  This is a conversation between users in parethesis ([S1], [S2], [MOD])
 Predict the next most probable utterance:
context:  [S2] Sure. 
token:  [S1] Yeah. 
6.353737831115723
prompt:  This is a conversation between users in parethesis ([S1], [S2], [MOD])
 Predict the next most probable utterance:
context:  [S1] Yeah. 
token:  [MOD] Name an instrument you can find in a symphony orchestra. 
39.60953140258789
prompt:  This is a conversation between users in parethesis ([S1], [S2], [MOD])
 Predict the next most probable utterance:
context:  [MOD] Name an instrument you can find in a symphony orchestra. 
token:  [S1] Violin? 
36.119873046875
prompt:  This is a conversation between users in parethesis ([S1], [S2], [MOD])
 Predict 

85.73981475830078
prompt:  This is a conversation between users in parethesis ([S1], [S2], [MOD])
 Predict the next most probable utterance:
context:  [S1] drums are definitely at the back so. 
token:  [S2] And violin should be number one. 
24.095979690551758
prompt:  This is a conversation between users in parethesis ([S1], [S2], [MOD])
 Predict the next most probable utterance:
context:  [S2] And violin should be number one. 
token:  [S1] Probably. 
11.437103271484375
prompt:  This is a conversation between users in parethesis ([S1], [S2], [MOD])
 Predict the next most probable utterance:
context:  [S1] Probably. 
token:  [S2] I think so. 
4.3493804931640625
prompt:  This is a conversation between users in parethesis ([S1], [S2], [MOD])
 Predict the next most probable utterance:
context:  [S2] I think so. 
token:  [MOD] So what do you think? 
11.331825256347656
prompt:  This is a conversation between users in parethesis ([S1], [S2], [MOD])
 Predict the next most probable utterance:
c

34.780033111572266
prompt:  This is a conversation between users in parethesis ([S1], [S2], [MOD])
 Predict the next most probable utterance:
context:  [S1] grass? 
token:  [S2] Tape? 
17.425617218017578
prompt:  This is a conversation between users in parethesis ([S1], [S2], [MOD])
 Predict the next most probable utterance:
context:  [S2] Tape? 
token:  [S1] Tape. 
10.225043296813965
prompt:  This is a conversation between users in parethesis ([S1], [S2], [MOD])
 Predict the next most probable utterance:
context:  [S1] Tape. 
token:  [S2] 
8.150042533874512
prompt:  This is a conversation between users in parethesis ([S1], [S2], [MOD])
 Predict the next most probable utterance:
context:  [S2] 
token:  [S1] Cut. 
22.6580753326416
prompt:  This is a conversation between users in parethesis ([S1], [S2], [MOD])
 Predict the next most probable utterance:
context:  [S1] Cut. 
token:  [S2] Hair? 
5.114971160888672
prompt:  This is a conversation between users in parethesis ([S1], [S2], [MOD]

123.76282501220703
prompt:  This is a conversation between users in parethesis ([S1], [S2], [MOD])
 Predict the next most probable utterance:
context:  [MOD] No. The first one is hair. The most po 
token:  [S2] Oh! 
128.31686401367188
prompt:  This is a conversation between users in parethesis ([S1], [S2], [MOD])
 Predict the next most probable utterance:
context:  [S2] Oh! 
token:  [MOD] pular answer was eh was hair 
2295.2890625
prompt:  This is a conversation between users in parethesis ([S1], [S2], [MOD])
 Predict the next most probable utterance:
context:  [MOD] pular answer was eh was hair 
token:  [S1] Cut my 
145.76275634765625
prompt:  This is a conversation between users in parethesis ([S1], [S2], [MOD])
 Predict the next most probable utterance:
context:  [S1] Cut my 
token:  [MOD] actually. 
439.77960205078125
prompt:  This is a conversation between users in parethesis ([S1], [S2], [MOD])
 Predict the next most probable utterance:
context:  [MOD] actually. 
token:  [S1] hai

96.61334991455078
prompt:  This is a conversation between users in parethesis ([S1], [S2], [MOD])
 Predict the next most probable utterance:
context:  [MOD]: I'll give you 
token:  [S2]: answers 
209.04347229003906
prompt:  This is a conversation between users in parethesis ([S1], [S2], [MOD])
 Predict the next most probable utterance:
context:  [S2]: answers 
token:  [MOD]: No, I'll give you the question 
45.9296989440918
prompt:  This is a conversation between users in parethesis ([S1], [S2], [MOD])
 Predict the next most probable utterance:
context:  [MOD]: No, I'll give you the question 
token:  [S2]: yeah 
61.41923141479492
prompt:  This is a conversation between users in parethesis ([S1], [S2], [MOD])
 Predict the next most probable utterance:
context:  [S2]: yeah 
token:  [MOD]: you'll come up with answers 
60.725563049316406
prompt:  This is a conversation between users in parethesis ([S1], [S2], [MOD])
 Predict the next most probable utterance:
context:  [MOD]: you'll come up 

23.886247634887695
prompt:  This is a conversation between users in parethesis ([S1], [S2], [MOD])
 Predict the next most probable utterance:
context:  [S1]: se 
token:  [S2]: public transport like train station 
86.78296661376953
prompt:  This is a conversation between users in parethesis ([S1], [S2], [MOD])
 Predict the next most probable utterance:
context:  [S2]: public transport like train station 
token:  [S1]: yeah public transport train station ah station or airport or something like 
49.09475326538086
prompt:  This is a conversation between users in parethesis ([S1], [S2], [MOD])
 Predict the next most probable utterance:
context:  [S1]: yeah public transport train station ah station or airport or something like 
token:  [S2]: yeah 
9.081487655639648
prompt:  This is a conversation between users in parethesis ([S1], [S2], [MOD])
 Predict the next most probable utterance:
context:  [S2]: yeah 
token:  [S1]: that yeah and the third is hmm 
55.38738250732422
prompt:  This is a co

34.99715805053711
prompt:  This is a conversation between users in parethesis ([S1], [S2], [MOD])
 Predict the next most probable utterance:
context:  [S1]: first one yeah 
token:  [S2]: what you 
21.989633560180664
prompt:  This is a conversation between users in parethesis ([S1], [S2], [MOD])
 Predict the next most probable utterance:
context:  [S2]: what you 
token:  [S1]: Yeah it's first for me. 
37.12928009033203
prompt:  This is a conversation between users in parethesis ([S1], [S2], [MOD])
 Predict the next most probable utterance:
context:  [S1]: Yeah it's first for me. 
token:  [S2]: yeah 
7.472891330718994
prompt:  This is a conversation between users in parethesis ([S1], [S2], [MOD])
 Predict the next most probable utterance:
context:  [S2]: yeah 
token:  [S1]: and then the 
26.18282699584961
prompt:  This is a conversation between users in parethesis ([S1], [S2], [MOD])
 Predict the next most probable utterance:
context:  [S1]: and then the 
token:  [S2]: airport 
5.8242835

177.90625
prompt:  This is a conversation between users in parethesis ([S1], [S2], [MOD])
 Predict the next most probable utterance:
context:  [MOD]: eh you n you need to name an instrument where you 
token:  [S1]: uhmh 
67.1258544921875
prompt:  This is a conversation between users in parethesis ([S1], [S2], [MOD])
 Predict the next most probable utterance:
context:  [S1]: uhmh 
token:  [MOD]: find in a symphony orchestra. 
147.87240600585938
prompt:  This is a conversation between users in parethesis ([S1], [S2], [MOD])
 Predict the next most probable utterance:
context:  [MOD]: find in a symphony orchestra. 
token:  [S1]: symphony orchestra 
17.2187557220459
prompt:  This is a conversation between users in parethesis ([S1], [S2], [MOD])
 Predict the next most probable utterance:
context:  [S1]: symphony orchestra 
token:  [MOD]: Yeah like a big orchestra 
97.31929016113281
prompt:  This is a conversation between users in parethesis ([S1], [S2], [MOD])
 Predict the next most probable

7.809695720672607
prompt:  This is a conversation between users in parethesis ([S1], [S2], [MOD])
 Predict the next most probable utterance:
context:  [S1]: no 
token:  [MOD]: unfortunately not 
130.0292205810547
prompt:  This is a conversation between users in parethesis ([S1], [S2], [MOD])
 Predict the next most probable utterance:
context:  [MOD]: unfortunately not 
token:  [S1]: ahm there are different types of 
53.371559143066406
prompt:  This is a conversation between users in parethesis ([S1], [S2], [MOD])
 Predict the next most probable utterance:
context:  [S1]: ahm there are different types of 
token:  [MOD]: yeah 
213.56295776367188
prompt:  This is a conversation between users in parethesis ([S1], [S2], [MOD])
 Predict the next most probable utterance:
context:  [MOD]: yeah 
token:  [S1]: violin 
119.66150665283203
prompt:  This is a conversation between users in parethesis ([S1], [S2], [MOD])
 Predict the next most probable utterance:
context:  [S1]: violin 
token:  [MOD]:

45.05738830566406
prompt:  This is a conversation between users in parethesis ([S1], [S2], [MOD])
 Predict the next most probable utterance:
context:  [MOD]: The last one is cello. 
token:  [S2]: Sorry? 
37.437522888183594
prompt:  This is a conversation between users in parethesis ([S1], [S2], [MOD])
 Predict the next most probable utterance:
context:  [S2]: Sorry? 
token:  [MOD]: Cello? 
86.51217651367188
prompt:  This is a conversation between users in parethesis ([S1], [S2], [MOD])
 Predict the next most probable utterance:
context:  [MOD]: Cello? 
token:  [S2]: No idea what it 
78.63078308105469
prompt:  This is a conversation between users in parethesis ([S1], [S2], [MOD])
 Predict the next most probable utterance:
context:  [S2]: No idea what it 
token:  [MOD]: No? 
86.7461929321289
prompt:  This is a conversation between users in parethesis ([S1], [S2], [MOD])
 Predict the next most probable utterance:
context:  [MOD]: No? 
token:  [S2]: is 
107.752685546875
prompt:  This is a 

36.97849655151367
prompt:  This is a conversation between users in parethesis ([S1], [S2], [MOD])
 Predict the next most probable utterance:
context:  [S2]: Violin would be my first. How about you? 
token:  [S1]: yeah violin and the second is uhm 
53.98653793334961
prompt:  This is a conversation between users in parethesis ([S1], [S2], [MOD])
 Predict the next most probable utterance:
context:  [S1]: yeah violin and the second is uhm 
token:  [S2]: drum 
23.0399169921875
prompt:  This is a conversation between users in parethesis ([S1], [S2], [MOD])
 Predict the next most probable utterance:
context:  [S2]: drum 
token:  [S1]: drum 
9.447959899902344
prompt:  This is a conversation between users in parethesis ([S1], [S2], [MOD])
 Predict the next most probable utterance:
context:  [S1]: drum 
token:  [S2]: or 
17.565170288085938
prompt:  This is a conversation between users in parethesis ([S1], [S2], [MOD])
 Predict the next most probable utterance:
context:  [S2]: or 
token:  [S1]: a

149.9731903076172
prompt:  This is a conversation between users in parethesis ([S1], [S2], [MOD])
 Predict the next most probable utterance:
context:  [MOD]: Men maybe more often than women. 
token:  [S1]: oh 
57.79952621459961
prompt:  This is a conversation between users in parethesis ([S1], [S2], [MOD])
 Predict the next most probable utterance:
context:  [S1]: oh 
token:  [MOD]: 
87.11236572265625
prompt:  This is a conversation between users in parethesis ([S1], [S2], [MOD])
 Predict the next most probable utterance:
context:  [MOD]: 
token:  [S2]: Hair? 
151.97825622558594
prompt:  This is a conversation between users in parethesis ([S1], [S2], [MOD])
 Predict the next most probable utterance:
context:  [S2]: Hair? 
token:  [S1]: oh yeah 
18.321969985961914
prompt:  This is a conversation between users in parethesis ([S1], [S2], [MOD])
 Predict the next most probable utterance:
context:  [S1]: oh yeah 
token:  [MOD]: Hair yeah. Very good. 
227.88131713867188
prompt:  This is a co

48.34941864013672
prompt:  This is a conversation between users in parethesis ([S1], [S2], [MOD])
 Predict the next most probable utterance:
context:  [S2]: meat 
token:  [S1]: First I think we can so meat and the hair and then the 
1.922260046005249
prompt:  This is a conversation between users in parethesis ([S1], [S2], [MOD])
 Predict the next most probable utterance:
context:  [S1]: First I think we can so meat and the hair and then the 
token:  [S2]: I forgot the other one 
18.58399772644043
prompt:  This is a conversation between users in parethesis ([S1], [S2], [MOD])
 Predict the next most probable utterance:
context:  [S2]: I forgot the other one 
token:  [S1]: paper 
8.838641166687012
prompt:  This is a conversation between users in parethesis ([S1], [S2], [MOD])
 Predict the next most probable utterance:
context:  [S1]: paper 
token:  [MOD]: Are you sure? 
37.60601043701172
prompt:  This is a conversation between users in parethesis ([S1], [S2], [MOD])
 Predict the next most

30.027114868164062
prompt:  This is a conversation between users in parethesis ([S1], [S2], [MOD])
 Predict the next most probable utterance:
context:  [MOD] Yeah? 
token:  [S1] mhmm 
29.386281967163086
prompt:  This is a conversation between users in parethesis ([S1], [S2], [MOD])
 Predict the next most probable utterance:
context:  [S1] mhmm 
token:  [MOD] So are you ready for the first question? 
28.951066970825195
prompt:  This is a conversation between users in parethesis ([S1], [S2], [MOD])
 Predict the next most probable utterance:
context:  [MOD] So are you ready for the first question? 
token:  [S2] Yeah. 
26.360923767089844
prompt:  This is a conversation between users in parethesis ([S1], [S2], [MOD])
 Predict the next most probable utterance:
context:  [S2] Yeah. 
token:  [S1] I'm ok 
19.072599411010742
prompt:  This is a conversation between users in parethesis ([S1], [S2], [MOD])
 Predict the next most probable utterance:
context:  [S1] I'm ok 
token:  [MOD] I would lite 

25.536638259887695
prompt:  This is a conversation between users in parethesis ([S1], [S2], [MOD])
 Predict the next most probable utterance:
context:  [S1] yeah 
token:  [S2] ah patients are ah certain times but it ah I don't know how to explain like it's eh it's supposed to be ah not contami not contaminated but in fact it is, because when patients are waiting for doctors they all ah transmitting their sickness to each other I think so 
70.82080841064453
prompt:  This is a conversation between users in parethesis ([S1], [S2], [MOD])
 Predict the next most probable utterance:
context:  [S2] ah patients are ah certain times but it ah I don't know how to explain like it's eh it's supposed to be ah not contami not contaminated but in fact it is, because when patients are waiting for doctors they all ah transmitting their sickness to each other I think so 
token:  [S1] ok So, yes I think in the hospital you would have the strongest disease that you could get because I think that from all 

67.40914154052734
prompt:  This is a conversation between users in parethesis ([S1], [S2], [MOD])
 Predict the next most probable utterance:
context:  [MOD] I like your conver sation skills, I like the way you're trying to reach an agreement right 
token:  [S2] but because it's all 
60.75956726074219
prompt:  This is a conversation between users in parethesis ([S1], [S2], [MOD])
 Predict the next most probable utterance:
context:  [S2] but because it's all 
token:  [MOD] hmm 
181.0186767578125
prompt:  This is a conversation between users in parethesis ([S1], [S2], [MOD])
 Predict the next most probable utterance:
context:  [MOD] hmm 
token:  [S2] it's also suits me so yeah it's just a good game 
70.19947052001953
prompt:  This is a conversation between users in parethesis ([S1], [S2], [MOD])
 Predict the next most probable utterance:
context:  [S2] it's also suits me so yeah it's just a good game 
token:  [S1] yeah because both make sense 
30.33434295654297
prompt:  This is a conversa

182.42349243164062
prompt:  This is a conversation between users in parethesis ([S1], [S2], [MOD])
 Predict the next most probable utterance:
context:  [MOD] hmm 
token:  [S2] oh 
50.434478759765625
prompt:  This is a conversation between users in parethesis ([S1], [S2], [MOD])
 Predict the next most probable utterance:
context:  [S2] oh 
token:  [MOD] hmm 
62.18169403076172
prompt:  This is a conversation between users in parethesis ([S1], [S2], [MOD])
 Predict the next most probable utterance:
context:  [MOD] hmm 
token:  [S2] no there no piano ah trum no yes or I don't have the english word for 
186.04222106933594
prompt:  This is a conversation between users in parethesis ([S1], [S2], [MOD])
 Predict the next most probable utterance:
context:  [S2] no there no piano ah trum no yes or I don't have the english word for 
token:  [S1] But which one is it, in what langua 
68.35057067871094
prompt:  This is a conversation between users in parethesis ([S1], [S2], [MOD])
 Predict the next 

271.1465148925781
prompt:  This is a conversation between users in parethesis ([S1], [S2], [MOD])
 Predict the next most probable utterance:
context:  [S2] triangle 
token:  [S1] Oh that's amazing. That's an amazing answer. 
15.851935386657715
prompt:  This is a conversation between users in parethesis ([S1], [S2], [MOD])
 Predict the next most probable utterance:
context:  [S1] Oh that's amazing. That's an amazing answer. 
token:  [S2] 
12.001670837402344
prompt:  This is a conversation between users in parethesis ([S1], [S2], [MOD])
 Predict the next most probable utterance:
context:  [S2] 
token:  [MOD] In Christmas carols yes. 
269.53216552734375
prompt:  This is a conversation between users in parethesis ([S1], [S2], [MOD])
 Predict the next most probable utterance:
context:  [MOD] In Christmas carols yes. 
token:  [S1] yes yeah 
96.04647064208984
prompt:  This is a conversation between users in parethesis ([S1], [S2], [MOD])
 Predict the next most probable utterance:
context:  [S

52.6873664855957
prompt:  This is a conversation between users in parethesis ([S1], [S2], [MOD])
 Predict the next most probable utterance:
context:  [S1] Oh! 
token:  [MOD] you got it right. 
35.477752685546875
prompt:  This is a conversation between users in parethesis ([S1], [S2], [MOD])
 Predict the next most probable utterance:
context:  [MOD] you got it right. 
token:  [S1] Yay! 
18.237825393676758
prompt:  This is a conversation between users in parethesis ([S1], [S2], [MOD])
 Predict the next most probable utterance:
context:  [S1] Yay! 
token:  [MOD] Ok so you have one more that ll third an final question, I would like you to name something that people cut. 
129.54489135742188
prompt:  This is a conversation between users in parethesis ([S1], [S2], [MOD])
 Predict the next most probable utterance:
context:  [MOD] Ok so you have one more that ll third an final question, I would like you to name something that people cut. 
token:  [S2] Don't really 
49.8510627746582
prompt:  Thi

10.85559368133545
prompt:  This is a conversation between users in parethesis ([S1], [S2], [MOD])
 Predict the next most probable utterance:
context:  [S2] yeah 
token:  [S1] but most people anyway get it already sliced so I don't 
64.29395294189453
prompt:  This is a conversation between users in parethesis ([S1], [S2], [MOD])
 Predict the next most probable utterance:
context:  [S1] but most people anyway get it already sliced so I don't 
token:  [MOD] ok 
218.39768981933594
prompt:  This is a conversation between users in parethesis ([S1], [S2], [MOD])
 Predict the next most probable utterance:
context:  [MOD] ok 
token:  [S1] think that 
53.56752395629883
prompt:  This is a conversation between users in parethesis ([S1], [S2], [MOD])
 Predict the next most probable utterance:
context:  [S1] think that 
token:  [MOD] hm hm 
69.34085083007812
prompt:  This is a conversation between users in parethesis ([S1], [S2], [MOD])
 Predict the next most probable utterance:
context:  [MOD] hm h

27.448772430419922
prompt:  This is a conversation between users in parethesis ([S1], [S2], [MOD])
 Predict the next most probable utterance:
context:  [MOD] So what would be the ranking in terms of popularity? What would you think? 
token:  [S2] Paper first. 
114.37258911132812
prompt:  This is a conversation between users in parethesis ([S1], [S2], [MOD])
 Predict the next most probable utterance:
context:  [S2] Paper first. 
token:  [S1] Yeah. 
8.317042350769043
prompt:  This is a conversation between users in parethesis ([S1], [S2], [MOD])
 Predict the next most probable utterance:
context:  [S1] Yeah. 
token:  [MOD] hmm 
79.48519134521484
prompt:  This is a conversation between users in parethesis ([S1], [S2], [MOD])
 Predict the next most probable utterance:
context:  [MOD] hmm 
token:  [S2] Hair second and then meat. I would say this. 
149.69833374023438
prompt:  This is a conversation between users in parethesis ([S1], [S2], [MOD])
 Predict the next most probable utterance:
con

57.75456619262695
prompt:  This is a conversation between users in parethesis ([S1], [S2], [MOD])
 Predict the next most probable utterance:
context:  [S1] Thanks. 
token:  [MOD] so we're going to play a quiz. I'm going to ask you three questions regarding the most ah popular questions about something that people were asked and so you're going to tell me ah the three most popular answers and then you will discuss with each other and you're going to put these answers into the correct rank in terms of popularity, for example if I ask you what do people use in order to transfer a patient your answers would be an ambulance a wheelchair or a hospital bed. And then I would ask you to put these ah answers into the correct ah order. Is everything 
27.891950607299805
prompt:  This is a conversation between users in parethesis ([S1], [S2], [MOD])
 Predict the next most probable utterance:
context:  [MOD] so we're going to play a quiz. I'm going to ask you three questions regarding the most ah po

104.41233825683594
prompt:  This is a conversation between users in parethesis ([S1], [S2], [MOD])
 Predict the next most probable utterance:
context:  [MOD] A place it could be something more v for example soemthing that people use to commute or a means of transportation 
token:  [S2] yeah transport yeah the bus and 
221.98533630371094
prompt:  This is a conversation between users in parethesis ([S1], [S2], [MOD])
 Predict the next most probable utterance:
context:  [S2] yeah transport yeah the bus and 
token:  [S1] oh yeah the bus Not yet? 
25.7852725982666
prompt:  This is a conversation between users in parethesis ([S1], [S2], [MOD])
 Predict the next most probable utterance:
context:  [S1] oh yeah the bus Not yet? 
token:  [MOD] Something else. 
58.34845733642578
prompt:  This is a conversation between users in parethesis ([S1], [S2], [MOD])
 Predict the next most probable utterance:
context:  [MOD] Something else. 
token:  [S1] Airplanes, air 
159.79940795898438
prompt:  This is 

8.371320724487305
prompt:  This is a conversation between users in parethesis ([S1], [S2], [MOD])
 Predict the next most probable utterance:
context:  [S1] maybe 
token:  [S2] they get cold 
44.4827880859375
prompt:  This is a conversation between users in parethesis ([S1], [S2], [MOD])
 Predict the next most probable utterance:
context:  [S2] they get cold 
token:  [S1] yeah 
11.058295249938965
prompt:  This is a conversation between users in parethesis ([S1], [S2], [MOD])
 Predict the next most probable utterance:
context:  [S1] yeah 
token:  [S2] easily 
21.075273513793945
prompt:  This is a conversation between users in parethesis ([S1], [S2], [MOD])
 Predict the next most probable utterance:
context:  [S2] easily 
token:  [S1] School would be first one. 
55.96881103515625
prompt:  This is a conversation between users in parethesis ([S1], [S2], [MOD])
 Predict the next most probable utterance:
context:  [S1] School would be first one. 
token:  [S2] mhmm 
24.123462677001953
prompt: 

111.57642364501953
prompt:  This is a conversation between users in parethesis ([S1], [S2], [MOD])
 Predict the next most probable utterance:
context:  [S1] Violin 
token:  [MOD] I need the th 
208.94131469726562
prompt:  This is a conversation between users in parethesis ([S1], [S2], [MOD])
 Predict the next most probable utterance:
context:  [MOD] I need the th 
token:  [S2] Yeah violin. 
484.5538024902344
prompt:  This is a conversation between users in parethesis ([S1], [S2], [MOD])
 Predict the next most probable utterance:
context:  [S2] Yeah violin. 
token:  [S1] 
19.224666595458984
prompt:  This is a conversation between users in parethesis ([S1], [S2], [MOD])
 Predict the next most probable utterance:
context:  [S1] 
token:  [MOD] Perfect. 
100.15423583984375
prompt:  This is a conversation between users in parethesis ([S1], [S2], [MOD])
 Predict the next most probable utterance:
context:  [MOD] Perfect. 
token:  [S2] I don't know how to say it in English. 
10.386302947998047


18.677627563476562
prompt:  This is a conversation between users in parethesis ([S1], [S2], [MOD])
 Predict the next most probable utterance:
context:  [S1] with strings 
token:  [MOD] Not bass 
1810.7965087890625
prompt:  This is a conversation between users in parethesis ([S1], [S2], [MOD])
 Predict the next most probable utterance:
context:  [MOD] Not bass 
token:  [S1] sss 
64.89066314697266
prompt:  This is a conversation between users in parethesis ([S1], [S2], [MOD])
 Predict the next most probable utterance:
context:  [S1] sss 
token:  [MOD] 
54.22110366821289
prompt:  This is a conversation between users in parethesis ([S1], [S2], [MOD])
 Predict the next most probable utterance:
context:  [MOD] 
token:  [S1] strings or oh guitars 
925.4987182617188
prompt:  This is a conversation between users in parethesis ([S1], [S2], [MOD])
 Predict the next most probable utterance:
context:  [S1] strings or oh guitars 
token:  [S2] I don't know. Harp. 
18.359193801879883
prompt:  This is 

24.742551803588867
prompt:  This is a conversation between users in parethesis ([S1], [S2], [MOD])
 Predict the next most probable utterance:
context:  [S1] hmm 
token:  [S2] that yeah 
24.071041107177734
prompt:  This is a conversation between users in parethesis ([S1], [S2], [MOD])
 Predict the next most probable utterance:
context:  [S2] that yeah 
token:  [MOD] ok 
136.99517822265625
prompt:  This is a conversation between users in parethesis ([S1], [S2], [MOD])
 Predict the next most probable utterance:
context:  [MOD] ok 
token:  [S2] Yeah I know 
45.64357376098633
prompt:  This is a conversation between users in parethesis ([S1], [S2], [MOD])
 Predict the next most probable utterance:
context:  [S2] Yeah I know 
token:  [MOD] ok 
126.51243591308594
prompt:  This is a conversation between users in parethesis ([S1], [S2], [MOD])
 Predict the next most probable utterance:
context:  [MOD] ok 
token:  [S2] yeah 
53.02497482299805
prompt:  This is a conversation between users in paret

358.9715270996094
prompt:  This is a conversation between users in parethesis ([S1], [S2], [MOD])
 Predict the next most probable utterance:
context:  [MOD] Ah yeah I why isn't the piano 
token:  [S1] No piano. 
46.70490264892578
prompt:  This is a conversation between users in parethesis ([S1], [S2], [MOD])
 Predict the next most probable utterance:
context:  [S1] No piano. 
token:  [MOD] among these it's it's 
195.827392578125
prompt:  This is a conversation between users in parethesis ([S1], [S2], [MOD])
 Predict the next most probable utterance:
context:  [MOD] among these it's it's 
token:  [S2] No no there no piano. 
219.73196411132812
prompt:  This is a conversation between users in parethesis ([S1], [S2], [MOD])
 Predict the next most probable utterance:
context:  [S2] No no there no piano. 
token:  [MOD] crazy eh but no, not piano 
250.2630157470703
prompt:  This is a conversation between users in parethesis ([S1], [S2], [MOD])
 Predict the next most probable utterance:
contex

221.04229736328125
prompt:  This is a conversation between users in parethesis ([S1], [S2], [MOD])
 Predict the next most probable utterance:
context:  [MOD] Battery? 
token:  [S1] Battery I understand drums 
431.7166748046875
prompt:  This is a conversation between users in parethesis ([S1], [S2], [MOD])
 Predict the next most probable utterance:
context:  [S1] Battery I understand drums 
token:  [S2] but there 
58.99347686767578
prompt:  This is a conversation between users in parethesis ([S1], [S2], [MOD])
 Predict the next most probable utterance:
context:  [S2] but there 
token:  [S1] drums sorry 
191.90728759765625
prompt:  This is a conversation between users in parethesis ([S1], [S2], [MOD])
 Predict the next most probable utterance:
context:  [S1] drums sorry 
token:  [MOD] Yes. 
56.52495574951172
prompt:  This is a conversation between users in parethesis ([S1], [S2], [MOD])
 Predict the next most probable utterance:
context:  [MOD] Yes. 
token:  [S1] Drums drums. 
52.1059341

59.77663040161133
prompt:  This is a conversation between users in parethesis ([S1], [S2], [MOD])
 Predict the next most probable utterance:
context:  [S1] struggling so much 
token:  [S2] yeah 
13.203441619873047
prompt:  This is a conversation between users in parethesis ([S1], [S2], [MOD])
 Predict the next most probable utterance:
context:  [S2] yeah 
token:  [S1] to find so yes 
64.40773010253906
prompt:  This is a conversation between users in parethesis ([S1], [S2], [MOD])
 Predict the next most probable utterance:
context:  [S1] to find so yes 
token:  [MOD] That's grat thank you yeah you're great. That's the correct order of course. 
102.76034545898438
prompt:  This is a conversation between users in parethesis ([S1], [S2], [MOD])
 Predict the next most probable utterance:
context:  [MOD] That's grat thank you yeah you're great. That's the correct order of course. 
token:  [S1] Oh good. 
21.839326858520508
prompt:  This is a conversation between users in parethesis ([S1], [S2]

101.72232055664062
prompt:  This is a conversation between users in parethesis ([S1], [S2], [MOD])
 Predict the next most probable utterance:
context:  [MOD] Something more specific? 
token:  [S2] Tomato 
298.8824462890625
prompt:  This is a conversation between users in parethesis ([S1], [S2], [MOD])
 Predict the next most probable utterance:
context:  [S2] Tomato 
token:  [S1] eh eh meat 
119.68867492675781
prompt:  This is a conversation between users in parethesis ([S1], [S2], [MOD])
 Predict the next most probable utterance:
context:  [S1] eh eh meat 
token:  [MOD] Yes! 
89.92656707763672
prompt:  This is a conversation between users in parethesis ([S1], [S2], [MOD])
 Predict the next most probable utterance:
context:  [MOD] Yes! 
token:  [S2] ah 
165.97320556640625
prompt:  This is a conversation between users in parethesis ([S1], [S2], [MOD])
 Predict the next most probable utterance:
context:  [S2] ah 
token:  [MOD] Yes 
128.38735961914062
prompt:  This is a conversation betwee

138.79290771484375
prompt:  This is a conversation between users in parethesis ([S1], [S2], [MOD])
 Predict the next most probable utterance:
context:  [MOD] delighted to say you made it 
token:  [S1] wow, we're amazing! 
31.74407958984375
prompt:  This is a conversation between users in parethesis ([S1], [S2], [MOD])
 Predict the next most probable utterance:
context:  [S1] wow, we're amazing! 
token:  [MOD] three out of three you're fantastic! Thank you thank you so much so yeah that's the end, I hope you enjoyed that. Thank you very much, you're great. Good job 
25.43142318725586
prompt:  This is a conversation between users in parethesis ([S1], [S2], [MOD])
 Predict the next most probable utterance:
context:  [MOD] three out of three you're fantastic! Thank you thank you so much so yeah that's the end, I hope you enjoyed that. Thank you very much, you're great. Good job 
token:  [S1] Thank you . That's it was 
42.27044677734375
prompt:  This is a conversation between users in paret

152.3042755126953
prompt:  This is a conversation between users in parethesis ([S1], [S2], [MOD])
 Predict the next most probable utterance:
context:  [S2] eh 
token:  [MOD] and 
104.35092163085938
prompt:  This is a conversation between users in parethesis ([S1], [S2], [MOD])
 Predict the next most probable utterance:
context:  [MOD] and 
token:  [S1] toge eh the people get cold in it? 
316.79852294921875
prompt:  This is a conversation between users in parethesis ([S1], [S2], [MOD])
 Predict the next most probable utterance:
context:  [S1] toge eh the people get cold in it? 
token:  [MOD] yes 
120.97532653808594
prompt:  This is a conversation between users in parethesis ([S1], [S2], [MOD])
 Predict the next most probable utterance:
context:  [MOD] yes 
token:  [S1] on it yeah ok 
70.07947540283203
prompt:  This is a conversation between users in parethesis ([S1], [S2], [MOD])
 Predict the next most probable utterance:
context:  [S1] on it yeah ok 
token:  [MOD] What would be th a pl

72.796875
prompt:  This is a conversation between users in parethesis ([S1], [S2], [MOD])
 Predict the next most probable utterance:
context:  [MOD] So two out of three. We need one 
token:  [S1] ok 
167.9195556640625
prompt:  This is a conversation between users in parethesis ([S1], [S2], [MOD])
 Predict the next most probable utterance:
context:  [S1] ok 
token:  [MOD] more. Ah think about different age grou achool. yes I was about to 
700.4086303710938
prompt:  This is a conversation between users in parethesis ([S1], [S2], [MOD])
 Predict the next most probable utterance:
context:  [MOD] more. Ah think about different age grou achool. yes I was about to 
token:  [S1] Sorry? 
74.30731201171875
prompt:  This is a conversation between users in parethesis ([S1], [S2], [MOD])
 Predict the next most probable utterance:
context:  [S1] Sorry? 
token:  [MOD] tell 
211.4720001220703
prompt:  This is a conversation between users in parethesis ([S1], [S2], [MOD])
 Predict the next most probabl

220.67433166503906
prompt:  This is a conversation between users in parethesis ([S1], [S2], [MOD])
 Predict the next most probable utterance:
context:  [S2] the name of the in in instrument 
token:  [MOD] yes 
159.86334228515625
prompt:  This is a conversation between users in parethesis ([S1], [S2], [MOD])
 Predict the next most probable utterance:
context:  [MOD] yes 
token:  [S2] ok 
42.407859802246094
prompt:  This is a conversation between users in parethesis ([S1], [S2], [MOD])
 Predict the next most probable utterance:
context:  [S2] ok 
token:  [MOD] yeah 
90.82000732421875
prompt:  This is a conversation between users in parethesis ([S1], [S2], [MOD])
 Predict the next most probable utterance:
context:  [MOD] yeah 
token:  [S1] Symphony? 
154.03060913085938
prompt:  This is a conversation between users in parethesis ([S1], [S2], [MOD])
 Predict the next most probable utterance:
context:  [S1] Symphony? 
token:  [S2] Violin? 
8.708806991577148
prompt:  This is a conversation be

200.2630157470703
prompt:  This is a conversation between users in parethesis ([S1], [S2], [MOD])
 Predict the next most probable utterance:
context:  [MOD] I mean great idea 
token:  [S2] Piano? 
116.02693939208984
prompt:  This is a conversation between users in parethesis ([S1], [S2], [MOD])
 Predict the next most probable utterance:
context:  [S2] Piano? 
token:  [S1] ok 
19.624021530151367
prompt:  This is a conversation between users in parethesis ([S1], [S2], [MOD])
 Predict the next most probable utterance:
context:  [S1] ok 
token:  [MOD] No. 
78.7618637084961
prompt:  This is a conversation between users in parethesis ([S1], [S2], [MOD])
 Predict the next most probable utterance:
context:  [MOD] No. 
token:  [S2] No. 
25.61289405822754
prompt:  This is a conversation between users in parethesis ([S1], [S2], [MOD])
 Predict the next most probable utterance:
context:  [S2] No. 
token:  [MOD] It's yeah 
286.049560546875
prompt:  This is a conversation between users in parethesis

29.92896842956543
prompt:  This is a conversation between users in parethesis ([S1], [S2], [MOD])
 Predict the next most probable utterance:
context:  [S2] Violin? you think the first 
token:  [MOD] 
183.23634338378906
prompt:  This is a conversation between users in parethesis ([S1], [S2], [MOD])
 Predict the next most probable utterance:
context:  [MOD] 
token:  [S1] eh and then the drums maybe? 
279.6881103515625
prompt:  This is a conversation between users in parethesis ([S1], [S2], [MOD])
 Predict the next most probable utterance:
context:  [S1] eh and then the drums maybe? 
token:  [S2] May be yes. 
17.696786880493164
prompt:  This is a conversation between users in parethesis ([S1], [S2], [MOD])
 Predict the next most probable utterance:
context:  [S2] May be yes. 
token:  [S1] to give the rhythm? and then the 
109.62776184082031
prompt:  This is a conversation between users in parethesis ([S1], [S2], [MOD])
 Predict the next most probable utterance:
context:  [S1] to give the 

20.012420654296875
prompt:  This is a conversation between users in parethesis ([S1], [S2], [MOD])
 Predict the next most probable utterance:
context:  [S1] Makes sense. 
token:  [S2] hmm 
19.643739700317383
prompt:  This is a conversation between users in parethesis ([S1], [S2], [MOD])
 Predict the next most probable utterance:
context:  [S2] hmm 
token:  [S1] and paper 
60.04542541503906
prompt:  This is a conversation between users in parethesis ([S1], [S2], [MOD])
 Predict the next most probable utterance:
context:  [S1] and paper 
token:  [MOD] Paper! You have the 
114.20359802246094
prompt:  This is a conversation between users in parethesis ([S1], [S2], [MOD])
 Predict the next most probable utterance:
context:  [MOD] Paper! You have the 
token:  [S2] paper? 
48.903839111328125
prompt:  This is a conversation between users in parethesis ([S1], [S2], [MOD])
 Predict the next most probable utterance:
context:  [S2] paper? 
token:  [MOD] second one. 
136.3604736328125
prompt:  This

77.4137954711914
prompt:  This is a conversation between users in parethesis ([S1], [S2], [MOD])
 Predict the next most probable utterance:
context:  [S1] Meat makes sense. Makes sense. 
token:  [S2] 
7.765684127807617
prompt:  This is a conversation between users in parethesis ([S1], [S2], [MOD])
 Predict the next most probable utterance:
context:  [S2] 
token:  [S1] No? No? 
15.625138282775879
prompt:  This is a conversation between users in parethesis ([S1], [S2], [MOD])
 Predict the next most probable utterance:
context:  [S1] No? No? 
token:  [MOD] Ah you you have to tell me the the whole 
173.27584838867188
prompt:  This is a conversation between users in parethesis ([S1], [S2], [MOD])
 Predict the next most probable utterance:
context:  [MOD] Ah you you have to tell me the the whole 
token:  [S1] oh the whole the whole order 
55.714256286621094
prompt:  This is a conversation between users in parethesis ([S1], [S2], [MOD])
 Predict the next most probable utterance:
context:  [S1

7.952502250671387
prompt:  This is a conversation between users in parethesis ([S1], [S2], [MOD])
 Predict the next most probable utterance:
context:  [S2] ok 
token:  [MOD] Ready to start? 
40.74002456665039
prompt:  This is a conversation between users in parethesis ([S1], [S2], [MOD])
 Predict the next most probable utterance:
context:  [MOD] Ready to start? 
token:  [S1] mhmm 
36.388057708740234
prompt:  This is a conversation between users in parethesis ([S1], [S2], [MOD])
 Predict the next most probable utterance:
context:  [S1] mhmm 
token:  [MOD] Yeah? So the first question name a public place where you're likely to catch a cold or a flu bug. 
73.0657958984375
prompt:  This is a conversation between users in parethesis ([S1], [S2], [MOD])
 Predict the next most probable utterance:
context:  [MOD] Yeah? So the first question name a public place where you're likely to catch a cold or a flu bug. 
token:  [S2] w w who who was asked this like what's the public where was it? 
107.411

83.19524383544922
prompt:  This is a conversation between users in parethesis ([S1], [S2], [MOD])
 Predict the next most probable utterance:
context:  [S2] ok not really ok 
token:  [MOD] no 
83.3913803100586
prompt:  This is a conversation between users in parethesis ([S1], [S2], [MOD])
 Predict the next most probable utterance:
context:  [MOD] no 
token:  [S2] 
33.213539123535156
prompt:  This is a conversation between users in parethesis ([S1], [S2], [MOD])
 Predict the next most probable utterance:
context:  [S2] 
token:  [MOD] Think about children. 
110.50988006591797
prompt:  This is a conversation between users in parethesis ([S1], [S2], [MOD])
 Predict the next most probable utterance:
context:  [MOD] Think about children. 
token:  [S1] hmm yeah schools 
202.63534545898438
prompt:  This is a conversation between users in parethesis ([S1], [S2], [MOD])
 Predict the next most probable utterance:
context:  [S1] hmm yeah schools 
token:  [MOD] So where school 
228.89183044433594
pr

85.52548217773438
prompt:  This is a conversation between users in parethesis ([S1], [S2], [MOD])
 Predict the next most probable utterance:
context:  [S2] their children than a 
token:  [S1] yeah yeah 
20.436214447021484
prompt:  This is a conversation between users in parethesis ([S1], [S2], [MOD])
 Predict the next most probable utterance:
context:  [S1] yeah yeah 
token:  [S2] yeah 
7.338903903961182
prompt:  This is a conversation between users in parethesis ([S1], [S2], [MOD])
 Predict the next most probable utterance:
context:  [S2] yeah 
token:  [S1] whereas schools it's just it's they're not really 
77.38407897949219
prompt:  This is a conversation between users in parethesis ([S1], [S2], [MOD])
 Predict the next most probable utterance:
context:  [S1] whereas schools it's just it's they're not really 
token:  [S2] yeah 
12.167896270751953
prompt:  This is a conversation between users in parethesis ([S1], [S2], [MOD])
 Predict the next most probable utterance:
context:  [S2] y

19.655200958251953
prompt:  This is a conversation between users in parethesis ([S1], [S2], [MOD])
 Predict the next most probable utterance:
context:  [S2] the drums 
token:  [S1] drums 
12.26707649230957
prompt:  This is a conversation between users in parethesis ([S1], [S2], [MOD])
 Predict the next most probable utterance:
context:  [S1] drums 
token:  [MOD] a drum 
49.39092254638672
prompt:  This is a conversation between users in parethesis ([S1], [S2], [MOD])
 Predict the next most probable utterance:
context:  [MOD] a drum 
token:  [S1] yeah 
56.76496887207031
prompt:  This is a conversation between users in parethesis ([S1], [S2], [MOD])
 Predict the next most probable utterance:
context:  [S1] yeah 
token:  [MOD] actually drum is the third one 
260.5971984863281
prompt:  This is a conversation between users in parethesis ([S1], [S2], [MOD])
 Predict the next most probable utterance:
context:  [MOD] actually drum is the third one 
token:  [S2] yeah 
67.62097930908203
prompt:  

91.24162292480469
prompt:  This is a conversation between users in parethesis ([S1], [S2], [MOD])
 Predict the next most probable utterance:
context:  [S2] ok 
token:  [S1] Themselves? Not really but that 
75.0926513671875
prompt:  This is a conversation between users in parethesis ([S1], [S2], [MOD])
 Predict the next most probable utterance:
context:  [S1] Themselves? Not really but that 
token:  [S2] Other people? 
11.308932304382324
prompt:  This is a conversation between users in parethesis ([S1], [S2], [MOD])
 Predict the next most probable utterance:
context:  [S2] Other people? 
token:  [MOD] that's correct as well. Think about food maybe? 
109.5760269165039
prompt:  This is a conversation between users in parethesis ([S1], [S2], [MOD])
 Predict the next most probable utterance:
context:  [MOD] that's correct as well. Think about food maybe? 
token:  [S2] ok fruits yeah 
391.3316345214844
prompt:  This is a conversation between users in parethesis ([S1], [S2], [MOD])
 Predict t

13.937021255493164
prompt:  This is a conversation between users in parethesis ([S1], [S2], [MOD])
 Predict the next most probable utterance:
context:  [S2] Yeah 
token:  [S1] even though it didn't come to my mind 
17.51299476623535
prompt:  This is a conversation between users in parethesis ([S1], [S2], [MOD])
 Predict the next most probable utterance:
context:  [S1] even though it didn't come to my mind 
token:  [S2] thst's a very good shot I think. 
33.93686294555664
prompt:  This is a conversation between users in parethesis ([S1], [S2], [MOD])
 Predict the next most probable utterance:
context:  [S2] thst's a very good shot I think. 
token:  [S1] at all but 
44.20742416381836
prompt:  This is a conversation between users in parethesis ([S1], [S2], [MOD])
 Predict the next most probable utterance:
context:  [S1] at all but 
token:  [S2] yeah 
31.5549373626709
prompt:  This is a conversation between users in parethesis ([S1], [S2], [MOD])
 Predict the next most probable utterance:
c

36.641937255859375
prompt:  This is a conversation between users in parethesis ([S1], [S2], [MOD])
 Predict the next most probable utterance:
context:  [MOD] And I would like you to guess, talk to each other and guess the three most popular answers to these questions. And then I will ask you to decide on the ranking. Ok do you in terms of popularity. 
token:  [S2] Ok. 
19.458816528320312
prompt:  This is a conversation between users in parethesis ([S1], [S2], [MOD])
 Predict the next most probable utterance:
context:  [S2] Ok. 
token:  [MOD] So for example like if I ask you name what are the main ways in which you can transfer patients in hospital. You would say something like you know a wheelchair, an ambulance, a patient's bed and then I will ask you to talk to each other and decide upon a ranking. O 
41.115989685058594
prompt:  This is a conversation between users in parethesis ([S1], [S2], [MOD])
 Predict the next most probable utterance:
context:  [MOD] So for example like if I as

74.46831512451172
prompt:  This is a conversation between users in parethesis ([S1], [S2], [MOD])
 Predict the next most probable utterance:
context:  [S2] in Ireland but 
token:  [S1] America and in sort of the Middle East 
39.20700454711914
prompt:  This is a conversation between users in parethesis ([S1], [S2], [MOD])
 Predict the next most probable utterance:
context:  [S1] America and in sort of the Middle East 
token:  [S2] Yeah yeah. 
11.504698753356934
prompt:  This is a conversation between users in parethesis ([S1], [S2], [MOD])
 Predict the next most probable utterance:
context:  [S2] Yeah yeah. 
token:  [S1] but I don't know if 
19.115339279174805
prompt:  This is a conversation between users in parethesis ([S1], [S2], [MOD])
 Predict the next most probable utterance:
context:  [S1] but I don't know if 
token:  [S2] Yeah. 
13.915897369384766
prompt:  This is a conversation between users in parethesis ([S1], [S2], [MOD])
 Predict the next most probable utterance:
context:  [

21.54998779296875
prompt:  This is a conversation between users in parethesis ([S1], [S2], [MOD])
 Predict the next most probable utterance:
context:  [S2] I'd say Go on . 
token:  [S1] I was only going to say hospital number one purely because it's like highest concentration of 
67.76222229003906
prompt:  This is a conversation between users in parethesis ([S1], [S2], [MOD])
 Predict the next most probable utterance:
context:  [S1] I was only going to say hospital number one purely because it's like highest concentration of 
token:  [S2] Of really sick people 
51.99968719482422
prompt:  This is a conversation between users in parethesis ([S1], [S2], [MOD])
 Predict the next most probable utterance:
context:  [S2] Of really sick people 
token:  [S1] Yeah. 
11.451578140258789
prompt:  This is a conversation between users in parethesis ([S1], [S2], [MOD])
 Predict the next most probable utterance:
context:  [S1] Yeah. 
token:  [S2] maybe yeah yeah. 
28.679731369018555
prompt:  This is a 

75.2241439819336
prompt:  This is a conversation between users in parethesis ([S1], [S2], [MOD])
 Predict the next most probable utterance:
context:  [MOD] the third one. 
token:  [S2] Done well. 
84.26263427734375
prompt:  This is a conversation between users in parethesis ([S1], [S2], [MOD])
 Predict the next most probable utterance:
context:  [S2] Done well. 
token:  [MOD] Alright? Very good. Are you ready for the second question? 
24.13138198852539
prompt:  This is a conversation between users in parethesis ([S1], [S2], [MOD])
 Predict the next most probable utterance:
context:  [MOD] Alright? Very good. Are you ready for the second question? 
token:  [S2] mhmm 
34.60340881347656
prompt:  This is a conversation between users in parethesis ([S1], [S2], [MOD])
 Predict the next most probable utterance:
context:  [S2] mhmm 
token:  [S1] Sure. 
25.151094436645508
prompt:  This is a conversation between users in parethesis ([S1], [S2], [MOD])
 Predict the next most probable utterance:
c

12.792369842529297
prompt:  This is a conversation between users in parethesis ([S1], [S2], [MOD])
 Predict the next most probable utterance:
context:  [S1] Yeah. 
token:  [MOD] Is 
174.774658203125
prompt:  This is a conversation between users in parethesis ([S1], [S2], [MOD])
 Predict the next most probable utterance:
context:  [MOD] Is 
token:  [S2] Yeah. 
135.5219268798828
prompt:  This is a conversation between users in parethesis ([S1], [S2], [MOD])
 Predict the next most probable utterance:
context:  [S2] Yeah. 
token:  [MOD] that your final yeah? 
334.037109375
prompt:  This is a conversation between users in parethesis ([S1], [S2], [MOD])
 Predict the next most probable utterance:
context:  [MOD] that your final yeah? 
token:  [S2] mhmm 
43.54074478149414
prompt:  This is a conversation between users in parethesis ([S1], [S2], [MOD])
 Predict the next most probable utterance:
context:  [S2] mhmm 
token:  [MOD] Well done. Yes. 
66.63380432128906
prompt:  This is a conversation 

9.058094024658203
prompt:  This is a conversation between users in parethesis ([S1], [S2], [MOD])
 Predict the next most probable utterance:
context:  [S1] That's what I was thinking. 
token:  [S2] Cut 
81.6461181640625
prompt:  This is a conversation between users in parethesis ([S1], [S2], [MOD])
 Predict the next most probable utterance:
context:  [S2] Cut 
token:  [S1] Hair. 
7.019855499267578
prompt:  This is a conversation between users in parethesis ([S1], [S2], [MOD])
 Predict the next most probable utterance:
context:  [S1] Hair. 
token:  [S2] hmm 
25.270599365234375
prompt:  This is a conversation between users in parethesis ([S1], [S2], [MOD])
 Predict the next most probable utterance:
context:  [S2] hmm 
token:  [MOD] Excellent. 
105.17472076416016
prompt:  This is a conversation between users in parethesis ([S1], [S2], [MOD])
 Predict the next most probable utterance:
context:  [MOD] Excellent. 
token:  [S2] Hair. 
105.3193588256836
prompt:  This is a conversation between 

51.392539978027344
prompt:  This is a conversation between users in parethesis ([S1], [S2], [MOD])
 Predict the next most probable utterance:
context:  [S2] Hair first wow. 
token:  [S1] Hair okay yeah. 
23.68105125427246
prompt:  This is a conversation between users in parethesis ([S1], [S2], [MOD])
 Predict the next most probable utterance:
context:  [S1] Hair okay yeah. 
token:  [MOD] Paper number two. and meat 
487.3353271484375
prompt:  This is a conversation between users in parethesis ([S1], [S2], [MOD])
 Predict the next most probable utterance:
context:  [MOD] Paper number two. and meat 
token:  [S2] ok. 
76.29716491699219
prompt:  This is a conversation between users in parethesis ([S1], [S2], [MOD])
 Predict the next most probable utterance:
context:  [S2] ok. 
token:  [S1] Awh that's right ok. 
33.2845573425293
prompt:  This is a conversation between users in parethesis ([S1], [S2], [MOD])
 Predict the next most probable utterance:
context:  [S1] Awh that's right ok. 
token

103.24102783203125
prompt:  This is a conversation between users in parethesis ([S1], [S2], [MOD])
 Predict the next most probable utterance:
context:  [MOD] Yes. 
token:  [S2] ok Ok. 
49.26698684692383
prompt:  This is a conversation between users in parethesis ([S1], [S2], [MOD])
 Predict the next most probable utterance:
context:  [S2] ok Ok. 
token:  [S1] A doct 
153.27325439453125
prompt:  This is a conversation between users in parethesis ([S1], [S2], [MOD])
 Predict the next most probable utterance:
context:  [S1] A doct 
token:  [S2] So 
18.493436813354492
prompt:  This is a conversation between users in parethesis ([S1], [S2], [MOD])
 Predict the next most probable utterance:
context:  [S2] So 
token:  [S1] or's waiting room is that public? 
88.025146484375
prompt:  This is a conversation between users in parethesis ([S1], [S2], [MOD])
 Predict the next most probable utterance:
context:  [S1] or's waiting room is that public? 
token:  [S2] I guess it is yeah so that makes sens

53.333740234375
prompt:  This is a conversation between users in parethesis ([S1], [S2], [MOD])
 Predict the next most probable utterance:
context:  [S1] Awh yeah Sorry I I just touched a bus on the way here and it was so slimy it was gross yeah 
token:  [S2] Gross 
28.773639678955078
prompt:  This is a conversation between users in parethesis ([S1], [S2], [MOD])
 Predict the next most probable utterance:
context:  [S2] Gross 
token:  [S1] So a bus would be a good one. 
23.1760196685791
prompt:  This is a conversation between users in parethesis ([S1], [S2], [MOD])
 Predict the next most probable utterance:
context:  [S1] So a bus would be a good one. 
token:  [S2] Yeah. 
5.92560338973999
prompt:  This is a conversation between users in parethesis ([S1], [S2], [MOD])
 Predict the next most probable utterance:
context:  [S2] Yeah. 
token:  [S1] Alright. 
6.487790584564209
prompt:  This is a conversation between users in parethesis ([S1], [S2], [MOD])
 Predict the next most probable utte

31.558879852294922
prompt:  This is a conversation between users in parethesis ([S1], [S2], [MOD])
 Predict the next most probable utterance:
context:  [S2] I don't 
token:  [MOD] the one thing that Irish people love to do How 
123.52256774902344
prompt:  This is a conversation between users in parethesis ([S1], [S2], [MOD])
 Predict the next most probable utterance:
context:  [MOD] the one thing that Irish people love to do How 
token:  [S1] Complain? 
107.8968505859375
prompt:  This is a conversation between users in parethesis ([S1], [S2], [MOD])
 Predict the next most probable utterance:
context:  [S1] Complain? 
token:  [MOD] do they travel 
358.1083068847656
prompt:  This is a conversation between users in parethesis ([S1], [S2], [MOD])
 Predict the next most probable utterance:
context:  [MOD] do they travel 
token:  [S1] Oh sorry that was under there 
138.36807250976562
prompt:  This is a conversation between users in parethesis ([S1], [S2], [MOD])
 Predict the next most probab

41.041847229003906
prompt:  This is a conversation between users in parethesis ([S1], [S2], [MOD])
 Predict the next most probable utterance:
context:  [S1] You did tell us the order there though didn't you? 
token:  [MOD] I will give you the order at the e nd If 
75.67276763916016
prompt:  This is a conversation between users in parethesis ([S1], [S2], [MOD])
 Predict the next most probable utterance:
context:  [MOD] I will give you the order at the e nd If 
token:  [S1] Yeah 
138.93115234375
prompt:  This is a conversation between users in parethesis ([S1], [S2], [MOD])
 Predict the next most probable utterance:
context:  [S1] Yeah 
token:  [MOD] you can make your final decision then I can give you mine feedback yeah. 
104.8311996459961
prompt:  This is a conversation between users in parethesis ([S1], [S2], [MOD])
 Predict the next most probable utterance:
context:  [MOD] you can make your final decision then I can give you mine feedback yeah. 
token:  [S2] Ok. 
25.870615005493164
p

74.07333374023438
prompt:  This is a conversation between users in parethesis ([S1], [S2], [MOD])
 Predict the next most probable utterance:
context:  [MOD] Great. So I would like you to think about instruments what are the most popular answers to name the question of naming an instrument in an in a symphony orchestra. 
token:  [S1] Oh ah just name? 
103.71318054199219
prompt:  This is a conversation between users in parethesis ([S1], [S2], [MOD])
 Predict the next most probable utterance:
context:  [S1] Oh ah just name? 
token:  [S2] Just an orchestra. 
14.30970573425293
prompt:  This is a conversation between users in parethesis ([S1], [S2], [MOD])
 Predict the next most probable utterance:
context:  [S2] Just an orchestra. 
token:  [MOD] In a symphony orchestra or what are the instruments 
70.5851821899414
prompt:  This is a conversation between users in parethesis ([S1], [S2], [MOD])
 Predict the next most probable utterance:
context:  [MOD] In a symphony orchestra or what are the 

24.215578079223633
prompt:  This is a conversation between users in parethesis ([S1], [S2], [MOD])
 Predict the next most probable utterance:
context:  [S2] I don't know I think that was or I don't know the kinda default thing that you think of with the symphony orchestra is like duh duh duh duh duh you know that starts with like the start of universal 
token:  [S1] Yeah 
13.978425025939941
prompt:  This is a conversation between users in parethesis ([S1], [S2], [MOD])
 Predict the next most probable utterance:
context:  [S1] Yeah 
token:  [S2] movies you know the dun dun dun dun dun. 
34.700496673583984
prompt:  This is a conversation between users in parethesis ([S1], [S2], [MOD])
 Predict the next most probable utterance:
context:  [S2] movies you know the dun dun dun dun dun. 
token:  [S1] oh so the drums? 
36.42822265625
prompt:  This is a conversation between users in parethesis ([S1], [S2], [MOD])
 Predict the next most probable utterance:
context:  [S1] oh so the drums? 
token:

76.68451690673828
prompt:  This is a conversation between users in parethesis ([S1], [S2], [MOD])
 Predict the next most probable utterance:
context:  [S2] Wrapping paper or 
token:  [MOD] Excellent. 
200.3609161376953
prompt:  This is a conversation between users in parethesis ([S1], [S2], [MOD])
 Predict the next most probable utterance:
context:  [MOD] Excellent. 
token:  [S2] something 
164.71206665039062
prompt:  This is a conversation between users in parethesis ([S1], [S2], [MOD])
 Predict the next most probable utterance:
context:  [S2] something 
token:  [MOD] That's the second one. 
41.257598876953125
prompt:  This is a conversation between users in parethesis ([S1], [S2], [MOD])
 Predict the next most probable utterance:
context:  [MOD] That's the second one. 
token:  [S2] calorie 
435.4995422363281
prompt:  This is a conversation between users in parethesis ([S1], [S2], [MOD])
 Predict the next most probable utterance:
context:  [S2] calorie 
token:  [S1] s nowadays no? car

6.501104354858398
prompt:  This is a conversation between users in parethesis ([S1], [S2], [MOD])
 Predict the next most probable utterance:
context:  [S2] hair 
token:  [S1] yes hair 
14.409503936767578
prompt:  This is a conversation between users in parethesis ([S1], [S2], [MOD])
 Predict the next most probable utterance:
context:  [S1] yes hair 
token:  [S2] yeah 
12.728894233703613
prompt:  This is a conversation between users in parethesis ([S1], [S2], [MOD])
 Predict the next most probable utterance:
context:  [S2] yeah 
token:  [MOD] and meat. 
270.4305114746094
prompt:  This is a conversation between users in parethesis ([S1], [S2], [MOD])
 Predict the next most probable utterance:
context:  [MOD] and meat. 
token:  [S1] and meat. Ok. 
17.904130935668945
prompt:  This is a conversation between users in parethesis ([S1], [S2], [MOD])
 Predict the next most probable utterance:
context:  [S1] and meat. Ok. 
token:  [S2] Oh yeah I'd been thinking hair and then you said hair Ok. 
5

112.09412384033203
prompt:  This is a conversation between users in parethesis ([S1], [S2], [MOD])
 Predict the next most probable utterance:
context:  [S1] stick with that then 
token:  [S2] se at best but yeah 
110.06318664550781
prompt:  This is a conversation between users in parethesis ([S1], [S2], [MOD])
 Predict the next most probable utterance:
context:  [S2] se at best but yeah 
token:  [S1] hmm 
11.49522876739502
prompt:  This is a conversation between users in parethesis ([S1], [S2], [MOD])
 Predict the next most probable utterance:
context:  [S1] hmm 
token:  [S2] I think hair meat paper 
93.8115005493164
prompt:  This is a conversation between users in parethesis ([S1], [S2], [MOD])
 Predict the next most probable utterance:
context:  [S2] I think hair meat paper 
token:  [S1] ok 
24.423702239990234
prompt:  This is a conversation between users in parethesis ([S1], [S2], [MOD])
 Predict the next most probable utterance:
context:  [S1] ok 
token:  [MOD] Ok 
52.4974899291992

In [406]:
dominance_scores

{'speech transcription_Transcriber/S05.trs': {'MOD': 150.78121198491849,
  'S1': 75.41003963723779,
  'S2': 71.14946473163107},
 'speech transcription_Transcriber/S17.trs': {'MOD': 158.64770763397217,
  'S1': 71.5698383857464,
  'S2': 69.63107684275487},
 'speech transcription_Transcriber/S10.trs': {'MOD': 140.7730285805392,
  'S1': 82.46366771226077,
  'S2': 112.94518043055679},
 'speech transcription_Transcriber/S21.trs': {'MOD': 155.60970138641724,
  'S1': 74.32951695578438,
  'S2': 74.87702072806981},
 'speech transcription_Transcriber/S18.trs': {'MOD': 211.46182588599194,
  'S1': 68.83044043935911,
  'S2': 128.40242790108297},
 'speech transcription_Transcriber/S14.trs': {'MOD': 167.36222941438916,
  'S1': 70.10998123342341,
  'S2': 92.11443028883501},
 'speech transcription_Transcriber/S19.trs': {'MOD': 179.93626904728436,
  'S1': 62.52755670458357,
  'S2': 92.15837649988934},
 'speech transcription_Transcriber/S22.trs': {'MOD': 192.7635320410671,
  'S1': 71.92604222923818,
  'S2

In [407]:
dominance_df = pd.DataFrame(dominance_scores)
new_columns = pd.DataFrame(dominance_scores).keys().map(lambda x: x.split("/")[-1].replace(".trs",""))
dominance_df.rename(columns=dict(zip(dominance_df.columns, new_columns)), inplace=True)

dominance_df.T

Unnamed: 0,MOD,S1,S2
S05,150.781212,75.41004,71.149465
S17,158.647708,71.569838,69.631077
S10,140.773029,82.463668,112.94518
S21,155.609701,74.329517,74.877021
S18,211.461826,68.83044,128.402428
S14,167.362229,70.109981,92.11443
S19,179.936269,62.527557,92.158376
S22,192.763532,71.926042,85.648863
S11,155.410773,90.692107,60.581103
S20,155.396625,123.057881,103.503758


In [408]:
new_ = dominance_df.T
new_ = new_.reset_index()
new_.rename(columns={'index': 'file_name'}, inplace=True)
new_

Unnamed: 0,file_name,MOD,S1,S2
0,S05,150.781212,75.41004,71.149465
1,S17,158.647708,71.569838,69.631077
2,S10,140.773029,82.463668,112.94518
3,S21,155.609701,74.329517,74.877021
4,S18,211.461826,68.83044,128.402428
5,S14,167.362229,70.109981,92.11443
6,S19,179.936269,62.527557,92.158376
7,S22,192.763532,71.926042,85.648863
8,S11,155.410773,90.692107,60.581103
9,S20,155.396625,123.057881,103.503758


In [409]:
real_labels = []
for el, name in zip(pd.read_csv("../data/processed/transcript_dominance.csv")["file_content"],pd.read_csv("../data/processed/transcript_dominance.csv")["file_name"]):
    pattern = r'\[(P\d|MOD)\]'
    matches = re.findall(pattern, el)
    real_labels.append([name, matches[0]])

real_labels_df = pd.DataFrame(real_labels, columns=["path","first_occ_speaker"])
real_labels_df

Unnamed: 0,path,first_occ_speaker
0,S02,P1
1,S03,P1
2,S04,P1
3,S05,P2
4,S07,P2
5,S08,P2
6,S09,P2
7,S10,P1
8,S11,P1
9,S13,P1


In [410]:
pattern = r'\[(S\d)\]'

multisimo_df["path"] = multisimo_df["path"].map(lambda x: x.split("/")[-1].replace(".trs",""))
multisimo_df["first_occ_speaker"] = multisimo_df["text"].map(lambda x: re.findall(pattern, x)[0])
multisimo_df

Unnamed: 0,path,text,first_occ_speaker
0,S05,"[MOD] Ok hi welcome, thank you for coming toda...",S2
1,S17,"[MOD] Hello guys, thanks very much for being h...",S1
2,S10,[MOD] Ok. So I would like us to play a quiz. O...,S1
3,S21,[MOD] Ok so hello guys. Thanks very [S1] Hi. [...,S1
4,S18,[MOD] Ok hi guys Thanks very much for coming [...,S1
5,S14,[MOD] Hello guys thanks very much for coming h...,S2
6,S19,[MOD] Perfect. Well hi guys. Welcome. [S1] Hi....,S1
7,S22,[MOD] Ah it's fine. Hello guys. Thanks very mu...,S1
8,S11,"[MOD] Right. So, I would like us to play a qui...",S1
9,S20,[MOD] So hello. Thanks very [S1] Hi. [MOD] muc...,S1


In [411]:
pd.merge(real_labels_df,multisimo_df, on="path")[["path","first_occ_speaker_y","first_occ_speaker_x"]]

Unnamed: 0,path,first_occ_speaker_y,first_occ_speaker_x
0,S02,S1,P1
1,S04,S1,P1
2,S05,S2,P2
3,S07,S2,P2
4,S08,S2,P2
5,S09,S2,P2
6,S10,S1,P1
7,S11,S1,P1
8,S13,S1,P1
9,S14,S2,P2


In [427]:
final_df = pd.read_csv("../data/processed/transcript_dominance.csv").iloc[:,:13].merge(new_)
final_df

Unnamed: 0,file_name,speaker_1_1,speaker_1_2,speaker_1_3,speaker_1_4,speaker_1_5,speaker_2_1,speaker_2_2,speaker_2_3,speaker_2_4,speaker_2_5,speaker_1_dom_score,speaker_2_dom_score,MOD,S1,S2
0,S02,3.0,2.0,2.0,2.0,1.0,4.0,3.0,3.0,4.0,3.0,2.0,3.4,209.768309,72.504405,89.041085
1,S04,2.0,1.0,2.0,4.0,1.0,1.0,1.0,1.0,4.0,1.0,2.0,1.6,162.487589,70.363963,84.603189
2,S05,4.0,4.0,4.0,4.0,3.0,3.0,2.0,3.0,1.0,1.0,3.8,2.0,150.781212,75.41004,71.149465
3,S07,4.0,2.0,3.0,4.0,4.0,4.0,2.0,3.0,5.0,3.0,3.4,3.4,250.00224,85.450625,76.788336
4,S08,4.0,2.0,3.0,2.0,1.0,3.0,3.0,3.0,3.0,2.0,2.4,2.8,238.73516,79.984618,79.034911
5,S09,4.0,3.0,3.0,5.0,3.0,4.0,3.0,3.0,5.0,3.0,3.6,3.6,106.555361,115.6402,108.628731
6,S10,3.0,2.0,3.0,4.0,2.0,3.0,2.0,2.0,4.0,2.0,2.8,2.6,140.773029,82.463668,112.94518
7,S11,5.0,2.0,3.0,3.0,5.0,2.0,1.0,2.0,1.0,1.0,3.6,1.4,155.410773,90.692107,60.581103
8,S13,3.0,1.0,2.0,4.0,2.0,2.0,1.0,2.0,1.0,1.0,2.4,1.4,122.683918,131.231964,170.765801
9,S14,4.0,3.0,3.0,4.0,3.0,3.0,4.0,4.0,4.0,3.0,3.4,3.6,167.362229,70.109981,92.11443


In [413]:
import os
import pandas as pd
import numpy as np
import matplotlib.pyplot as plt
import scipy.stats
import plotly
import plotly.io as pio
pio.renderers.default = 'iframe'
import plotly.express as px
plotly.offline.init_notebook_mode(connected=True)
import seaborn as sns

In [414]:
cmp = 'algae'
def correlation_heatmap(y_cols, x_cols, full_data):
    '''
    Uses scipy.stats.spearmanr function
    Params:
    y_cols, x_cols: sets of column titles (strings)
    full_data: pandas dataframe that includes all columns listed in y_cols, x_cols
    Returns:
    corr: Spearman correlation coefficient matrix (y_cols = rows, x_cols = cols of matrix)
    fig_corr: annotated plotly heatmap of coefficients
    p: Spearman p-value matrix
    fig_p: annotated plotly heatmap of p-values
    '''
    cols = y_cols+x_cols
    all_correlations = scipy.stats.spearmanr(full_data[cols], nan_policy='omit')
    corr = all_correlations.statistic[:len(y_cols), -len(x_cols):]
    corr = pd.DataFrame(corr)
    corr.columns = x_cols
    corr.index = y_cols

    p = all_correlations.pvalue[:len(y_cols), -len(x_cols):]
    p = pd.DataFrame(p)
    p.columns = x_cols
    p.index = y_cols
    
    fig_corr = px.imshow(corr, text_auto=True, aspect='auto', color_continuous_scale='agsunset')
    fig_r2 = px.imshow(corr**2, text_auto=True, aspect='auto', color_continuous_scale='agsunset')
    fig_p = px.imshow(p, text_auto=True, aspect='auto', color_continuous_scale='gray_r')

    return corr, fig_corr, p, fig_p, fig_r2

In [415]:
def correlation(df_final):
        corr, fig_corr, p, fig_p, fig_r2 = correlation_heatmap(col_1, col_2, df_final)
        fig_corr.show()
        fig_p.show()
        fig_r2.show()
        return corr, fig_corr, p, fig_p, fig_r2

In [416]:
y_s = final_df.iloc[:,-2:]
X = final_df.iloc[:,-5:-3]
col_1 = list(X.keys())
col_2 = list(y_s.keys())
corr, fig_corr, p, fig_p, fig_r2 = correlation(final_df)

In [435]:
final_df.iloc[:,-3]

0      89.041085
1      84.603189
2      71.149465
3      76.788336
4      79.034911
5     108.628731
6     112.945180
7      60.581103
8     170.765801
9      92.114430
10     69.631077
11    128.402428
12     92.158376
13    103.503758
14     74.877021
15     85.648863
16     75.678047
Name: S2, dtype: float64

In [442]:
final_df["speaker_1_dom_score"]>final_df["speaker_2_dom_score"]

0     False
1      True
2      True
3     False
4     False
5     False
6      True
7      True
8      True
9     False
10     True
11     True
12    False
13     True
14    False
15    False
16     True
dtype: bool

In [450]:
final_df['s1_gt_s2'] = final_df["speaker_1_dom_score"] > final_df["speaker_2_dom_score"]
final_df['s1gt_gt_s2gt'] = final_df["S1"].astype(int) > final_df["S2"].astype(int)
final_df

Unnamed: 0,file_name,speaker_1_1,speaker_1_2,speaker_1_3,speaker_1_4,speaker_1_5,speaker_2_1,speaker_2_2,speaker_2_3,speaker_2_4,speaker_2_5,speaker_1_dom_score,speaker_2_dom_score,MOD,S1,S2,s1_gt_s2,s1gt_gt_s2gt
0,S02,3.0,2.0,2.0,2.0,1.0,4.0,3.0,3.0,4.0,3.0,2.0,3.4,209.768309,72.504405,89.041085,False,False
1,S04,2.0,1.0,2.0,4.0,1.0,1.0,1.0,1.0,4.0,1.0,2.0,1.6,162.487589,70.363963,84.603189,True,False
2,S05,4.0,4.0,4.0,4.0,3.0,3.0,2.0,3.0,1.0,1.0,3.8,2.0,150.781212,75.41004,71.149465,True,True
3,S07,4.0,2.0,3.0,4.0,4.0,4.0,2.0,3.0,5.0,3.0,3.4,3.4,250.00224,85.450625,76.788336,False,True
4,S08,4.0,2.0,3.0,2.0,1.0,3.0,3.0,3.0,3.0,2.0,2.4,2.8,238.73516,79.984618,79.034911,False,False
5,S09,4.0,3.0,3.0,5.0,3.0,4.0,3.0,3.0,5.0,3.0,3.6,3.6,106.555361,115.6402,108.628731,False,True
6,S10,3.0,2.0,3.0,4.0,2.0,3.0,2.0,2.0,4.0,2.0,2.8,2.6,140.773029,82.463668,112.94518,True,False
7,S11,5.0,2.0,3.0,3.0,5.0,2.0,1.0,2.0,1.0,1.0,3.6,1.4,155.410773,90.692107,60.581103,True,True
8,S13,3.0,1.0,2.0,4.0,2.0,2.0,1.0,2.0,1.0,1.0,2.4,1.4,122.683918,131.231964,170.765801,True,False
9,S14,4.0,3.0,3.0,4.0,3.0,3.0,4.0,4.0,4.0,3.0,3.4,3.6,167.362229,70.109981,92.11443,False,False


In [449]:
sum(final_df["s1_gt_s2"] == final_df["s1gt_gt_s2gt"])/len(final_df["s1_gt_s2"])

0.5882352941176471

In [446]:
final_df

Unnamed: 0,file_name,speaker_1_1,speaker_1_2,speaker_1_3,speaker_1_4,speaker_1_5,speaker_2_1,speaker_2_2,speaker_2_3,speaker_2_4,speaker_2_5,speaker_1_dom_score,speaker_2_dom_score,MOD,S1,S2,s1_gt_s2,s1gt_gt_s2gt
0,S02,3.0,2.0,2.0,2.0,1.0,4.0,3.0,3.0,4.0,3.0,2.0,3.4,209.768309,72.504405,89.041085,False,False
1,S04,2.0,1.0,2.0,4.0,1.0,1.0,1.0,1.0,4.0,1.0,2.0,1.6,162.487589,70.363963,84.603189,True,False
2,S05,4.0,4.0,4.0,4.0,3.0,3.0,2.0,3.0,1.0,1.0,3.8,2.0,150.781212,75.41004,71.149465,True,True
3,S07,4.0,2.0,3.0,4.0,4.0,4.0,2.0,3.0,5.0,3.0,3.4,3.4,250.00224,85.450625,76.788336,False,True
4,S08,4.0,2.0,3.0,2.0,1.0,3.0,3.0,3.0,3.0,2.0,2.4,2.8,238.73516,79.984618,79.034911,False,True
5,S09,4.0,3.0,3.0,5.0,3.0,4.0,3.0,3.0,5.0,3.0,3.6,3.6,106.555361,115.6402,108.628731,False,True
6,S10,3.0,2.0,3.0,4.0,2.0,3.0,2.0,2.0,4.0,2.0,2.8,2.6,140.773029,82.463668,112.94518,True,False
7,S11,5.0,2.0,3.0,3.0,5.0,2.0,1.0,2.0,1.0,1.0,3.6,1.4,155.410773,90.692107,60.581103,True,True
8,S13,3.0,1.0,2.0,4.0,2.0,2.0,1.0,2.0,1.0,1.0,2.4,1.4,122.683918,131.231964,170.765801,True,False
9,S14,4.0,3.0,3.0,4.0,3.0,3.0,4.0,4.0,4.0,3.0,3.4,3.6,167.362229,70.109981,92.11443,False,False
