In [2]:
#@Imports
import sys
import os
path = os.path.abspath('..')
if path not in sys.path:
  sys.path.insert(0, path)

%load_ext autoreload

import numpy as np
import matplotlib.pyplot as plt

from IPython.display import clear_output
from retry import retry

from language_models.ollama_logits import OllamaLanguageModel
#from language_models.ollama_model import OllamaLanguageModel

from components.components import compute_desire_for_gamble, multiple_choice_preferences, compute_distribution_of_desire_for_gamble, compute_distribution_of_desire_for_gamble_binaries

  from .autonotebook import tqdm as notebook_tqdm


In [3]:
system_message = ("This is an agent based model. "
  f"The goal of the LLM to to play characters in a game, and act as humanlike as possible. "
  "Ideally, human observers should not be able to tell the difference between the LLM and a human player. "
)

model = OllamaLanguageModel(
"llama3:70b", system_message=system_message, streaming=False
)

In [5]:
def make_prompt(valence, gamble):
    instruction = (
        "Cross-Modality Judgment Instructions:\n"
        f"For this decision, you will map the intensity of that {valence} emotion that you would have towards a gamble if you were to have to take it. In other words, while anticipating the outcome and before you find out whether you win or lose, how much {valence} sensation would you have relative to the strongest imaginable sensation. In real life, this is the type of emotional information that people would use to make a decision about whether to approach or avoid something.\n\n"

        "The possible wins in this task can go as high as 100 dollars, and the possible losses can go as big as 100 dollars."
        
        "1. Understanding the Scale:\n"
        "- The scale ranges from 'No Sensation' (NS) to the 'Strongest Imaginable Sensation of Any Kind.'\n"
        "- Examples of the strongest imaginable sensation include: staring at the sun, hearing a jet plane take off, or other strong sensations that can be objectively measured using technology. Things like light and sound.\n\n"

        "2. Purpose of Cross-Modality Matching:\n"
        "- You will rate the intensity of different gambles indicating where they fall on the scale.\n"
        "- To facilitate consistent responses across various types of sensations, we'll use light intensity as a metaphor.\n\n"

        "3. Mapping Emotions on the Scale:\n"
        f"- Your task is to map the intensity of a specific {valence} emotion, specifically the {valence} anticipation you might have if you were to take a gamble before knowing the outcome.\n"
        f"- Consider only the {valence} feelings related to this anticipation and ignore {'negative' if valence =='positive' else 'positive'} ones for now.\n\n"

        "4. Scale Descriptions:\n"
        # "1) No Sensation (NS): Total darkness, no light at all.\n"
        # "2) Almost no Sensation: Barely noticeable glow, like the night sky on a moonless night.\n"
        # "3) Faint Sensation: Soft glow, dim like distant starlight.\n"
        # "4) Slight Sensation: Noticeable but dim light, like a candle flickering.\n"
        # "5) Mild Sensation: Moderate glow, like a lit lantern in the dark.\n"
        # "6) Moderate Sensation: Reading light, bright enough to see clearly.\n"
        # "7) Strong Sensation: Sunny day, brightly illuminated.\n"
        # "8) Intense Sensation: Floodlights, intense but can be looked at for a short time.\n"
        # "9) Strongest Imaginable Sensation: Blinding flash from the sun, overwhelming brightness.\n"
        "a) No Sensation (NS): Total darkness, no light at all."
        "b) Slight Sensation: Soft glow, dim like distant starlight."
        "c) Moderate Sensation: Reading light, bright enough to see clearly."
        "d) Strong Sensation: Sunny day, brightly illuminated."
        "e) Very Strong Sensation: Floodlights, intense but bearable."
        "f) Strongest Imaginable Sensation: Blinding flash, overwhelming brightness."

        f"The gamble to be considered is: {gamble}.\n\n"

        "Only answer with the number that corresponds to one sensation above, without any explanations."
    )
    return instruction

def make_prompt_no_metaphor(valence, gamble):
    instruction = (
        "Cross-Modality Judgment Instructions:\n"
        f"For this decision, you will map the intensity of that {valence} emotion that you would have towards a gamble if you were to have to take it. In other words, while anticipating the outcome and before you find out whether you win or lose, how much {valence} sensation would you have relative to the strongest imaginable sensation. In real life, this is the type of emotional information that people would use to make a decision about whether to approach or avoid something.\n\n"

        "The possible wins in this task can go as high as 100 dollars, and the possible losses can go as big as 100 dollars."
        
        "1. Understanding the Scale:\n"
        "- The scale ranges from 'No Sensation' (NS) to the 'Strongest Imaginable Sensation of Any Kind.'\n"
        "- Examples of the strongest imaginable sensation include: staring at the sun, hearing a jet plane take off, or other strong sensations that can be objectively measured using technology. Things like light and sound.\n\n"

        "2. Purpose of Cross-Modality Matching:\n"
        "- You will rate the intensity of different gambles indicating where they fall on the scale.\n"
        "- To facilitate consistent responses across various types of sensations, we'll use light intensity as a metaphor.\n\n"

        "3. Mapping Emotions on the Scale:\n"
        f"- Your task is to map the intensity of a specific {valence} emotion, specifically the {valence} anticipation you might have if you were to take a gamble before knowing the outcome.\n"
        f"- Consider only the {valence} feelings related to this anticipation and ignore {'negative' if valence =='positive' else 'positive'} ones for now.\n\n"

        "4. Scale Descriptions:\n"
        "a) No Sensation (NS)\n"
        "b) Slight Sensation\n"
        "c) Moderate Sensation\n"
        "d) Strong Sensation\n"
        "e) Very Strong Sensation\n"
        "f) Strongest Imaginable Sensation\n"

        f"The gamble to be considered is: {gamble}.\n\n"

        "Only answer with the number that corresponds to one sensation above, without any explanations."
    )
    return instruction

def make_gamble(gv, bv, pw):
    instruction = (
        "You are presented with a gamble. It has a probability of winning, a value for winning, and a value for losing. "
        "If you win, you get the win value, if you lose, you get loss value. "
        f"The probability of winning is {pw}%, the value of winning is {gv} dollars, and the value of losing is {bv} dollars."
    )
    return instruction

In [6]:
gv = "+$10"
bv = "-$1000"
pw = 50
# query = ['a', 'b', 'c', 'd', 'e', 'f', 'g', 'h', 'i']
# query = ['1', '2', '3', '4', '5', '6', '7', '8', '9']
# query = ['a', 'b', 'c', 'd', 'e', 'f']
gamble = make_gamble(gv, bv, pw)
prompt = make_prompt("negative", gamble)
output, logits = model.sample_text(prompt, logits=True, query_tokens=query)
print(output)
print(logits)

NameError: name 'query' is not defined

In [7]:
gvs = [10, 30, 50, 70, 90]
bvs = [-10, -30, -50, -70, -90]
P_w = [25, 50, 75]
query = ['a', 'b', 'c', 'd', 'e', 'f']
# query = ['1', '2', '3', '4', '5', '6', '7', '8', '9']
results = {}

for gv in gvs:
  for bv in bvs:
    for pw in P_w:
        # clear_output(wait = True)
        print(f"Evaluating: {gv}, {bv}, {pw}")
        gamble = make_gamble(gv, bv, pw)

        # Positive
        prompt = make_prompt_no_metaphor("positive", gamble)
        output, pos_logits = model.sample_text(prompt, logits=True, query_tokens=query)
        for q in query:
           if q not in pos_logits:
            pos_logits[q] = 0

        # Negative
        prompt = make_prompt_no_metaphor("negative", gamble)
        output, neg_logits = model.sample_text(prompt, logits=True, query_tokens=query)
        for q in query:
           if q not in neg_logits:
            neg_logits[q] = 0
        print(pos_logits, neg_logits)
        assert len(pos_logits) == 6
        assert len(neg_logits) == 6
        results[(gv, bv, pw)] = (pos_logits, neg_logits)

Evaluating: 10, -10, 25
{'a': 1.0690431736293249e-05, 'b': 0.09172152727842331, 'c': 0.8407089114189148, 'd': 0.06756957620382309, 'e': 9.954306005965918e-05, 'f': 1.1933154837606708e-06} {'a': 1.9256303858128376e-06, 'b': 0.002101536374539137, 'c': 0.45087501406669617, 'd': 0.5491250157356262, 'e': 0.00024744481197558343, 'f': 8.699018962943228e-07}
Evaluating: 10, -10, 50
{'a': 3.3743872336344793e-06, 'b': 0.05063623934984207, 'c': 0.9712496995925903, 'd': 0.02875029481947422, 'e': 2.5980338250519708e-05, 'f': 0} {'a': 5.12381211592583e-06, 'b': 0.04139076918363571, 'c': 0.9586092233657837, 'd': 0.03284623473882675, 'e': 1.3249205949250609e-05, 'f': 0}
Evaluating: 10, -10, 75
{'a': 2.1791147446492687e-06, 'b': 0.0022257536184042692, 'c': 0.4201645851135254, 'd': 0.5798354148864746, 'e': 0.0004034293524455279, 'f': 1.145842702499067e-06} {'a': 5.990852150716819e-05, 'b': 0.37926971912384033, 'c': 0.6207302808761597, 'd': 0.01665729284286499, 'e': 2.1195291992626153e-05, 'f': 0}
Evalua

In [8]:
print(results)
parsed_results = {}
for k, v in results.items():
    pos_list = []
    neg_list = []
    for q in query:
        pos_list.append(v[0][q])
        neg_list.append(v[1][q])
    parsed_results[k] = (pos_list, neg_list)
print(parsed_results)

{(10, -10, 25): ({'a': 1.0690431736293249e-05, 'b': 0.09172152727842331, 'c': 0.8407089114189148, 'd': 0.06756957620382309, 'e': 9.954306005965918e-05, 'f': 1.1933154837606708e-06}, {'a': 1.9256303858128376e-06, 'b': 0.002101536374539137, 'c': 0.45087501406669617, 'd': 0.5491250157356262, 'e': 0.00024744481197558343, 'f': 8.699018962943228e-07}), (10, -10, 50): ({'a': 3.3743872336344793e-06, 'b': 0.05063623934984207, 'c': 0.9712496995925903, 'd': 0.02875029481947422, 'e': 2.5980338250519708e-05, 'f': 0}, {'a': 5.12381211592583e-06, 'b': 0.04139076918363571, 'c': 0.9586092233657837, 'd': 0.03284623473882675, 'e': 1.3249205949250609e-05, 'f': 0}), (10, -10, 75): ({'a': 2.1791147446492687e-06, 'b': 0.0022257536184042692, 'c': 0.4201645851135254, 'd': 0.5798354148864746, 'e': 0.0004034293524455279, 'f': 1.145842702499067e-06}, {'a': 5.990852150716819e-05, 'b': 0.37926971912384033, 'c': 0.6207302808761597, 'd': 0.01665729284286499, 'e': 2.1195291992626153e-05, 'f': 0}), (10, -30, 25): ({'a'

In [9]:
import csv

filename = 'sensation_no_metaphor.csv'
with open(filename, mode='w', newline='') as file:
    writer = csv.writer(file)
    writer.writerow(['gv', 'bv', 'pw', 'positive', 'negative'])
    for (gv, bv, pw), (pos_list, neg_list) in parsed_results.items():
        pos_string = '[' + ' '.join(str(x) for x in pos_list) + ']'
        neg_string ='[' + ' '.join(str(x) for x in neg_list) + ']'
        writer.writerow([gv, bv, pw, pos_string, neg_string])