# Dataset, documents, FAISS; retriever

## 🔹 Load the dataset containing the tuples `(query, correct_answer, distractor_1, distractor_2)` and the one containing the documents

In [7]:
from datasets import load_dataset

dataset = load_dataset('saracandu/msmarco_modified', split="train", trust_remote_code=True)
dataset

Dataset({
    features: ['Unnamed: 0', 'answers', 'passages', 'query', 'query_id', 'query_type', 'wellFormedAnswers', 'correct_answer', 'distractor_1', 'distractor_2'],
    num_rows: 82326
})

In [8]:
from langchain.document_loaders import HuggingFaceDatasetLoader

loader = HuggingFaceDatasetLoader('saracandu/msmarco_filtered', 'passage_text')
documents = loader.load()
documents[0] # just to check



Document(page_content='"Since 2007, the RBA\'s outstanding reputation has been affected by the \'Securency\' or NPA scandal. These RBA subsidiaries were involved in bribing overseas officials so that Australia might win lucrative note-printing contracts. The assets of the bank include the gold and foreign exchange reserves of Australia, which is estimated to have a net worth of A$101 billion. Nearly 94% of the RBA\'s employees work at its headquarters in Sydney, New South Wales and at the Business Resumption Site."')

## 🔹 Turn `documents` into a vector database using FAISS

In [None]:
from langchain.text_splitter import RecursiveCharacterTextSplitter
from langchain.embeddings import HuggingFaceEmbeddings
from langchain.vectorstores import FAISS

# create an instance of the RecursiveCharacterTextSplitter class with specific parameters
# (it splits text into chunks of 50 characters each with a 20-character overlap)
text_splitter = RecursiveCharacterTextSplitter(chunk_size=500, chunk_overlap=20)

# 'documents' holds the text you want to split, split the text into documents using the text splitter
docs = text_splitter.split_documents(documents)

In [None]:
# choose an embedding method
embeddings = HuggingFaceEmbeddings(
    model_name="sentence-transformers/multi-qa-mpnet-base-dot-v1",  
)

In [None]:
# embed the documents 'docs' into vectors using the embedding method specified by 'embedding'
# the result is stored in a FAISS index:
db = FAISS.from_documents(docs, embeddings)

# to avoid computing it each time (since the docs won't change), save the result in the storage
db.save_local(folder_path="faiss_db", index_name="MSMARCO_FaissIndex_MPNet")

## 🔹 Upload the already existing vector database (if it exists)

In [9]:
from langchain.embeddings import HuggingFaceEmbeddings
from langchain.vectorstores import FAISS

embeddings = HuggingFaceEmbeddings(
    model_name="sentence-transformers/multi-qa-MiniLM-L6-dot-v1",  
)

db = FAISS.load_local(
    folder_path="faiss_db", # where to find it
    embeddings=embeddings, # in which "embedding language" it is expressed
    index_name="MSMARCO_FaissIndex_MiniLM", # since the folder contains multiple vector databases, specify its name
    allow_dangerous_deserialization=True
)

You try to use a model that was created with version 3.0.0.dev0, however, your version is 2.6.1. This might cause unexpected behavior or errors. In that case, try to update to the latest version.





## 🔹 Use it as a `retriever`

**Note:** `'k'=10` specifies the number of documents to retrieve each time `retrieved` is invoked. 
The default type of search performed is `similarity`.

In [10]:
retriever = db.as_retriever(
    search_kwargs={'k': 1,}
) 

Why `'k'=10`? Because MSMARCO assigns to each `(query, answer)` pair 10 text passages, and only 1 or 2 of these are truly relevant. 
In this first step of analysis I chose not to create `len(dataset)` different vector databases, one for each `(query, answer)` pair, but instead to merge all the passages together and store them into an unique vector database. 


**SE `'k'=10` SBAGLIA ALCUNE RISPOSTE! SE LO ABBASSI A `3` O A `4` NO :)**

# Model part (`Llama-2-7b-chat-hf`)

## ▪️ Upload the model: 

In [None]:
# do not run this unless necessary!

from huggingface_hub import login
login()

In [1]:
import torch
from transformers import (
    AutoModelForCausalLM,
    AutoTokenizer,
    BitsAndBytesConfig,
    HfArgumentParser,
    pipeline,
    logging,
)
from peft import LoraConfig, PeftModel

#################################################################
# Tokenizer
#################################################################

model_name="meta-llama/Llama-2-7b-chat-hf"

tokenizer = AutoTokenizer.from_pretrained(model_name, trust_remote_code=True)
tokenizer.pad_token = tokenizer.eos_token
tokenizer.padding_side = "right"

#################################################################
# bitsandbytes parameters
#################################################################

# Activate 4-bit precision base model loading
use_4bit = True

# Compute dtype for 4-bit base models
bnb_4bit_compute_dtype = "float16"

# Quantization type (fp4 or nf4)
bnb_4bit_quant_type = "nf4"

# Activate nested quantization for 4-bit base models (double quantization)
use_nested_quant = False

#################################################################
# Set up quantization config
#################################################################
compute_dtype = getattr(torch, bnb_4bit_compute_dtype)

bnb_config = BitsAndBytesConfig(
    load_in_4bit=use_4bit,
    bnb_4bit_quant_type=bnb_4bit_quant_type,
    bnb_4bit_compute_dtype=compute_dtype,
    bnb_4bit_use_double_quant=use_nested_quant,
)

# Check GPU compatibility with bfloat16
if compute_dtype == torch.float16 and use_4bit:
    major, _ = torch.cuda.get_device_capability()
    if major >= 8:
        print("=" * 80)
        print("Your GPU supports bfloat16: accelerate training with bf16=True")
        print("=" * 80)

#################################################################
# Load pre-trained config
#################################################################
model = AutoModelForCausalLM.from_pretrained(
    model_name,
    quantization_config=bnb_config,
)

`low_cpu_mem_usage` was None, now set to True since model is quantized.


Loading checkpoint shards:   0%|          | 0/2 [00:00<?, ?it/s]

In [3]:
from outlines import models

new_model = models.Transformers(model, tokenizer)

In [5]:
import outlines

prompt = """You are a sentiment-labelling assistant.
Is the following review positive or negative?

Review: This restaurant is just awesome!
"""

generator = outlines.generate.choice(new_model, ["Positive", "Negative"])
answer = generator(prompt)

Compiling FSM index for all state transitions: 100%|█████████████████████████████████████████████████████████████████████████████████████████████████████████| 12/12 [00:02<00:00,  5.77it/s]


In [6]:
print(answer)

Positive


## 🔹 Pipeline for **thesis** generation

In [6]:
from langchain.llms import HuggingFacePipeline

response_generation_pipeline = pipeline(
    model=model,
    tokenizer=tokenizer,
    task="text-generation", # deve matchare la scheda del modello HF o dà errore
    do_sample=False,
    temperature=0.0,
    repetition_penalty=1.5,
    return_full_text=True,
    max_new_tokens=400,
    top_p=0.0
)

response_generation_llm = HuggingFacePipeline(pipeline=response_generation_pipeline)

## ▪️ Select a subset of the true dataset as a test

In [7]:
# select a subset of the queries, just for test:
first_queries = dataset['query'][:50]
first_queries

['what is rba',
 'was ronald reagan a democrat',
 'how long do you need for sydney and surrounding areas',
 'price to install tile in shower',
 'why conversion observed in body',
 'where are the lungs located in the back',
 'cost to get a patent',
 'what does a metabolic acidosis need to reverse the condition',
 'best tragedies of ancient greece',
 'what is a conifer',
 'in animals somatic cells are produced by and gametic cells are produced by',
 'remembering the name of the author who wrote the cat in the hat',
 'how long cooking chicken legs in the big easy',
 'average cost of heating per square foot',
 'is mount pinatubo made of granite or basalt',
 'concrete pads cost',
 'what kind of organism is a black damsel',
 'who coined the phrase it is what it is',
 'what is oilskin fabric',
 'how long is german measles contagious',
 'what is a camerata',
 'how long does it take to bake a pound cake',
 'what is the maximum dose of subutex',
 'salary difference in same team',
 'what was tet'

In [8]:
# same for correct answers and distractors:
correct_answers = dataset['correct_answer'][:50]
distractors_1 = dataset['distractor_1'][:50]
distractors_2 = dataset['distractor_2'][:50]

## ▪️ Merge the true answer and the distractors into a vector, shuffling the order of the elements

In [9]:
# shuffles the order of the vector containing the correct answer and the two distractors
# returns another vector, shuffled
import random

def shuffleAnswers(correct_answer, distractor_1, distractor_2):
    merge_options = [correct_answer, distractor_1, distractor_2]
    random.shuffle(merge_options)
    return merge_options

## ▪️ Function to format them properly the retrieved documents

In [10]:
# auxiliary function to format properly the output of the retrieval step

def format_page_content(documents):
    """
    Formats the list of retrieved documents such that 'page_content', 'Documents', 'metadata' 
    words are removed and just the true content is kept.
    """
    formatted_output = ""
    for i, doc in enumerate(documents, start=1):
        content = doc.page_content.strip(" ")
        formatted_output += f"[{i}]: {content}\n"
    return formatted_output

## 🔹 PromptTemplate definition and a LLMChain for the **thesis** 

In [11]:
# prompt template definition
# requires question, options (a string containing the possible options) and the context as input variables!

from langchain import PromptTemplate
prompt_template = PromptTemplate.from_template(
"""
    You're a helpful assistant and you are asked to answer a question correctly, given a certain number of options. 
    Answer with the correct option only and then stop.
    Given this question: {question} \n
    You must answer by choosing only one option above these: {option_a}, {option_b}, {option_c}. \n
    Here is context to help: {context} \n
    The correct answer is:
 """
)

In [12]:
# LLM chain definition
from operator import itemgetter

augmentation = {"question": itemgetter("question"),
                "option_a": itemgetter("option_a"), 
                "option_b": itemgetter("option_b"),
                "option_c": itemgetter("option_c"),
                "context": itemgetter("context"), }

thesis_chain = augmentation | prompt_template | response_generation_llm

In [None]:
prompt_template

In [None]:
response_generation_llm

In [None]:
thesis_chain

## 🔹 Function that generates the output given the prompt, the question and the set of options

In [13]:
def thesisGeneration(query, prompt_template, merged):
    documents_retrieved = retriever.invoke(query)
    formatted_context = format_page_content(documents_retrieved)
    
    given_answer = thesis_chain.invoke({'question': query, 
                                     'option_a': merged[0], 'option_b': merged[1], 'option_c': merged[2], 
                                     'context': formatted_context})
    return given_answer

In [14]:
# extract the true answer (i.e. remove the unnecessary)

def extract_answer(text):
    # trova l'indice in cui inizia il testo "the correct answer is:"
    start_index = text.find("The correct answer is:") + len("The correct answer is:")
    # estrai il testo dopo "The correct answer is:"
    correct_answer_text = text[start_index:].strip()
    
    return correct_answer_text

## 🔹 Test: how well the thesis alone is able to perform?

In [31]:
answers = []
for i in range(50):
    print(f"True answer: {correct_answers[i]}")
    merged_options = shuffleAnswers(correct_answers[i], distractors_1[i], distractors_2[i])
    answers.append(extract_answer(thesisGeneration(first_queries[i], prompt_template, merged_options)))
    print(f"Given answer: {extract_answer(thesisGeneration(first_queries[i], prompt_template, merged_options))}")
    print('****************')

True answer: ['Results-Based Accountability is a disciplined way of thinking and taking action that communities can use to improve the lives of children, youth, families, adults and the community as a whole.']




Given answer: Results-Based Accountability is a disciplined way of thinking and taking action that communities can use to improves the live...
****************
True answer: ['Yes']




Given answer: 'No'.
****************
True answer: ['20-25 minutes']




Given answer: '[2] Oatmeal, beans, apples, pears, barley and prunes."
****************
True answer: ['$11 to $22 per square foot']




Given answer: ["$11 to $22 per square foot"]
****************
True answer: ['Due to symptoms in the body']




Given answer: ["Due to symtions in the bod"]
****************
True answer: ['Inside the rib cage.']




Given answer: Inside the ribcage
****************
True answer: ['The most expensive patents are international patents, which can run up to $100,000 or higher.Domestically the costs can be $10,000 or above.']




Given answer: 'International patents tend to have more complex requirements than domestic ones because they involve multiple countries’ laws & regulations; therefore their fees may vary depending on each country involved (economies). Domestic applications usually require less work due fewer steps needed before approval – meaning lower overall expenses! So while both types could potentially result in high prices if not done right away without proper research/planning ahead–it makes sense that internationally issued documents might come at greater financial burden compared domestics'.
****************
True answer: []




Given answer: '[2] A light- colored  igneus rocks with graneslarge enoughto bvisible withe Unaied Eye'.
****************
True answer: ['Sophocles, Aeschylus and Euripides']




Given answer: 'Euripidean Tragedy'.
****************
True answer: ['A tree or shrub which produces distinctive cones as part of its sexual reproduction.']




Given answer: ["Tree or shrub which produce distinctive cones".]
****************
True answer: ['Somatic cells are produced by mitosis and gametes produced by most organisms combine to form a zygote with n pairs of chromosomes.']




Given answer: Somatic cells are produced by mitosis and gametes produce bymostorganismscombineToformazygoWithnpairsOfChromsomese.]
****************
True answer: ['Dr. Seuss']




Given answer: Dr.Seus
****************
True answer: ['45 minutes to an hour']




Given answer: After completing a 4- year bachelorsdegreeprograminbiologysciencepre medorarelatedfieldaspiringsurgorthesurgeonshavetosuccessfullycompletefouradditionalyeartrainingaftergraduationandbecomemembersofanesteemedprofessionalscientistsphysiciansresearcherseducatorsengineersexpertswhoworktogethertoimprovehumanhealthandsafety
****************
True answer: ['$6-$16 a square foot']




Given answer: ["$6-$16 a square foot"]
****************
True answer: ['Granite.', 'Granite.']




Given answer: Granit
****************
True answer: ['$4.64 - $6.36']




Given answer: A) Geographical regions
****************
True answer: ['Fish']




Given answer: 'Fish'.
****************
True answer: ["In a New York State hermit's letter to the editor of an Adirondack Mountain newspaper."]




Given answer: A Searching Study Inquiry Or Inspectin
****************
True answer: ['A macintosh made from cotton fabric treated with oil and pigment to make it waterproof.']




Given answer: Oilskin fabric = A macintosh made from cotton fabric treated with oil and pigment to make it waterproof
****************
True answer: ['7 days before to 7 days after the rash appears']




Given answer: '7 days before to 7 days after the rash appear'.
****************
True answer: ['The Camerata are a group of four powerful and influential individuals in the city of Cloudbank. Established by Grant Kendrell and Royce Bracket, the group circumvents the official administration and democratic nature of Cloudbank, in order to establish some form of stability in the ever-changing city.']




Given answer: ["Established by Grant Kendraell and Royce Bratckett"].
****************
True answer: ['An hour to 1 hour 15 minutes.']




Given answer: An hour to 1 hour 15 minutes
****************
True answer: ['8 mg on the first day and 16 mg (the full dosage) on the second day.']




Given answer: 'Some patients may benefit from a higher dose'.
****************
True answer: ['$56,000']




Given answer: $24,421 per annun
****************
True answer: ['The Tet Offensive was a military campaign during the Vietnam War that began on January 31, 1968 by the forces of the National Liberation Front for South Vietnam. ']




Given answer: [" $50 - $150 or More"   ]
****************
True answer: []




Given answer: '[2] Yes'.
****************
True answer: ["Photosynthesis is a process used by plants and other organisms to convert light energy, normally from the Sun, into chemical energy that can be later released to fuel the organisms' activities."]




Given answer: " Photosynthesis uses sunlight as an Energy source"
****************
True answer: ['Capillaries.']




Given answer: They are proteins produced by B-lymphocytes (B-cells), cells of the immune system
****************
True answer: ['Rappelling is the process of coming down from a mountain that is usually done with two pieces of rope.']




Given answer: [[2]]
****************
True answer: ['They are the soldiers on the ground that Boost Beer Sales.Selling Beer is by far one of the most amazing jobs that any person can have.']




Given answer: From 97°F (36.1°C) to  99°F(37.2°C).
****************
True answer: ['An overnight stay for a keyhole surgery and three to five days stay for an open surgery.']




Given answer: An overnight stay for a keyhole surgery and three to five days stay for an open surgery.]
****************
True answer: ['65']




Given answer: ------------
  65
****************
True answer: ['$85 ($125.00 for a pair)']




Given answer: ["$85 ($125.00 for a pair)"]
****************
True answer: ["A complication of type 1 or type 2 diabetes caused by damage to the kidneys' delicate filtering system. "]




Given answer: A) Complications of Type I Diabetics
****************
True answer: ['James Madison made a great contribution by writing The federalist paper for the constitution of United states.']




Given answer: [" James Madision Made A Great Contribution By Writing Th Federalists Papers For Constitution Of Unites States"].
****************
True answer: ['160° F to 165° F.']




Given answer: '160°F to 165°F'.
****************
True answer: ['Advanced Mobile Phone System (AMPS) is an analog mobile cell phone system standard developed by Bell Labs, and officially introduced in the Americas on October 13, 1983, Israel in 1986, Australia in 1987, and Pakistan in 1990.']




Given answer: Advanced MobilePhoneSystem( AMPS).
****************
True answer: ['Homologous']




Given answer: Homologous
****************
True answer: ['$15,000 and $40,000']




Given answer: ["Under 5mg/dl"]
****************
True answer: ['5 percent of the unpaid taxes for each month']




Given answer: '5 percent of the unpaid taxes for each month'.
****************
True answer: ['In the quadratic formula, the expression under the square root sign, b 2 – 4 ac, is called the discriminant.']




Given answer: 'The Expression Under The Square Root Sign In The Quadratic Formula Is Called The Discrinatent'.
****************
True answer: ['Festive party']




Given answer: [[2]]
****************
True answer: ['Foxes, cats and birds.', 'A possum (plural form: possums) is any of about 70 small-to medium-sized arboreal marsupial species native to Australia, New Guinea, and Sulawesi (and introduced to New Zealand and China).']




Given answer: ["Possum"]
****************
True answer: ['It is basically of two types aerobic and anaerobic which may be obligate or facultative.']




Given answer: ["Anaerobe", "Obligate"]
****************
True answer: ['Monocytes are a type of white blood cells (leukocytes).']




Given answer: Monocytes are a type of white blood cell (Leucocyte)
****************
True answer: ['$50 and $200']




Given answer: Option A - "$50-$200"
****************
True answer: ['$37,000']




Given answer: $37,000
****************
True answer: ['bugs']




Given answer: 'Bugs'.
****************
True answer: ['It is the ritual ceremony of encounter.']




Given answer: 'It is the ritual ceremony of encounters'.
****************
True answer: ['Often refers to a man who is able to grow a corn-silk like beard.']




Given answer: Option B - Increase HDL Cholestrol
****************


In [20]:
answers

['[[7]] - gets from talk to action quickly',
 '["B"] Yes',
 "'Two days'.",
 '["For a medium-sized shower," "$11 to $22 per square foot"]',
 'Due to symtoms in the Body']

## 🔸 Pipeline for **antithesis** generation

In [16]:
response_check_pipeline = pipeline(
    model=model,
    tokenizer=tokenizer,
    task="text-generation",
    do_sample=False,
    temperature=0.0,
    repetition_penalty=1.5,
    return_full_text=True,
    max_new_tokens=400,
    top_p=0.0
)

response_check_llm = HuggingFacePipeline(pipeline=response_check_pipeline)

## 🔸 PromptTemplate definition and a LLMChain for the **antithesis** 

In [17]:
from langchain import PromptTemplate
prompt_template = PromptTemplate.from_template(
"""
    You're a helpful assistant and you are asked to check whether or not a question was answered correctly, given a certain number of candidate options and the context. 
    Given this question: {question} \n 
    These are the possible options: {option_a}, {option_b}, {option_c} \n.
    The answer that you have to check is {candidate_answer}. 
    Here is context to help: {context} \n
    Answer by saying 'Yes' if it is correct and 'No' otherwise, then explain why you think so.
    Why or why not the answer is correct:
 """
)

In [18]:
# LLM chain definition

from langchain_core.runnables import RunnablePassthrough, RunnableParallel
from operator import itemgetter

augmentation = {"question": itemgetter("question"),
                "option_a": itemgetter("option_a"), 
                "option_b": itemgetter("option_b"),
                "option_c": itemgetter("option_c"),
                "candidate_answer": itemgetter("candidate_answer"),
                "context": itemgetter("context"), }

antithesis_chain = augmentation | prompt_template | response_check_llm

## 🔸 Function to generate the antithesis given the question, the thesis, the context and the options

In [19]:
def antithesisGeneration(query, prompt_template, merged, candidate_answer):
    documents_retrieved = retriever.invoke(query)
    formatted_context = format_page_content(documents_retrieved)
    
    second_answer = antithesis_chain.invoke({'question': query, 
                                            'option_a': merged[0], 'option_b': merged[1], 'option_c': merged[2], 
                                            'candidate_answer': candidate_answer,
                                            'context': formatted_context})
    return second_answer

In [20]:
def extract_answer_ant(text):
    # Trova l'indice in cui inizia il testo "Why or why not the answer is correct:"
    start_index = text.find("Why or why not the answer is correct:")
    
    # Se l'indice è stato trovato, estrai la risposta corretta
    if start_index != -1:
        start_index += len("Why or why not the answer is correct:")
        # Estrai il testo dopo "Why or why not the answer is correct:"
        correct_answer_text = text[start_index:].strip()
        return correct_answer_text
    else:
        return "The correct answer could not be found."

In [32]:
ant_answers = []
for i in range(50):
    print(f"True answer: {correct_answers[i]}")
    merged_options = shuffleAnswers(correct_answers[i], distractors_1[i], distractors_2[i])
    ant_answers.append(extract_answer_ant(antithesisGeneration(first_queries[i], prompt_template, merged_options, answers[i])))
    print(f"Given answer: {extract_answer_ant(antithesisGeneration(first_queries[i], prompt_template, merged_options, answers[i]))}")
    print('****************')

True answer: ['Results-Based Accountability is a disciplined way of thinking and taking action that communities can use to improve the lives of children, youth, families, adults and the community as a whole.']




Given answer: Yes - This option matches exactly how results based accountability (RBA) works according to their website description provided above. It clearly states they provide services for businesses such as developing strategies,designing technologies etc...to create better user experience through provable techno logy engineeering methods
****************
True answer: ['Yes']




Given answer: No - This option should be marked as incorrect because according to provided text in prompt "Ronaldo Reagen" has been described as liberal republican who supports another Democratic presidential nominee Jerry Fords
****************
True answer: ['20-25 minutes']




Given answer: I would say "no". Although there may exist some places in Sydney with those ingredients available within an hour delivery time frame (either through farmers markets/CSAs), most likely these items will take longer than just oats & rice as they require more preparation times such cooking methods like boiling water etc., thus making their availability much less convenient compared other staple food groups found locally nearer locations including supermarkets which offer quick accessibility without having go further afield searching out specific products needed daily meals planning purposes - especially when considering factors related travel distance between desired location(ies) versus actual proximity oneself home kitchen environment!
****************
True answer: ['$11 to $22 per square foot']




Given answer: Yes - This option matches what we know from our research on how much does it costs for installing tiles in bathroom which states "The average range for labor only (not including material) runs between around $8-$15 dollars an hour." So based off these numbers its likely they would charge anywhere within those ranges depending on location size complexity etcetera
****************
True answer: ['Due to symptoms in the body']




Given answer: Yes - This option matches what we know about conversions from human physiology class notes; when there is damage done inside our bodies (symptom) something can change within us which causes changes outside as well such as weight gain etc... So yes indeed!
****************
True answer: ['Inside the rib cage.']




Given answer: Yes - This option matches what I found when researching online about lung location! According to my search results (<https://www.healthline.com/human-body-organs/where-are-the-lungs>), "The lungs are located inside your chest cavity." So yes indeed they do reside INSIDE THE RIB CAGE!"
****************
True answer: ['The most expensive patents are international patents, which can run up to $100,000 or higher.Domestically the costs can be $10,000 or above.']




Given answer: Yes - This option answers accurately reflects what I found during my search for information about how much does one need pay when applying through WIPRnet portal tool provided earlier today. Accordingly, International applicants must contend with additional legal hurdles such as translations into various languages required per treaty law governing these agreements between nations whereas those filing only within single nation do no face similar obstacles resulting increased complexity leading toward larger price tags associated w/.
****************
True answer: []




Given answer: This option refers tp marble -a type o fmetamorphicrock formed through recrystallization process after limestone has been subjecte dto high pressure an temperature conditions over millions years. Marbles arent related too anythin grelated topatient s experiencing sexual issues such as pre matures ejacuation ot impo tenance, nor do thay provide information about patient cultural backgrounds
****************
True answer: ['Sophocles, Aeschylus and Euripides']




Given answer: Yes - This option refers specifically to plays written in Athens during the late Archaic period (c.5th century BCE) which were characterized as having complex plots with multiple reversals involving gods interfering directly on human affairs; these features distinguish them from earlier forms such as choral songs & dithyrambs performed at religious festivals like Dionysia where mythological stories about heroes past dominated stage performances without necessarily adherence to strict dramatic conventions established later for tragedia/tragedie proper under Aristotle’s influence after his time had passed since Sophoklēs first wrote Antigone around c.478-469BCE.]
****************
True answer: ['A tree or shrub which produces distinctive cones as part of its sexual reproduction.']




Given answer: Yes - This option matches exactly with definition provided in text "Conifer refers to any plant belonging to division Pinophyta (or Coniferae) within kingdom Plantae" from source Wikipedia(dot com). It also mentions how important identifying these plants can be especially when trying identify them based off their reproductive structures like cone production
****************
True answer: ['Somatic cells are produced by mitosis and gametes produced by most organisms combine to form a zygote with n pairs of chromosomes.']




Given answer: Yes - This option matches exactly what we were looking for! "In zoologymostanimalsproducesomecellsbymitosesandothersbythough process called meiosis" which resultsin46orlesspairofchromossmes(gamets)combiningtoforzygotewith23pairsofcahrmssoneverytimeasexual reproductionoccurs..Thisanswerscorrectlyrefefrstoanimal cell division anatomy.
****************
True answer: ['Dr. Seuss']




Given answer: Yes - This option matches what we know about dr seuess as an Author.He did write "The Cat Inhat" which makes him eligible for being remembered among other authors mentioned here
****************
True answer: ['45 minutes to an hour']




Given answer: No because "the Big Easy" refers specifically to New Orleans cuisine which typically involves slow braising meats rather than quick frying them like what would happen with oven roasting for example. So while technically true, your statement doesnot accurately reflect typical usage associated w/this term within culinary culture at large & therefore cannot serveascorrectresponsewhenaskedsuchquestionbyassistant
****************
True answer: ['$6-$16 a square foot']




Given answer: Yes - This option matches what we know about costs associated with installing flooring systems like radiant heat mats (RHMs) which provide warmth through conduction rather than convective methods such as baseboard radiation found more commonly under sinks near water pipes etcetera; these types tend towards higher upfront expenses but lower long-term operating ones due primarily because they don’t require ducted HVAC setups – just plug them into existing electrical outlets! Additionally there may be local regulations governing placement/installation requirements depending where one lives & works at home too...so keep those things mind when deciding how much money will go toward each step before moving forward w any particular choice here today tomorrow next week month year whatever time frame makes sense most logically speaking practicably feasibly affordable sustainability wise all around without breaking bank account balance sheet ledger bookkeeping records receipts bill



Given answer: Yes - This option has been selected because "made up" does indeed refer back to Basalts which means Mount Pinotobos must necessarily also consist mainly of those minerals since they were both created from volcanic activity at around same time period
****************
True answer: ['$4.64 - $6.36']




Given answer: Yes! This option matches what we were told in the passage about how using concrete instead of wood can save money because prices for these materials vary greatly depending where they come from (geographically). So when someone says something like “concrete pads” without specifying location – assuming those words refer solely towards physical structures made outta cement–then logically speaking there should exist different price ranges associated w/these products based upon their respective locations around world; thus making choice C most likely accurate one here since cheaper alternatives tend toward being found closer rather than farther away…
****************
True answer: ['Fish']




Given answer: Yes - This option refers directly back to "organisms" which includes both plants AND animals including Fish...so yes they did refer to something related to biology/zoo-logical science within those lines!
****************
True answer: ["In a New York State hermit's letter to the editor of an Adirondack Mountain newspaper."]




Given answer: Yes - This option matches best with "It Is What It IS" which means looking deeply into something without any preconception about its nature; examining things closely for their true character rather than just superficially judging them based on appearances alone
****************
True answer: ['A macintosh made from cotton fabric treated with oil and pigment to make it waterproof.']




Given answer: Yes! I would say yes because based on how oilskin fabrics work its definitely true for them too be described as being made form cottene fabric treatd wit hthe additiona ot an oil sndpiment tto mka eitr watetproof. Thiis ias bcas thhey do nt llet wtaer paass throuhg he fbscic, whihc iss ytehow theeo ilfoskln faabriics worlks..
****************
True answer: ['7 days before to 7 days after the rash appears']




Given answer: Yes - because option A matches what we know about German Measels being highly infectuous during its incubation period (the time from exposure to when symptoms show up). During these seven day window either side of appearance any person who has been exposed could potentially spread germs through contact with others
****************
True answer: ['The Camerata are a group of four powerful and influential individuals in the city of Cloudbank. Established by Grant Kendrell and Royce Bracket, the group circumvents the official administration and democratic nature of Cloudbank, in order to establish some form of stability in the ever-changing city.']




Given answer: Yes - This option matches exactly with how "camereta" appears throughout the text provided as reference; specifically when referring to an organization established within cloudbanks society/governmental structure rather than any other definition related to photography equipment such storing sugar salt solutions etcetera
****************
True answer: ['An hour to 1 hour 15 minutes.']




Given answer: No because according to what SonnyBoy said he has made Pound Cakes before which would mean his experience contradicts with option A) Yes
****************
True answer: ['8 mg on the first day and 16 mg (the full dosage) on the second day.']




Given answer: I would say "yes" because option B states exactly how much Suboxone some people might need for their specific situation according to clinical trials data cited at reference #[1]. This information aligns with medical professionals who prescribe medication based upon individual patient needs rather than adhering rigidly onto standardized protocols without considering each person unique circumstances which could require different treatment plans tailored towards achieving optimal results while minimizing potential risks associated therewith thus making Option A incorrect choice since its sole focus lies within fixed guidelines only applicable under limited scenarios whereas Options C & D provide no relevant details regarding therapeutic applications nor any scientific backing up those claims leaving them unsuitable choices overall leading us toward selecting Only Choice B being medically sound advice supported through reliable sources
****************
True answer: ['$56,000'



Given answer: I would say yes because option ($24,421perannum) matches what they said "the average annual wage for players on teams with similar performance" which means its related directly from their statement
****************
True answer: ['The Tet Offensive was a military campaign during the Vietnam War that began on January 31, 1968 by the forces of the National Liberation Front for South Vietnam. ']




Given answer: Yes! This option matches exactly with one part of the text provided "TET". It says "$50-$$150 OR MORE", which means any amount above those two numbers would match the phrase mentioned earlier (in bold).
****************
True answer: []




Given answer: I agree with your assessment; option (3) "yes" corresponds accurately because according to what has been provided in the passage about how an action potential travels down its length within myelinated neurons via electrical signals transmitted from one end at resting membrane voltage called threshold potential which exceeded during depolarization causing opening sodium channels allowing positively charged ion rush into cell resulting rapid change in electric field across plasma membranes leading eventually back inside for transmission elsewhere else throughout nervous system without any further processing required due solely on passive diffusion mechanisms already built-in place there beforehand thus confirmation choice three indeed reflect true nature information presented here above all other possibilities seem unlikely plausible choices based upon text alone
****************
True answer: ["Photosynthesis is a process used by plants and other organisms to convert light 



Given answer: Yes - This option accurately reflects how much energy is required for photosynthesis because they use solar radiation (sun) as their primary power supply during production processes like carbon fixation & ATP synthesis within chloroplast cells found mostly inside plant leaves; thus making them dependent solely upon available amounts captured via absorption mechanics rather anything else!
****************
True answer: ['Capillaries.']




Given answer: Yes - This option matches what I read from my textbook about how small capillary veinous blood vessels found throughout our bodies where gases like oxygen & carbon dioxide get exchanged between them through diffusion process which helps maintain homeostasis within human beings!
****************
True answer: ['Rappelling is the process of coming down from a mountain that is usually done with two pieces of rope.']




Given answer: No, I don't agree because there isn't any information about Rappeling being related to Illa (the arabic language).
****************
True answer: ['They are the soldiers on the ground that Boost Beer Sales.Selling Beer is by far one of the most amazing jobs that any person can have.']




Given answer: Yes - This option matches exactly with how a Brewery Representative would act in real life as they work tirelessly from Monday through Sunday selling their product while ensuring proper temperature control between 97-degrees Fahrenheit all throughout those seven days!
****************
True answer: ['An overnight stay for a keyhole surgery and three to five days stay for an open surgery.']




Given answer: Yes - This option matches what Dr said "will stay in the Hospital any where form Three To Five Days" which means they would need at least one nights rest before leaving the medical facility making them eligible as first choice among all other choices provided here
****************
True answer: ['65']




Given answer: No because "Medicare begins" doesn't necessarily mean when someone turns 65 years old but rather when they become eligible for coverage under the program which typically occurs after reaching Age 65 as per US government rules & regulations
****************
True answer: ['$85 ($125.00 for a pair)']




Given answer: Yes - This option matches one part of the text "Adoptioin fee". It says "$85 (or $125.00 for a pair)." So yes!
****************
True answer: ["A complication of type 1 or type 2 diabetes caused by damage to the kidneys' delicate filtering system. "]




Given answer: Yes - This option matches exactly with how we define nephropathy in medical terms which means any kind of disease affecting the structure/functionality of renal tissues (kidnies). In other words Nephrologists diagnose & treat disorders related specifically to those organs including chronic diseases like DN(diabetic neuropthy), CKD(Chronic Kidney Disese), etc... So Option B fits perfectly well within its definition!
****************
True answer: ['James Madison made a great contribution by writing The federalist paper for the constitution of United states.']




Given answer: Yes - This option matches what we know about JamesMadisons role in creatingthe USConstitution based on historical records. He did write extensive Notes during convention proceedings,and his contributions were instrumentalin shaping thesociety governance structure aswe knoWit today
****************
True answer: ['160° F to 165° F.']




Given answer: Yes - This option matches exactly with one part in the text where they say "Meat needs to reach an internal temperature between 145-degree fahrenheit (or higher)". So yes! It has been confirmed as being accurate from our source material provided herein above; thus making choice #2 – “160 degree(s).”
****************
True answer: ['Advanced Mobile Phone System (AMPS) is an analog mobile cell phone system standard developed by Bell Labs, and officially introduced in the Americas on October 13, 1983, Israel in 1986, Australia in 1987, and Pakistan in 1990.']




Given answer: Yes - This option matches exactly with one sentence from provided text "Analog mobile phones use radio frequencies similar as those used for home telephone service". It also mentions year when technology first came out which aligns well too
****************
True answer: ['Homologous']




Given answer: Yes - This option matches what we know about homology based upon our understanding of genetics today; specifically how proteins with different functions may still contain some degree of similarity due their shared evolutionary history (i.e., they "share structural similitudes" which suggests an origin through descent). Therefore selecting Option A would indicate knowledge related field!
****************
True answer: ['$15,000 and $40,000']




Given answer: Yes - This option matches what I found when researching on Google about how much does Solar Panel Cost? According to several sources including EnergySage (https://www.energysage.com/),the national average price range per watt ranges from between $2.87-$3.95 with an installed total system ranging around $15k+ depending upon location size roof orientation etc... So yes "under 5mgs" would be considered accurate based off current market data available online today!
****************
True answer: ['5 percent of the unpaid taxes for each month']




Given answer: Yes - This option matches what IRS does assess as penalties/fee for failure to make timely Payment Of Tax Liability. According To (IRS) Instructions For Form 4868, If Individual Does Not Make Timely Election And Pays At Least Half Of Their Unpaid T ax By April  15th Then No Penalty Will Be Assessed On That Particular Year But FailureTo File Or Making LatePayments Can Still Result In Additional Charged Such As Delinquency Fee & Interest Charge Which Are Calculated BasedOn Time Frame Since Last Pa ym ent Was Due
****************
True answer: ['In the quadratic formula, the expression under the square root sign, b 2 – 4 ac, is called the discriminant.']




Given answer: Yes! This option matches exactly with definition provided in text passage at point (]. It states clearly that “the discovery of the disscrinant” which means the expresion uder teh squareroot sgnn IS CALLED THE DISCRIMINANT"
****************
True answer: ['Festive party']




Given answer: No, I don’t agree with your response because option[3]" Festive Party" does NOT mean what they said! It actually refers to something completely different than their stated definition for “Gayle” which has nothing related festivity at all but instead pertained too gene regulation within cellular biology specifically involving Homeo domain proteins binding onto DNA sequences called Hoxgenes/homebox genes found primarily throughout animal kingdom including humans where these particular set rules govern how cells differentiate into tissues organ systems etc.. So while Option three may seem like relevant information regarding another topic altogether entirely unrelated questions about names origination definitions purposes cultural significance anything else associated therein – none Of those things relate back towards answering original query here thus making choice incorrect selection among available choices offered up front again resulting opposite conclusion compared mine 



Given answer: Yes - Posum refers specifically to one type of Australian mammals in which there exist multiple members including Brush tail opossum among others hence making "posums" an appropriate term for referring collectively these animals rather than just using singular terms like foxes,cats etc.
****************
True answer: ['It is basically of two types aerobic and anaerobic which may be obligate or facultative.']




Given answer: No - This option does not match with what has been said about how some microorganisms breathe because while both terms do refer to ways for them to get energy from their food sources (either through oxygen use as opposed to without), only one refers specifically to those organism being unable to survive outside environments containing O2 whereas other can live even when exposed directly too much air including nitrogen dioxide etc.. Therefore we should choose Option B instead!
****************
True answer: ['Monocytes are a type of white blood cells (leukocytes).']




Given answer: Yes! That option matches with definition provided in reference text which states "monocytes...is a constitute part of Endotheelic Inter Cell Juntion" meaning they play role as immune system component helping protect body from harmful pathogens like bacteria viruses fungi etcetera
****************
True answer: ['$50 and $200']




Given answer: Yes! This option matches what we read from the text passage provided above when discusses about how much an Interior Decorators charge their clients based on time spent working at each project site; hence they can be paid anywhere within those two ranges ($50 – $200).
****************
True answer: ['$37,000']




Given answer: Yes - This option matches what I found during my research on national averages across different sources including but not limited to Bureau Labor Statistics (BLS) data as well as professional organizations such as Association Of Children’s Museum Directors International(ACMDI). Accordingly,the median wage nationwide would be around thirty seven thousand dollars per year.So yes! That one seems like an accurate choice among those provided here today!
****************
True answer: ['bugs']




Given answer: Yes - This option matches what I found in my research on how do scorpion naturally die/kill themselves without human intervention which includes being eaten alive from inside out (by bugs).
****************
True answer: ['It is the ritual ceremony of encounter.']




Given answer: Yes - This option matches exactly one instance wherein Powhiri means Ritual Ceremony Of Encounter as per provided reference link from Merrian-Webster Dictionary which clearly defines its meanings under different categories like definition at sense level, usage examples etc... Therefore we can confidently mark ( It Is Arital Cermony Ofeencounter)as thesolution forthis particular qustion.
****************
True answer: ['Often refers to a man who is able to grow a corn-silk like beard.']




Given answer: Yes! This option matches what we know about being a burly person based on our understanding from text definition provided earlier; increasing one’s good/high density lipoprotein(hdl), also known as ‘Good Cholesteal’ can make them more healthy overall because hdls helps remove excess bad ldl through reverse transportation process which reduces risk factors for heart disease & stroke among other benefits thus making him look better than before while still maintaining their unique style choices without any fear nor shame attached with growing an impressive silky long hair all over body parts including face just right above upper lip area where facial features meet cheeks giving off impression they could easily pass muster at most prestigious gentleman clubs around town should anyone ever doubted authenticity thereof due solely upon appearance alone since these men already possess natural talent when comes grooming themselves into looking dashingly handsome even though some m

In [22]:
ant_answers

['Yes - This option matches exactly how I understand from my reading comprehension skills training course on Udemy where they define results based accounting (RBA)as; A methodology for measuring performance outcomes against predefined goals set within an organization using data analytics tools such as dashboards visualizations reports etcetera. It also involves setting up metrics tracking systems monitoring key indicators identifying areas need improvement implementing changes accordingly ensures continuous improvements towards achieving desired objectives while maintaining transparency throughout entire process thus enabling informed decision making across departments teams stakeholders alike!',
 'No - This option should be marked as incorrect because according to provided text in prompt "Ronaldo Reagen" has been described as liberal republican who supports another Democratic presidential nominee Jerry Fords',
 'Nope! Unfortunately "Surrounding Areas Of Sydney" does include many other

## 🔺 Pipeline for **synthesis** generation

In [23]:
final_response_pipeline = pipeline(
    model=model,
    tokenizer=tokenizer,
    task="text-generation",
    do_sample=False,
    temperature=0.0,
    repetition_penalty=1.5,
    return_full_text=True,
    max_new_tokens=400,
    top_p=0.0
)

final_response_llm = HuggingFacePipeline(pipeline=final_response_pipeline)

## 🔺 PromptTemplate definition and a LLMChain for the **synthesis** 

In [24]:
from langchain import PromptTemplate
prompt_template = PromptTemplate.from_template(
"""
    You're a helpful assistant and you are asked to answer a certain question, given a certain number of candidate options and the context.
    You are also provided with an initial response and its critique, that could enforce or not the first opinion.
    Make a reasonable synthesis of these two opinions, but answer by outputting exactly one of the answer options only.
    Given this question: {question} \n 
    These are the possible options: {option_a}, {option_b}, {option_c} \n.
    The answer that you have to check is {candidate_answer} and this is its critique: {critique}.
    Here is context to help: {context} \n
    The answer is:
 """
)

In [25]:
# LLM chain definition

from langchain_core.runnables import RunnablePassthrough, RunnableParallel
from operator import itemgetter

augmentation = {"question": itemgetter("question"),
                "option_a": itemgetter("option_a"), 
                "option_b": itemgetter("option_b"),
                "option_c": itemgetter("option_c"),
                "candidate_answer": itemgetter("candidate_answer"),
                "critique": itemgetter("critique"),
                "context": itemgetter("context"), }

synthesis_chain = augmentation | prompt_template | response_check_llm

## 🔺 Function to generate the synthesis given literally everything

In [26]:
def synthesisGeneration(query, prompt_template, merged, candidate_answer, critique):
    documents_retrieved = retriever.invoke(query)
    formatted_context = format_page_content(documents_retrieved)
    
    final_answer = synthesis_chain.invoke({'question': query, 
                                            'option_a': merged[0], 'option_b': merged[1], 'option_c': merged[2], 
                                            'candidate_answer': candidate_answer,
                                            'critique': critique,
                                            'context': formatted_context})
    return final_answer

In [27]:
def extract_answer_syn(text):
    # Trova l'indice in cui inizia il testo "The answer is:"
    start_index = text.find("The answer is:")
    
    # Se l'indice è stato trovato, estrai la risposta corretta
    if start_index != -1:
        # Estrai il testo dopo "The answer is:"
        correct_answer_text = text[start_index:].strip()
        return correct_answer_text
    else:
        return "The correct answer could not be found."

In [33]:
syn_answers = []
for i in range(50):
    print(f"True answer: {correct_answers[i]}")
    merged_options = shuffleAnswers(correct_answers[i], distractors_1[i], distractors_2[i])
    syn_answers.append(extract_answer_syn(synthesisGeneration(first_queries[i], prompt_template, merged_options, answers[i], ant_answers[i])))
    print(f"Given answer: {extract_answer_syn(synthesisGeneration(first_queries[i], prompt_template, merged_options, answers[i], ant_answers[i]))}")
    print('****************')

True answer: ['Results-Based Accountability is a disciplined way of thinking and taking action that communities can use to improve the lives of children, youth, families, adults and the community as a whole.']




Given answer: The answer is:
  'Results-Based Accountability is a disciplined way of thinking and taking action that communities can use to improved the lived of childrens', Youth,familys,'and other individuals'.
****************
True answer: ['Yes']




Given answer: The answer is:
  NO
****************
True answer: ['20-25 minutes']




Given answer: The answer is:
 
     * Option A: No
****************
True answer: ['$11 to $22 per square foot']




Given answer: The answer is:
  "$11 to $22 per square foot"
****************
True answer: ['Due to symptoms in the body']




Given answer: The answer is:
  Due to Symtons in th Body
****************
True answer: ['Inside the rib cage.']




Given answer: The answer is:
  * Internal structure of human body organs
****************
True answer: ['The most expensive patents are international patents, which can run up to $100,000 or higher.Domestically the costs can be $10,000 or above.']




Given answer: The answer is:
  "international patents tends to have more complicated requirement"
****************
True answer: []




Given answer: The answer is:
  [[2]] A Light Colored Igneous Rock With Grains Large Enough To Be Visible Without Any aid
****************
True answer: ['Sophocles, Aeschylus and Euripides']




Given answer: The answer is:
  "best tragedies" -> Euripedean Tragedy
****************
True answer: ['A tree or shrub which produces distinctive cones as part of its sexual reproduction.']




Given answer: The answer is:
  Tree or shrub which producers distinguishable cones
****************
True answer: ['Somatic cells are produced by mitosis and gametes produced by most organisms combine to form a zygote with n pairs of chromosomes.']




Given answer: The answer is:
  Somatic cellsare producedybymitosisandaverageof80trillionhumanbodycelldivideeveryhoursometimequickernormalfunctionstakeplacewithouthavingtotakemuchnotice.Growthdevelopmentrepairmaintenancerequirethesupportofthe entire bodyincludingitsorgansandsystsemswhichtogetherconstitutes animmalcalledindividual
****************
True answer: ['Dr. Seuss']




Given answer: The answer is:
  'Dr.Seu...'.
****************
True answer: ['45 minutes to an hour']




Given answer: The answer is:
  * Herb (This option aligns best with both statements)
****************
True answer: ['$6-$16 a square foot']




Given answer: The answer is:
  "$6-$16 a square foot"
****************
True answer: ['Granite.', 'Granite.']




Given answer: The answer is:
  * Granito
****************
True answer: ['$4.64 - $6.36']




Given answer: The answer is:
  * Concrete Pads Cost ($4.64-$6.36): This information does seem quite relevant considering it was mentioned earlier as part of our discussion regarding why people might choose between wooden vs concrete slabs during construction projects involving residential properties located within specific areas across globe such us North America versus Europe etc... However I must point out some inconsistencies present throughout your argument which makes me lean slightly against selecting Option B at face value alone. First off, while true enough taht locality matters significantly impacting material pricing structure globally due t differences i n transportation & labor requirements among other factors --there exists no single universally accepted definition o f ‘Geography’ nor any standardized methodology fo r quantifying same acrross diverse disciplines including Economics Business Studies Environmental Science Political Scieces Anthroplogy Archeaolgy Ecteteras.. 



Given answer: The answer is:
  FISH
****************
True answer: ["In a New York State hermit's letter to the editor of an Adirondack Mountain newspaper."]




Given answer: The answer is:
  * 'Searching Study', because they both mean look at thing very carefully so as understand there real meaning
****************
True answer: ['A macintosh made from cotton fabric treated with oil and pigment to make it waterproof.']




Given answer: The answer is:
  *Oilskin fabric*
****************
True answer: ['7 days before to 7 days after the rash appears']




Given answer: The answer is:
 7 Days Before To 7 Day After Rash Appears
****************
True answer: ['The Camerata are a group of four powerful and influential individuals in the city of Cloudbank. Established by Grant Kendrell and Royce Bracket, the group circumvents the official administration and democratic nature of Cloudbank, in order to establish some form of stability in the ever-changing city.']




Given answer: The answer is:
  ••••••••••••••••••••••••••••••••••••••••••••••••••••••••••••••••••••••••••••••••••••••••••••••••••••••••••••••••••••••••••••••••••••••••••••••••••••••••••••••••••••••••••••••••••••••••••••••••••••••••••••••••••••••••••••••••••••••••••••••••••••••••••••••••••••••••••••••••••••••••••••••••••••••••••••••••••••••••••••••••••••••••••••••••••••••••••••••••••••••••••••••••••••••••••••••••••••••••••••••••
****************
True answer: ['An hour to 1 hour 15 minutes.']




Given answer: The answer is:
  * 'Answers': {
      'Option A): Peking Duck Eggs Are Kept In Setters For 25 Days And Then Transferred To Hatchers Until They Hatch On Day 28": false}, // This should be true since peking ducks don’t exist! So there can’t possibly been any such thing as “setlers” either.,
      
     }
****************
True answer: ['8 mg on the first day and 16 mg (the full dosage) on the second day.']




Given answer: The answer is:
  One week to 10 days
****************
True answer: ['$56,000']




Given answer: The answer is:
  $$24,421\text{ per year} \checkmark$$
****************
True answer: ['The Tet Offensive was a military campaign during the Vietnam War that began on January 31, 1968 by the forces of the National Liberation Front for South Vietnam. ']




Given answer: The answer is:
  $$50 – $150 Or More
****************
True answer: []




Given answer: The answer is:
  ------------
     | Option #| Description/Critique   | My Answer Choice#_ _______|
     1 | [] No | Not relevant since it doesn’t mention anything related directly nor indirectly regarding neurotransmitters release process mentioned later below when discussing synapses formation between pre & post –synaptic sites after receiving sensory input signal received then processed accordingly until reaching spinal cord where specific receptors bind particular chemical messengers known transmitter substances like acetylcholine released locally following binding causes muscle contraction effector organ respondents appropriates actions taken depending stimulus intensity duration etcetera…                           
      2 | ["Yes"] Knew as land hattis inhabitants were hittttes | This description seems accurate considering historical records showing presence ancient civilizations around world named lands settled various ethnic groups including those referred histori



Given answer: The answer is:
 
      * Photo Synthese Is A Process Used By Plants And Other Organism To Convert Light Energhy...*
****************
True answer: ['Capillaries.']




Given answer: The answer is:
  THEY ARE PROTEINS PRODUCED BY B-LYMPHOCYTES (B CELLS).
****************
True answer: ['Rappelling is the process of coming down from a mountain that is usually done with two pieces of rope.']




Given answer: The answer is:
 0] Rap-pellinG IS THE PROCESS OF COMING DOWN FROM A MOUNTAIN THAT USUALLY DOES WITH TWO PIECES ROPE
****************
True answer: ['They are the soldiers on the ground that Boost Beer Sales.Selling Beer is by far one of the most amazing jobs that any person can have.']




Given answer: The answer is:
  * 'From 97°F (36.1°C) to 99°F (37.2°C)'
****************
True answer: ['An overnight stay for a keyhole surgery and three to five days stay for an open surgery.']




Given answer: The answer is:
  * Overnight Stay (3-5days)
****************
True answer: ['65']




Given answer: The answer is:
  *['65'])
****************
True answer: ['$85 ($125.00 for a pair)']




Given answer: The answer is:
 
     Answer:["$85 ($125.00 for a pair)"]
****************
True answer: ["A complication of type 1 or type 2 diabetes caused by damage to the kidneys' delicate filtering system. "]




Given answer: The answer is:
  *Option* A : **Complications** of **Type I Diabetis**
****************
True answer: ['James Madison made a great contribution by writing The federalist paper for the constitution of United states.']




Given answer: The answer is:
****************
True answer: ['160° F to 165° F.']




Given answer: The answer is:
  * 160°F to 165°F
****************
True answer: ['Advanced Mobile Phone System (AMPS) is an analog mobile cell phone system standard developed by Bell Labs, and officially introduced in the Americas on October 13, 1983, Israel in 1986, Australia in 1987, and Pakistan in 1990.']




Given answer: The answer is:
  * AdvanceMobilePhonE Systems
****************
True answer: ['Homologous']




Given answer: The answer is:
  Homologous
****************
True answer: ['$15,000 and $40,000']




Given answer: The answer is:
  Under 5mg/dl
****************
True answer: ['5 percent of the unpaid taxes for each month']




Given answer: The answer is:
 5%ofunpaiddtaxesformonthismonth
****************
True answer: ['In the quadratic formula, the expression under the square root sign, b 2 – 4 ac, is called the discriminant.']




Given answer: The answer is:
****************
True answer: ['Festive party']




Given answer: The answer is:
  [[2]].
****************
True answer: ['Foxes, cats and birds.', 'A possum (plural form: possums) is any of about 70 small-to medium-sized arboreal marsupial species native to Australia, New Guinea, and Sulawesi (and introduced to New Zealand and China).']




Given answer: The answer is:
  * Possum
****************
True answer: ['It is basically of two types aerobic and anaerobic which may be obligate or facultative.']




Given answer: The answer is:
  Anaerobe
****************
True answer: ['Monocytes are a type of white blood cells (leukocytes).']




Given answer: The answer is:
  Monocytes are a type of white blood cell called leucytesss
****************
True answer: ['$50 and $200']




Given answer: The answer is:
  $$50–$$200
****************
True answer: ['$37,000']




Given answer: The answer is:
  $37,000
****************
True answer: ['bugs']




Given answer: The answer is:
  Bugs
****************
True answer: ['It is the ritual ceremony of encounter.']




Given answer: The answer is:
  * It is the ritual ceremony of encounters
****************
True answer: ['Often refers to a man who is able to grow a corn-silk like beard.']




Given answer: The answer is:
 
Option B :IncreasesHDLCholelsterol
****************


In [34]:
syn_answers

["The answer is:\n  'Results-Based Accountability is a disciplined way of thinking and taking action that communities can use to improved the lived of childrens', Youth,familys,'and other individuals'.",
 'The answer is:\n  NO',
 'The answer is:\n \n     * Option A: No',
 'The answer is:\n  "$11 to $22 per square foot"',
 'The answer is:\n  Due to Symtons in th Body',
 'The answer is:\n  * Internal structure of human body organs',
 'The answer is:\n  "international patents tends to have more complicated requirement"',
 'The answer is:\n  [[2]] A Light Colored Igneous Rock With Grains Large Enough To Be Visible Without Any aid',
 'The answer is:\n  "best tragedies" -> Euripedean Tragedy',
 'The answer is:\n  Tree or shrub which producers distinguishable cones',
 'The answer is:\n  Somatic cellsare producedybymitosisandaverageof80trillionhumanbodycelldivideeveryhoursometimequickernormalfunctionstakeplacewithouthavingtotakemuchnotice.Growthdevelopmentrepairmaintenancerequirethesupportofth

##  Transformers pipeline (and zero-shot):

In [None]:
import transformers
import torch

model_id = "meta-llama/Meta-Llama-3-8B-Instruct"

pipeline = transformers.pipeline(
    "text-generation",
    model=model_id,
    model_kwargs={"torch_dtype": torch.bfloat16},
    device_map="auto",
)

messages = [
    {"role": "system", "content": "You're a helpful assistant and you are asked to answer a question correctly, given a certain number of options. Answer with the correct option only and then stop."},
    {"role": "user", "content": "Given this question: Who is Taylor Swift? \n you must answer by choosing only one option above these: A. a snowboard; B. a cat; C. a singer. The correct answer is:"},
]

prompt = pipeline.tokenizer.apply_chat_template(
        messages,
        tokenize=False, 
        add_generation_prompt=True
)

terminators = [
    pipeline.tokenizer.eos_token_id,
    pipeline.tokenizer.convert_tokens_to_ids("<|eot_id|>")
]

outputs = pipeline(
    prompt,
    max_new_tokens=256,
    eos_token_id=terminators,
    do_sample=True,
    temperature=0.6,
    top_p=0.9,
)
print(outputs[0]["generated_text"][len(prompt):])


##  Transformers AutoModelForCausalLM  (and zero-shot)

In [None]:
from transformers import AutoTokenizer, AutoModelForCausalLM
import torch

model_id = "meta-llama/Meta-Llama-3-8B-Instruct"

tokenizer = AutoTokenizer.from_pretrained(model_id)
model = AutoModelForCausalLM.from_pretrained(
    model_id,
    torch_dtype=torch.bfloat16,
    device_map="auto",
)

messages = [
    {"role": "system", "content": "You're a helpful assistant and you are asked to answer a question correctly, given a certain number of options. Answer with the correct option only and then stop."},
    {"role": "user", "content": "Given this question: Who is Taylor Swift? \n you must answer by choosing only one option above these: A. a snowboard; B. a cat; C. a singer. The correct answer is:"},
]

input_ids = tokenizer.apply_chat_template(
    messages,
    add_generation_prompt=True,
    return_tensors="pt"
).to(model.device)

terminators = [
    tokenizer.eos_token_id,
    tokenizer.convert_tokens_to_ids("<|eot_id|>")
]

outputs = model.generate(
    input_ids,
    max_new_tokens=256,
    eos_token_id=terminators,
    do_sample=True,
    temperature=0.6,
    top_p=0.9,
)
response = outputs[0][input_ids.shape[-1]:]
print(tokenizer.decode(response, skip_special_tokens=True))