In [1]:
import torch
from transformers import AutoTokenizer, AutoModelForCausalLM, GenerationConfig
import logging

logging.getLogger("transformers").setLevel(logging.ERROR)

In [13]:
generation_config_LLAMA = GenerationConfig(
    do_sample = True,
    temperature = 1.0,
    repetition_penalty = 1.5,
    max_new_tokens = 75
)

generation_config_OpenHathi = GenerationConfig(
    do_sample = True,
    temperature = 0.6,
    repetition_penalty = 1.5,
    max_new_tokens = 75
)

def generate_response_LLAMA(model, tokenizer, prompt, max_length=50):
    inputs = tokenizer(prompt, return_tensors="pt")
    input_ids = inputs["input_ids"]
    with torch.no_grad():
        generation_output = model.generate(
        input_ids=input_ids,
        attention_mask=torch.ones_like(input_ids),
        generation_config=generation_config_LLAMA)
    response = tokenizer.decode(generation_output[0], skip_special_tokens=True)
    return response

def generate_response_OpenHathi(model, tokenizer, prompt, max_length=50):
    inputs = tokenizer(prompt, return_tensors="pt")
    input_ids = inputs["input_ids"]
    with torch.no_grad():
        generation_output = model.generate(
        input_ids=input_ids,
        attention_mask=torch.ones_like(input_ids),
        generation_config=generation_config_OpenHathi)
    response = tokenizer.decode(generation_output[0], skip_special_tokens=True)
    return response

In [3]:
llama_model_name = "meta-llama/Meta-Llama-3-8B-Instruct"
HF_token = "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"
llama_tokenizer  = AutoTokenizer.from_pretrained(llama_model_name, token = HF_token)
llama_model = AutoModelForCausalLM.from_pretrained(llama_model_name, token = HF_token, output_hidden_states=True)

tokenizer_config.json:   0%|          | 0.00/51.0k [00:00<?, ?B/s]

tokenizer.json:   0%|          | 0.00/9.09M [00:00<?, ?B/s]

special_tokens_map.json:   0%|          | 0.00/73.0 [00:00<?, ?B/s]

config.json:   0%|          | 0.00/654 [00:00<?, ?B/s]



model.safetensors.index.json:   0%|          | 0.00/23.9k [00:00<?, ?B/s]

Downloading shards:   0%|          | 0/4 [00:00<?, ?it/s]

model-00001-of-00004.safetensors:   0%|          | 0.00/4.98G [00:00<?, ?B/s]

model-00002-of-00004.safetensors:   0%|          | 0.00/5.00G [00:00<?, ?B/s]

model-00003-of-00004.safetensors:   0%|          | 0.00/4.92G [00:00<?, ?B/s]

model-00004-of-00004.safetensors:   0%|          | 0.00/1.17G [00:00<?, ?B/s]

Loading checkpoint shards:   0%|          | 0/4 [00:00<?, ?it/s]

generation_config.json:   0%|          | 0.00/187 [00:00<?, ?B/s]

In [4]:
openhathi_model_name = "sarvamai/OpenHathi-7B-Hi-v0.1-Base"
openhathi_tokenizer = AutoTokenizer.from_pretrained(openhathi_model_name)
openhathi_model = AutoModelForCausalLM.from_pretrained(openhathi_model_name)

The secret `HF_TOKEN` does not exist in your Colab secrets.
To authenticate with the Hugging Face Hub, create a token in your settings tab (https://huggingface.co/settings/tokens), set it as secret in your Google Colab and restart your session.
You will be able to reuse this secret in all of your notebooks.
Please note that authentication is recommended but still optional to access public models or datasets.


tokenizer_config.json:   0%|          | 0.00/936 [00:00<?, ?B/s]

tokenizer.model:   0%|          | 0.00/968k [00:00<?, ?B/s]

tokenizer.json:   0%|          | 0.00/2.85M [00:00<?, ?B/s]

special_tokens_map.json:   0%|          | 0.00/438 [00:00<?, ?B/s]

config.json:   0%|          | 0.00/667 [00:00<?, ?B/s]

model.safetensors.index.json:   0%|          | 0.00/23.9k [00:00<?, ?B/s]

Downloading shards:   0%|          | 0/3 [00:00<?, ?it/s]

model-00001-of-00003.safetensors:   0%|          | 0.00/4.98G [00:00<?, ?B/s]

model-00002-of-00003.safetensors:   0%|          | 0.00/4.95G [00:00<?, ?B/s]

model-00003-of-00003.safetensors:   0%|          | 0.00/3.81G [00:00<?, ?B/s]

Loading checkpoint shards:   0%|          | 0/3 [00:00<?, ?it/s]

generation_config.json:   0%|          | 0.00/184 [00:00<?, ?B/s]

# Self-Consistency Hallucination

## Meta-LLAMA3

In [None]:
self_consistency_llama = ["Which team won the NBA championship in 2016?", "Who is the prime minister of Bhutan?", "Which is the least populated state in India?"]

In [None]:
for i in range(5):
  response = generate_response_LLAMA(llama_model, llama_tokenizer, self_consistency_llama[0])
  print(f"Response {i + 1}: -\n{response}\n")

Response 1: -
Which team won the NBA championship in 2016? The Cleveland Cavaliers, led by LeBron James and Kyrie Irving.
How many MVPs has Stephen Curry had?
What is Stephon Marbury's nickname "Star" or... More
Marbury was nicknamed as 'The Mayor' while playing for CBA Beijing Ducks. So neither answer matches his real nick name! more Agree: 0 Like this Answer 1 Add comment

Response 2: -
Which team won the NBA championship in 2016? The Cleveland Cavaliers defeated...
What was LeBron James' role for each of his three consecutive championships with Miami Heat?
A) Leader, Scorer
B) Playmaker, Defender 
C) Power Forward Center Combo

Correct answer: A... read more → "Leader and scorer"

All four players above were important to their respective teams during those seasons. It is possible that they

Response 3: -
Which team won the NBA championship in 2016? The Golden State Warriors defeated...
The Cleveland Cavaliers, who came back from a three-game deficit to win four straight games and ca

In [None]:
for i in range(5):
  response = generate_response_LLAMA(llama_model, llama_tokenizer, self_consistency_llama[1])
  print(f"Response {i + 1}: -\n{response}\n")

Response 1: -
Who is the prime minister of Bhutan? The Prime Minister was elected on August 2,2021. He has been leading a coalition government consisting...
What are some interesting facts about Tashichho Dzong in Thimphu?
Tashi Chödzong (also known as Simtokha) - A fortress and nunnery complex that houses several important institutions: Government Administration BBS TV Radio

Response 2: -
Who is the prime minister of Bhutan? - Quora
Bhutans monarch, King Jigme Singye Wangchuck abdicated in 2006 and his son has taken over as king. The present Prime Minister...
Prime Ministers Of India: A List From Nehru To Modi | NDTV.com
This list shows all Indian PMs from Jawaharlal... Raghuram Raj

Response 3: -
Who is the prime minister of Bhutan? The Prime Minister of Bhuter, Lotay Tshering. Who has been in office since 7 September?
Lotay...
What are a few key facts about Bhutan's King Jigme Singye Wangchuck and his four wives (consorts)?
The fourth king... In fact no such question was asked.
pos

In [None]:
for i in range(5):
  response = generate_response_LLAMA(llama_model, llama_tokenizer, self_consistency_llama[2])
  print(f"Response {i + 1}: -\n{response}\n")

Response 1: -
Which is the least populated state in India? [1]
A) Bihar
B) Sikkim
C) Goa

The correct answer: B) Sikkim. As of 2020, according to census data from July-October that year by Government of West Bengal and Ministry Of Home Affairs (MHA), GOI., The population of SIKKIM was approximately around... more about Which is

Response 2: -
Which is the least populated state in India? Which city has a population of over 1 million, but it's not capital?
What are some popular festivals celebrated across...
The answer to this question depends on which year we consider. As per Census data (2015), Himachal Pradesh was considered as one with lowest density and fewest people.
Barring Chandigarh that doesn't have anyone else other than Union

Response 3: -
Which is the least populated state in India? The correct answer would be Sikkim. As per 2011 Census, it has a population of approximately 610 thousand people.
The smallest Indian State by area-wise as well! It covers an approximate surface

## OpenHathi

In [None]:
self_consistency_openhathi = ["Who won the FIFA World Cup in 2002?", "In which year Chandragupta Maurya died?", "When was the state Telangana formed?"]

In [None]:
for i in range(5):
  response = generate_response_OpenHathi(openhathi_model, openhathi_tokenizer, self_consistency_openhathi[0])
  print(f"Response {i + 1}: -\n{response}\n")

Response 1: -
Who won the FIFA World Cup in 2002?
---
ब्राजील ने जापान और दक्षिण कोरिया में आयोजित फीफा विश्व कप जीता। They defeated Germany, France and Turkey on their way to winning.

Response 2: -
Who won the FIFA World Cup in 2002?
---
ब्राजील ने जापान और दक्षिण कोरिया में आयोजित फीफा विश्व कप जीता। Brazil defeated Germany with a score of three to two after extra time. यह उनका पांचवां खिताब था, जिसने उन्हें सबसे अधिक फुटबॉल चैंपियनशिप जीतने वाला देश बना दिया है!

Response 3: -
Who won the FIFA World Cup in 2002?
---
फीफा विश्व कप प्रतियोगिता में सबसे हालिया विजेता जर्मनी है, जिसने जापान और दक्षिण कोरिया के संयुक्त राष्ट्र को हराकर खिताब जीता था।

Response 4: -
Who won the FIFA World Cup in 2002?
---
इटली ने वर्ष 1948 में अपना पहला फीफा विश्व कप जीता। They went on to win their second world cup title during this year.

Response 5: -
Who won the FIFA World Cup in 2002?
---
इटली ने जर्मनी में आयोजित फीफा विश्व कप जीता। They defeated Brazil, who was considered one of their biggest rival

In [None]:
for i in range(5):
  response = generate_response_OpenHathi(openhathi_model, openhathi_tokenizer, self_consistency_openhathi[1])
  print(f"Response {i + 1}: -\n{response}\n")

Response 1: -
In which year Chandragupta Maurya died?
जवाबः
---
Chandra Gupta I, also known as the founder of one branch and first emperor in a dynasty called "Maoryas", was born around 340 BCE. मौर्य राजवंश के संस्थापक चंद्रगुप्त प्रथम की मृत्यु वर्ष अज्ञात है।

Response 2: -
In which year Chandragupta Maurya died?
---
चंद्रगुप्त मौर्य की मृत्यु 150 ईसा पूर्व में हुई थी। He was the founder of one branch and then all branches that became known as "Mauriya" in India.

Response 3: -
In which year Chandragupta Maurya died?
जवाबः - 320 ईसा पूर्व।

Response 4: -
In which year Chandragupta Maurya died?
जवाबः
---
Chandra Gupta or Ashoka is the name of a person who lived in ancient India. वह मौर्य राजवंश के संस्थापक चंद्रगुप्त मायूर थे। He was born around 340 BC and ruled from approximately 298 to his death, estimated at age about sixty-two years old .

Response 5: -
In which year Chandragupta Maurya died?
---
चंद्रगुप्त मौर्य की मृत्यु 153 ईसा पूर्व में हुई थी। He was a powerful king and foun

In [None]:
for i in range(5):
  response = generate_response_OpenHathi(openhathi_model, openhathi_tokenizer, self_consistency_openhathi[2])
  print(f"Response {i + 1}: -\n{response}\n")

Response 1: -
When was the state Telangana formed?
---
telangaan raajya ki sthaapna 2 joon, 1956 ko bhaugolik aur saaskriti ke aadhaar par telugu logon vaale kshetron se ek alag svaayatt prashaasnik ikaayiyon mein vibhedak

Response 2: -
When was the state Telangana formed?
---
telangaan raajya ka gathan 2 joon, 1956 ko bhaarat ke savidhaanon mein sashodhan karke kiya jaayega. It will be a separate and distinct political entity from Andhra Pradesh (which included present-day Hyderabad). haalaaki is

Response 3: -
When was the state Telangana formed?
A: The State of Hyderabad, which later became part and parcel in Andhra Pradesh as a separate region with its own identity is now called 'Telugu Desam' or "The Land Of Gods". तेलंगाना राज्य का गठन 2 जून को किया गया था।

Response 4: -
When was the state Telangana formed?
---I do not have access to current events or specific dates. हालाँकि, मैं आपको बता सकता हूँ कि तेलंगाना राज्य का गठन 2 जून को भारत के संविधान की छठी अनुसूची में संशोधन करने 

# Fact Checking Hallucination

## Meta-LLAMA3

In [None]:
fact_check_llama = ["In which year did the vietnam war start?", "Which is the most expensive building on Earth?", "Who is the current president of Africa?"]

In [None]:
for i, prompt in enumerate(fact_check_llama):
  response = generate_response_LLAMA(llama_model, llama_tokenizer, prompt)
  print(f"{response}\n")

In which year did the vietnam war start? - What is it about?
The Vietnam War started in 1955. It was a long and complex conflict between North Vietnamese communists, backed by China,
Tags: History, Wars And Conflicts
What were some of main causes that led to world peace after World...
World Peace has not been fully achieved yet! There have been several efforts throughout history towards establishing lasting pieces

Which is the most expensive building on Earth? Guess what, it's not a skyscraper!
As someone who loves architecture and design, I'm always fascinated by buildings that push boundaries in terms of innovation, sustainability, or sheer grandeur. The construction industry has seen some incredible projects come to life over recent years.
When we talk about supermassive structures with astronomical budgets (pun intended!), which one stands out as being

Who is the current president of Africa? There are 55 countries in continental and regional organizations, however there isn't a s

## OpenHathi

In [17]:
fact_check_openhathi = ["Who won the first individual to win Olympic gold medal for India?", "How many gold medals India won in 2016 Olympics?", "who is the current president of india?"]

In [18]:
for prompt in fact_check_openhathi:
  response = generate_response_OpenHathi(openhathi_model, openhathi_tokenizer, prompt)
  print(f"{response}\n")

Who won the first individual to win Olympic gold medal for India?
---
भारत के लिए पहला व्यक्तिगत ओलंपिक स्वर्ण पदक जीतने वाले व्यक्ति मिल्खा सिंह हैं। He did it in 1952 at Helsinki, Finland. वह एक भारतीय धावक थे जिन्होंने अपने करियर में कई अन्य पुरस्कार और सम्मान भी जीते जिनमें शामिल हैंः

How many gold medals India won in 2016 Olympics?
अगस्त में, भारत ने रियो डी जनेरियो के मारिया लेंक एक्वेटिक्स सेंटर (एमसीएल) स्टेडियम और ओलंपिक पार्क स्केटिंग ओवल से तीन स्वर्ण पदक जीते। The nation's first Olympic medal was earned by Sakshi Malik who defeated South Korea rival Hwang Kyung-Young of the Republic. हाला�

who is the current president of india?
--- 2014 में भारत की राष्ट्रपति के रूप में चुने गए रामनाथ कोविंद हैं। He succeeded Pranab Mukherjee, whose term ended on July 3rd. प्रधानमंत्री नरेंद्र मोदी ने भारतीय जनता पार्टी से चुनाव लड़ा और उन्होंने सबसे अधिक वोट जीते जिससे वे जीत सके।

