In [1]:
from transformers import AutoModelForSeq2SeqLM, AutoTokenizer

  from .autonotebook import tqdm as notebook_tqdm


In [2]:
MODEL_NAME = "CohereForAI/aya-101"

In [4]:
tokenizer = AutoTokenizer.from_pretrained(MODEL_NAME)
aya_model = AutoModelForSeq2SeqLM.from_pretrained(MODEL_NAME)

Loading checkpoint shards: 100%|██████████| 11/11 [01:18<00:00,  7.11s/it]


In [5]:
tur_inputs = tokenizer.encode("Translate to English: Aya cok dilli bir dil modelidir.", return_tensors="pt")
tur_outputs = aya_model.generate(tur_inputs, max_new_tokens=128)
print(tokenizer.decode(tur_outputs[0]))

<pad> Aya is a multi-lingual language model.</s>


In [6]:
inputs = tokenizer.encode("How do I say 'eat atleast a little something' in Korean that sounds like 'boradu chom bogo'? But i am not good at the phonetic version so please think about possibilites of sounds that are similar and give some options with both the korean scriot and the correct phonetic so that I can read and verify it. Thank you.", return_tensors="pt")

In [7]:
outputs = aya_model.generate(inputs)



In [10]:
tokenizer.decode(outputs[0])

'<pad> Here are some possible Korean spellings and phonetic variations for the phrase "'

In [17]:
inputs = tokenizer.encode("How do I say 'eat atleast a little something' in Korean that sounds like 'boradu chom bogo'? But i am not good at the phonetic version so please think about possibilites of sounds that are similar. Thank you.", return_tensors="pt")

In [12]:
outputs1 = aya_model.generate(inputs, max_new_tokens=200)

In [15]:
print("\n".join(tokenizer.decode(outputs1[0]).split(". ")))

<pad> 'boradu chom bogo' is a Korean phrase that means 'at least eat something'
The phrase is often used to express a desire to eat something, and it can be used to express a desire to eat something that is a little bit of something
Here are some possible phonetic variations of the phrase: 1
'boradu chom bogo' - 'bora-du' is a Korean phrase that means 'at least eat something'
The phrase is often used to express a desire to eat something that is a little bit of something, and it can be used to express a desire to eat something that is a little bit of something
2
'boradu chom bogo' - 'bora-du' is a Korean phrase that means 'at least eat


In [18]:
def helpMe(query):
	inputs = tokenizer.encode(query, return_tensors="pt")
	outputs = aya_model.generate(inputs, max_new_tokens=200)
	return "\n".join(tokenizer.decode(outputs[0]).split(". "))

In [20]:
print(helpMe("How do I say 'eat atleast a little something' in Korean that sounds like 'boradu chom bogo'? Please give the korean script and the phonetic version. Thank you."))

<pad> Korean script: 보라도 좀 먹고 Phonetic version: borado chomeom boggo</s>


### Mistake
Prompt: How do I say 'eat atleast a little something' in Korean that sounds like 'boradu chom bogo'? Please give the korean script and the phonetic version. Thank you.

Output: <pad> Korean script: 보라도 좀 먹고 Phonetic version: borado chomeom boggo</s>

Expected Output: Korean script: 뭐라도 좀 먹고 Phonetic version: mwolado jom meoggo

Mistakes: 
- It assumed bora was a thing, I think instead of understanding the mistake. 
- It did not fix the mistakes in the transliteration.
- It even made a mistake in the transliteration. ('chom' in the prompt became 'chomeom')

In [21]:
print(helpMe("How do I say 'eat atleast a little something' in Korean that sounds like 'boradu chom bogo'? But i am not good at the transliteration so please correct that too. Thank you."))

<pad> 'boradu chom bogo' is written as '보라도 좀 먹어'.</s>
