In [1]:
import kagglehub
from tqdm import tqdm
from pathlib import Path
import pandas as pd
from transformers import pipeline
from datasets import Dataset, load_dataset
from transformers import set_seed
set_seed(42)

# Load the original sentiment analysis dataset

In [2]:
# Download latest version
path = kagglehub.dataset_download("kashishparmar02/social-media-sentiments-analysis-dataset")

print("Path to dataset files:", path)

Downloading from https://www.kaggle.com/api/v1/datasets/download/kashishparmar02/social-media-sentiments-analysis-dataset?dataset_version_number=3...


100%|‚ñà‚ñà‚ñà‚ñà‚ñà‚ñà‚ñà‚ñà‚ñà‚ñà| 50.9k/50.9k [00:00<00:00, 12.8MB/s]

Extracting files...
Path to dataset files: /root/.cache/kagglehub/datasets/kashishparmar02/social-media-sentiments-analysis-dataset/versions/3





In [3]:
df = pd.read_csv(Path(path) / "sentimentdataset.csv")
df.head()

Unnamed: 0.2,Unnamed: 0.1,Unnamed: 0,Text,Sentiment,Timestamp,User,Platform,Hashtags,Retweets,Likes,Country,Year,Month,Day,Hour
0,0,0,Enjoying a beautiful day at the park! ...,Positive,2023-01-15 12:30:00,User123,Twitter,#Nature #Park,15.0,30.0,USA,2023,1,15,12
1,1,1,Traffic was terrible this morning. ...,Negative,2023-01-15 08:45:00,CommuterX,Twitter,#Traffic #Morning,5.0,10.0,Canada,2023,1,15,8
2,2,2,Just finished an amazing workout! üí™ ...,Positive,2023-01-15 15:45:00,FitnessFan,Instagram,#Fitness #Workout,20.0,40.0,USA,2023,1,15,15
3,3,3,Excited about the upcoming weekend getaway! ...,Positive,2023-01-15 18:20:00,AdventureX,Facebook,#Travel #Adventure,8.0,15.0,UK,2023,1,15,18
4,4,4,Trying out a new recipe for dinner tonight. ...,Neutral,2023-01-15 19:55:00,ChefCook,Instagram,#Cooking #Food,12.0,25.0,Australia,2023,1,15,19


In [4]:
df = df.drop(columns=["Unnamed: 0", "Unnamed: 0.1"])
df.head()

Unnamed: 0,Text,Sentiment,Timestamp,User,Platform,Hashtags,Retweets,Likes,Country,Year,Month,Day,Hour
0,Enjoying a beautiful day at the park! ...,Positive,2023-01-15 12:30:00,User123,Twitter,#Nature #Park,15.0,30.0,USA,2023,1,15,12
1,Traffic was terrible this morning. ...,Negative,2023-01-15 08:45:00,CommuterX,Twitter,#Traffic #Morning,5.0,10.0,Canada,2023,1,15,8
2,Just finished an amazing workout! üí™ ...,Positive,2023-01-15 15:45:00,FitnessFan,Instagram,#Fitness #Workout,20.0,40.0,USA,2023,1,15,15
3,Excited about the upcoming weekend getaway! ...,Positive,2023-01-15 18:20:00,AdventureX,Facebook,#Travel #Adventure,8.0,15.0,UK,2023,1,15,18
4,Trying out a new recipe for dinner tonight. ...,Neutral,2023-01-15 19:55:00,ChefCook,Instagram,#Cooking #Food,12.0,25.0,Australia,2023,1,15,19


# Load the translated dataframe with Gemini-2.5 Pro

In [26]:
gemini_df = pd.read_csv("/notebooks/translations-gemini-2.5pro.csv")
gemini_df["English"] = gemini_df.apply(lambda x: x["English"].strip(), axis=1)

In [27]:
gemini_df

Unnamed: 0,English,Myanmar
0,Enjoying a beautiful day at the park!,·Äï·Äî·Ä∫·Ä∏·ÄÅ·Äº·Ä∂·Äë·Ä≤·Äô·Äæ·Ä¨ ·Äú·Äæ·Äï·Äê·Ä≤·Ä∑·Äî·Ä±·Ä∑·Äú·Ä±·Ä∏·Äê·ÄÖ·Ä∫·Äî·Ä±·Ä∑·ÄÄ·Ä≠·ÄØ ·Äï·Äª·Ä±·Ä¨·Ä∫·Äõ·ÄΩ·Äæ·ÄÑ·Ä∫·ÄÖ...
1,Traffic was terrible this morning.,·Äí·ÄÆ·Äô·Äî·ÄÄ·Ä∫ ·Äú·Äô·Ä∫·Ä∏·Ä°·Äõ·Äô·Ä∫·Ä∏·Äï·Ä≠·Äê·Ä∫·Äê·Äö·Ä∫·Åã
2,Just finished an amazing workout! üí™,·Ä°·Äõ·Äô·Ä∫·Ä∏·ÄÄ·Ä±·Ä¨·ÄÑ·Ä∫·Ä∏·Äê·Ä≤·Ä∑ ·Äú·Ä±·Ä∑·ÄÄ·Äª·ÄÑ·Ä∑·Ä∫·ÄÅ·Äî·Ä∫·Ä∏·Äê·ÄÖ·Ä∫·ÄÅ·ÄØ ·ÄÅ·ÄØ·Äï·Ä≤·Äï·Äº·ÄÆ·Ä∏·Äû·ÄΩ·Ä¨·Ä∏·Äï...
3,Excited about the upcoming weekend getaway!,·Äú·Ä¨·Äô·Äö·Ä∑·Ä∫ ·ÄÖ·Äî·Ä±·Åä ·Äê·Äî·ÄÑ·Ä∫·Äπ·ÄÇ·Äî·ÄΩ·Ä± ·Ä°·Äï·Äî·Ä∫·Ä∏·Äñ·Äº·Ä±·ÄÅ·Äõ·ÄÆ·Ä∏·Ä°·Äê·ÄΩ·ÄÄ·Ä∫ ·ÄÖ·Ä≠·Äê·Ä∫·Äú·Äæ...
4,Trying out a new recipe for dinner tonight.,·Äí·ÄÆ·Ää ·Ää·ÄÖ·Ä¨·Ä°·Äê·ÄΩ·ÄÄ·Ä∫ ·Äü·ÄÑ·Ä∫·Ä∏·ÄÅ·Äª·ÄÄ·Ä∫·Äî·Ää·Ä∫·Ä∏·Ä°·Äû·ÄÖ·Ä∫·Äê·ÄÖ·Ä∫·ÄÅ·ÄØ ·ÄÖ·Äô·Ä∫·Ä∏·Äû·Äï·Ä∫·ÄÅ·Äª·ÄÄ·Ä∫...
...,...,...
727,Collaborating on a science project that receiv...,·Äí·Ä±·Äû·ÄÜ·Ä≠·ÄØ·ÄÑ·Ä∫·Äõ·Ä¨ ·Äï·Äº·Äï·ÄΩ·Ä≤·Äê·ÄÖ·Ä∫·ÄÅ·ÄØ·Äô·Äæ·Ä¨ ·Ä°·Äû·Ä≠·Ä°·Äô·Äæ·Äê·Ä∫·Äï·Äº·ÄØ·Äô·Äæ·ÄØ ·Äõ·Äõ·Äæ·Ä≠·ÄÅ·Ä≤...
728,Attending a surprise birthday party organized ...,·Äû·Ä∞·ÄÑ·Äö·Ä∫·ÄÅ·Äª·ÄÑ·Ä∫·Ä∏·Äê·ÄΩ·Ä±·ÄÄ ·ÄÖ·ÄÆ·ÄÖ·Äâ·Ä∫·Äï·Ä±·Ä∏·Äê·Ä≤·Ä∑ ·Ä°·Ä∂·Ä∑·Ä°·Ä¨·Ä∏·Äû·ÄÑ·Ä∑·Ä∫·Äñ·ÄΩ·Äö·Ä∫ ·Äô·ÄΩ·Ä±·Ä∏...
729,Successfully fundraising for a school charity ...,·ÄÄ·Äª·Ä±·Ä¨·ÄÑ·Ä∫·Ä∏ ·Äï·Äõ·Äü·Ä≠·Äê ·Ä°·ÄÖ·ÄÆ·Ä°·ÄÖ·Äâ·Ä∫·Äê·ÄÖ·Ä∫·ÄÅ·ÄØ·Ä°·Äê·ÄΩ·ÄÄ·Ä∫ ·Ä°·Ä±·Ä¨·ÄÑ·Ä∫·Äô·Äº·ÄÑ·Ä∫·ÄÖ·ÄΩ·Ä¨ ·Äõ...
730,"Participating in a multicultural festival, cel...",·Äö·Äâ·Ä∫·ÄÄ·Äª·Ä±·Ä∏·Äô·Äæ·ÄØ·Äï·Ä±·Ä´·ÄÑ·Ä∫·Ä∏·ÄÖ·ÄØ·Ä∂ ·Äï·ÄΩ·Ä≤·Äê·Ä±·Ä¨·Ä∫·Äê·ÄÖ·Ä∫·ÄÅ·ÄØ·Äô·Äæ·Ä¨ ·Äï·Ä´·Äù·ÄÑ·Ä∫·Äî·Ä±·Äï·Ä´·Äê...


# Map the translated Myanmar Text into Original DataFrame

In [None]:
def map_eng_mm(row):
    myanmar_text = gemini_df[gemini_df["English"] == row["Text"].strip()]['Myanmar']
    myanmar_text = myanmar_text.drop_duplicates()
    
    return myanmar_text.item()
    
df["Text-MM"] = df.apply(map_eng_mm, axis=1)

In [47]:
df.head()

Unnamed: 0,Text,Sentiment,Timestamp,User,Platform,Hashtags,Retweets,Likes,Country,Year,Month,Day,Hour,Text-MM
0,Enjoying a beautiful day at the park! ...,Positive,2023-01-15 12:30:00,User123,Twitter,#Nature #Park,15.0,30.0,USA,2023,1,15,12,·Äï·Äî·Ä∫·Ä∏·ÄÅ·Äº·Ä∂·Äë·Ä≤·Äô·Äæ·Ä¨ ·Äú·Äæ·Äï·Äê·Ä≤·Ä∑·Äî·Ä±·Ä∑·Äú·Ä±·Ä∏·Äê·ÄÖ·Ä∫·Äî·Ä±·Ä∑·ÄÄ·Ä≠·ÄØ ·Äï·Äª·Ä±·Ä¨·Ä∫·Äõ·ÄΩ·Äæ·ÄÑ·Ä∫·ÄÖ...
1,Traffic was terrible this morning. ...,Negative,2023-01-15 08:45:00,CommuterX,Twitter,#Traffic #Morning,5.0,10.0,Canada,2023,1,15,8,·Äí·ÄÆ·Äô·Äî·ÄÄ·Ä∫ ·Äú·Äô·Ä∫·Ä∏·Ä°·Äõ·Äô·Ä∫·Ä∏·Äï·Ä≠·Äê·Ä∫·Äê·Äö·Ä∫·Åã
2,Just finished an amazing workout! üí™ ...,Positive,2023-01-15 15:45:00,FitnessFan,Instagram,#Fitness #Workout,20.0,40.0,USA,2023,1,15,15,·Ä°·Äõ·Äô·Ä∫·Ä∏·ÄÄ·Ä±·Ä¨·ÄÑ·Ä∫·Ä∏·Äê·Ä≤·Ä∑ ·Äú·Ä±·Ä∑·ÄÄ·Äª·ÄÑ·Ä∑·Ä∫·ÄÅ·Äî·Ä∫·Ä∏·Äê·ÄÖ·Ä∫·ÄÅ·ÄØ ·ÄÅ·ÄØ·Äï·Ä≤·Äï·Äº·ÄÆ·Ä∏·Äû·ÄΩ·Ä¨·Ä∏·Äï...
3,Excited about the upcoming weekend getaway! ...,Positive,2023-01-15 18:20:00,AdventureX,Facebook,#Travel #Adventure,8.0,15.0,UK,2023,1,15,18,·Äú·Ä¨·Äô·Äö·Ä∑·Ä∫ ·ÄÖ·Äî·Ä±·Åä ·Äê·Äî·ÄÑ·Ä∫·Äπ·ÄÇ·Äî·ÄΩ·Ä± ·Ä°·Äï·Äî·Ä∫·Ä∏·Äñ·Äº·Ä±·ÄÅ·Äõ·ÄÆ·Ä∏·Ä°·Äê·ÄΩ·ÄÄ·Ä∫ ·ÄÖ·Ä≠·Äê·Ä∫·Äú·Äæ...
4,Trying out a new recipe for dinner tonight. ...,Neutral,2023-01-15 19:55:00,ChefCook,Instagram,#Cooking #Food,12.0,25.0,Australia,2023,1,15,19,·Äí·ÄÆ·Ää ·Ää·ÄÖ·Ä¨·Ä°·Äê·ÄΩ·ÄÄ·Ä∫ ·Äü·ÄÑ·Ä∫·Ä∏·ÄÅ·Äª·ÄÄ·Ä∫·Äî·Ää·Ä∫·Ä∏·Ä°·Äû·ÄÖ·Ä∫·Äê·ÄÖ·Ä∫·ÄÅ·ÄØ ·ÄÖ·Äô·Ä∫·Ä∏·Äû·Äï·Ä∫·ÄÅ·Äª·ÄÄ·Ä∫...


In [48]:
ordered_columns = ["Text", "Text-MM", "Sentiment", "Timestamp", "User", 
                  "Platform", "Hashtags", "Retweets", "Likes", 
                  "Country", "Year", "Month", "Day", "Hour"]

# Filter to only include columns that actually exist
ordered_columns = [col for col in ordered_columns if col in df.columns]
df = df[ordered_columns]

In [49]:
df.head()

Unnamed: 0,Text,Text-MM,Sentiment,Timestamp,User,Platform,Hashtags,Retweets,Likes,Country,Year,Month,Day,Hour
0,Enjoying a beautiful day at the park! ...,·Äï·Äî·Ä∫·Ä∏·ÄÅ·Äº·Ä∂·Äë·Ä≤·Äô·Äæ·Ä¨ ·Äú·Äæ·Äï·Äê·Ä≤·Ä∑·Äî·Ä±·Ä∑·Äú·Ä±·Ä∏·Äê·ÄÖ·Ä∫·Äî·Ä±·Ä∑·ÄÄ·Ä≠·ÄØ ·Äï·Äª·Ä±·Ä¨·Ä∫·Äõ·ÄΩ·Äæ·ÄÑ·Ä∫·ÄÖ...,Positive,2023-01-15 12:30:00,User123,Twitter,#Nature #Park,15.0,30.0,USA,2023,1,15,12
1,Traffic was terrible this morning. ...,·Äí·ÄÆ·Äô·Äî·ÄÄ·Ä∫ ·Äú·Äô·Ä∫·Ä∏·Ä°·Äõ·Äô·Ä∫·Ä∏·Äï·Ä≠·Äê·Ä∫·Äê·Äö·Ä∫·Åã,Negative,2023-01-15 08:45:00,CommuterX,Twitter,#Traffic #Morning,5.0,10.0,Canada,2023,1,15,8
2,Just finished an amazing workout! üí™ ...,·Ä°·Äõ·Äô·Ä∫·Ä∏·ÄÄ·Ä±·Ä¨·ÄÑ·Ä∫·Ä∏·Äê·Ä≤·Ä∑ ·Äú·Ä±·Ä∑·ÄÄ·Äª·ÄÑ·Ä∑·Ä∫·ÄÅ·Äî·Ä∫·Ä∏·Äê·ÄÖ·Ä∫·ÄÅ·ÄØ ·ÄÅ·ÄØ·Äï·Ä≤·Äï·Äº·ÄÆ·Ä∏·Äû·ÄΩ·Ä¨·Ä∏·Äï...,Positive,2023-01-15 15:45:00,FitnessFan,Instagram,#Fitness #Workout,20.0,40.0,USA,2023,1,15,15
3,Excited about the upcoming weekend getaway! ...,·Äú·Ä¨·Äô·Äö·Ä∑·Ä∫ ·ÄÖ·Äî·Ä±·Åä ·Äê·Äî·ÄÑ·Ä∫·Äπ·ÄÇ·Äî·ÄΩ·Ä± ·Ä°·Äï·Äî·Ä∫·Ä∏·Äñ·Äº·Ä±·ÄÅ·Äõ·ÄÆ·Ä∏·Ä°·Äê·ÄΩ·ÄÄ·Ä∫ ·ÄÖ·Ä≠·Äê·Ä∫·Äú·Äæ...,Positive,2023-01-15 18:20:00,AdventureX,Facebook,#Travel #Adventure,8.0,15.0,UK,2023,1,15,18
4,Trying out a new recipe for dinner tonight. ...,·Äí·ÄÆ·Ää ·Ää·ÄÖ·Ä¨·Ä°·Äê·ÄΩ·ÄÄ·Ä∫ ·Äü·ÄÑ·Ä∫·Ä∏·ÄÅ·Äª·ÄÄ·Ä∫·Äî·Ää·Ä∫·Ä∏·Ä°·Äû·ÄÖ·Ä∫·Äê·ÄÖ·Ä∫·ÄÅ·ÄØ ·ÄÖ·Äô·Ä∫·Ä∏·Äû·Äï·Ä∫·ÄÅ·Äª·ÄÄ·Ä∫...,Neutral,2023-01-15 19:55:00,ChefCook,Instagram,#Cooking #Food,12.0,25.0,Australia,2023,1,15,19


# Upload to HuggingFace

In [51]:
ds = Dataset.from_pandas(df)
ds.push_to_hub("chuuhtetnaing/myanmar-social-media-sentiment-analysis-dataset")

Uploading the dataset shards:   0%|          | 0/1 [00:00<?, ?it/s]

Creating parquet from Arrow format:   0%|          | 0/1 [00:00<?, ?ba/s]

README.md:   0%|          | 0.00/2.37k [00:00<?, ?B/s]

CommitInfo(commit_url='https://huggingface.co/datasets/chuuhtetnaing/myanmar-social-media-sentiment-analysis-dataset/commit/9ffd58b98eab714e9100477d0975278b1b9d19e3', commit_message='Upload dataset', commit_description='', oid='9ffd58b98eab714e9100477d0975278b1b9d19e3', pr_url=None, repo_url=RepoUrl('https://huggingface.co/datasets/chuuhtetnaing/myanmar-social-media-sentiment-analysis-dataset', endpoint='https://huggingface.co', repo_type='dataset', repo_id='chuuhtetnaing/myanmar-social-media-sentiment-analysis-dataset'), pr_revision=None, pr_num=None)

In [64]:
# Create the pipeline
pipe = pipeline("translation", model="facebook/nllb-200-3.3B", device=0)  # device=0 for first GPU

Loading checkpoint shards:   0%|          | 0/3 [00:00<?, ?it/s]

Device set to use cuda:0


In [65]:
pipe("Weekend road trip to explore scenic views.", src_lang="eng_Latn", tgt_lang="mya_Mymr")

[{'translation_text': '·Ä°·Äï·Äî·Ä∫·Ä∏·Äñ·Äº·Ä±·ÄÖ·ÄÅ·Äî·Ä∫·Ä∏·ÄÄ·Ä≠·ÄØ ·Ä°·Äú·Ää·Ä∫·Äû·ÄΩ·Ä¨·Ä∏·Äï·Äº·ÄÆ·Ä∏ ·Äõ·Äæ·ÄØ·ÄÅ·ÄÑ·Ä∫·Ä∏·ÄÄ·Ä≠·ÄØ ·Äú·Ä±·Ä∑·Äú·Ä¨·ÄÄ·Äº·Ää·Ä∫·Ä∑·Äê·Äö·Ä∫·Åã'}]

In [66]:
dataset = Dataset.from_pandas(df)

# Define a function to translate in batches
def translate_batch(examples):
    translations = pipe(
        examples["Text"], 
        src_lang="eng_Latn", 
        tgt_lang="mya_Mymr",
        batch_size=8
    )
    return {
        "Text": examples["Text"],
        "Text_MM": [t["translation_text"] for t in translations],
        "Sentiment": examples["Sentiment"],
        "Timestamp": examples["Timestamp"],
        "User": examples["User"],
        "Platform": examples["Platform"],
        "Hashtags": examples["Hashtags"],
        "Retweets": examples["Retweets"],
        "Likes": examples["Likes"],
        "Country": examples["Country"],
        "Year": examples["Year"],
        "Month": examples["Month"],
        "Day": examples["Day"],
        "Hour": examples["Hour"]
    }

In [7]:
# Apply the translation function to the entire dataset
# This will process in batches automatically
translated_dataset = dataset.map(
    translate_batch,
    batched=True,
    batch_size=8,  # You can adjust this batch size
    remove_columns=dataset.column_names
)



Map:   0%|          | 0/732 [00:00<?, ? examples/s]

You seem to be using the pipelines sequentially on GPU. In order to maximize efficiency please use a dataset


In [None]:
ordered_columns = ["Text", "Text_MM", "Sentiment", "Timestamp", "User", 
                  "Platform", "Hashtags", "Retweets", "Likes", 
                  "Country", "Year", "Month", "Day", "Hour"]

df = translated_dataset.to_pandas()
# Filter to only include columns that actually exist
ordered_columns = [col for col in ordered_columns if col in df.columns]
df = df[ordered_columns]

In [69]:
df.iloc[-10:]

Unnamed: 0,Text,Sentiment,Timestamp,User,Platform,Hashtags,Retweets,Likes,Country,Year,Month,Day,Hour
722,Winning a friendly sports competition against ...,Happy,2023-10-20 14:15:00,SportsVictoryHighSchool,Twitter,#SportsTriumph #HighSchoolAthletics,26.0,50.0,USA,2023,10,20,14
723,Receiving a heartfelt letter from a pen pal in...,Happy,2023-10-21 17:30:00,PenPalConnectionHighSchool,Facebook,#GlobalFriendship #HighSchoolCorrespondence,23.0,45.0,Canada,2023,10,21,17
724,Creating a beautiful mural with fellow art ent...,Happy,2023-10-22 20:45:00,MuralCreationHighSchool,Instagram,#ArtCollaboration #HighSchoolCreativity,22.0,43.0,UK,2023,10,22,20
725,Participating in a school-wide art exhibition....,Happy,2015-11-10 16:45:00,ArtExhibitionJoyHighSchool,Instagram,#ArtisticExpression #HighSchoolCreativity,23.0,44.0,USA,2015,11,10,16
726,Achieving a personal best in a track and field...,Happy,2016-09-14 12:30:00,TrackFieldSuccessHighSchool,Twitter,#AthleticAchievement #HighSchoolSports,26.0,51.0,Canada,2016,9,14,12
727,Collaborating on a science project that receiv...,Happy,2017-08-18 18:20:00,ScienceProjectSuccessHighSchool,Facebook,#ScienceFairWinner #HighSchoolScience,20.0,39.0,UK,2017,8,18,18
728,Attending a surprise birthday party organized ...,Happy,2018-06-22 14:15:00,BirthdayPartyJoyHighSchool,Instagram,#SurpriseCelebration #HighSchoolFriendship,25.0,48.0,USA,2018,6,22,14
729,Successfully fundraising for a school charity ...,Happy,2019-04-05 17:30:00,CharityFundraisingTriumphHighSchool,Twitter,#CommunityGiving #HighSchoolPhilanthropy,22.0,42.0,Canada,2019,4,5,17
730,"Participating in a multicultural festival, cel...",Happy,2020-02-29 20:45:00,MulticulturalFestivalJoyHighSchool,Facebook,#CulturalCelebration #HighSchoolUnity,21.0,43.0,UK,2020,2,29,20
731,Organizing a virtual talent show during challe...,Happy,2020-11-15 15:15:00,VirtualTalentShowSuccessHighSchool,Instagram,#VirtualEntertainment #HighSchoolPositivity,24.0,47.0,USA,2020,11,15,15


In [74]:
dataset = Dataset.from_pandas(df.iloc[-10:])

# Define a function to translate in batches
def translate(example):
    translation = pipe(
        example["Text"], 
        src_lang="eng_Latn", 
        tgt_lang="mya_Mymr"
    )[0]["translation_text"]
    
    print(example["Text"])
    print(translation)
    print()
    return {"Text_MM": translation}

In [83]:
from transformers import AutoTokenizer, AutoModelForSeq2SeqLM

tokenizer = AutoTokenizer.from_pretrained("facebook/nllb-200-3.3B")
model = AutoModelForSeq2SeqLM.from_pretrained("facebook/nllb-200-3.3B")

Loading checkpoint shards:   0%|          | 0/3 [00:00<?, ?it/s]

In [93]:
def translate(text, src_lang="eng_Latn", tgt_lang="mya_Mymr"):
    # Set the language tokens
    tokenizer.src_lang = src_lang
    
    # Tokenize the input text
    inputs = tokenizer(text, return_tensors="pt").to("cuda")
    
    # Get the target language token ID
    forced_bos_token_id = tokenizer.lang_code_to_id[tgt_lang]
    
    # Generate translation
    outputs = model.generate(
        **inputs,
        forced_bos_token_id=forced_bos_token_id,
        max_length=128
    )
    
    # Decode the output tokens
    translation = tokenizer.batch_decode(outputs, skip_special_tokens=True)
    
    return translation

In [None]:
translate("An amusing incident brightened up my day!")

AttributeError: NllbTokenizerFast has no attribute lang_code_to_id

In [112]:
article = "Receiving a heartfelt letter from a pen pal in another country. Connecting across the globe!".split(".")
article

['Receiving a heartfelt letter from a pen pal in another country',
 ' Connecting across the globe!']

In [113]:
article = "Receiving a heartfelt letter from a pen pal in another country. Connecting across the globe!".split(".")
inputs = tokenizer(article, return_tensors="pt")

translated_tokens = model.generate(
    **inputs, forced_bos_token_id=tokenizer.convert_tokens_to_ids("mya_Mymr"), max_length=500
)
tokenizer.batch_decode(translated_tokens, skip_special_tokens=True)[0]

ValueError: Unable to create tensor, you should probably activate truncation and/or padding with 'padding=True' 'truncation=True' to have batched tensors with the same length. Perhaps your features (`input_ids` in this case) have excessive nesting (inputs type `list` where type `int` is expected).

In [104]:
tokenizer.decode(outputs[0], skip_special_tokens=True)

'Smutn√° ud√°lost mi dnes usm√°la den.'

In [114]:
pipe("Receiving a heartfelt letter from a pen pal in another country. Connecting across the globe!".split("."), src_lang="eng_Latn", tgt_lang="mya_Mymr")

[{'translation_text': '·Ä°·ÄÅ·Äº·Ä¨·Ä∏·Äî·Ä≠·ÄØ·ÄÑ·Ä∫·ÄÑ·Ä∂·Äô·Äæ ·ÄÖ·Ä¨·Äõ·Ä±·Ä∏·Äñ·Ä±·Ä¨·Ä∫·Äë·Ä∂·Äô·Äæ ·Äî·Äæ·Äú·ÄØ·Ä∂·Ä∏·Äû·Ä¨·Ä∏·ÄÄ·Ä≠·ÄØ·Äñ·ÄØ·Ä∂·Ä∏·Äú·ÄΩ·Äæ·Äô·Ä∫·Ä∏·ÄÖ·Ä±·Äû·Ä±·Ä¨ ·ÄÖ·Ä¨·Äõ·ÄÅ·Äº·ÄÑ·Ä∫·Ä∏'},
 {'translation_text': '·ÄÄ·Äô·Äπ·Äò·Ä¨·Äê·ÄÖ·Ä∫·Äú·ÄΩ·Äæ·Ä¨·Ä∏·Äô·Äæ·Ä¨ ·ÄÜ·ÄÄ·Ä∫·Äû·ÄΩ·Äö·Ä∫·Äô·Äæ·ÄØ·Äï·Ä´·Åã'}]

In [75]:
# Apply the translation function to the entire dataset
# This will process in batches automatically
translated_dataset = dataset.map(translate)

Map:   0%|          | 0/10 [00:00<?, ? examples/s]

Winning a friendly sports competition against rival schools. Victory celebrations in full swing! 
·Äô·Ä≠·Äê·Ä∫·ÄÜ·ÄΩ·Ä±·Äô·Äª·Ä¨·Ä∏·Ä°·Ä¨·Ä∏ ·Ä°·Ä¨·Ä∏·ÄÄ·ÄÖ·Ä¨·Ä∏·Äï·Äº·Ä≠·ÄØ·ÄÑ·Ä∫·Äï·ÄΩ·Ä≤·Äê·ÄΩ·ÄÑ·Ä∫ ·Äï·Äº·Ä≠·ÄØ·ÄÑ·Ä∫·Äò·ÄÄ·Ä∫·ÄÄ·Äª·Ä±·Ä¨·ÄÑ·Ä∫·Ä∏·Äô·Äª·Ä¨·Ä∏·Ä°·Ä¨·Ä∏ ·Ä°·Äî·Ä≠·ÄØ·ÄÑ·Ä∫·Äõ·ÄÅ·Äº·ÄÑ·Ä∫·Ä∏·Åã

Receiving a heartfelt letter from a pen pal in another country. Connecting across the globe! 
[·ÄÖ·Ä¨·Äô·Äª·ÄÄ·Ä∫·Äî·Äæ·Ä¨ ·ÅÇ·ÅÉ ·Äï·Ä´ ·Äõ·ÄØ·Äï·Ä∫·Äï·ÄØ·Ä∂]

Creating a beautiful mural with fellow art enthusiasts. The power of collaboration and creativity! 
·Ä°·Äî·ÄØ·Äï·Ää·Ä¨ ·Äù·Ä´·Äû·Äî·Ä¨·Ä°·Ä≠·ÄØ·Ä∏·Äô·Äª·Ä¨·Ä∏·Äî·Ä≤·Ä∑·Ä°·Äê·Ä∞ ·Äú·Äæ·Äï·Äê·Ä≤·Ä∑ ·Äî·Ä∂·Äõ·Ä∂·ÄÜ·Ä±·Ä∏·Äõ·Ä±·Ä∏·Äï·Äî·Ä∫·Ä∏·ÄÅ·Äª·ÄÆ·ÄÄ·Ä≠·ÄØ ·Äñ·Äî·Ä∫·Äê·ÄÆ·Ä∏·ÄÅ·Äº·ÄÑ·Ä∫·Ä∏·Åã

Participating in a school-wide art exhibition. Witnessing creativity and spreading positive vibes! 
·ÄÄ·Äª·Ä±·Ä¨·ÄÑ·Ä∫·Ä∏·Äê·ÄÖ·Ä∫·Äù·Äæ·Äô·Ä∫·Ä∏·Äú·ÄØ·Ä∂·Ä∏ ·Ä°·Äî·ÄØ·Äï·Ää·Ä¨·Äï·Äº·Äï·ÄΩ·Ä≤·Äê·ÄΩ·ÄÑ·Ä∫ ·Äï·Ä´·Äù·ÄÑ·Ä∫·ÄÅ·Äº·ÄÑ·Ä∫

In [76]:
ordered_columns = ["Text", "Text_MM", "Sentiment", "Timestamp", "User", 
                  "Platform", "Hashtags", "Retweets", "Likes", 
                  "Country", "Year", "Month", "Day", "Hour"]

df = translated_dataset.to_pandas()
# Filter to only include columns that actually exist
ordered_columns = [col for col in ordered_columns if col in df.columns]
df = df[ordered_columns]

In [73]:
df

Unnamed: 0,Text,Text_MM,Sentiment,Timestamp,User,Platform,Hashtags,Retweets,Likes,Country,Year,Month,Day,Hour
0,Winning a friendly sports competition against ...,·Äô·Ä≠·Äê·Ä∫·ÄÜ·ÄΩ·Ä±·Äô·Äª·Ä¨·Ä∏·Ä°·Ä¨·Ä∏ ·Ä°·Ä¨·Ä∏·ÄÄ·ÄÖ·Ä¨·Ä∏·Äï·Äº·Ä≠·ÄØ·ÄÑ·Ä∫·Äï·ÄΩ·Ä≤·Äê·ÄΩ·ÄÑ·Ä∫ ·Äï·Äº·Ä≠·ÄØ·ÄÑ·Ä∫·Äò·ÄÄ·Ä∫·ÄÄ...,Happy,2023-10-20 14:15:00,SportsVictoryHighSchool,Twitter,#SportsTriumph #HighSchoolAthletics,26.0,50.0,USA,2023,10,20,14
1,Receiving a heartfelt letter from a pen pal in...,[·ÄÖ·Ä¨·Äô·Äª·ÄÄ·Ä∫·Äî·Äæ·Ä¨ ·ÅÇ·ÅÉ ·Äï·Ä´ ·Äõ·ÄØ·Äï·Ä∫·Äï·ÄØ·Ä∂],Happy,2023-10-21 17:30:00,PenPalConnectionHighSchool,Facebook,#GlobalFriendship #HighSchoolCorrespondence,23.0,45.0,Canada,2023,10,21,17
2,Creating a beautiful mural with fellow art ent...,·Ä°·Äî·ÄØ·Äï·Ää·Ä¨ ·Äù·Ä´·Äû·Äî·Ä¨·Ä°·Ä≠·ÄØ·Ä∏·Äô·Äª·Ä¨·Ä∏·Äî·Ä≤·Ä∑·Ä°·Äê·Ä∞ ·Äú·Äæ·Äï·Äê·Ä≤·Ä∑ ·Äî·Ä∂·Äõ·Ä∂·ÄÜ·Ä±·Ä∏·Äõ·Ä±·Ä∏·Äï·Äî...,Happy,2023-10-22 20:45:00,MuralCreationHighSchool,Instagram,#ArtCollaboration #HighSchoolCreativity,22.0,43.0,UK,2023,10,22,20
3,Participating in a school-wide art exhibition....,·ÄÄ·Äª·Ä±·Ä¨·ÄÑ·Ä∫·Ä∏·Äê·ÄÖ·Ä∫·Äù·Äæ·Äô·Ä∫·Ä∏·Äú·ÄØ·Ä∂·Ä∏ ·Ä°·Äî·ÄØ·Äï·Ää·Ä¨·Äï·Äº·Äï·ÄΩ·Ä≤·Äê·ÄΩ·ÄÑ·Ä∫ ·Äï·Ä´·Äù·ÄÑ·Ä∫·ÄÅ·Äº·ÄÑ·Ä∫·Ä∏...,Happy,2015-11-10 16:45:00,ArtExhibitionJoyHighSchool,Instagram,#ArtisticExpression #HighSchoolCreativity,23.0,44.0,USA,2015,11,10,16
4,Achieving a personal best in a track and field...,[·ÄÖ·Ä¨·Äô·Äª·ÄÄ·Ä∫·Äî·Äæ·Ä¨ ·ÅÇ·ÅÅ ·Äï·Ä´ ·Äõ·ÄØ·Äï·Ä∫·Äï·ÄØ·Ä∂],Happy,2016-09-14 12:30:00,TrackFieldSuccessHighSchool,Twitter,#AthleticAchievement #HighSchoolSports,26.0,51.0,Canada,2016,9,14,12
5,Collaborating on a science project that receiv...,·Äí·Ä±·Äû·Äê·ÄΩ·ÄÑ·Ä∫·Ä∏ ·Äï·Äº·Äï·ÄΩ·Ä≤·Äê·ÄÖ·Ä∫·ÄÅ·ÄØ·Äê·ÄΩ·ÄÑ·Ä∫ ·Ä°·Äû·Ä≠·Ä°·Äô·Äæ·Äê·Ä∫·Äï·Äº·ÄØ·ÄÅ·Ä∂·Äõ·Äû·Ä±·Ä¨ ·Äû·Ä≠·Äï·Äπ...,Happy,2017-08-18 18:20:00,ScienceProjectSuccessHighSchool,Facebook,#ScienceFairWinner #HighSchoolScience,20.0,39.0,UK,2017,8,18,18
6,Attending a surprise birthday party organized ...,·Äô·Ä≠·Äê·Ä∫·ÄÜ·ÄΩ·Ä±·Äê·ÄΩ·Ä±·ÄÄ ·ÄÄ·Äª·ÄÑ·Ä∫·Ä∏·Äï·Äê·Ä≤·Ä∑ ·Äô·Äô·Äª·Äæ·Ä±·Ä¨·Ä∫·Äú·ÄÑ·Ä∑·Ä∫·Äê·Ä≤·Ä∑ ·Äô·ÄΩ·Ä±·Ä∏·Äî·Ä±·Ä∑·Äï·Ä´...,Happy,2018-06-22 14:15:00,BirthdayPartyJoyHighSchool,Instagram,#SurpriseCelebration #HighSchoolFriendship,25.0,48.0,USA,2018,6,22,14
7,Successfully fundraising for a school charity ...,·ÄÄ·Äª·Ä±·Ä¨·ÄÑ·Ä∫·Ä∏·Äï·Äõ·Äü·Ä≠·Äê·Äú·ÄØ·Äï·Ä∫·ÄÑ·Äî·Ä∫·Ä∏·Äê·ÄÖ·Ä∫·ÄÅ·ÄØ·Ä°·Äê·ÄΩ·ÄÄ·Ä∫ ·ÄÑ·ÄΩ·Ä±·ÄÄ·Äº·Ä±·Ä∏·Äë·Ä±·Ä¨·ÄÄ·Ä∫·Äï·Ä∂·Ä∑...,Happy,2019-04-05 17:30:00,CharityFundraisingTriumphHighSchool,Twitter,#CommunityGiving #HighSchoolPhilanthropy,22.0,42.0,Canada,2019,4,5,17
8,"Participating in a multicultural festival, cel...",·Äö·Äâ·Ä∫·ÄÄ·Äª·Ä±·Ä∏·Äô·Äæ·ÄØ·ÄÖ·ÄØ·Ä∂·Äú·ÄÑ·Ä∫·Äû·Ä±·Ä¨·Äï·ÄΩ·Ä≤·Äê·Ä±·Ä¨·Ä∫·Äê·ÄΩ·ÄÑ·Ä∫ ·Äï·Ä´·Äù·ÄÑ·Ä∫·ÄÅ·Äº·ÄÑ·Ä∫·Ä∏·Åä ·ÄÇ·ÄÆ·Äê...,Happy,2020-02-29 20:45:00,MulticulturalFestivalJoyHighSchool,Facebook,#CulturalCelebration #HighSchoolUnity,21.0,43.0,UK,2020,2,29,20
9,Organizing a virtual talent show during challe...,·ÄÖ·Ä≠·Äî·Ä∫·ÄÅ·Ä±·Ä´·Ä∫·Äô·Äæ·ÄØ·Äõ·Äæ·Ä≠·Äê·Ä≤·Ä∑ ·Ä°·ÄÅ·Äª·Ä≠·Äî·Ä∫·Äê·ÄΩ·Ä±·Äô·Äæ·Ä¨ ·Äï·ÄÑ·Ä∫·ÄÄ·Ä≠·ÄØ·Äö·Ä∫·ÄÖ·ÄΩ·Äô·Ä∫·Ä∏·Äõ·Ää...,Happy,2020-11-15 15:15:00,VirtualTalentShowSuccessHighSchool,Instagram,#VirtualEntertainment #HighSchoolPositivity,24.0,47.0,USA,2020,11,15,15


In [51]:
previous_ds = load_dataset("chuuhtetnaing/myanmar-social-media-sentiment-analysis-dataset")
previous_df = previous_ds['train'].to_pandas()

In [52]:
previous_df = previous_df.rename(columns={"Text_MM": "Text_MM_old"})

In [53]:
previous_df

Unnamed: 0,Text,Text_MM_old,Sentiment,Timestamp,User,Platform,Hashtags,Retweets,Likes,Country,Year,Month,Day,Hour
0,Enjoying a beautiful day at the park! ...,·Äï·Äî·Ä∫·Ä∏·ÄÅ·Äº·Ä∂·Äë·Ä≤·Äô·Äæ·Ä¨ ·Äú·Äæ·Äï·Äê·Ä≤·Ä∑ ·Äî·Ä±·Ä∑·ÄÄ·Ä≠·ÄØ ·ÄÅ·Ä∂·ÄÖ·Ä¨·Ä∏·Äõ·ÄÑ·Ä∫·Ä∏·Äï·Ä±·Ä´·Ä∑·Åã,Positive,2023-01-15 12:30:00,User123,Twitter,#Nature #Park,15.0,30.0,USA,2023,1,15,12
1,Traffic was terrible this morning. ...,·Äí·ÄÆ·Äô·Äî·ÄÄ·Ä∫·ÄÄ ·Äö·Ä¨·Äâ·Ä∫·ÄÄ·Äº·Ä±·Ä¨·ÄÄ ·Ä°·Äõ·Äô·Ä∫·Ä∏·ÄÄ·Ä≠·ÄØ ·ÄÜ·Ä≠·ÄØ·Ä∏·Äê·Äö·Ä∫·Åã,Negative,2023-01-15 08:45:00,CommuterX,Twitter,#Traffic #Morning,5.0,10.0,Canada,2023,1,15,8
2,Just finished an amazing workout! üí™ ...,·Ä°·Ä∂·Ä∑·Ä°·Ä¨·Ä∏·Äû·ÄÑ·Ä∑·Ä∫·ÄÖ·Äõ·Ä¨ ·Äú·Ä±·Ä∑·ÄÄ·Äª·ÄÑ·Ä∑·Ä∫·ÄÅ·Äî·Ä∫·Ä∏ ·Äï·Äº·ÄÆ·Ä∏·Äû·ÄΩ·Ä¨·Ä∏·Äï·Äº·ÄÆ·Åã,Positive,2023-01-15 15:45:00,FitnessFan,Instagram,#Fitness #Workout,20.0,40.0,USA,2023,1,15,15
3,Excited about the upcoming weekend getaway! ...,·Äú·Ä¨·Äô·Äö·Ä∑·Ä∫ ·Äû·ÄÆ·Äê·ÄÑ·Ä∫·Ä∏·Äï·Äê·Ä∫·Äõ·Ä≤·Ä∑ ·Äë·ÄΩ·ÄÄ·Ä∫·ÄÅ·ÄΩ·Ä¨·Äô·Äæ·ÄØ·Ä°·Äê·ÄΩ·ÄÄ·Ä∫ ·ÄÖ·Ä≠·Äê·Ä∫·Äú·Äæ·ÄØ·Äï·Ä∫·Äõ...,Positive,2023-01-15 18:20:00,AdventureX,Facebook,#Travel #Adventure,8.0,15.0,UK,2023,1,15,18
4,Trying out a new recipe for dinner tonight. ...,·Äí·ÄÆ·Ää·ÄÖ·Ä¨·Ä°·Äê·ÄΩ·ÄÄ·Ä∫ ·Äü·ÄÑ·Ä∫·Ä∏·ÄÅ·Äª·ÄÄ·Ä∫·Äî·Ää·Ä∫·Ä∏ ·Ä°·Äû·ÄÖ·Ä∫·Äê·ÄÖ·Ä∫·ÄÅ·ÄØ ·ÄÖ·Äô·Ä∫·Ä∏·Äî·Ä±·Äê·Äö·Ä∫·Åã,Neutral,2023-01-15 19:55:00,ChefCook,Instagram,#Cooking #Food,12.0,25.0,Australia,2023,1,15,19
...,...,...,...,...,...,...,...,...,...,...,...,...,...,...
727,Collaborating on a science project that receiv...,·Äí·Ä±·Äû·Äê·ÄΩ·ÄÑ·Ä∫·Ä∏ ·Äï·Äº·Äï·ÄΩ·Ä≤·Äê·ÄÖ·Ä∫·ÄÅ·ÄØ·Äê·ÄΩ·ÄÑ·Ä∫ ·Ä°·Äû·Ä≠·Ä°·Äô·Äæ·Äê·Ä∫·Äï·Äº·ÄØ·ÄÅ·Ä∂·Äõ·Äû·Ä±·Ä¨ ·Äû·Ä≠·Äï·Äπ...,Happy,2017-08-18 18:20:00,ScienceProjectSuccessHighSchool,Facebook,#ScienceFairWinner #HighSchoolScience,20.0,39.0,UK,2017,8,18,18
728,Attending a surprise birthday party organized ...,·Äô·Ä≠·Äê·Ä∫·ÄÜ·ÄΩ·Ä±·Äê·ÄΩ·Ä±·ÄÄ ·ÄÄ·Äª·ÄÑ·Ä∫·Ä∏·Äï·Äê·Ä≤·Ä∑ ·Äô·Äô·Äª·Äæ·Ä±·Ä¨·Ä∫·Äú·ÄÑ·Ä∑·Ä∫·Äê·Ä≤·Ä∑ ·Äô·ÄΩ·Ä±·Ä∏·Äî·Ä±·Ä∑·Äï·Ä´...,Happy,2018-06-22 14:15:00,BirthdayPartyJoyHighSchool,Instagram,#SurpriseCelebration #HighSchoolFriendship,25.0,48.0,USA,2018,6,22,14
729,Successfully fundraising for a school charity ...,·ÄÄ·Äª·Ä±·Ä¨·ÄÑ·Ä∫·Ä∏·Äï·Äõ·Äü·Ä≠·Äê·Äú·ÄØ·Äï·Ä∫·ÄÑ·Äî·Ä∫·Ä∏·Äê·ÄÖ·Ä∫·ÄÅ·ÄØ·Ä°·Äê·ÄΩ·ÄÄ·Ä∫ ·ÄÑ·ÄΩ·Ä±·ÄÄ·Äº·Ä±·Ä∏·Äë·Ä±·Ä¨·ÄÄ·Ä∫·Äï·Ä∂·Ä∑...,Happy,2019-04-05 17:30:00,CharityFundraisingTriumphHighSchool,Twitter,#CommunityGiving #HighSchoolPhilanthropy,22.0,42.0,Canada,2019,4,5,17
730,"Participating in a multicultural festival, cel...",·Äö·Äâ·Ä∫·ÄÄ·Äª·Ä±·Ä∏·Äô·Äæ·ÄØ·ÄÖ·ÄØ·Ä∂·Äú·ÄÑ·Ä∫·Äû·Ä±·Ä¨·Äï·ÄΩ·Ä≤·Äê·Ä±·Ä¨·Ä∫·Äê·ÄΩ·ÄÑ·Ä∫ ·Äï·Ä´·Äù·ÄÑ·Ä∫·ÄÅ·Äº·ÄÑ·Ä∫·Ä∏·Åä ·ÄÇ·ÄÆ·Äê...,Happy,2020-02-29 20:45:00,MulticulturalFestivalJoyHighSchool,Facebook,#CulturalCelebration #HighSchoolUnity,21.0,43.0,UK,2020,2,29,20


In [59]:
translated_dataset[-1]

{'Text': "Organizing a virtual talent show during challenging times, bringing smiles to classmates' faces! ",
 'Sentiment': ' Happy ',
 'Timestamp': '2020-11-15 15:15:00',
 'User': ' VirtualTalentShowSuccessHighSchool ',
 'Platform': ' Instagram ',
 'Hashtags': ' #VirtualEntertainment #HighSchoolPositivity ',
 'Retweets': 24.0,
 'Likes': 47.0,
 'Country': ' USA',
 'Year': 2020,
 'Month': 11,
 'Day': 15,
 'Hour': 15,
 'Text_MM': '·ÄÖ·Ä≠·Äî·Ä∫·ÄÅ·Ä±·Ä´·Ä∫·Äô·Äæ·ÄØ·Äõ·Äæ·Ä≠·Äê·Ä≤·Ä∑ ·Ä°·ÄÅ·Äª·Ä≠·Äî·Ä∫·Äê·ÄΩ·Ä±·Äô·Äæ·Ä¨ ·Äï·ÄÑ·Ä∫·ÄÄ·Ä≠·ÄØ·Äö·Ä∫·ÄÖ·ÄΩ·Äô·Ä∫·Ä∏·Äõ·Ää·Ä∫ ·Äï·Äº·Äï·ÄΩ·Ä≤·Äê·ÄÖ·Ä∫·ÄÅ·ÄØ·ÄÄ·Ä≠·ÄØ ·Äñ·Äî·Ä∫·Äê·ÄÆ·Ä∏·ÄÅ·Äº·ÄÑ·Ä∫·Ä∏·Äï·Ä´·Åã ·Ä°·Äê·Äî·Ä∫·Ä∏·Äñ·Ä±·Ä¨·Ä∫·Äê·ÄΩ·Ä±·Äõ·Ä≤·Ä∑ ·Äô·Äª·ÄÄ·Ä∫·Äî·Äæ·Ä¨·Äê·ÄΩ·Ä±·Äï·Ä±·Ä´·Ä∫ ·Ä°·Äï·Äº·ÄØ·Ä∂·Ä∏·Äê·ÄΩ·Ä±·Äê·ÄÑ·Ä∫·Äõ·ÄÑ·Ä∫·Ä∏·Äï·Ä±·Ä´·Ä∑·Åã'}

In [54]:
df['Text_MM_old'] = previous_df['Text_MM_old']

In [55]:
df

Unnamed: 0,Text,Text_MM,Sentiment,Timestamp,User,Platform,Hashtags,Retweets,Likes,Country,Year,Month,Day,Hour,Text_MM_old
0,Enjoying a beautiful day at the park! ...,·Äï·Äî·Ä∫·Ä∏·ÄÅ·Äº·Ä∂·Äë·Ä≤·Äô·Äæ·Ä¨ ·Äú·Äæ·Äï·Äê·Ä≤·Ä∑ ·Äî·Ä±·Ä∑·ÄÄ·Ä≠·ÄØ ·ÄÅ·Ä∂·ÄÖ·Ä¨·Ä∏·Äõ·ÄÑ·Ä∫·Ä∏·Äï·Ä±·Ä´·Ä∑·Åã,Positive,2023-01-15 12:30:00,User123,Twitter,#Nature #Park,15.0,30.0,USA,2023,1,15,12,·Äï·Äî·Ä∫·Ä∏·ÄÅ·Äº·Ä∂·Äë·Ä≤·Äô·Äæ·Ä¨ ·Äú·Äæ·Äï·Äê·Ä≤·Ä∑ ·Äî·Ä±·Ä∑·ÄÄ·Ä≠·ÄØ ·ÄÅ·Ä∂·ÄÖ·Ä¨·Ä∏·Äõ·ÄÑ·Ä∫·Ä∏·Äï·Ä±·Ä´·Ä∑·Åã
1,Traffic was terrible this morning. ...,·Äí·ÄÆ·Äô·Äî·ÄÄ·Ä∫·ÄÄ ·Äö·Ä¨·Äâ·Ä∫·ÄÄ·Äº·Ä±·Ä¨·ÄÄ ·Ä°·Äõ·Äô·Ä∫·Ä∏·ÄÄ·Ä≠·ÄØ ·ÄÜ·Ä≠·ÄØ·Ä∏·Äê·Äö·Ä∫·Åã,Negative,2023-01-15 08:45:00,CommuterX,Twitter,#Traffic #Morning,5.0,10.0,Canada,2023,1,15,8,·Äí·ÄÆ·Äô·Äî·ÄÄ·Ä∫·ÄÄ ·Äö·Ä¨·Äâ·Ä∫·ÄÄ·Äº·Ä±·Ä¨·ÄÄ ·Ä°·Äõ·Äô·Ä∫·Ä∏·ÄÄ·Ä≠·ÄØ ·ÄÜ·Ä≠·ÄØ·Ä∏·Äê·Äö·Ä∫·Åã
2,Just finished an amazing workout! üí™ ...,·Ä°·Ä∂·Ä∑·Ä°·Ä¨·Ä∏·Äû·ÄÑ·Ä∑·Ä∫·ÄÖ·Äõ·Ä¨ ·Äú·Ä±·Ä∑·ÄÄ·Äª·ÄÑ·Ä∑·Ä∫·ÄÅ·Äî·Ä∫·Ä∏ ·Äï·Äº·ÄÆ·Ä∏·Äû·ÄΩ·Ä¨·Ä∏·Äï·Äº·ÄÆ·Åã,Positive,2023-01-15 15:45:00,FitnessFan,Instagram,#Fitness #Workout,20.0,40.0,USA,2023,1,15,15,·Ä°·Ä∂·Ä∑·Ä°·Ä¨·Ä∏·Äû·ÄÑ·Ä∑·Ä∫·ÄÖ·Äõ·Ä¨ ·Äú·Ä±·Ä∑·ÄÄ·Äª·ÄÑ·Ä∑·Ä∫·ÄÅ·Äî·Ä∫·Ä∏ ·Äï·Äº·ÄÆ·Ä∏·Äû·ÄΩ·Ä¨·Ä∏·Äï·Äº·ÄÆ·Åã
3,Excited about the upcoming weekend getaway! ...,·Äú·Ä¨·Äô·Äö·Ä∑·Ä∫ ·Äû·ÄÆ·Äê·ÄÑ·Ä∫·Ä∏·Äï·Äê·Ä∫·Äõ·Ä≤·Ä∑ ·Äë·ÄΩ·ÄÄ·Ä∫·ÄÅ·ÄΩ·Ä¨·Äô·Äæ·ÄØ·Ä°·Äê·ÄΩ·ÄÄ·Ä∫ ·ÄÖ·Ä≠·Äê·Ä∫·Äú·Äæ·ÄØ·Äï·Ä∫·Äõ...,Positive,2023-01-15 18:20:00,AdventureX,Facebook,#Travel #Adventure,8.0,15.0,UK,2023,1,15,18,·Äú·Ä¨·Äô·Äö·Ä∑·Ä∫ ·Äû·ÄÆ·Äê·ÄÑ·Ä∫·Ä∏·Äï·Äê·Ä∫·Äõ·Ä≤·Ä∑ ·Äë·ÄΩ·ÄÄ·Ä∫·ÄÅ·ÄΩ·Ä¨·Äô·Äæ·ÄØ·Ä°·Äê·ÄΩ·ÄÄ·Ä∫ ·ÄÖ·Ä≠·Äê·Ä∫·Äú·Äæ·ÄØ·Äï·Ä∫·Äõ...
4,Trying out a new recipe for dinner tonight. ...,·Äí·ÄÆ·Ää·ÄÖ·Ä¨·Ä°·Äê·ÄΩ·ÄÄ·Ä∫ ·Äü·ÄÑ·Ä∫·Ä∏·ÄÅ·Äª·ÄÄ·Ä∫·Äî·Ää·Ä∫·Ä∏ ·Ä°·Äû·ÄÖ·Ä∫·Äê·ÄÖ·Ä∫·ÄÅ·ÄØ ·ÄÖ·Äô·Ä∫·Ä∏·Äî·Ä±·Äê·Äö·Ä∫·Åã,Neutral,2023-01-15 19:55:00,ChefCook,Instagram,#Cooking #Food,12.0,25.0,Australia,2023,1,15,19,·Äí·ÄÆ·Ää·ÄÖ·Ä¨·Ä°·Äê·ÄΩ·ÄÄ·Ä∫ ·Äü·ÄÑ·Ä∫·Ä∏·ÄÅ·Äª·ÄÄ·Ä∫·Äî·Ää·Ä∫·Ä∏ ·Ä°·Äû·ÄÖ·Ä∫·Äê·ÄÖ·Ä∫·ÄÅ·ÄØ ·ÄÖ·Äô·Ä∫·Ä∏·Äî·Ä±·Äê·Äö·Ä∫·Åã
...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...
727,Collaborating on a science project that receiv...,·Äí·Ä±·Äû·Äê·ÄΩ·ÄÑ·Ä∫·Ä∏ ·Äï·Äº·Äï·ÄΩ·Ä≤·Äê·ÄÖ·Ä∫·ÄÅ·ÄØ·Äê·ÄΩ·ÄÑ·Ä∫ ·Ä°·Äû·Ä≠·Ä°·Äô·Äæ·Äê·Ä∫·Äï·Äº·ÄØ·ÄÅ·Ä∂·Äõ·Äû·Ä±·Ä¨ ·Äû·Ä≠·Äï·Äπ...,Happy,2017-08-18 18:20:00,ScienceProjectSuccessHighSchool,Facebook,#ScienceFairWinner #HighSchoolScience,20.0,39.0,UK,2017,8,18,18,·Äí·Ä±·Äû·Äê·ÄΩ·ÄÑ·Ä∫·Ä∏ ·Äï·Äº·Äï·ÄΩ·Ä≤·Äê·ÄÖ·Ä∫·ÄÅ·ÄØ·Äê·ÄΩ·ÄÑ·Ä∫ ·Ä°·Äû·Ä≠·Ä°·Äô·Äæ·Äê·Ä∫·Äï·Äº·ÄØ·ÄÅ·Ä∂·Äõ·Äû·Ä±·Ä¨ ·Äû·Ä≠·Äï·Äπ...
728,Attending a surprise birthday party organized ...,·Äô·Ä≠·Äê·Ä∫·ÄÜ·ÄΩ·Ä±·Äê·ÄΩ·Ä±·ÄÄ ·ÄÄ·Äª·ÄÑ·Ä∫·Ä∏·Äï·Äê·Ä≤·Ä∑ ·Äô·Äô·Äª·Äæ·Ä±·Ä¨·Ä∫·Äú·ÄÑ·Ä∑·Ä∫·Äê·Ä≤·Ä∑ ·Äô·ÄΩ·Ä±·Ä∏·Äî·Ä±·Ä∑·Äï·Ä´...,Happy,2018-06-22 14:15:00,BirthdayPartyJoyHighSchool,Instagram,#SurpriseCelebration #HighSchoolFriendship,25.0,48.0,USA,2018,6,22,14,·Äô·Ä≠·Äê·Ä∫·ÄÜ·ÄΩ·Ä±·Äê·ÄΩ·Ä±·ÄÄ ·ÄÄ·Äª·ÄÑ·Ä∫·Ä∏·Äï·Äê·Ä≤·Ä∑ ·Äô·Äô·Äª·Äæ·Ä±·Ä¨·Ä∫·Äú·ÄÑ·Ä∑·Ä∫·Äê·Ä≤·Ä∑ ·Äô·ÄΩ·Ä±·Ä∏·Äî·Ä±·Ä∑·Äï·Ä´...
729,Successfully fundraising for a school charity ...,·ÄÄ·Äª·Ä±·Ä¨·ÄÑ·Ä∫·Ä∏·Äï·Äõ·Äü·Ä≠·Äê·Äú·ÄØ·Äï·Ä∫·ÄÑ·Äî·Ä∫·Ä∏·Äê·ÄÖ·Ä∫·ÄÅ·ÄØ·Ä°·Äê·ÄΩ·ÄÄ·Ä∫ ·ÄÑ·ÄΩ·Ä±·ÄÄ·Äº·Ä±·Ä∏·Äë·Ä±·Ä¨·ÄÄ·Ä∫·Äï·Ä∂·Ä∑...,Happy,2019-04-05 17:30:00,CharityFundraisingTriumphHighSchool,Twitter,#CommunityGiving #HighSchoolPhilanthropy,22.0,42.0,Canada,2019,4,5,17,·ÄÄ·Äª·Ä±·Ä¨·ÄÑ·Ä∫·Ä∏·Äï·Äõ·Äü·Ä≠·Äê·Äú·ÄØ·Äï·Ä∫·ÄÑ·Äî·Ä∫·Ä∏·Äê·ÄÖ·Ä∫·ÄÅ·ÄØ·Ä°·Äê·ÄΩ·ÄÄ·Ä∫ ·ÄÑ·ÄΩ·Ä±·ÄÄ·Äº·Ä±·Ä∏·Äë·Ä±·Ä¨·ÄÄ·Ä∫·Äï·Ä∂·Ä∑...
730,"Participating in a multicultural festival, cel...",·Äö·Äâ·Ä∫·ÄÄ·Äª·Ä±·Ä∏·Äô·Äæ·ÄØ·ÄÖ·ÄØ·Ä∂·Äú·ÄÑ·Ä∫·Äû·Ä±·Ä¨·Äï·ÄΩ·Ä≤·Äê·Ä±·Ä¨·Ä∫·Äê·ÄΩ·ÄÑ·Ä∫ ·Äï·Ä´·Äù·ÄÑ·Ä∫·ÄÅ·Äº·ÄÑ·Ä∫·Ä∏·Åä ·ÄÇ·ÄÆ·Äê...,Happy,2020-02-29 20:45:00,MulticulturalFestivalJoyHighSchool,Facebook,#CulturalCelebration #HighSchoolUnity,21.0,43.0,UK,2020,2,29,20,·Äö·Äâ·Ä∫·ÄÄ·Äª·Ä±·Ä∏·Äô·Äæ·ÄØ·ÄÖ·ÄØ·Ä∂·Äú·ÄÑ·Ä∫·Äû·Ä±·Ä¨·Äï·ÄΩ·Ä≤·Äê·Ä±·Ä¨·Ä∫·Äê·ÄΩ·ÄÑ·Ä∫ ·Äï·Ä´·Äù·ÄÑ·Ä∫·ÄÅ·Äº·ÄÑ·Ä∫·Ä∏·Åä ·ÄÇ·ÄÆ·Äê...


In [56]:
ordered_columns = ["Text", "Text_MM", "Text_MM_old", "Sentiment", "Timestamp", "User", 
                  "Platform", "Hashtags", "Retweets", "Likes", 
                  "Country", "Year", "Month", "Day", "Hour"]

# Filter to only include columns that actually exist
# ordered_columns = [col for col in ordered_columns if col in df.columns]
df = df[ordered_columns]

In [57]:
df

Unnamed: 0,Text,Text_MM,Text_MM_old,Sentiment,Timestamp,User,Platform,Hashtags,Retweets,Likes,Country,Year,Month,Day,Hour
0,Enjoying a beautiful day at the park! ...,·Äï·Äî·Ä∫·Ä∏·ÄÅ·Äº·Ä∂·Äë·Ä≤·Äô·Äæ·Ä¨ ·Äú·Äæ·Äï·Äê·Ä≤·Ä∑ ·Äî·Ä±·Ä∑·ÄÄ·Ä≠·ÄØ ·ÄÅ·Ä∂·ÄÖ·Ä¨·Ä∏·Äõ·ÄÑ·Ä∫·Ä∏·Äï·Ä±·Ä´·Ä∑·Åã,·Äï·Äî·Ä∫·Ä∏·ÄÅ·Äº·Ä∂·Äë·Ä≤·Äô·Äæ·Ä¨ ·Äú·Äæ·Äï·Äê·Ä≤·Ä∑ ·Äî·Ä±·Ä∑·ÄÄ·Ä≠·ÄØ ·ÄÅ·Ä∂·ÄÖ·Ä¨·Ä∏·Äõ·ÄÑ·Ä∫·Ä∏·Äï·Ä±·Ä´·Ä∑·Åã,Positive,2023-01-15 12:30:00,User123,Twitter,#Nature #Park,15.0,30.0,USA,2023,1,15,12
1,Traffic was terrible this morning. ...,·Äí·ÄÆ·Äô·Äî·ÄÄ·Ä∫·ÄÄ ·Äö·Ä¨·Äâ·Ä∫·ÄÄ·Äº·Ä±·Ä¨·ÄÄ ·Ä°·Äõ·Äô·Ä∫·Ä∏·ÄÄ·Ä≠·ÄØ ·ÄÜ·Ä≠·ÄØ·Ä∏·Äê·Äö·Ä∫·Åã,·Äí·ÄÆ·Äô·Äî·ÄÄ·Ä∫·ÄÄ ·Äö·Ä¨·Äâ·Ä∫·ÄÄ·Äº·Ä±·Ä¨·ÄÄ ·Ä°·Äõ·Äô·Ä∫·Ä∏·ÄÄ·Ä≠·ÄØ ·ÄÜ·Ä≠·ÄØ·Ä∏·Äê·Äö·Ä∫·Åã,Negative,2023-01-15 08:45:00,CommuterX,Twitter,#Traffic #Morning,5.0,10.0,Canada,2023,1,15,8
2,Just finished an amazing workout! üí™ ...,·Ä°·Ä∂·Ä∑·Ä°·Ä¨·Ä∏·Äû·ÄÑ·Ä∑·Ä∫·ÄÖ·Äõ·Ä¨ ·Äú·Ä±·Ä∑·ÄÄ·Äª·ÄÑ·Ä∑·Ä∫·ÄÅ·Äî·Ä∫·Ä∏ ·Äï·Äº·ÄÆ·Ä∏·Äû·ÄΩ·Ä¨·Ä∏·Äï·Äº·ÄÆ·Åã,·Ä°·Ä∂·Ä∑·Ä°·Ä¨·Ä∏·Äû·ÄÑ·Ä∑·Ä∫·ÄÖ·Äõ·Ä¨ ·Äú·Ä±·Ä∑·ÄÄ·Äª·ÄÑ·Ä∑·Ä∫·ÄÅ·Äî·Ä∫·Ä∏ ·Äï·Äº·ÄÆ·Ä∏·Äû·ÄΩ·Ä¨·Ä∏·Äï·Äº·ÄÆ·Åã,Positive,2023-01-15 15:45:00,FitnessFan,Instagram,#Fitness #Workout,20.0,40.0,USA,2023,1,15,15
3,Excited about the upcoming weekend getaway! ...,·Äú·Ä¨·Äô·Äö·Ä∑·Ä∫ ·Äû·ÄÆ·Äê·ÄÑ·Ä∫·Ä∏·Äï·Äê·Ä∫·Äõ·Ä≤·Ä∑ ·Äë·ÄΩ·ÄÄ·Ä∫·ÄÅ·ÄΩ·Ä¨·Äô·Äæ·ÄØ·Ä°·Äê·ÄΩ·ÄÄ·Ä∫ ·ÄÖ·Ä≠·Äê·Ä∫·Äú·Äæ·ÄØ·Äï·Ä∫·Äõ...,·Äú·Ä¨·Äô·Äö·Ä∑·Ä∫ ·Äû·ÄÆ·Äê·ÄÑ·Ä∫·Ä∏·Äï·Äê·Ä∫·Äõ·Ä≤·Ä∑ ·Äë·ÄΩ·ÄÄ·Ä∫·ÄÅ·ÄΩ·Ä¨·Äô·Äæ·ÄØ·Ä°·Äê·ÄΩ·ÄÄ·Ä∫ ·ÄÖ·Ä≠·Äê·Ä∫·Äú·Äæ·ÄØ·Äï·Ä∫·Äõ...,Positive,2023-01-15 18:20:00,AdventureX,Facebook,#Travel #Adventure,8.0,15.0,UK,2023,1,15,18
4,Trying out a new recipe for dinner tonight. ...,·Äí·ÄÆ·Ää·ÄÖ·Ä¨·Ä°·Äê·ÄΩ·ÄÄ·Ä∫ ·Äü·ÄÑ·Ä∫·Ä∏·ÄÅ·Äª·ÄÄ·Ä∫·Äî·Ää·Ä∫·Ä∏ ·Ä°·Äû·ÄÖ·Ä∫·Äê·ÄÖ·Ä∫·ÄÅ·ÄØ ·ÄÖ·Äô·Ä∫·Ä∏·Äî·Ä±·Äê·Äö·Ä∫·Åã,·Äí·ÄÆ·Ää·ÄÖ·Ä¨·Ä°·Äê·ÄΩ·ÄÄ·Ä∫ ·Äü·ÄÑ·Ä∫·Ä∏·ÄÅ·Äª·ÄÄ·Ä∫·Äî·Ää·Ä∫·Ä∏ ·Ä°·Äû·ÄÖ·Ä∫·Äê·ÄÖ·Ä∫·ÄÅ·ÄØ ·ÄÖ·Äô·Ä∫·Ä∏·Äî·Ä±·Äê·Äö·Ä∫·Åã,Neutral,2023-01-15 19:55:00,ChefCook,Instagram,#Cooking #Food,12.0,25.0,Australia,2023,1,15,19
...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...
727,Collaborating on a science project that receiv...,·Äí·Ä±·Äû·Äê·ÄΩ·ÄÑ·Ä∫·Ä∏ ·Äï·Äº·Äï·ÄΩ·Ä≤·Äê·ÄÖ·Ä∫·ÄÅ·ÄØ·Äê·ÄΩ·ÄÑ·Ä∫ ·Ä°·Äû·Ä≠·Ä°·Äô·Äæ·Äê·Ä∫·Äï·Äº·ÄØ·ÄÅ·Ä∂·Äõ·Äû·Ä±·Ä¨ ·Äû·Ä≠·Äï·Äπ...,·Äí·Ä±·Äû·Äê·ÄΩ·ÄÑ·Ä∫·Ä∏ ·Äï·Äº·Äï·ÄΩ·Ä≤·Äê·ÄÖ·Ä∫·ÄÅ·ÄØ·Äê·ÄΩ·ÄÑ·Ä∫ ·Ä°·Äû·Ä≠·Ä°·Äô·Äæ·Äê·Ä∫·Äï·Äº·ÄØ·ÄÅ·Ä∂·Äõ·Äû·Ä±·Ä¨ ·Äû·Ä≠·Äï·Äπ...,Happy,2017-08-18 18:20:00,ScienceProjectSuccessHighSchool,Facebook,#ScienceFairWinner #HighSchoolScience,20.0,39.0,UK,2017,8,18,18
728,Attending a surprise birthday party organized ...,·Äô·Ä≠·Äê·Ä∫·ÄÜ·ÄΩ·Ä±·Äê·ÄΩ·Ä±·ÄÄ ·ÄÄ·Äª·ÄÑ·Ä∫·Ä∏·Äï·Äê·Ä≤·Ä∑ ·Äô·Äô·Äª·Äæ·Ä±·Ä¨·Ä∫·Äú·ÄÑ·Ä∑·Ä∫·Äê·Ä≤·Ä∑ ·Äô·ÄΩ·Ä±·Ä∏·Äî·Ä±·Ä∑·Äï·Ä´...,·Äô·Ä≠·Äê·Ä∫·ÄÜ·ÄΩ·Ä±·Äê·ÄΩ·Ä±·ÄÄ ·ÄÄ·Äª·ÄÑ·Ä∫·Ä∏·Äï·Äê·Ä≤·Ä∑ ·Äô·Äô·Äª·Äæ·Ä±·Ä¨·Ä∫·Äú·ÄÑ·Ä∑·Ä∫·Äê·Ä≤·Ä∑ ·Äô·ÄΩ·Ä±·Ä∏·Äî·Ä±·Ä∑·Äï·Ä´...,Happy,2018-06-22 14:15:00,BirthdayPartyJoyHighSchool,Instagram,#SurpriseCelebration #HighSchoolFriendship,25.0,48.0,USA,2018,6,22,14
729,Successfully fundraising for a school charity ...,·ÄÄ·Äª·Ä±·Ä¨·ÄÑ·Ä∫·Ä∏·Äï·Äõ·Äü·Ä≠·Äê·Äú·ÄØ·Äï·Ä∫·ÄÑ·Äî·Ä∫·Ä∏·Äê·ÄÖ·Ä∫·ÄÅ·ÄØ·Ä°·Äê·ÄΩ·ÄÄ·Ä∫ ·ÄÑ·ÄΩ·Ä±·ÄÄ·Äº·Ä±·Ä∏·Äë·Ä±·Ä¨·ÄÄ·Ä∫·Äï·Ä∂·Ä∑...,·ÄÄ·Äª·Ä±·Ä¨·ÄÑ·Ä∫·Ä∏·Äï·Äõ·Äü·Ä≠·Äê·Äú·ÄØ·Äï·Ä∫·ÄÑ·Äî·Ä∫·Ä∏·Äê·ÄÖ·Ä∫·ÄÅ·ÄØ·Ä°·Äê·ÄΩ·ÄÄ·Ä∫ ·ÄÑ·ÄΩ·Ä±·ÄÄ·Äº·Ä±·Ä∏·Äë·Ä±·Ä¨·ÄÄ·Ä∫·Äï·Ä∂·Ä∑...,Happy,2019-04-05 17:30:00,CharityFundraisingTriumphHighSchool,Twitter,#CommunityGiving #HighSchoolPhilanthropy,22.0,42.0,Canada,2019,4,5,17
730,"Participating in a multicultural festival, cel...",·Äö·Äâ·Ä∫·ÄÄ·Äª·Ä±·Ä∏·Äô·Äæ·ÄØ·ÄÖ·ÄØ·Ä∂·Äú·ÄÑ·Ä∫·Äû·Ä±·Ä¨·Äï·ÄΩ·Ä≤·Äê·Ä±·Ä¨·Ä∫·Äê·ÄΩ·ÄÑ·Ä∫ ·Äï·Ä´·Äù·ÄÑ·Ä∫·ÄÅ·Äº·ÄÑ·Ä∫·Ä∏·Åä ·ÄÇ·ÄÆ·Äê...,·Äö·Äâ·Ä∫·ÄÄ·Äª·Ä±·Ä∏·Äô·Äæ·ÄØ·ÄÖ·ÄØ·Ä∂·Äú·ÄÑ·Ä∫·Äû·Ä±·Ä¨·Äï·ÄΩ·Ä≤·Äê·Ä±·Ä¨·Ä∫·Äê·ÄΩ·ÄÑ·Ä∫ ·Äï·Ä´·Äù·ÄÑ·Ä∫·ÄÅ·Äº·ÄÑ·Ä∫·Ä∏·Åä ·ÄÇ·ÄÆ·Äê...,Happy,2020-02-29 20:45:00,MulticulturalFestivalJoyHighSchool,Facebook,#CulturalCelebration #HighSchoolUnity,21.0,43.0,UK,2020,2,29,20


In [58]:
df.to_csv("to_check_manually.csv", index=False)

In [29]:
reordered_dataset = Dataset.from_pandas(df)

In [30]:
reordered_dataset

Dataset({
    features: ['Text', 'Text_MM', 'Sentiment', 'Timestamp', 'User', 'Platform', 'Hashtags', 'Retweets', 'Likes', 'Country', 'Year', 'Month', 'Day', 'Hour'],
    num_rows: 732
})

In [31]:
reordered_dataset.push_to_hub("chuuhtetnaing/myanmar-social-media-sentiment-analysis-dataset")

Uploading the dataset shards:   0%|          | 0/1 [00:00<?, ?it/s]

Creating parquet from Arrow format:   0%|          | 0/1 [00:00<?, ?ba/s]

CommitInfo(commit_url='https://huggingface.co/datasets/chuuhtetnaing/myanmar-social-media-sentiment-analysis-dataset/commit/6c00516d603b1822b4c1fcc7fd20e042b727e645', commit_message='Upload dataset', commit_description='', oid='6c00516d603b1822b4c1fcc7fd20e042b727e645', pr_url=None, repo_url=RepoUrl('https://huggingface.co/datasets/chuuhtetnaing/myanmar-social-media-sentiment-analysis-dataset', endpoint='https://huggingface.co', repo_type='dataset', repo_id='chuuhtetnaing/myanmar-social-media-sentiment-analysis-dataset'), pr_revision=None, pr_num=None)