In [None]:
!pip install value-nlp
!pip install pandas

In [None]:
from google.colab import drive
drive.mount('/content/drive')

In [None]:
# RUN BEFORE ANY OTHER CELL!!!!

import pandas as pd
from multivalue import Dialects

# Initialize the dialect for African American Vernacular English
aave = Dialects.AfricanAmericanVernacular()

In [None]:
# WSC Value Translation Code

def translate_text(text):
    try:
        return aave.transform(text)
    except Exception as e:
        print(f"Error in translation: {e}")
        return text  # Return the original text if an error occurs

def main():
    # Load the original CSV file
    file_path = '/content/drive/MyDrive/Algoverse/New Results/GPT 4o mini Translations/Translated WSC.csv'
    df = pd.read_csv(file_path)

    # Rename columns
    df.rename(columns={
        'Original Paragraph': 'Original Paragraph',
        'AAVE Paragraph': 'AAVE Paragraph'
    }, inplace=True)

    # Initialize new column for VALUE translation
    df['VALUE Paragraph'] = ''

    # Translate the 'Original Paragraph' column
    for index, row in df.iterrows():
        original_text = row['Original Paragraph']
        translated_text = translate_text(original_text)
        df.at[index, 'VALUE Paragraph'] = translated_text
        print(f"Processed Original Paragraph row {index + 1}")

    # Filter rows where 'Original Paragraph' matches 'VALUE Paragraph'
    filtered_df = df[df['Original Paragraph'] != df['VALUE Paragraph']]

    # Reorder columns
    filtered_df = filtered_df[['Original Paragraph', 'AAVE Paragraph', 'VALUE Paragraph']]

    # Save the new CSV
    output_path = '/content/drive/MyDrive/Algoverse/New Results/VALUE Translations/WSC/Filtered WSC Paragraphs.csv'
    filtered_df.to_csv(output_path, index=False)

    print(f"Filtered data saved to {output_path}")

if __name__ == '__main__':
    main()

In [None]:
# BoolQ Value Translation Code

def translate_text(text):
    try:
        return aave.transform(text)
    except Exception as e:
        print("Error in translation:", e)
        return text

def main():
    # Load the original CSV file
    file_path = '/content/drive/MyDrive/Algoverse/New Results/GPT 4o mini Translations/Translated BoolQ.csv'
    df = pd.read_csv(file_path)

    # Translate 'SAE Passage' and 'SAE Question'
    df['VALUE Passage'] = df['SAE Passage'].apply(translate_text)
    df['VALUE Question'] = df['SAE Question'].apply(translate_text)

    # Rename columns
    df.rename(columns={'SAE Passage': 'Original Passage', 'SAE Question': 'Original Question'}, inplace=True)

    # Filter and save the passages
    passages = df[['Original Passage', 'AAVE Passage', 'VALUE Passage']]
    passages_no_match = passages[passages['VALUE Passage'] != passages['Original Passage']]
    passages_no_match.to_csv('/content/drive/MyDrive/Algoverse/New Results/VALUE Translations/Filtered Passages No Match.csv', index=False)

    # Filter and save the questions
    questions = df[['Original Question', 'AAVE Question', 'VALUE Question']]
    questions_no_match = questions[questions['VALUE Question'] != questions['Original Question']]
    questions_no_match.to_csv('/content/drive/MyDrive/Algoverse/New Results/VALUE Translations/Filtered Questions No Match.csv', index=False)

if __name__ == '__main__':
    main()

In [None]:
# CoLA Value Translation Code

def translate_text(text):
    try:
        return aave.transform(text)
    except Exception as e:
        print(f"Error in translation: {e}")
        return text  # Return the original text if an error occurs

def main():
    # Load the original CSV file
    file_path = '/content/drive/MyDrive/Algoverse/New Results/GPT 4o mini Translations/Translated CoLA.csv'
    df = pd.read_csv(file_path)

    # Initialize new columns for translations
    df['VALUE Sentence'] = ''

    # Translate the 'Sentence' column
    for index, row in df.iterrows():
        # Translate the current sentence
        original_sentence = row['Sentence']
        aave_translation = translate_text(original_sentence)
        df.at[index, 'VALUE Sentence'] = aave_translation
        print(f"Processed row {index + 1}")

    # Rename columns
    df.rename(columns={'Sentence': 'Original Sentence', 'Translated Sentence': 'AAVE Sentence'}, inplace=True)

    # Filter rows where 'Original Sentence' matches 'VALUE Sentence'
    filtered_df = df[df['Original Sentence'] != df['VALUE Sentence']]

    # Reorder columns
    filtered_df = filtered_df[['Original Sentence', 'AAVE Sentence', 'VALUE Sentence']]

    # Save the new CSV
    output_path = '/content/drive/MyDrive/Algoverse/New Results/VALUE Translations/Filtered CoLA Sentences.csv'
    filtered_df.to_csv(output_path, index=False)

    print(f"Filtered data saved to {output_path}")

if __name__ == '__main__':
    main()

In [None]:
# COPA Value Translation Code

def translate_text(text):
    try:
        return aave.transform(text)
    except Exception as e:
        print(f"Error in translation: {e}")
        return text  # Return the original text if an error occurs

def process_column(df, original_col, aave_col, value_col):
    # Translate the original column
    for index, row in df.iterrows():
        original_text = row[original_col]
        translated_text = translate_text(original_text)
        df.at[index, value_col] = translated_text
        print(f"Processed {original_col} row {index + 1}")

    # Filter rows where original and VALUE columns match
    filtered_df = df[df[original_col] != df[value_col]]

    # Reorder columns
    filtered_df = filtered_df[[original_col, aave_col, value_col]]

    return filtered_df

def main():
    # Load the original CSV file
    file_path = '/content/drive/MyDrive/Algoverse/New Results/GPT 4o mini Translations/Translated Copa.csv'
    df = pd.read_csv(file_path)

    # Rename columns
    df.rename(columns={
        'Premise': 'Original Premise',
        'Choice 1': 'Original Choice 1',
        'Choice 2': 'Original Choice 2',
        'Translated Premise': 'AAVE Premise',
        'Translated Choice 1': 'AAVE Choice 1',
        'Translated Choice 2': 'AAVE Choice 2'
    }, inplace=True)

    # Initialize new columns for VALUE translations
    df['VALUE Premise'] = ''
    df['VALUE Choice 1'] = ''
    df['VALUE Choice 2'] = ''

    # Process each column and save to separate CSV files
    for column_info in [
        ('Original Premise', 'AAVE Premise', 'VALUE Premise', 'VALUE COPA Premise.csv'),
        ('Original Choice 1', 'AAVE Choice 1', 'VALUE Choice 1', 'VALUE COPA Choice 1.csv'),
        ('Original Choice 2', 'AAVE Choice 2', 'VALUE Choice 2', 'VALUE COPA Choice 2.csv')
    ]:
        original_col, aave_col, value_col, output_file = column_info
        filtered_data = process_column(df, original_col, aave_col, value_col)
        output_path = f'/content/drive/MyDrive/Algoverse/New Results/VALUE Translations/COPA/{output_file}'
        filtered_data.to_csv(output_path, index=False)
        print(f"Filtered data saved to {output_path}")

if __name__ == '__main__':
    main()

In [None]:
# MultiRC VALUE Translation Code

def translate_text(text):
    try:
        return aave.transform(text)
    except Exception as e:
        print(f"Error in translation: {e}")
        return text  # Return the original text if an error occurs

def process_column(df, original_col, aave_col, value_col):
    # Translate the original column
    for index, row in df.iterrows():
        original_text = row[original_col]
        translated_text = translate_text(original_text)
        df.at[index, value_col] = translated_text
        print(f"Processed {original_col} row {index + 1}")

    # Filter rows where original and VALUE columns match
    filtered_df = df[df[original_col] != df[value_col]]

    # Reorder columns
    filtered_df = filtered_df[[original_col, aave_col, value_col]]

    return filtered_df

def main():
    # Load the original CSV file
    file_path = '/content/drive/MyDrive/Algoverse/New Results/GPT 4o mini Translations/Translated MultiRC.csv'
    df = pd.read_csv(file_path)

    # Rename columns
    df.rename(columns={
        'Paragraph': 'Original Paragraph',
        'Question': 'Original Question',
        'Translated Paragraph': 'AAVE Paragraph',
        'Translated Question': 'AAVE Question'
    }, inplace=True)

    # Initialize new columns for VALUE translations
    df['VALUE Paragraph'] = ''
    df['VALUE Question'] = ''

    # Process each column and save to separate CSV files
    for column_info in [
        ('Original Paragraph', 'AAVE Paragraph', 'VALUE Paragraph', 'VALUE MultiRC Paragraph.csv'),
        ('Original Question', 'AAVE Question', 'VALUE Question', 'VALUE MultiRC Question.csv')
    ]:
        original_col, aave_col, value_col, output_file = column_info
        filtered_data = process_column(df, original_col, aave_col, value_col)
        output_path = f'/content/drive/MyDrive/Algoverse/New Results/VALUE Translations/MultiRC/{output_file}'
        filtered_data.to_csv(output_path, index=False)
        print(f"Filtered data saved to {output_path}")

if __name__ == '__main__':
    main()

In [None]:
# SST-2 VALUE Translation Code

def translate_text(text):
    try:
        return aave.transform(text)
    except Exception as e:
        print(f"Error in translation: {e}")
        return text  # Return the original text if an error occurs

def main():
    # Load the original CSV file
    file_path = '/content/drive/MyDrive/Algoverse/New Results/GPT 4o mini Translations/Translated SST-2.csv'
    df = pd.read_csv(file_path)

    # Rename columns
    df.rename(columns={
        'Original Sentence': 'Original Sentence',
        'Translated Sentence': 'AAVE Sentence'
    }, inplace=True)

    # Initialize new column for VALUE translation
    df['VALUE Sentence'] = ''

    # Translate the 'Original Sentence' column
    for index, row in df.iterrows():
        original_text = row['Original Sentence']
        translated_text = translate_text(original_text)
        df.at[index, 'VALUE Sentence'] = translated_text
        print(f"Processed Original Sentence row {index + 1}")

    # Filter rows where 'Original Sentence' matches 'VALUE Sentence'
    filtered_df = df[df['Original Sentence'] != df['VALUE Sentence']]

    # Reorder columns
    filtered_df = filtered_df[['Original Sentence', 'AAVE Sentence', 'VALUE Sentence']]

    # Save the new CSV
    output_path = '/content/drive/MyDrive/Algoverse/New Results/VALUE Translations/SST-2/VALUE SST-2 Sentences.csv'
    filtered_df.to_csv(output_path, index=False)

    print(f"Filtered data saved to {output_path}")

if __name__ == '__main__':
    main()