In [1]:
from tqdm import tqdm
import pandas as pd
import string, math

In [2]:
def count_label(data, message):
    
    total_entailment_gold = data['Label from Gold Answer'].str.count('entailment').sum()
    total_neutral_gold = data['Label from Gold Answer'].str.count('neutral').sum()
    total_contradiction_gold = data['Label from Gold Answer'].str.count('contradiction').sum()
    
    total_entailment_pred = data['Label from Prediction Answer'].str.count('entailment').sum()
    total_neutral_pred = data['Label from Prediction Answer'].str.count('neutral').sum()
    total_contradiction_pred = data['Label from Prediction Answer'].str.count('contradiction').sum()
    
    total_label_gold = len(data[data['Label from Gold Answer'] != "NULL"])
    total_label_pred = len(data[data['Label from Prediction Answer'] != "NULL"])
    
    #print(f"PREDICTION {message.upper()}")
    #print(f"E: {total_entailment_pred} ({round(total_entailment_pred/total_label_pred, 2) * 100} %)")
    #print(f"N: {total_neutral_pred} ({round(total_neutral_pred/total_label_pred, 2) * 100} %)")
    #print(f"C: {total_contradiction_pred} ({round(total_contradiction_pred/total_label_pred, 2) * 100} %)")
    #print()
    print(f"GOLD {message.upper()}")
    print(f"E: {total_entailment_gold} ({round(total_entailment_gold/total_label_gold, 2) * 100} %)")
    print(f"N: {total_neutral_gold} ({round(total_neutral_gold/total_label_gold, 2) * 100} %)")
    print(f"C: {total_contradiction_gold} ({round(total_contradiction_gold/total_label_gold, 2) * 100} %)")
    print()
    print(f"Total data: {len(data)}")

In [3]:
def count_properties(data, message):
    
    re = data['properties'].str.count('Right answer and entailment label').sum()
    rn = data['properties'].str.count('Right answer and neutral label').sum()
    rc = data['properties'].str.count('Right answer and contradiction label').sum()
    
    we = data['properties'].str.count('Wrong answer and entailment label').sum()
    wn = data['properties'].str.count('Wrong answer and neutral label').sum()
    wc = data['properties'].str.count('Wrong answer and contradiction label').sum()
    
    total_right_answer = re + rn + rc
    total_wrong_answer = we + wn + wc
    
    print(message.upper())
    
    if total_right_answer != 0:
        print(f"RE: {re} ({round(re/total_right_answer, 2) * 100}) %")
        print(f"RN: {rn} ({round(rn/total_right_answer, 2) * 100}) %")
        print(f"RC: {rc} ({round(rc/total_right_answer, 2) * 100}) %")
    else:
        print(f"RE: 0 (0) %")
        print(f"RN: 0 (0) %")
        print(f"RC: 0 (0) %")
    
    print()
    
    if total_wrong_answer != 0:
        print(f"WE: {we} ({round(we/total_wrong_answer, 2) * 100}) %")
        print(f"WN: {wn} ({round(wn/total_wrong_answer, 2) * 100}) %")
        print(f"WC: {wc} ({round(wc/total_wrong_answer, 2) * 100}) %")
    
    else:
        print(f"WE: 0 (0) %")
        print(f"WN: 0 (0) %")
        print(f"WC: 0 (0) %")

In [4]:
def remove_punctuation(text):
    return text.strip(string.punctuation)

def return_overlap_between_gold_and_pred(data):
    
    data['is_overlap'] = ""
    overlap_data_array = []
    
    for i in tqdm(range(len(data))):
        
        pred_answer = data['Prediction Answer'][i]
        gold_answer = data['Gold Answer'][i]
        
        if type(pred_answer) != str and math.isnan(pred_answer): pred_answer = ""
        if type(gold_answer) != str and math.isnan(gold_answer): gold_answer = ""
        
        pred_answer = remove_punctuation(str(pred_answer).lower().strip())
        gold_answer = remove_punctuation(str(gold_answer).lower().strip())
        
        pred_answer_words = set(remove_punctuation(text) for text in pred_answer.split())
        gold_answer_words = set(remove_punctuation(text) for text in gold_answer.split())
        
        if pred_answer_words.intersection(gold_answer_words):
            if pred_answer == gold_answer:
                overlap_data_array.append(False)
            else:
                overlap_data_array.append(True)
        else:
            overlap_data_array.append(False)
            
    data['is_overlap'] = overlap_data_array
    return data

# All (drop nothing)

## All (drop nothing) - Model idk-mrc-nli_keep+indonli+mnli-translated

In [5]:
df_idkmrc = pd.read_excel("df_idkmrc_idk-mrc-nli_keep+indonli+mnli-translated.xlsx")
df_tydiqaid = pd.read_excel("df_tydiqaid_idk-mrc-nli_keep+indonli+mnli-translated.xlsx")

In [6]:
count_label(df_idkmrc, "IDK-MRC")
print("=" * 24)
count_label(df_tydiqaid, "TyDI-QA-ID")

print()
count_properties(df_idkmrc, "IDK-MRC")
print("=" * 20)
count_properties(df_tydiqaid, "TyDI-QA-ID")

GOLD IDK-MRC
E: 419 (49.0 %)
N: 13 (2.0 %)
C: 416 (49.0 %)

Total data: 848
GOLD TYDI-QA-ID
E: 846 (99.0 %)
N: 0 (0.0 %)
C: 11 (1.0 %)

Total data: 857

IDK-MRC
RE: 266 (100.0) %
RN: 0 (0.0) %
RC: 1 (0.0) %

WE: 142 (24.0) %
WN: 15 (3.0) %
WC: 424 (73.0) %
TYDI-QA-ID
RE: 569 (100.0) %
RN: 0 (0.0) %
RC: 1 (0.0) %

WE: 255 (89.0) %
WN: 1 (0.0) %
WC: 31 (11.0) %


## All (drop nothing) - Model idk-mrc-nli_keep

In [7]:
df_idkmrc = pd.read_excel("df_idkmrc_idk-mrc-nli_keep.xlsx")
df_tydiqaid = pd.read_excel("df_tydiqaid_idk-mrc-nli_keep.xlsx")

In [8]:
count_label(df_idkmrc, "IDK-MRC")
print("=" * 24)
count_label(df_tydiqaid, "TyDI-QA-ID")

print()
count_properties(df_idkmrc, "IDK-MRC")
print("=" * 20)
count_properties(df_tydiqaid, "TyDI-QA-ID")

GOLD IDK-MRC
E: 676 (80.0 %)
N: 0 (0.0 %)
C: 172 (20.0 %)

Total data: 848
GOLD TYDI-QA-ID
E: 849 (99.0 %)
N: 0 (0.0 %)
C: 8 (1.0 %)

Total data: 857

IDK-MRC
RE: 266 (100.0) %
RN: 0 (0.0) %
RC: 1 (0.0) %

WE: 416 (72.0) %
WN: 0 (0.0) %
WC: 165 (28.000000000000004) %
TYDI-QA-ID
RE: 570 (100.0) %
RN: 0 (0.0) %
RC: 0 (0.0) %

WE: 274 (95.0) %
WN: 0 (0.0) %
WC: 13 (5.0) %


## All (drop nothing) - Model indonli+mnli-translated

In [9]:
df_idkmrc = pd.read_excel("df_idkmrc_indonli+mnli-translated.xlsx")
df_tydiqaid = pd.read_excel("df_tydiqaid_indonli+mnli-translated.xlsx")

In [10]:
count_label(df_idkmrc, "IDK-MRC")
print("=" * 24)
count_label(df_tydiqaid, "TyDI-QA-ID")

print()
count_properties(df_idkmrc, "IDK-MRC")
print("=" * 20)
count_properties(df_tydiqaid, "TyDI-QA-ID")

GOLD IDK-MRC
E: 255 (30.0 %)
N: 453 (53.0 %)
C: 140 (17.0 %)

Total data: 848
GOLD TYDI-QA-ID
E: 513 (60.0 %)
N: 286 (33.0 %)
C: 58 (7.000000000000001 %)

Total data: 857

IDK-MRC
RE: 178 (67.0) %
RN: 65 (24.0) %
RC: 24 (9.0) %

WE: 83 (14.000000000000002) %
WN: 386 (66.0) %
WC: 112 (19.0) %
TYDI-QA-ID
RE: 370 (65.0) %
RN: 167 (28.999999999999996) %
RC: 33 (6.0) %

WE: 145 (51.0) %
WN: 112 (39.0) %
WC: 30 (10.0) %


# Only unanswerable (gold answer NaN only)

## Only unanswerable (gold answer NaN only) - Model idk-mrc-nli_keep+indonli+mnli-translated

In [11]:
df_idkmrc = pd.read_excel("df_idkmrc_idk-mrc-nli_keep+indonli+mnli-translated.xlsx")
df_tydiqaid = pd.read_excel("df_tydiqaid_idk-mrc-nli_keep+indonli+mnli-translated.xlsx")

df_idkmrc_unanswerable_only = df_idkmrc[df_idkmrc['Gold Answer'].isna()]
df_tydiqaid_unanswerable_only = df_tydiqaid[df_tydiqaid['Gold Answer'].isna()]

In [12]:
count_label(df_idkmrc_unanswerable_only, "IDK-MRC")
print("=" * 24)
count_label(df_tydiqaid_unanswerable_only, "TyDI-QA-ID")

print()
count_properties(df_idkmrc_unanswerable_only, "IDK-MRC")
print("=" * 20)
count_properties(df_tydiqaid_unanswerable_only, "TyDI-QA-ID")

GOLD IDK-MRC
E: 4 (1.0 %)
N: 13 (3.0 %)
C: 409 (96.0 %)

Total data: 426
GOLD TYDI-QA-ID
E: 0 (0.0 %)
N: 0 (0.0 %)
C: 1 (100.0 %)

Total data: 1

IDK-MRC
RE: 0 (0) %
RN: 0 (0) %
RC: 0 (0) %

WE: 35 (8.0) %
WN: 13 (3.0) %
WC: 378 (89.0) %
TYDI-QA-ID
RE: 0 (0) %
RN: 0 (0) %
RC: 0 (0) %

WE: 1 (100.0) %
WN: 0 (0.0) %
WC: 0 (0.0) %


## Only unanswerable (gold answer NaN only) - Model idk-mrc-nli_keep

In [13]:
df_idkmrc = pd.read_excel("df_idkmrc_idk-mrc-nli_keep.xlsx")
df_tydiqaid = pd.read_excel("df_tydiqaid_idk-mrc-nli_keep.xlsx")

df_idkmrc_unanswerable_only = df_idkmrc[df_idkmrc['Gold Answer'].isna()]
df_tydiqaid_unanswerable_only = df_tydiqaid[df_tydiqaid['Gold Answer'].isna()]

In [14]:
count_label(df_idkmrc_unanswerable_only, "IDK-MRC")
print("=" * 24)
count_label(df_tydiqaid_unanswerable_only, "TyDI-QA-ID")

print()
count_properties(df_idkmrc_unanswerable_only, "IDK-MRC")
print("=" * 20)
count_properties(df_tydiqaid_unanswerable_only, "TyDI-QA-ID")

GOLD IDK-MRC
E: 264 (62.0 %)
N: 0 (0.0 %)
C: 162 (38.0 %)

Total data: 426
GOLD TYDI-QA-ID
E: 1 (100.0 %)
N: 0 (0.0 %)
C: 0 (0.0 %)

Total data: 1

IDK-MRC
RE: 0 (0) %
RN: 0 (0) %
RC: 0 (0) %

WE: 275 (65.0) %
WN: 0 (0.0) %
WC: 151 (35.0) %
TYDI-QA-ID
RE: 0 (0) %
RN: 0 (0) %
RC: 0 (0) %

WE: 1 (100.0) %
WN: 0 (0.0) %
WC: 0 (0.0) %


## Only unanswerable (gold answer NaN only) - Model indonli+mnli-translated

In [15]:
df_idkmrc = pd.read_excel("df_idkmrc_indonli+mnli-translated.xlsx")
df_tydiqaid = pd.read_excel("df_tydiqaid_indonli+mnli-translated.xlsx")

df_idkmrc_unanswerable_only = df_idkmrc[df_idkmrc['Gold Answer'].isna()]
df_tydiqaid_unanswerable_only = df_tydiqaid[df_tydiqaid['Gold Answer'].isna()]

In [16]:
count_label(df_idkmrc_unanswerable_only, "IDK-MRC")
print("=" * 24)
count_label(df_tydiqaid_unanswerable_only, "TyDI-QA-ID")

print()
count_properties(df_idkmrc_unanswerable_only, "IDK-MRC")
print("=" * 20)
count_properties(df_tydiqaid_unanswerable_only, "TyDI-QA-ID")

GOLD IDK-MRC
E: 1 (0.0 %)
N: 333 (78.0 %)
C: 92 (22.0 %)

Total data: 426
GOLD TYDI-QA-ID
E: 0 (0.0 %)
N: 1 (100.0 %)
C: 0 (0.0 %)

Total data: 1

IDK-MRC
RE: 0 (0) %
RN: 0 (0) %
RC: 0 (0) %

WE: 13 (3.0) %
WN: 330 (77.0) %
WC: 83 (19.0) %
TYDI-QA-ID
RE: 0 (0) %
RN: 0 (0) %
RC: 0 (0) %

WE: 0 (0.0) %
WN: 1 (100.0) %
WC: 0 (0.0) %


# Answerable + Non overlap

## Answerable + Non overlap - Model idk-mrc-nli_keep+indonli+mnli-translated

In [17]:
df_idkmrc = pd.read_excel("df_idkmrc_idk-mrc-nli_keep+indonli+mnli-translated.xlsx")
df_tydiqaid = pd.read_excel("df_tydiqaid_idk-mrc-nli_keep+indonli+mnli-translated.xlsx")

df_idkmrc = return_overlap_between_gold_and_pred(df_idkmrc)
df_tydiqaid = return_overlap_between_gold_and_pred(df_tydiqaid)

df_idkmrc = df_idkmrc[df_idkmrc['is_overlap'] == False].reset_index(drop=True)
df_tydiqaid = df_tydiqaid[df_tydiqaid['is_overlap'] == False].reset_index(drop=True)

df_idkmrc_answerable_non_overlap = df_idkmrc.dropna(subset=['Gold Answer']).reset_index(drop=True)
df_tydiqaid_answerable_non_overlap = df_tydiqaid.dropna(subset=['Gold Answer']).reset_index(drop=True)

100%|██████████████████████████████████████████████████████████████████████████████| 848/848 [00:00<00:00, 63974.13it/s]
100%|██████████████████████████████████████████████████████████████████████████████| 857/857 [00:00<00:00, 60268.24it/s]


In [18]:
count_label(df_idkmrc_answerable_non_overlap, "IDK-MRC")
print("=" * 24)
count_label(df_tydiqaid_answerable_non_overlap, "TyDI-QA-ID")

print()
count_properties(df_idkmrc_answerable_non_overlap, "IDK-MRC")
print("=" * 20)
count_properties(df_tydiqaid_answerable_non_overlap, "TyDI-QA-ID")

GOLD IDK-MRC
E: 322 (98.0 %)
N: 0 (0.0 %)
C: 5 (2.0 %)

Total data: 327
GOLD TYDI-QA-ID
E: 660 (99.0 %)
N: 0 (0.0 %)
C: 8 (1.0 %)

Total data: 668

IDK-MRC
RE: 266 (100.0) %
RN: 0 (0.0) %
RC: 1 (0.0) %

WE: 19 (32.0) %
WN: 2 (3.0) %
WC: 39 (65.0) %
TYDI-QA-ID
RE: 569 (100.0) %
RN: 0 (0.0) %
RC: 1 (0.0) %

WE: 72 (73.0) %
WN: 1 (1.0) %
WC: 25 (26.0) %


## Answerable + Non overlap - Model idk-mrc-nli_keep

In [19]:
df_idkmrc = pd.read_excel("df_idkmrc_idk-mrc-nli_keep.xlsx")
df_tydiqaid = pd.read_excel("df_tydiqaid_idk-mrc-nli_keep.xlsx")

df_idkmrc = return_overlap_between_gold_and_pred(df_idkmrc)
df_tydiqaid = return_overlap_between_gold_and_pred(df_tydiqaid)

df_idkmrc = df_idkmrc[df_idkmrc['is_overlap'] == False].reset_index(drop=True)
df_tydiqaid = df_tydiqaid[df_tydiqaid['is_overlap'] == False].reset_index(drop=True)

df_idkmrc_answerable_non_overlap = df_idkmrc.dropna(subset=['Gold Answer']).reset_index(drop=True)
df_tydiqaid_answerable_non_overlap = df_tydiqaid.dropna(subset=['Gold Answer']).reset_index(drop=True)

100%|██████████████████████████████████████████████████████████████████████████████| 848/848 [00:00<00:00, 69913.31it/s]
100%|██████████████████████████████████████████████████████████████████████████████| 857/857 [00:00<00:00, 61867.79it/s]


In [20]:
count_label(df_idkmrc_answerable_non_overlap, "IDK-MRC")
print("=" * 24)
count_label(df_tydiqaid_answerable_non_overlap, "TyDI-QA-ID")

print()
count_properties(df_idkmrc_answerable_non_overlap, "IDK-MRC")
print("=" * 20)
count_properties(df_tydiqaid_answerable_non_overlap, "TyDI-QA-ID")

GOLD IDK-MRC
E: 319 (98.0 %)
N: 0 (0.0 %)
C: 8 (2.0 %)

Total data: 327
GOLD TYDI-QA-ID
E: 664 (99.0 %)
N: 0 (0.0 %)
C: 4 (1.0 %)

Total data: 668

IDK-MRC
RE: 266 (100.0) %
RN: 0 (0.0) %
RC: 1 (0.0) %

WE: 52 (87.0) %
WN: 0 (0.0) %
WC: 8 (13.0) %
TYDI-QA-ID
RE: 570 (100.0) %
RN: 0 (0.0) %
RC: 0 (0.0) %

WE: 89 (91.0) %
WN: 0 (0.0) %
WC: 9 (9.0) %


## Answerable + Non overlap - Model indonli+mnli-translated

In [21]:
df_idkmrc = pd.read_excel("df_idkmrc_indonli+mnli-translated.xlsx")
df_tydiqaid = pd.read_excel("df_tydiqaid_indonli+mnli-translated.xlsx")

df_idkmrc = return_overlap_between_gold_and_pred(df_idkmrc)
df_tydiqaid = return_overlap_between_gold_and_pred(df_tydiqaid)

df_idkmrc = df_idkmrc[df_idkmrc['is_overlap'] == False].reset_index(drop=True)
df_tydiqaid = df_tydiqaid[df_tydiqaid['is_overlap'] == False].reset_index(drop=True)

df_idkmrc_answerable_non_overlap = df_idkmrc.dropna(subset=['Gold Answer']).reset_index(drop=True)
df_tydiqaid_answerable_non_overlap = df_tydiqaid.dropna(subset=['Gold Answer']).reset_index(drop=True)

100%|██████████████████████████████████████████████████████████████████████████████| 848/848 [00:00<00:00, 70770.22it/s]
100%|██████████████████████████████████████████████████████████████████████████████| 857/857 [00:00<00:00, 62234.12it/s]


In [22]:
count_label(df_idkmrc_answerable_non_overlap, "IDK-MRC")
print("=" * 24)
count_label(df_tydiqaid_answerable_non_overlap, "TyDI-QA-ID")

print()
count_properties(df_idkmrc_answerable_non_overlap, "IDK-MRC")
print("=" * 20)
count_properties(df_tydiqaid_answerable_non_overlap, "TyDI-QA-ID")

GOLD IDK-MRC
E: 197 (60.0 %)
N: 93 (28.000000000000004 %)
C: 37 (11.0 %)

Total data: 327
GOLD TYDI-QA-ID
E: 408 (61.0 %)
N: 215 (32.0 %)
C: 45 (7.000000000000001 %)

Total data: 668

IDK-MRC
RE: 178 (67.0) %
RN: 65 (24.0) %
RC: 24 (9.0) %

WE: 4 (7.000000000000001) %
WN: 34 (56.99999999999999) %
WC: 22 (37.0) %
TYDI-QA-ID
RE: 370 (65.0) %
RN: 167 (28.999999999999996) %
RC: 33 (6.0) %

WE: 29 (30.0) %
WN: 52 (53.0) %
WC: 17 (17.0) %


# Answerable + Overlap

## Answerable + Overlap - Model idk-mrc-nli_keep+indonli+mnli-translated

In [23]:
df_idkmrc = pd.read_excel("df_idkmrc_idk-mrc-nli_keep+indonli+mnli-translated.xlsx")
df_tydiqaid = pd.read_excel("df_tydiqaid_idk-mrc-nli_keep+indonli+mnli-translated.xlsx")

df_idkmrc_answerable_overlap = df_idkmrc.dropna(subset=['Gold Answer']).reset_index(drop=True)
df_tydiqaid_answerable_overlap = df_tydiqaid.dropna(subset=['Gold Answer']).reset_index(drop=True)

In [24]:
count_label(df_idkmrc_answerable_overlap, "IDK-MRC")
print("=" * 24)
count_label(df_tydiqaid_answerable_overlap, "TyDI-QA-ID")

print()
count_properties(df_idkmrc_answerable_overlap, "IDK-MRC")
print("=" * 20)
count_properties(df_tydiqaid_answerable_overlap, "TyDI-QA-ID")

GOLD IDK-MRC
E: 415 (98.0 %)
N: 0 (0.0 %)
C: 7 (2.0 %)

Total data: 422
GOLD TYDI-QA-ID
E: 846 (99.0 %)
N: 0 (0.0 %)
C: 10 (1.0 %)

Total data: 856

IDK-MRC
RE: 266 (100.0) %
RN: 0 (0.0) %
RC: 1 (0.0) %

WE: 107 (69.0) %
WN: 2 (1.0) %
WC: 46 (30.0) %
TYDI-QA-ID
RE: 569 (100.0) %
RN: 0 (0.0) %
RC: 1 (0.0) %

WE: 254 (89.0) %
WN: 1 (0.0) %
WC: 31 (11.0) %


## Answerable + Overlap - Model idk-mrc-nli_keep

In [25]:
df_idkmrc = pd.read_excel("df_idkmrc_idk-mrc-nli_keep.xlsx")
df_tydiqaid = pd.read_excel("df_tydiqaid_idk-mrc-nli_keep.xlsx")

df_idkmrc_answerable_overlap = df_idkmrc.dropna(subset=['Gold Answer']).reset_index(drop=True)
df_tydiqaid_answerable_overlap = df_tydiqaid.dropna(subset=['Gold Answer']).reset_index(drop=True)

In [26]:
count_label(df_idkmrc_answerable_overlap, "IDK-MRC")
print("=" * 24)
count_label(df_tydiqaid_answerable_overlap, "TyDI-QA-ID")

print()
count_properties(df_idkmrc_answerable_overlap, "IDK-MRC")
print("=" * 20)
count_properties(df_tydiqaid_answerable_overlap, "TyDI-QA-ID")

GOLD IDK-MRC
E: 412 (98.0 %)
N: 0 (0.0 %)
C: 10 (2.0 %)

Total data: 422
GOLD TYDI-QA-ID
E: 848 (99.0 %)
N: 0 (0.0 %)
C: 8 (1.0 %)

Total data: 856

IDK-MRC
RE: 266 (100.0) %
RN: 0 (0.0) %
RC: 1 (0.0) %

WE: 141 (91.0) %
WN: 0 (0.0) %
WC: 14 (9.0) %
TYDI-QA-ID
RE: 570 (100.0) %
RN: 0 (0.0) %
RC: 0 (0.0) %

WE: 273 (95.0) %
WN: 0 (0.0) %
WC: 13 (5.0) %


## Answerable + Overlap - Model indonli+mnli-translated

In [27]:
df_idkmrc = pd.read_excel("df_idkmrc_indonli+mnli-translated.xlsx")
df_tydiqaid = pd.read_excel("df_tydiqaid_indonli+mnli-translated.xlsx")

df_idkmrc_answerable_overlap = df_idkmrc.dropna(subset=['Gold Answer']).reset_index(drop=True)
df_tydiqaid_answerable_overlap = df_tydiqaid.dropna(subset=['Gold Answer']).reset_index(drop=True)

In [28]:
count_label(df_idkmrc_answerable_overlap, "IDK-MRC")
print("=" * 24)
count_label(df_tydiqaid_answerable_overlap, "TyDI-QA-ID")

print()
count_properties(df_idkmrc_answerable_overlap, "IDK-MRC")
print("=" * 20)
count_properties(df_tydiqaid_answerable_overlap, "TyDI-QA-ID")

GOLD IDK-MRC
E: 254 (60.0 %)
N: 120 (28.000000000000004 %)
C: 48 (11.0 %)

Total data: 422
GOLD TYDI-QA-ID
E: 513 (60.0 %)
N: 285 (33.0 %)
C: 58 (7.000000000000001 %)

Total data: 856

IDK-MRC
RE: 178 (67.0) %
RN: 65 (24.0) %
RC: 24 (9.0) %

WE: 70 (45.0) %
WN: 56 (36.0) %
WC: 29 (19.0) %
TYDI-QA-ID
RE: 370 (65.0) %
RN: 167 (28.999999999999996) %
RC: 33 (6.0) %

WE: 145 (51.0) %
WN: 111 (39.0) %
WC: 30 (10.0) %
