In [1]:
import os
import pandas as pd
from src.test_evaluation import *

In [2]:
# Load the test results data
data_path = 'transcriptions/readingTestFluencE_children.csv'
tests_df = pd.read_csv(data_path)

In [3]:
# We extract the ground truth for the readingTestFluencE
df = pd.read_csv('transcriptions/readingTestFluencE_transcriptions.csv')
ground_truth = df.loc[0, 'Phonetic Transcription']

In [4]:
tests_df.head()

Unnamed: 0,File Name,Phonetic Transcription
0,readingTestFluencE_098522E8-2203-425E-85E5-580...,ɑ̃sez istwaʁ də lysdy dyitie dɑ̃ yzjevvɛzɔ̃ si...
1,readingTestFluencE_BE04EB29-C18F-4382-8DB5-4A1...,listwaʁ dœ̃ sjø dœ̃ pødə də məsj pətiki vi dɑ̃...
2,readingTestFluencE_4F8CAF37-C0E2-4A9B-9E5C-F87...,sɛ litwa dy m̃dy mɔ məsø pətikiv pə vjɛ me ity...
3,readingTestFluencE_9620A493-0DAB-432D-A939-A6C...,lfeitɔ dəmsypi de vadɛ̃ fi lz ɑ̃sfi okœʁ dœ̃ s...
4,readingTestFluencE_CD57AFB2-2DA2-4106-935C-9BD...,valakpliʁavoʁi itaʁive ifoiʁ apɔtsidyp puʁviiʁ...


In [5]:
# We test the evaluation on the test with 'File Name' = 'readingTestFluencE_75A80925-F8CF-463D-AFED-5CC399848CC2.wav'
child_transcription = tests_df[tests_df['File Name'] == 'readingTestFluencE_75A80925-F8CF-463D-AFED-5CC399848CC2.wav'].iloc[0]['Phonetic Transcription']

# We print the children transcription and the ground truth
print(f"Child transcription: {child_transcription}")
print(f"Ground truth: {ground_truth}")
print("-" * 30)

results = run_all_evaluations(ground_truth, child_transcription)

for res in results:
    print(f"Method: {res['method']}")
    print(f"Score: {res['score']}")
    print("-" * 30)

Child transcription: sə listwaʁ də məsø pəti ki vi dɑ̃z yn ljɛ mɛzɔ̃ sitile o kœʁ dɑ̃vjø vilaʒ la mɛzɔ̃ e dɑ̃tuʁe dɑ̃ ʒaʁdɛ̃ avɛk yn baʁeil a de k̃tɔ̃bʁ deʃu pʁize tusɔʁt də lik ʁofɔ̃daʁdɛ̃ lə bɔʁtilɔ̃ pʁlɔ̃ ʁɛstuʒuʁ pɛʁmɛ puʁpə jœʁ aʁtysdə seʃapay pys ɛ m səkuʃe pʁɛ də lapubɛ alɔ̃̃bʁ loʁɑ̃ʒe kuvɛʁt fʁide lisy sy a puse kuʁmɑ̃ i kʁoktu sə ki lyi asʃu
Ground truth: sɛ listwaʁ də məsjø pəti ki vi dɑ̃z yn vjɛj mɛzɔ̃ sitye o kœʁ dœ̃ vjø vilaʒ la mɛzɔ̃ ɛt ɑ̃tuʁe dœ̃ ʒaʁdɛ̃ avɛk yn baʁjɛʁ il i a de kɔ̃kɔ̃bʁ de ʃu fʁize tut sɔʁt də leɡymz o fɔ̃ dy ʒaʁdɛ̃ lə pɔʁtijɔ̃ ʁɛst tuʒuʁ fɛʁme puʁ kə ʃjɛ̃ a pys nə seʃap pa ʃjɛ̃ a pysz ɛm sə kuʃe pʁɛ də la pubɛl a lɔ̃bʁ dœ̃n ɔʁɑ̃ʒe kuvɛʁ də fʁyi delisjø ʃjɛ̃ a pysz ɛ ɡuʁmɑ̃ il kʁɔk tu sə ki lyi pas su la dɑ̃ dez ɔʁɑ̃ʒ puʁi ki tɔ̃b syʁ lə sɔl de flœʁ fanez œ̃ mɔʁso də byvaʁ œ̃ ʒuʁ məsjø pəti desid də mɛtʁ ʃjɛ̃ a pys dɑ̃z yn niʃ ʃjɛ̃ a pys nɛm paz ɛtʁ ɑ̃fɛʁme il pʁefɛʁ sɑ̃dɔʁmiʁ ɑ̃ ʁəɡaʁdɑ̃ lez etwal dɑ̃ lə sjɛl tut le nyiz il abwa kɑ̃ məsjø pəti va sə kuʃ

In [6]:
thresholds = [0.6, 0.7, 0.8, 0.9]

results = compare_methods_with_different_thresholds(ground_truth, child_transcription, thresholds)

# Print out the results to compare them
for result in results:
    print(f"Threshold: {result['threshold']} -> Score: {result['score']}")

Threshold: 0.6 -> Score: 7
Threshold: 0.7 -> Score: 2
Threshold: 0.8 -> Score: 2
Threshold: 0.9 -> Score: 2


In [7]:
window_sizes = [3, 4, 5, 6, 7]
thresholds = [0.6, 0.7, 0.8, 0.9]

results = compare_methods_with_different_parameters(ground_truth, child_transcription, window_sizes, thresholds)

# Print out the results to compare them
for result in results:
    print(f"Window Size: {result['window_size']} | Threshold: {result['threshold']} -> Score: {result['score']}")

Window Size: 3 | Threshold: 0.6 -> Score: 1
Window Size: 3 | Threshold: 0.7 -> Score: 1
Window Size: 3 | Threshold: 0.8 -> Score: 1
Window Size: 3 | Threshold: 0.9 -> Score: 1
Window Size: 4 | Threshold: 0.6 -> Score: 1
Window Size: 4 | Threshold: 0.7 -> Score: 1
Window Size: 4 | Threshold: 0.8 -> Score: 1
Window Size: 4 | Threshold: 0.9 -> Score: 1
Window Size: 5 | Threshold: 0.6 -> Score: 1
Window Size: 5 | Threshold: 0.7 -> Score: 1
Window Size: 5 | Threshold: 0.8 -> Score: 1
Window Size: 5 | Threshold: 0.9 -> Score: 1
Window Size: 6 | Threshold: 0.6 -> Score: 1
Window Size: 6 | Threshold: 0.7 -> Score: 1
Window Size: 6 | Threshold: 0.8 -> Score: 1
Window Size: 6 | Threshold: 0.9 -> Score: 1
Window Size: 7 | Threshold: 0.6 -> Score: 1
Window Size: 7 | Threshold: 0.7 -> Score: 1
Window Size: 7 | Threshold: 0.8 -> Score: 1
Window Size: 7 | Threshold: 0.9 -> Score: 1
