# This is the driver file for the full pseudo transcript, TF-IDF based subset selection experiment

### Creating pseudo transcripts

In [1]:
import sys
import torch

In [2]:
print(sys.executable)

/home/mayank/.conda/envs/error/bin/python


In [3]:
device = torch.device("cuda" if torch.cuda.is_available() else "cpu")
print(device)

cuda


In [4]:
BASE_PATH = '/home/mayank/MTP/begin_again/Error-Driven-ASR-Personalization'
CURR_DIR = BASE_PATH + '/entropy-testing/pseudo-transcript-entropy'
PARENT_DIR = BASE_PATH + '/entropy-testing'

In [5]:
ACCENTS = list(map(lambda x : x + '_english', [
    'assamese_female', 
    'gujarati_female',
    'hindi_male',
    'kannada_male',
    'malayalam_male',
    'manipuri_female',
    'rajasthani_male',
    'tamil_male'
]))

BUDGETS= [
    '100',
    '200',
    '400',
    '800'
]

TARGET = [10]

METHODS = ['FL2MI', 'GCMI', 'LogDMI']

ETA = ['1.0']

SIM = ['euclidean']

FEATURES = ['39']

RUNS = ['1', '2', '3']

In [6]:
# Do the SMI generation

def doSMI(feature, similarity, eta, target, budget, method, accent):
    
    python_file = CURR_DIR + "/TSS.py"
    
    print("----------------------- TSS -----------------------")
    print(f"accent_{accent}, budget_{budget}, method_{method}")
    !$sys.executable $python_file --target $target --budget $budget --similarity $similarity --eta $eta --accent $accent --fxn $method --feature_type $feature
    

def generate_SMI_selections():
    for feature in FEATURES:
        for sim in SIM:
            for eta in ETA:
                for target in TARGET:
                    for budget in BUDGETS:
                        for method in METHODS:
                            for accent in ACCENTS:
                                doSMI(
                                    feature = feature,
                                    similarity = sim,
                                    eta = eta,
                                    target = target,
                                    budget = budget,
                                    method = method,
                                    accent = accent
                                )

generate_SMI_selections()

----------------------- TSS -----------------------
accent_assamese_female_english, budget_100, method_FL2MI
(50, 39)
(3244, 39)
(3491, 39)
(3267, 39)
(3492, 39)
(5183, 39)
(3169, 39)
(6925, 39)
(5765, 39)
(2513, 39)
34536 in ground, shape=(34536, 39)
10 in query, shape=(10, 39)
2513 in test, shape=(2513, 39)
creating kernels ....
kernel creation done .... in 13.553933143615723s
ground_kernel:  (34536, 34536)
query_kernel:  (34536, 10)
query_query_kernel:  (10, 10)

creating FL2MI object


FL2MI object created


generating greedyList...

[||||||||||||||||||||]100% [Iteration 300 of 300]
.... greedyList generated ... 

subset computed ....
----------------------- TSS -----------------------
accent_gujarati_female_english, budget_100, method_FL2MI
(50, 39)
(3244, 39)
(3491, 39)
(3267, 39)
(3492, 39)
(5183, 39)
(3169, 39)
(6925, 39)
(5765, 39)
(1401, 39)
34536 in ground, shape=(34536, 39)
10 in query, shape=(10, 39)
1401 in test, shape=(1401, 39)
creating kernels ....
kernel creation done

### Generate the transcripts and do the grapheme to phoneme.
-  We'll be directly using the code from error-model here

### Generate the transcripts

In [6]:
def infer_transcripts(feature, similarity, eta, target, budget, method, accent, run):
    python_env = sys.executable
    python_file = CURR_DIR + "/models/quartznet_asr/inference.py"
    data_base_dir = CURR_DIR + f"/data/{accent}/manifests/TSS_output/all/budget_{budget}/target_{target}/{method}/eta_{eta}/{similarity}/{feature}/run_{run}/"
    wav_dir=BASE_PATH + "/data/indicTTS_audio/indicTTS/{accent}/english/wav/"
    ckpt_base_dir=CURR_DIR + "/models/pretrained_checkpoints/"
    batch_size=32
    bash_file = CURR_DIR + "/models/quartznet_asr/scripts/infer_transcriptions_on_seed_set.sh"

    
    print("------ Generating Pseudo Transcripts -------")
    print(f"accent_{accent}, budget_{budget}, method_{method}, run_{run}")
    !export CUDA_VISIBLE_DEVICES=0,1 && bash $bash_file $python_env $python_file $data_base_dir $wav_dir $ckpt_base_dir $batch_size
    
def infer_transcripts_all():
#     ACCENTS = ["kannada_male_english"]
#     METHODS = ["FL2MI"]
#     BUDGETS = [800]
    for feature in FEATURES:
        for sim in SIM:
            for eta in ETA:
                for target in TARGET:
                    for budget in BUDGETS:
                        for method in METHODS:
                            for run in RUNS:
                                for accent in ACCENTS:
                                    infer_transcripts(
                                        feature = feature,
                                        similarity = sim,
                                        eta = eta,
                                        target = target,
                                        budget = budget,
                                        method = method,
                                        accent = accent,
                                        run = run
                                    )
    

In [None]:
infer_transcripts_all()

------ Generating Pseudo Transcripts -------
accent_assamese_female_english, budget_100, method_FL2MI, run_1
--------------START---------------
INPUTS  <--------- /home/mayank/MTP/begin_again/Error-Driven-ASR-Personalization/entropy-testing/pseudo-transcript-entropy/data/assamese_female_english/manifests/TSS_output/all/budget_100/target_10/FL2MI/eta_1.0/euclidean/39/run_1/
Outputs ---------> /home/mayank/MTP/begin_again/Error-Driven-ASR-Personalization/entropy-testing/pseudo-transcript-entropy/data/assamese_female_english/manifests/TSS_output/all/budget_100/target_10/FL2MI/eta_1.0/euclidean/39/run_1//quartznet_outputs
100%|█████████████████████████████████████████████| 3/3 [00:11<00:00,  5.54s/it]
--------------DONE---------------
------ Generating Pseudo Transcripts -------
accent_gujarati_female_english, budget_100, method_FL2MI, run_1
--------------START---------------
INPUTS  <--------- /home/mayank/MTP/begin_again/Error-Driven-ASR-Personalization/entropy-testing/pseudo-transcript-

--------------START---------------
INPUTS  <--------- /home/mayank/MTP/begin_again/Error-Driven-ASR-Personalization/entropy-testing/pseudo-transcript-entropy/data/kannada_male_english/manifests/TSS_output/all/budget_100/target_10/FL2MI/eta_1.0/euclidean/39/run_2/
Outputs ---------> /home/mayank/MTP/begin_again/Error-Driven-ASR-Personalization/entropy-testing/pseudo-transcript-entropy/data/kannada_male_english/manifests/TSS_output/all/budget_100/target_10/FL2MI/eta_1.0/euclidean/39/run_2//quartznet_outputs
100%|█████████████████████████████████████████████| 3/3 [00:08<00:00,  3.92s/it]
--------------DONE---------------
------ Generating Pseudo Transcripts -------
accent_malayalam_male_english, budget_100, method_FL2MI, run_2
--------------START---------------
INPUTS  <--------- /home/mayank/MTP/begin_again/Error-Driven-ASR-Personalization/entropy-testing/pseudo-transcript-entropy/data/malayalam_male_english/manifests/TSS_output/all/budget_100/target_10/FL2MI/eta_1.0/euclidean/39/run_2/


100%|█████████████████████████████████████████████| 3/3 [00:09<00:00,  4.57s/it]
--------------DONE---------------
------ Generating Pseudo Transcripts -------
accent_tamil_male_english, budget_100, method_FL2MI, run_3
--------------START---------------
INPUTS  <--------- /home/mayank/MTP/begin_again/Error-Driven-ASR-Personalization/entropy-testing/pseudo-transcript-entropy/data/tamil_male_english/manifests/TSS_output/all/budget_100/target_10/FL2MI/eta_1.0/euclidean/39/run_3/
Outputs ---------> /home/mayank/MTP/begin_again/Error-Driven-ASR-Personalization/entropy-testing/pseudo-transcript-entropy/data/tamil_male_english/manifests/TSS_output/all/budget_100/target_10/FL2MI/eta_1.0/euclidean/39/run_3//quartznet_outputs
100%|█████████████████████████████████████████████| 3/3 [00:08<00:00,  4.23s/it]
--------------DONE---------------
------ Generating Pseudo Transcripts -------
accent_assamese_female_english, budget_100, method_GCMI, run_1
--------------START---------------
INPUTS  <-------

--------------START---------------
INPUTS  <--------- /home/mayank/MTP/begin_again/Error-Driven-ASR-Personalization/entropy-testing/pseudo-transcript-entropy/data/hindi_male_english/manifests/TSS_output/all/budget_100/target_10/GCMI/eta_1.0/euclidean/39/run_2/
Outputs ---------> /home/mayank/MTP/begin_again/Error-Driven-ASR-Personalization/entropy-testing/pseudo-transcript-entropy/data/hindi_male_english/manifests/TSS_output/all/budget_100/target_10/GCMI/eta_1.0/euclidean/39/run_2//quartznet_outputs
100%|█████████████████████████████████████████████| 4/4 [00:08<00:00,  2.05s/it]
--------------DONE---------------
------ Generating Pseudo Transcripts -------
accent_kannada_male_english, budget_100, method_GCMI, run_2
--------------START---------------
INPUTS  <--------- /home/mayank/MTP/begin_again/Error-Driven-ASR-Personalization/entropy-testing/pseudo-transcript-entropy/data/kannada_male_english/manifests/TSS_output/all/budget_100/target_10/GCMI/eta_1.0/euclidean/39/run_2/
Outputs ----

100%|█████████████████████████████████████████████| 4/4 [00:07<00:00,  2.39s/it]
--------------DONE---------------
------ Generating Pseudo Transcripts -------
accent_rajasthani_male_english, budget_100, method_GCMI, run_3
--------------START---------------
INPUTS  <--------- /home/mayank/MTP/begin_again/Error-Driven-ASR-Personalization/entropy-testing/pseudo-transcript-entropy/data/rajasthani_male_english/manifests/TSS_output/all/budget_100/target_10/GCMI/eta_1.0/euclidean/39/run_3/
Outputs ---------> /home/mayank/MTP/begin_again/Error-Driven-ASR-Personalization/entropy-testing/pseudo-transcript-entropy/data/rajasthani_male_english/manifests/TSS_output/all/budget_100/target_10/GCMI/eta_1.0/euclidean/39/run_3//quartznet_outputs
100%|█████████████████████████████████████████████| 3/3 [00:09<00:00,  4.64s/it]
--------------DONE---------------
------ Generating Pseudo Transcripts -------
accent_tamil_male_english, budget_100, method_GCMI, run_3
--------------START---------------
INPUTS  <

100%|█████████████████████████████████████████████| 3/3 [00:08<00:00,  4.23s/it]
--------------DONE---------------
------ Generating Pseudo Transcripts -------
accent_gujarati_female_english, budget_100, method_LogDMI, run_2
--------------START---------------
INPUTS  <--------- /home/mayank/MTP/begin_again/Error-Driven-ASR-Personalization/entropy-testing/pseudo-transcript-entropy/data/gujarati_female_english/manifests/TSS_output/all/budget_100/target_10/LogDMI/eta_1.0/euclidean/39/run_2/
Outputs ---------> /home/mayank/MTP/begin_again/Error-Driven-ASR-Personalization/entropy-testing/pseudo-transcript-entropy/data/gujarati_female_english/manifests/TSS_output/all/budget_100/target_10/LogDMI/eta_1.0/euclidean/39/run_2//quartznet_outputs
100%|█████████████████████████████████████████████| 3/3 [00:11<00:00,  3.73s/it]
--------------DONE---------------
------ Generating Pseudo Transcripts -------
accent_hindi_male_english, budget_100, method_LogDMI, run_2
--------------START---------------
I

100%|█████████████████████████████████████████████| 4/4 [00:07<00:00,  1.93s/it]
--------------DONE---------------
------ Generating Pseudo Transcripts -------
accent_malayalam_male_english, budget_100, method_LogDMI, run_3
--------------START---------------
INPUTS  <--------- /home/mayank/MTP/begin_again/Error-Driven-ASR-Personalization/entropy-testing/pseudo-transcript-entropy/data/malayalam_male_english/manifests/TSS_output/all/budget_100/target_10/LogDMI/eta_1.0/euclidean/39/run_3/
Outputs ---------> /home/mayank/MTP/begin_again/Error-Driven-ASR-Personalization/entropy-testing/pseudo-transcript-entropy/data/malayalam_male_english/manifests/TSS_output/all/budget_100/target_10/LogDMI/eta_1.0/euclidean/39/run_3//quartznet_outputs
100%|█████████████████████████████████████████████| 3/3 [00:09<00:00,  4.38s/it]
--------------DONE---------------
------ Generating Pseudo Transcripts -------
accent_manipuri_female_english, budget_100, method_LogDMI, run_3
--------------START---------------

100%|█████████████████████████████████████████████| 5/5 [00:16<00:00,  4.09s/it]
--------------DONE---------------
------ Generating Pseudo Transcripts -------
accent_tamil_male_english, budget_200, method_FL2MI, run_1
--------------START---------------
INPUTS  <--------- /home/mayank/MTP/begin_again/Error-Driven-ASR-Personalization/entropy-testing/pseudo-transcript-entropy/data/tamil_male_english/manifests/TSS_output/all/budget_200/target_10/FL2MI/eta_1.0/euclidean/39/run_1/
Outputs ---------> /home/mayank/MTP/begin_again/Error-Driven-ASR-Personalization/entropy-testing/pseudo-transcript-entropy/data/tamil_male_english/manifests/TSS_output/all/budget_200/target_10/FL2MI/eta_1.0/euclidean/39/run_1//quartznet_outputs
100%|█████████████████████████████████████████████| 6/6 [00:18<00:00,  3.06s/it]
--------------DONE---------------
------ Generating Pseudo Transcripts -------
accent_assamese_female_english, budget_200, method_FL2MI, run_2
--------------START---------------
INPUTS  <------

------ Generating Pseudo Transcripts -------
accent_hindi_male_english, budget_200, method_FL2MI, run_3
--------------START---------------
INPUTS  <--------- /home/mayank/MTP/begin_again/Error-Driven-ASR-Personalization/entropy-testing/pseudo-transcript-entropy/data/hindi_male_english/manifests/TSS_output/all/budget_200/target_10/FL2MI/eta_1.0/euclidean/39/run_3/
Outputs ---------> /home/mayank/MTP/begin_again/Error-Driven-ASR-Personalization/entropy-testing/pseudo-transcript-entropy/data/hindi_male_english/manifests/TSS_output/all/budget_200/target_10/FL2MI/eta_1.0/euclidean/39/run_3//quartznet_outputs
100%|█████████████████████████████████████████████| 7/7 [00:15<00:00,  2.17s/it]
--------------DONE---------------
------ Generating Pseudo Transcripts -------
accent_kannada_male_english, budget_200, method_FL2MI, run_3
--------------START---------------
INPUTS  <--------- /home/mayank/MTP/begin_again/Error-Driven-ASR-Personalization/entropy-testing/pseudo-transcript-entropy/data/kanna

100%|█████████████████████████████████████████████| 8/8 [00:14<00:00,  1.83s/it]
--------------DONE---------------
------ Generating Pseudo Transcripts -------
accent_rajasthani_male_english, budget_200, method_GCMI, run_1
--------------START---------------
INPUTS  <--------- /home/mayank/MTP/begin_again/Error-Driven-ASR-Personalization/entropy-testing/pseudo-transcript-entropy/data/rajasthani_male_english/manifests/TSS_output/all/budget_200/target_10/GCMI/eta_1.0/euclidean/39/run_1/
Outputs ---------> /home/mayank/MTP/begin_again/Error-Driven-ASR-Personalization/entropy-testing/pseudo-transcript-entropy/data/rajasthani_male_english/manifests/TSS_output/all/budget_200/target_10/GCMI/eta_1.0/euclidean/39/run_1//quartznet_outputs
100%|█████████████████████████████████████████████| 5/5 [00:16<00:00,  4.07s/it]
--------------DONE---------------
------ Generating Pseudo Transcripts -------
accent_tamil_male_english, budget_200, method_GCMI, run_1
--------------START---------------
INPUTS  <

--------------START---------------
INPUTS  <--------- /home/mayank/MTP/begin_again/Error-Driven-ASR-Personalization/entropy-testing/pseudo-transcript-entropy/data/rajasthani_male_english/manifests/TSS_output/all/budget_200/target_10/GCMI/eta_1.0/euclidean/39/run_3/
Outputs ---------> /home/mayank/MTP/begin_again/Error-Driven-ASR-Personalization/entropy-testing/pseudo-transcript-entropy/data/rajasthani_male_english/manifests/TSS_output/all/budget_200/target_10/GCMI/eta_1.0/euclidean/39/run_3//quartznet_outputs
100%|█████████████████████████████████████████████| 5/5 [00:15<00:00,  3.94s/it]
--------------DONE---------------
------ Generating Pseudo Transcripts -------
accent_tamil_male_english, budget_200, method_GCMI, run_3
--------------START---------------
INPUTS  <--------- /home/mayank/MTP/begin_again/Error-Driven-ASR-Personalization/entropy-testing/pseudo-transcript-entropy/data/tamil_male_english/manifests/TSS_output/all/budget_200/target_10/GCMI/eta_1.0/euclidean/39/run_3/
Output

100%|█████████████████████████████████████████████| 5/5 [00:12<00:00,  2.47s/it]
--------------DONE---------------
------ Generating Pseudo Transcripts -------
accent_hindi_male_english, budget_200, method_LogDMI, run_2
--------------START---------------
INPUTS  <--------- /home/mayank/MTP/begin_again/Error-Driven-ASR-Personalization/entropy-testing/pseudo-transcript-entropy/data/hindi_male_english/manifests/TSS_output/all/budget_200/target_10/LogDMI/eta_1.0/euclidean/39/run_2/
Outputs ---------> /home/mayank/MTP/begin_again/Error-Driven-ASR-Personalization/entropy-testing/pseudo-transcript-entropy/data/hindi_male_english/manifests/TSS_output/all/budget_200/target_10/LogDMI/eta_1.0/euclidean/39/run_2//quartznet_outputs
100%|█████████████████████████████████████████████| 8/8 [00:14<00:00,  1.76s/it]
--------------DONE---------------
------ Generating Pseudo Transcripts -------
accent_kannada_male_english, budget_200, method_LogDMI, run_2
--------------START---------------
INPUTS  <-----

100%|█████████████████████████████████████████████| 6/6 [00:15<00:00,  2.83s/it]
--------------DONE---------------
------ Generating Pseudo Transcripts -------
accent_manipuri_female_english, budget_200, method_LogDMI, run_3
--------------START---------------
INPUTS  <--------- /home/mayank/MTP/begin_again/Error-Driven-ASR-Personalization/entropy-testing/pseudo-transcript-entropy/data/manipuri_female_english/manifests/TSS_output/all/budget_200/target_10/LogDMI/eta_1.0/euclidean/39/run_3/
Outputs ---------> /home/mayank/MTP/begin_again/Error-Driven-ASR-Personalization/entropy-testing/pseudo-transcript-entropy/data/manipuri_female_english/manifests/TSS_output/all/budget_200/target_10/LogDMI/eta_1.0/euclidean/39/run_3//quartznet_outputs
100%|█████████████████████████████████████████████| 9/9 [00:12<00:00,  1.01it/s]
--------------DONE---------------
------ Generating Pseudo Transcripts -------
accent_rajasthani_male_english, budget_200, method_LogDMI, run_3
--------------START------------

------ Generating Pseudo Transcripts -------
accent_assamese_female_english, budget_400, method_FL2MI, run_2
--------------START---------------
INPUTS  <--------- /home/mayank/MTP/begin_again/Error-Driven-ASR-Personalization/entropy-testing/pseudo-transcript-entropy/data/assamese_female_english/manifests/TSS_output/all/budget_400/target_10/FL2MI/eta_1.0/euclidean/39/run_2/
Outputs ---------> /home/mayank/MTP/begin_again/Error-Driven-ASR-Personalization/entropy-testing/pseudo-transcript-entropy/data/assamese_female_english/manifests/TSS_output/all/budget_400/target_10/FL2MI/eta_1.0/euclidean/39/run_2//quartznet_outputs
100%|███████████████████████████████████████████| 11/11 [00:24<00:00,  1.69s/it]
--------------DONE---------------
------ Generating Pseudo Transcripts -------
accent_gujarati_female_english, budget_400, method_FL2MI, run_2
--------------START---------------
INPUTS  <--------- /home/mayank/MTP/begin_again/Error-Driven-ASR-Personalization/entropy-testing/pseudo-transcript-

--------------START---------------
INPUTS  <--------- /home/mayank/MTP/begin_again/Error-Driven-ASR-Personalization/entropy-testing/pseudo-transcript-entropy/data/kannada_male_english/manifests/TSS_output/all/budget_400/target_10/FL2MI/eta_1.0/euclidean/39/run_3/
Outputs ---------> /home/mayank/MTP/begin_again/Error-Driven-ASR-Personalization/entropy-testing/pseudo-transcript-entropy/data/kannada_male_english/manifests/TSS_output/all/budget_400/target_10/FL2MI/eta_1.0/euclidean/39/run_3//quartznet_outputs
100%|███████████████████████████████████████████| 12/12 [00:23<00:00,  1.97s/it]
--------------DONE---------------
------ Generating Pseudo Transcripts -------
accent_malayalam_male_english, budget_400, method_FL2MI, run_3
--------------START---------------
INPUTS  <--------- /home/mayank/MTP/begin_again/Error-Driven-ASR-Personalization/entropy-testing/pseudo-transcript-entropy/data/malayalam_male_english/manifests/TSS_output/all/budget_400/target_10/FL2MI/eta_1.0/euclidean/39/run_3/


100%|███████████████████████████████████████████| 10/10 [00:28<00:00,  2.77s/it]
--------------DONE---------------
------ Generating Pseudo Transcripts -------
accent_tamil_male_english, budget_400, method_GCMI, run_1
--------------START---------------
INPUTS  <--------- /home/mayank/MTP/begin_again/Error-Driven-ASR-Personalization/entropy-testing/pseudo-transcript-entropy/data/tamil_male_english/manifests/TSS_output/all/budget_400/target_10/GCMI/eta_1.0/euclidean/39/run_1/
Outputs ---------> /home/mayank/MTP/begin_again/Error-Driven-ASR-Personalization/entropy-testing/pseudo-transcript-entropy/data/tamil_male_english/manifests/TSS_output/all/budget_400/target_10/GCMI/eta_1.0/euclidean/39/run_1//quartznet_outputs
100%|███████████████████████████████████████████| 11/11 [00:27<00:00,  2.00s/it]
--------------DONE---------------
------ Generating Pseudo Transcripts -------
accent_assamese_female_english, budget_400, method_GCMI, run_2
--------------START---------------
INPUTS  <--------- 

--------------START---------------
INPUTS  <--------- /home/mayank/MTP/begin_again/Error-Driven-ASR-Personalization/entropy-testing/pseudo-transcript-entropy/data/hindi_male_english/manifests/TSS_output/all/budget_400/target_10/GCMI/eta_1.0/euclidean/39/run_3/
Outputs ---------> /home/mayank/MTP/begin_again/Error-Driven-ASR-Personalization/entropy-testing/pseudo-transcript-entropy/data/hindi_male_english/manifests/TSS_output/all/budget_400/target_10/GCMI/eta_1.0/euclidean/39/run_3//quartznet_outputs
100%|███████████████████████████████████████████| 13/13 [00:25<00:00,  1.92s/it]
--------------DONE---------------
------ Generating Pseudo Transcripts -------
accent_kannada_male_english, budget_400, method_GCMI, run_3
--------------START---------------
INPUTS  <--------- /home/mayank/MTP/begin_again/Error-Driven-ASR-Personalization/entropy-testing/pseudo-transcript-entropy/data/kannada_male_english/manifests/TSS_output/all/budget_400/target_10/GCMI/eta_1.0/euclidean/39/run_3/
Outputs ----

100%|███████████████████████████████████████████| 13/13 [00:23<00:00,  1.05s/it]
--------------DONE---------------
------ Generating Pseudo Transcripts -------
accent_gujarati_female_english, budget_400, method_LogDMI, run_2
--------------START---------------
INPUTS  <--------- /home/mayank/MTP/begin_again/Error-Driven-ASR-Personalization/entropy-testing/pseudo-transcript-entropy/data/gujarati_female_english/manifests/TSS_output/all/budget_400/target_10/LogDMI/eta_1.0/euclidean/39/run_2/
Outputs ---------> /home/mayank/MTP/begin_again/Error-Driven-ASR-Personalization/entropy-testing/pseudo-transcript-entropy/data/gujarati_female_english/manifests/TSS_output/all/budget_400/target_10/LogDMI/eta_1.0/euclidean/39/run_2//quartznet_outputs
100%|█████████████████████████████████████████████| 9/9 [00:22<00:00,  1.67s/it]
--------------DONE---------------
------ Generating Pseudo Transcripts -------
accent_hindi_male_english, budget_400, method_LogDMI, run_2
--------------START---------------
I

100%|███████████████████████████████████████████| 14/14 [00:25<00:00,  1.83s/it]
--------------DONE---------------
------ Generating Pseudo Transcripts -------
accent_malayalam_male_english, budget_400, method_LogDMI, run_3
--------------START---------------
INPUTS  <--------- /home/mayank/MTP/begin_again/Error-Driven-ASR-Personalization/entropy-testing/pseudo-transcript-entropy/data/malayalam_male_english/manifests/TSS_output/all/budget_400/target_10/LogDMI/eta_1.0/euclidean/39/run_3/
Outputs ---------> /home/mayank/MTP/begin_again/Error-Driven-ASR-Personalization/entropy-testing/pseudo-transcript-entropy/data/malayalam_male_english/manifests/TSS_output/all/budget_400/target_10/LogDMI/eta_1.0/euclidean/39/run_3//quartznet_outputs
100%|███████████████████████████████████████████| 12/12 [00:24<00:00,  2.01s/it]
--------------DONE---------------
------ Generating Pseudo Transcripts -------
accent_manipuri_female_english, budget_400, method_LogDMI, run_3
--------------START---------------

100%|███████████████████████████████████████████| 21/21 [00:45<00:00,  2.18s/it]
--------------DONE---------------
------ Generating Pseudo Transcripts -------
accent_tamil_male_english, budget_800, method_FL2MI, run_1
--------------START---------------
INPUTS  <--------- /home/mayank/MTP/begin_again/Error-Driven-ASR-Personalization/entropy-testing/pseudo-transcript-entropy/data/tamil_male_english/manifests/TSS_output/all/budget_800/target_10/FL2MI/eta_1.0/euclidean/39/run_1/
Outputs ---------> /home/mayank/MTP/begin_again/Error-Driven-ASR-Personalization/entropy-testing/pseudo-transcript-entropy/data/tamil_male_english/manifests/TSS_output/all/budget_800/target_10/FL2MI/eta_1.0/euclidean/39/run_1//quartznet_outputs
100%|███████████████████████████████████████████| 22/22 [00:48<00:00,  1.97s/it]
--------------DONE---------------
------ Generating Pseudo Transcripts -------
accent_assamese_female_english, budget_800, method_FL2MI, run_2
--------------START---------------
INPUTS  <------

100%|███████████████████████████████████████████| 23/23 [00:45<00:00,  1.27s/it]
--------------DONE---------------
------ Generating Pseudo Transcripts -------
accent_malayalam_male_english, budget_800, method_FL2MI, run_3
--------------START---------------
INPUTS  <--------- /home/mayank/MTP/begin_again/Error-Driven-ASR-Personalization/entropy-testing/pseudo-transcript-entropy/data/malayalam_male_english/manifests/TSS_output/all/budget_800/target_10/FL2MI/eta_1.0/euclidean/39/run_3/
Outputs ---------> /home/mayank/MTP/begin_again/Error-Driven-ASR-Personalization/entropy-testing/pseudo-transcript-entropy/data/malayalam_male_english/manifests/TSS_output/all/budget_800/target_10/FL2MI/eta_1.0/euclidean/39/run_3//quartznet_outputs
100%|███████████████████████████████████████████| 22/22 [00:48<00:00,  2.18s/it]
--------------DONE---------------
------ Generating Pseudo Transcripts -------
accent_manipuri_female_english, budget_800, method_FL2MI, run_3
--------------START---------------
INP

------ Generating Pseudo Transcripts -------
accent_tamil_male_english, budget_800, method_GCMI, run_1
--------------START---------------
INPUTS  <--------- /home/mayank/MTP/begin_again/Error-Driven-ASR-Personalization/entropy-testing/pseudo-transcript-entropy/data/tamil_male_english/manifests/TSS_output/all/budget_800/target_10/GCMI/eta_1.0/euclidean/39/run_1/
Outputs ---------> /home/mayank/MTP/begin_again/Error-Driven-ASR-Personalization/entropy-testing/pseudo-transcript-entropy/data/tamil_male_english/manifests/TSS_output/all/budget_800/target_10/GCMI/eta_1.0/euclidean/39/run_1//quartznet_outputs
100%|███████████████████████████████████████████| 22/22 [00:49<00:00,  2.29s/it]
--------------DONE---------------
------ Generating Pseudo Transcripts -------
accent_assamese_female_english, budget_800, method_GCMI, run_2
--------------START---------------
INPUTS  <--------- /home/mayank/MTP/begin_again/Error-Driven-ASR-Personalization/entropy-testing/pseudo-transcript-entropy/data/assame

#### Get the phoneme versions

#### Do the TF-IDF vectors

#### Make selections using some submodlib utility