In [1]:
import os
import pandas as pd
import numpy as np
from google.cloud import speech_v1
from google.cloud.speech_v1 import enums
from google.datalab import storage
from tqdm import tqdm
from multiprocessing import Pool

In [2]:
print("Hello")

Hello


In [3]:
#CONSTANTS
MANIFEST_PATH = 'gs://aave-test-bucket/DCB_manifest.csv'
WAV_FOLDER = 'data_processed_DCB/wav'
OUTPUT_PATH = 'DCB_manifest_transcribed.csv'

In [4]:
os.environ["GOOGLE_APPLICATION_CREDENTIALS"]="speech-rec-key.json"

In [5]:
root = "gs://aave-test-bucket"
audio_files = [o.key for o in storage.Bucket('aave-test-bucket').objects() if o.key.startswith(WAV_FOLDER)]
manifest = pd.read_csv(MANIFEST_PATH)
# manifest["google_transcription"] = np.nan

In [6]:
print(len(audio_files))

4361


In [7]:
manifest.head()

Unnamed: 0,wav_file,txt_file,groundtruth_text,duration,age,gender
0,data_processed_DCB/wav/DCB_se1_ag1_m_01_1_part...,data_processed_DCB/txt/DCB_se1_ag1_m_01_1_part...,"Uh, I want to- I'm going to pursue IT. And I'm...",13.18,18,Male
1,data_processed_DCB/wav/DCB_se1_ag1_m_01_1_part...,data_processed_DCB/txt/DCB_se1_ag1_m_01_1_part...,showing that all young black men shouldn't go ...,21.988,18,Male
2,data_processed_DCB/wav/DCB_se1_ag1_m_01_1_part...,data_processed_DCB/txt/DCB_se1_ag1_m_01_1_part...,[And one-] And once you in college we will try...,5.134,18,Male
3,data_processed_DCB/wav/DCB_se1_ag1_m_01_1_part...,data_processed_DCB/txt/DCB_se1_ag1_m_01_1_part...,"Uh, well, basically as of today, Congress Heig...",30.588,18,Male
4,data_processed_DCB/wav/DCB_se1_ag1_m_01_1_part...,data_processed_DCB/txt/DCB_se1_ag1_m_01_1_part...,"Uh, I had /began before the street life/ for- ...",28.943,18,Male


In [8]:
def get_single_transcript(storage_uri):
    """
    Transcribe long audio file from Cloud Storage using asynchronous speech
    recognition

    Args:
      storage_uri URI for audio file in Cloud Storage, e.g. gs://[BUCKET]/[FILE]
    """

    client = speech_v1.SpeechClient()

    # The language of the supplied audio
    language_code = "en-US"

    config = {
        "language_code": language_code,
    }
    
    audio = {"uri": storage_uri}
    try:

        operation = client.long_running_recognize(config, audio)

        response = operation.result()
    
        transcript = []
        for result in response.results:
            # First alternative is the most probable result
            alternative = result.alternatives[0]
            transcript.append(alternative.transcript.strip())

        return " ".join(transcript)
    except:
        print("CONNECTION FAILED")
        print(storage_uri)
        return np.nan
        

In [9]:
client = speech_v1.SpeechClient()

def get_single_transcript_multithreaded(audio_file):
    """
    Transcribe long audio file from Cloud Storage using asynchronous speech
    recognition

    Args:
      storage_uri URI for audio file in Cloud Storage, e.g. gs://[BUCKET]/[FILE]
    """

    # The language of the supplied audio
    storage_uri = os.path.join(root, audio_file)
    language_code = "en-US"

    config = {
        "language_code": language_code,
    }
    
    audio = {"uri": storage_uri}
    try:

        operation = client.long_running_recognize(config, audio)

        response = operation.result()
    
        transcript = []
        for result in response.results:
            # First alternative is the most probable result
            alternative = result.alternatives[0]
            transcript.append(alternative.transcript.strip())

        return audio_file," ".join(transcript)
    except:
        print("CONNECTION FAILED")
        return audio_file,np.nan
        

In [11]:
#single process version
num = 10#len(audio_files)
for idx in tqdm(range(num)):
    print("iter")
    audio_file = audio_files[idx]
    full_file_path = os.path.join(root, audio_file)
    transcript = get_single_transcript(full_file_path)
    print(audio_file)
    print(transcript)
#     manifest.loc[manifest['wav_file'] == audio_file, "google_transcription"] = transcript
#     manifest.to_csv("ROC_manifest_transcribed.csv")

  0%|          | 0/10 [00:00<?, ?it/s]

iter


 10%|█         | 1/10 [00:04<00:44,  4.91s/it]

data_processed_DCB/wav/DCB_se1_ag1_m_01_1_part_1.wav
I want it going to pursue it nonprofit program call big bro
iter


 20%|██        | 2/10 [00:07<00:32,  4.11s/it]

data_processed_DCB/wav/DCB_se1_ag1_m_01_1_part_10.wav
I just want to do everything
iter


 30%|███       | 3/10 [00:10<00:27,  3.88s/it]

data_processed_DCB/wav/DCB_se1_ag1_m_01_1_part_100.wav
ugly one message for people made
iter


 40%|████      | 4/10 [00:16<00:26,  4.45s/it]

data_processed_DCB/wav/DCB_se1_ag1_m_01_1_part_101.wav
find something that you like by something is different from everybody else it is a Trends easy to set but your life is not the easiest
iter


 50%|█████     | 5/10 [00:22<00:24,  4.83s/it]

data_processed_DCB/wav/DCB_se1_ag1_m_01_1_part_11.wav
in the school I was going I was in the computer science class so I learn how to do coding Emily got me interested
iter


 60%|██████    | 6/10 [00:26<00:19,  4.77s/it]

data_processed_DCB/wav/DCB_se1_ag1_m_01_1_part_12.wav
because my family's most be spread out to deceased
iter


 70%|███████   | 7/10 [00:33<00:16,  5.49s/it]

data_processed_DCB/wav/DCB_se1_ag1_m_01_1_part_13.wav
is different but still the same Wisconsin environment different the way it looks different but in general still the same but you still have to watch over your shoulder at the people you grew up with you still got to be careful with your friends is like this is a cycle
iter


 80%|████████  | 8/10 [01:00<00:23, 11.95s/it]

data_processed_DCB/wav/DCB_se1_ag1_m_01_1_part_14.wav
if you go out with somebody and y'all get into it or if you more successful than we have to watch out maybe they might be trying to rob you with a probably try to kill you and stuff like that like I don't think that's likely going to break everybody want the same goal but nobody was trying to reach
iter


 90%|█████████ | 9/10 [01:12<00:11, 11.96s/it]

data_processed_DCB/wav/DCB_se1_ag1_m_01_1_part_15.wav
I guess Parkland is beefing with a hood that's literally right down the street 22nd it's literally has the Boys & Girls Club in these row houses townhouses other than that it's basically nothing to separate
iter


100%|██████████| 10/10 [01:23<00:00,  8.30s/it]

data_processed_DCB/wav/DCB_se1_ag1_m_01_1_part_16.wav
is Ali you can get junk it is shot at 4 you get if you get robbed if there's a lot of stuff, I got her people that kidnapped just Allah





In [13]:
%%time
num_audio_files = len(audio_files)
transcript_dict = {'audio_file':[], 'google_transcription': []}
with Pool(20) as p:
    with tqdm(total=num_audio_files) as prog_bar:
        for i, result in enumerate(tqdm(p.imap_unordered(get_single_transcript_multithreaded, audio_files))):
            prog_bar.update()
            transcript_dict['audio_file'].append(result[0])
            transcript_dict['google_transcription'].append(result[1])

  0%|          | 0/4361 [00:00<?, ?it/s]
  0%|          | 1/4361 [00:03<3:52:54,  3.21s/it]
  0%|          | 3/4361 [00:04<3:01:35,  2.50s/it]
  0%|          | 4/4361 [00:05<2:10:33,  1.80s/it]
  0%|          | 5/4361 [00:05<1:48:29,  1.49s/it]
  0%|          | 7/4361 [00:06<1:20:47,  1.11s/it]
  0%|          | 8/4361 [00:07<1:28:12,  1.22s/it]
  0%|          | 9/4361 [00:08<1:08:48,  1.05it/s]
  0%|          | 10/4361 [00:08<52:30,  1.38it/s] 
  0%|          | 11/4361 [00:08<44:57,  1.61it/s]
  0%|          | 12/4361 [00:08<37:00,  1.96it/s]
  0%|          | 14/4361 [00:09<32:34,  2.22it/s]
  0%|          | 15/4361 [00:09<27:57,  2.59it/s]
  0%|          | 17/4361 [00:10<24:59,  2.90it/s]
  0%|          | 18/4361 [00:10<26:53,  2.69it/s]
  0%|          | 19/4361 [00:12<1:04:06,  1.13it/s]
  0%|          | 20/4361 [00:13<51:28,  1.41it/s]  
  1%|          | 22/4361 [00:13<39:47,  1.82it/s]
  1%|          | 23/4361 [00:13<39:43,  1.82it/s]
  1%|          | 25/4361 [00:14<32:39,  2.21it/

  5%|▍         | 197/4361 [01:27<23:37,  2.94it/s]
  5%|▍         | 198/4361 [01:28<36:37,  1.89it/s]
  5%|▍         | 199/4361 [01:28<28:35,  2.43it/s]
  5%|▍         | 200/4361 [01:28<28:44,  2.41it/s]
  5%|▍         | 201/4361 [01:29<38:32,  1.80it/s]
  5%|▍         | 202/4361 [01:30<33:49,  2.05it/s]
  5%|▍         | 204/4361 [01:30<31:21,  2.21it/s]
  5%|▍         | 206/4361 [01:31<32:16,  2.15it/s]
  5%|▍         | 207/4361 [01:32<25:51,  2.68it/s]
  5%|▍         | 208/4361 [01:32<24:02,  2.88it/s]
  5%|▍         | 210/4361 [01:32<22:06,  3.13it/s]
  5%|▍         | 211/4361 [01:32<17:57,  3.85it/s]
  5%|▍         | 212/4361 [01:33<24:24,  2.83it/s]
  5%|▍         | 213/4361 [01:33<19:40,  3.51it/s]
  5%|▍         | 214/4361 [01:34<27:56,  2.47it/s]
  5%|▍         | 215/4361 [01:34<22:41,  3.04it/s]
  5%|▍         | 216/4361 [01:34<20:18,  3.40it/s]
  5%|▍         | 217/4361 [01:35<21:44,  3.18it/s]
  5%|▍         | 218/4361 [01:35<17:40,  3.91it/s]
  5%|▌         | 219/4361 [01:3

  9%|▉         | 393/4361 [03:03<43:37,  1.52it/s]
  9%|▉         | 394/4361 [03:03<32:50,  2.01it/s]
  9%|▉         | 396/4361 [03:03<29:17,  2.26it/s]
  9%|▉         | 397/4361 [03:05<47:46,  1.38it/s]
  9%|▉         | 398/4361 [03:05<36:23,  1.81it/s]
  9%|▉         | 399/4361 [03:06<47:15,  1.40it/s]
  9%|▉         | 401/4361 [03:07<42:58,  1.54it/s]
  9%|▉         | 402/4361 [03:08<57:59,  1.14it/s]
  9%|▉         | 403/4361 [03:10<1:11:01,  1.08s/it]
  9%|▉         | 404/4361 [03:11<1:14:26,  1.13s/it]
  9%|▉         | 405/4361 [03:12<1:16:20,  1.16s/it]
  9%|▉         | 407/4361 [03:13<59:35,  1.11it/s]  
  9%|▉         | 408/4361 [03:13<46:23,  1.42it/s]
  9%|▉         | 410/4361 [03:14<41:37,  1.58it/s]
  9%|▉         | 411/4361 [03:15<42:22,  1.55it/s]
  9%|▉         | 413/4361 [03:16<37:26,  1.76it/s]
 10%|▉         | 415/4361 [03:16<31:02,  2.12it/s]
 10%|▉         | 416/4361 [03:17<38:49,  1.69it/s]
 10%|▉         | 417/4361 [03:17<31:21,  2.10it/s]
 10%|▉         | 418/43

 14%|█▎        | 598/4361 [04:37<13:27,  4.66it/s]
 14%|█▎        | 599/4361 [04:38<25:21,  2.47it/s]
 14%|█▍        | 600/4361 [04:39<39:18,  1.59it/s]
 14%|█▍        | 601/4361 [04:39<29:32,  2.12it/s]
 14%|█▍        | 602/4361 [04:40<31:56,  1.96it/s]
 14%|█▍        | 605/4361 [04:40<24:34,  2.55it/s]
 14%|█▍        | 607/4361 [04:41<21:49,  2.87it/s]
 14%|█▍        | 608/4361 [04:41<17:09,  3.65it/s]
 14%|█▍        | 609/4361 [04:41<17:26,  3.59it/s]
 14%|█▍        | 610/4361 [04:42<20:27,  3.06it/s]
 14%|█▍        | 612/4361 [04:42<16:06,  3.88it/s]
 14%|█▍        | 613/4361 [04:43<26:54,  2.32it/s]
 14%|█▍        | 614/4361 [04:43<22:47,  2.74it/s]
 14%|█▍        | 615/4361 [04:43<19:04,  3.27it/s]
 14%|█▍        | 617/4361 [04:43<14:32,  4.29it/s]
 14%|█▍        | 618/4361 [04:43<12:51,  4.85it/s]
 14%|█▍        | 619/4361 [04:43<11:30,  5.42it/s]
 14%|█▍        | 620/4361 [04:43<10:11,  6.12it/s]
 14%|█▍        | 621/4361 [04:44<09:53,  6.30it/s]
 14%|█▍        | 622/4361 [04:4

 18%|█▊        | 787/4361 [07:02<26:46,  2.22it/s]
 18%|█▊        | 788/4361 [07:03<32:09,  1.85it/s]
 18%|█▊        | 789/4361 [07:03<30:44,  1.94it/s]
 18%|█▊        | 790/4361 [07:04<31:02,  1.92it/s]
 18%|█▊        | 792/4361 [07:04<23:25,  2.54it/s]
 18%|█▊        | 793/4361 [07:04<19:35,  3.04it/s]
 18%|█▊        | 794/4361 [07:05<25:16,  2.35it/s]
 18%|█▊        | 795/4361 [07:05<19:34,  3.04it/s]
 18%|█▊        | 797/4361 [07:06<20:34,  2.89it/s]
 18%|█▊        | 798/4361 [07:06<31:46,  1.87it/s]
 18%|█▊        | 799/4361 [07:08<50:31,  1.18it/s]
 18%|█▊        | 800/4361 [07:08<41:20,  1.44it/s]
 18%|█▊        | 801/4361 [07:09<31:03,  1.91it/s]
 18%|█▊        | 802/4361 [07:09<31:09,  1.90it/s]
 18%|█▊        | 805/4361 [07:09<22:47,  2.60it/s]
 18%|█▊        | 806/4361 [07:10<30:11,  1.96it/s]
 19%|█▊        | 808/4361 [07:10<24:49,  2.39it/s]
 19%|█▊        | 809/4361 [07:11<30:03,  1.97it/s]
 19%|█▊        | 810/4361 [07:12<44:37,  1.33it/s]
 19%|█▊        | 812/4361 [07:1

 23%|██▎       | 988/4361 [08:27<26:01,  2.16it/s]
 23%|██▎       | 989/4361 [08:27<20:11,  2.78it/s]
 23%|██▎       | 990/4361 [08:27<20:39,  2.72it/s]
 23%|██▎       | 992/4361 [08:28<17:09,  3.27it/s]
 23%|██▎       | 994/4361 [08:29<22:21,  2.51it/s]
 23%|██▎       | 995/4361 [08:29<21:58,  2.55it/s]
 23%|██▎       | 996/4361 [08:30<25:46,  2.18it/s]
 23%|██▎       | 997/4361 [08:30<26:40,  2.10it/s]
 23%|██▎       | 998/4361 [08:31<35:33,  1.58it/s]
 23%|██▎       | 999/4361 [08:32<33:10,  1.69it/s]
 23%|██▎       | 1000/4361 [08:32<30:35,  1.83it/s]
 23%|██▎       | 1001/4361 [08:32<24:50,  2.25it/s]
 23%|██▎       | 1002/4361 [08:33<23:38,  2.37it/s]
 23%|██▎       | 1003/4361 [08:33<23:22,  2.39it/s]
 23%|██▎       | 1004/4361 [08:34<29:27,  1.90it/s]
 23%|██▎       | 1005/4361 [08:34<25:46,  2.17it/s]
 23%|██▎       | 1007/4361 [08:35<21:13,  2.63it/s]
 23%|██▎       | 1008/4361 [08:35<16:57,  3.30it/s]
 23%|██▎       | 1009/4361 [08:36<26:27,  2.11it/s]
 23%|██▎       | 1011/

 27%|██▋       | 1171/4361 [10:06<1:03:49,  1.20s/it]
 27%|██▋       | 1172/4361 [10:07<56:14,  1.06s/it]  
 27%|██▋       | 1173/4361 [10:07<44:14,  1.20it/s]
 27%|██▋       | 1174/4361 [10:08<40:16,  1.32it/s]
 27%|██▋       | 1176/4361 [10:09<37:30,  1.41it/s]
 27%|██▋       | 1177/4361 [10:09<31:53,  1.66it/s]
 27%|██▋       | 1178/4361 [10:10<26:49,  1.98it/s]
 27%|██▋       | 1179/4361 [10:10<33:35,  1.58it/s]
 27%|██▋       | 1180/4361 [10:11<29:44,  1.78it/s]
 27%|██▋       | 1181/4361 [10:13<48:21,  1.10it/s]
 27%|██▋       | 1182/4361 [10:13<42:30,  1.25it/s]
 27%|██▋       | 1183/4361 [10:13<32:26,  1.63it/s]
 27%|██▋       | 1184/4361 [10:15<42:30,  1.25it/s]
 27%|██▋       | 1185/4361 [10:15<38:15,  1.38it/s]
 27%|██▋       | 1187/4361 [10:20<1:07:23,  1.27s/it]
 27%|██▋       | 1188/4361 [10:22<1:18:12,  1.48s/it]
 27%|██▋       | 1189/4361 [10:24<1:18:16,  1.48s/it]
 27%|██▋       | 1190/4361 [10:24<1:00:27,  1.14s/it]
 27%|██▋       | 1191/4361 [10:24<44:34,  1.19it/s] 

 31%|███       | 1356/4361 [12:10<18:59,  2.64it/s]
 31%|███       | 1357/4361 [12:11<18:31,  2.70it/s]
 31%|███       | 1358/4361 [12:11<18:36,  2.69it/s]
 31%|███       | 1359/4361 [12:12<36:18,  1.38it/s]
 31%|███       | 1360/4361 [12:13<27:52,  1.79it/s]
 31%|███       | 1361/4361 [12:13<24:55,  2.01it/s]
 31%|███       | 1362/4361 [12:13<19:53,  2.51it/s]
 31%|███▏      | 1364/4361 [12:13<15:03,  3.32it/s]
 31%|███▏      | 1365/4361 [12:14<15:23,  3.24it/s]
 31%|███▏      | 1366/4361 [12:14<18:04,  2.76it/s]
 31%|███▏      | 1367/4361 [12:15<26:06,  1.91it/s]
 31%|███▏      | 1368/4361 [12:16<28:25,  1.76it/s]
 31%|███▏      | 1370/4361 [12:16<23:56,  2.08it/s]
 31%|███▏      | 1371/4361 [12:17<25:05,  1.99it/s]
 31%|███▏      | 1372/4361 [12:17<24:14,  2.06it/s]
 31%|███▏      | 1373/4361 [12:18<31:28,  1.58it/s]
 32%|███▏      | 1375/4361 [12:19<28:09,  1.77it/s]
 32%|███▏      | 1376/4361 [12:20<27:19,  1.82it/s]
 32%|███▏      | 1377/4361 [12:20<25:32,  1.95it/s]
 32%|███▏   

 35%|███▌      | 1533/4361 [15:01<26:58,  1.75it/s]
 35%|███▌      | 1534/4361 [15:01<25:34,  1.84it/s]
 35%|███▌      | 1535/4361 [15:01<20:12,  2.33it/s]
 35%|███▌      | 1536/4361 [15:02<21:16,  2.21it/s]
 35%|███▌      | 1537/4361 [15:03<28:20,  1.66it/s]
 35%|███▌      | 1538/4361 [15:03<27:37,  1.70it/s]
 35%|███▌      | 1539/4361 [15:04<24:43,  1.90it/s]
 35%|███▌      | 1540/4361 [15:04<19:23,  2.42it/s]
 35%|███▌      | 1541/4361 [15:04<17:45,  2.65it/s]
 35%|███▌      | 1542/4361 [15:05<17:46,  2.64it/s]
 35%|███▌      | 1543/4361 [15:05<14:59,  3.13it/s]
 35%|███▌      | 1544/4361 [15:05<16:28,  2.85it/s]
 35%|███▌      | 1545/4361 [15:06<19:43,  2.38it/s]
 35%|███▌      | 1546/4361 [15:07<28:53,  1.62it/s]
 35%|███▌      | 1547/4361 [15:07<25:00,  1.87it/s]
 35%|███▌      | 1548/4361 [15:08<22:34,  2.08it/s]
 36%|███▌      | 1549/4361 [15:08<17:39,  2.65it/s]
 36%|███▌      | 1550/4361 [15:09<22:58,  2.04it/s]
 36%|███▌      | 1551/4361 [15:09<23:53,  1.96it/s]
 36%|███▌   

 40%|███▉      | 1729/4361 [16:19<23:41,  1.85it/s]
 40%|███▉      | 1730/4361 [16:19<18:59,  2.31it/s]
 40%|███▉      | 1731/4361 [16:19<17:22,  2.52it/s]
 40%|███▉      | 1732/4361 [16:19<16:24,  2.67it/s]
 40%|███▉      | 1733/4361 [16:20<25:06,  1.74it/s]
 40%|███▉      | 1734/4361 [16:21<21:41,  2.02it/s]
 40%|███▉      | 1735/4361 [16:21<17:21,  2.52it/s]
 40%|███▉      | 1736/4361 [16:22<20:47,  2.10it/s]
 40%|███▉      | 1738/4361 [16:22<16:31,  2.65it/s]
 40%|███▉      | 1740/4361 [16:24<22:34,  1.94it/s]
 40%|███▉      | 1741/4361 [16:24<17:45,  2.46it/s]
 40%|███▉      | 1742/4361 [16:24<15:07,  2.89it/s]
 40%|███▉      | 1743/4361 [16:24<14:46,  2.95it/s]
 40%|████      | 1745/4361 [16:24<11:04,  3.94it/s]
 40%|████      | 1747/4361 [16:25<09:13,  4.72it/s]
 40%|████      | 1748/4361 [16:25<16:27,  2.65it/s]
 40%|████      | 1749/4361 [16:26<20:31,  2.12it/s]
 40%|████      | 1750/4361 [16:27<22:03,  1.97it/s]
 40%|████      | 1752/4361 [16:28<22:46,  1.91it/s]
 40%|████   

 44%|████▍     | 1934/4361 [17:42<36:56,  1.09it/s]
 44%|████▍     | 1935/4361 [17:42<31:11,  1.30it/s]
 44%|████▍     | 1936/4361 [17:43<25:52,  1.56it/s]
 44%|████▍     | 1937/4361 [17:43<25:59,  1.55it/s]
 44%|████▍     | 1938/4361 [17:44<22:43,  1.78it/s]
 44%|████▍     | 1939/4361 [17:44<24:28,  1.65it/s]
 45%|████▍     | 1942/4361 [17:45<18:06,  2.23it/s]
 45%|████▍     | 1943/4361 [17:45<20:46,  1.94it/s]
 45%|████▍     | 1944/4361 [17:45<16:26,  2.45it/s]
 45%|████▍     | 1946/4361 [17:46<14:11,  2.84it/s]
 45%|████▍     | 1947/4361 [17:47<18:52,  2.13it/s]
 45%|████▍     | 1948/4361 [17:47<18:39,  2.16it/s]
 45%|████▍     | 1950/4361 [17:47<15:06,  2.66it/s]
 45%|████▍     | 1951/4361 [17:48<14:01,  2.87it/s]
 45%|████▍     | 1952/4361 [17:48<13:43,  2.92it/s]
 45%|████▍     | 1953/4361 [17:49<24:24,  1.64it/s]
 45%|████▍     | 1954/4361 [17:50<23:53,  1.68it/s]
 45%|████▍     | 1956/4361 [17:50<17:48,  2.25it/s]
 45%|████▍     | 1957/4361 [17:51<23:08,  1.73it/s]
 45%|████▍  

 49%|████▊     | 2121/4361 [19:32<19:54,  1.87it/s]
 49%|████▊     | 2122/4361 [19:33<28:46,  1.30it/s]
 49%|████▊     | 2123/4361 [19:34<29:12,  1.28it/s]
 49%|████▊     | 2124/4361 [19:35<31:58,  1.17it/s]
 49%|████▊     | 2125/4361 [19:35<25:53,  1.44it/s]
 49%|████▉     | 2126/4361 [19:36<26:27,  1.41it/s]
 49%|████▉     | 2127/4361 [19:36<22:19,  1.67it/s]
 49%|████▉     | 2128/4361 [19:37<18:54,  1.97it/s]
 49%|████▉     | 2129/4361 [19:37<18:52,  1.97it/s]
 49%|████▉     | 2130/4361 [19:37<17:25,  2.13it/s]
 49%|████▉     | 2131/4361 [19:38<14:02,  2.65it/s]
 49%|████▉     | 2132/4361 [19:38<13:12,  2.81it/s]
 49%|████▉     | 2133/4361 [19:38<12:43,  2.92it/s]
 49%|████▉     | 2134/4361 [19:39<14:28,  2.56it/s]
 49%|████▉     | 2135/4361 [19:39<13:11,  2.81it/s]
 49%|████▉     | 2136/4361 [19:39<10:23,  3.57it/s]
 49%|████▉     | 2137/4361 [19:39<08:49,  4.20it/s]
 49%|████▉     | 2138/4361 [19:39<07:41,  4.81it/s]
 49%|████▉     | 2139/4361 [19:40<07:54,  4.68it/s]
 49%|████▉  

 53%|█████▎    | 2312/4361 [20:58<10:39,  3.21it/s]
 53%|█████▎    | 2313/4361 [20:59<20:43,  1.65it/s]
 53%|█████▎    | 2315/4361 [21:01<20:12,  1.69it/s]
 53%|█████▎    | 2316/4361 [21:02<23:49,  1.43it/s]
 53%|█████▎    | 2317/4361 [21:02<24:49,  1.37it/s]
 53%|█████▎    | 2318/4361 [21:03<28:50,  1.18it/s]
 53%|█████▎    | 2319/4361 [21:04<27:32,  1.24it/s]
 53%|█████▎    | 2321/4361 [21:05<21:17,  1.60it/s]
 53%|█████▎    | 2322/4361 [21:05<17:39,  1.92it/s]
 53%|█████▎    | 2323/4361 [21:06<23:24,  1.45it/s]
 53%|█████▎    | 2325/4361 [21:07<22:25,  1.51it/s]
 53%|█████▎    | 2326/4361 [21:07<16:44,  2.03it/s]
 53%|█████▎    | 2327/4361 [21:08<16:36,  2.04it/s]
 53%|█████▎    | 2328/4361 [21:08<16:23,  2.07it/s]
 53%|█████▎    | 2330/4361 [21:09<13:29,  2.51it/s]
 53%|█████▎    | 2331/4361 [21:09<16:21,  2.07it/s]
 53%|█████▎    | 2332/4361 [21:10<14:22,  2.35it/s]
 53%|█████▎    | 2333/4361 [21:10<12:08,  2.78it/s]
 54%|█████▎    | 2334/4361 [21:12<27:01,  1.25it/s]
 54%|█████▎ 

 57%|█████▋    | 2495/4361 [23:20<14:37,  2.13it/s]
 57%|█████▋    | 2496/4361 [23:21<16:55,  1.84it/s]
 57%|█████▋    | 2497/4361 [23:21<13:17,  2.34it/s]
 57%|█████▋    | 2498/4361 [23:21<10:37,  2.92it/s]
 57%|█████▋    | 2499/4361 [23:22<08:25,  3.69it/s]
 57%|█████▋    | 2500/4361 [23:22<13:16,  2.34it/s]
 57%|█████▋    | 2502/4361 [23:22<09:59,  3.10it/s]
 57%|█████▋    | 2504/4361 [23:23<08:23,  3.69it/s]
 57%|█████▋    | 2505/4361 [23:23<07:27,  4.15it/s]
 57%|█████▋    | 2506/4361 [23:23<10:00,  3.09it/s]
 57%|█████▋    | 2507/4361 [23:25<19:11,  1.61it/s]
 58%|█████▊    | 2508/4361 [23:25<15:05,  2.05it/s]
 58%|█████▊    | 2509/4361 [23:26<16:42,  1.85it/s]
 58%|█████▊    | 2511/4361 [23:26<12:20,  2.50it/s]
 58%|█████▊    | 2512/4361 [23:26<13:54,  2.21it/s]
 58%|█████▊    | 2513/4361 [23:27<13:00,  2.37it/s]
 58%|█████▊    | 2514/4361 [23:27<10:51,  2.83it/s]
 58%|█████▊    | 2517/4361 [23:27<07:57,  3.86it/s]
 58%|█████▊    | 2519/4361 [23:27<06:27,  4.75it/s]
 58%|█████▊ 

 62%|██████▏   | 2692/4361 [24:35<09:53,  2.81it/s]
 62%|██████▏   | 2693/4361 [24:36<09:41,  2.87it/s]
 62%|██████▏   | 2695/4361 [24:36<08:05,  3.43it/s]
 62%|██████▏   | 2696/4361 [24:37<11:27,  2.42it/s]
 62%|██████▏   | 2697/4361 [24:38<14:05,  1.97it/s]
 62%|██████▏   | 2698/4361 [24:38<10:42,  2.59it/s]
 62%|██████▏   | 2699/4361 [24:38<12:04,  2.29it/s]
 62%|██████▏   | 2700/4361 [24:38<10:22,  2.67it/s]
 62%|██████▏   | 2701/4361 [24:39<11:41,  2.37it/s]
 62%|██████▏   | 2702/4361 [24:39<09:08,  3.03it/s]
 62%|██████▏   | 2704/4361 [24:39<07:02,  3.92it/s]
 62%|██████▏   | 2705/4361 [24:40<08:16,  3.34it/s]
 62%|██████▏   | 2707/4361 [24:41<10:10,  2.71it/s]
 62%|██████▏   | 2708/4361 [24:41<08:28,  3.25it/s]
 62%|██████▏   | 2709/4361 [24:42<13:41,  2.01it/s]
 62%|██████▏   | 2712/4361 [24:43<13:21,  2.06it/s]
 62%|██████▏   | 2713/4361 [24:43<10:39,  2.58it/s]
 62%|██████▏   | 2715/4361 [24:43<08:09,  3.36it/s]
 62%|██████▏   | 2717/4361 [24:44<09:22,  2.92it/s]
 62%|██████▏

 66%|██████▌   | 2888/4361 [25:53<33:15,  1.35s/it]
 66%|██████▌   | 2889/4361 [25:54<28:50,  1.18s/it]
 66%|██████▋   | 2890/4361 [25:54<21:46,  1.13it/s]
 66%|██████▋   | 2891/4361 [25:55<17:34,  1.39it/s]
 66%|██████▋   | 2893/4361 [25:55<13:41,  1.79it/s]
 66%|██████▋   | 2894/4361 [25:55<11:13,  2.18it/s]
 66%|██████▋   | 2895/4361 [25:56<08:48,  2.77it/s]
 66%|██████▋   | 2896/4361 [25:56<11:52,  2.06it/s]
 66%|██████▋   | 2897/4361 [25:57<15:06,  1.62it/s]
 66%|██████▋   | 2898/4361 [25:58<12:56,  1.88it/s]
 66%|██████▋   | 2900/4361 [25:58<10:54,  2.23it/s]
 67%|██████▋   | 2901/4361 [25:59<17:01,  1.43it/s]
 67%|██████▋   | 2902/4361 [26:00<14:13,  1.71it/s]
 67%|██████▋   | 2903/4361 [26:00<14:59,  1.62it/s]
 67%|██████▋   | 2904/4361 [26:01<13:57,  1.74it/s]
 67%|██████▋   | 2905/4361 [26:01<11:01,  2.20it/s]
 67%|██████▋   | 2906/4361 [26:01<10:35,  2.29it/s]
 67%|██████▋   | 2907/4361 [26:03<18:07,  1.34it/s]
 67%|██████▋   | 2908/4361 [26:04<22:37,  1.07it/s]
 67%|██████▋

 71%|███████   | 3078/4361 [27:19<07:49,  2.73it/s]
 71%|███████   | 3081/4361 [27:19<05:49,  3.66it/s]
 71%|███████   | 3082/4361 [27:19<05:01,  4.25it/s]
 71%|███████   | 3083/4361 [27:20<07:27,  2.86it/s]
 71%|███████   | 3084/4361 [27:20<08:39,  2.46it/s]
 71%|███████   | 3085/4361 [27:21<10:09,  2.09it/s]
 71%|███████   | 3087/4361 [27:21<07:52,  2.70it/s]
 71%|███████   | 3088/4361 [27:21<07:11,  2.95it/s]
 71%|███████   | 3089/4361 [27:22<07:02,  3.01it/s]
 71%|███████   | 3090/4361 [27:22<10:14,  2.07it/s]
 71%|███████   | 3091/4361 [27:23<08:14,  2.57it/s]
 71%|███████   | 3092/4361 [27:23<10:26,  2.03it/s]
 71%|███████   | 3093/4361 [27:24<11:01,  1.92it/s]
 71%|███████   | 3094/4361 [27:24<11:09,  1.89it/s]
 71%|███████   | 3095/4361 [27:25<10:38,  1.98it/s]
 71%|███████   | 3096/4361 [27:26<12:08,  1.74it/s]
 71%|███████   | 3097/4361 [27:26<12:37,  1.67it/s]
 71%|███████   | 3099/4361 [27:27<11:03,  1.90it/s]
 71%|███████   | 3100/4361 [27:29<20:05,  1.05it/s]
 71%|███████

 75%|███████▍  | 3266/4361 [28:44<06:58,  2.61it/s]
 75%|███████▍  | 3267/4361 [28:45<09:08,  1.99it/s]
 75%|███████▍  | 3268/4361 [28:45<07:29,  2.43it/s]
 75%|███████▍  | 3269/4361 [28:45<08:52,  2.05it/s]
 75%|███████▌  | 3272/4361 [28:46<07:30,  2.42it/s]
 75%|███████▌  | 3273/4361 [28:46<07:13,  2.51it/s]
 75%|███████▌  | 3275/4361 [28:47<05:46,  3.13it/s]
 75%|███████▌  | 3276/4361 [28:47<04:42,  3.84it/s]
 75%|███████▌  | 3277/4361 [28:47<06:06,  2.96it/s]
 75%|███████▌  | 3278/4361 [28:48<05:06,  3.53it/s]
 75%|███████▌  | 3279/4361 [28:48<05:23,  3.35it/s]
 75%|███████▌  | 3281/4361 [28:48<05:23,  3.33it/s]
 75%|███████▌  | 3282/4361 [28:50<11:17,  1.59it/s]
 75%|███████▌  | 3283/4361 [28:51<12:15,  1.47it/s]
 75%|███████▌  | 3284/4361 [28:51<10:32,  1.70it/s]
 75%|███████▌  | 3285/4361 [28:52<12:11,  1.47it/s]
 75%|███████▌  | 3288/4361 [28:52<09:08,  1.95it/s]
 75%|███████▌  | 3289/4361 [28:53<08:58,  1.99it/s]
 75%|███████▌  | 3290/4361 [28:53<08:34,  2.08it/s]
 75%|███████

 79%|███████▉  | 3453/4361 [30:11<10:38,  1.42it/s]
 79%|███████▉  | 3454/4361 [30:12<12:42,  1.19it/s]
 79%|███████▉  | 3455/4361 [30:13<10:31,  1.44it/s]
 79%|███████▉  | 3456/4361 [30:13<09:57,  1.52it/s]
 79%|███████▉  | 3457/4361 [30:14<08:39,  1.74it/s]
 79%|███████▉  | 3458/4361 [30:14<07:06,  2.12it/s]
 79%|███████▉  | 3459/4361 [30:15<09:35,  1.57it/s]
 79%|███████▉  | 3460/4361 [30:16<10:13,  1.47it/s]
 79%|███████▉  | 3461/4361 [30:16<08:47,  1.71it/s]
 79%|███████▉  | 3462/4361 [30:16<06:39,  2.25it/s]
 79%|███████▉  | 3463/4361 [30:17<09:57,  1.50it/s]
 79%|███████▉  | 3464/4361 [30:18<08:22,  1.78it/s]
 79%|███████▉  | 3465/4361 [30:19<12:58,  1.15it/s]
 80%|███████▉  | 3467/4361 [30:20<09:37,  1.55it/s]
 80%|███████▉  | 3468/4361 [30:21<10:57,  1.36it/s]
 80%|███████▉  | 3471/4361 [30:21<08:12,  1.81it/s]
 80%|███████▉  | 3472/4361 [30:22<09:27,  1.57it/s]
 80%|███████▉  | 3473/4361 [30:22<07:50,  1.89it/s]
 80%|███████▉  | 3474/4361 [30:23<08:26,  1.75it/s]
 80%|███████

 83%|████████▎ | 3634/4361 [31:56<08:28,  1.43it/s]
 83%|████████▎ | 3635/4361 [31:56<07:02,  1.72it/s]
 83%|████████▎ | 3636/4361 [31:57<06:21,  1.90it/s]
 83%|████████▎ | 3637/4361 [31:57<05:57,  2.03it/s]
 83%|████████▎ | 3639/4361 [31:58<05:41,  2.11it/s]
 83%|████████▎ | 3640/4361 [31:59<06:30,  1.85it/s]
 83%|████████▎ | 3641/4361 [31:59<05:33,  2.16it/s]
 84%|████████▎ | 3642/4361 [31:59<05:27,  2.20it/s]
 84%|████████▎ | 3643/4361 [32:00<07:46,  1.54it/s]
 84%|████████▎ | 3644/4361 [32:01<06:35,  1.81it/s]
 84%|████████▎ | 3645/4361 [32:02<08:24,  1.42it/s]
 84%|████████▎ | 3646/4361 [32:02<08:34,  1.39it/s]
 84%|████████▎ | 3647/4361 [32:04<12:06,  1.02s/it]
 84%|████████▎ | 3648/4361 [32:05<09:55,  1.20it/s]
 84%|████████▎ | 3649/4361 [32:05<08:55,  1.33it/s]
 84%|████████▎ | 3650/4361 [32:06<09:08,  1.30it/s]
 84%|████████▎ | 3651/4361 [32:06<07:56,  1.49it/s]
 84%|████████▎ | 3652/4361 [32:08<10:31,  1.12it/s]
 84%|████████▍ | 3653/4361 [32:09<11:06,  1.06it/s]
 84%|███████

 88%|████████▊ | 3819/4361 [33:54<04:39,  1.94it/s]
 88%|████████▊ | 3821/4361 [33:55<03:28,  2.59it/s]
 88%|████████▊ | 3823/4361 [33:55<03:17,  2.73it/s]
 88%|████████▊ | 3824/4361 [33:55<02:55,  3.06it/s]
 88%|████████▊ | 3825/4361 [33:57<05:48,  1.54it/s]
 88%|████████▊ | 3826/4361 [33:57<04:21,  2.04it/s]
 88%|████████▊ | 3828/4361 [33:58<04:22,  2.03it/s]
 88%|████████▊ | 3829/4361 [33:59<04:37,  1.92it/s]
 88%|████████▊ | 3831/4361 [34:01<05:51,  1.51it/s]
 88%|████████▊ | 3832/4361 [34:02<07:08,  1.23it/s]
 88%|████████▊ | 3833/4361 [34:02<05:45,  1.53it/s]
 88%|████████▊ | 3834/4361 [34:02<04:57,  1.77it/s]
 88%|████████▊ | 3836/4361 [34:03<03:58,  2.20it/s]
 88%|████████▊ | 3838/4361 [34:03<02:58,  2.93it/s]
 88%|████████▊ | 3839/4361 [34:04<04:11,  2.08it/s]
 88%|████████▊ | 3840/4361 [34:04<03:26,  2.53it/s]
 88%|████████▊ | 3841/4361 [34:04<03:16,  2.64it/s]
 88%|████████▊ | 3842/4361 [34:05<03:44,  2.31it/s]
 88%|████████▊ | 3843/4361 [34:05<04:10,  2.07it/s]
 88%|███████

 92%|█████████▏| 4021/4361 [35:34<02:51,  1.98it/s]
 92%|█████████▏| 4022/4361 [35:34<02:35,  2.17it/s]
 92%|█████████▏| 4023/4361 [35:35<02:20,  2.41it/s]
 92%|█████████▏| 4024/4361 [35:35<02:01,  2.77it/s]
 92%|█████████▏| 4025/4361 [35:35<01:40,  3.34it/s]
 92%|█████████▏| 4026/4361 [35:36<02:04,  2.70it/s]
 92%|█████████▏| 4027/4361 [35:36<02:03,  2.71it/s]
 92%|█████████▏| 4028/4361 [35:37<03:37,  1.53it/s]
 92%|█████████▏| 4030/4361 [35:38<03:20,  1.65it/s]
 92%|█████████▏| 4031/4361 [35:38<02:34,  2.13it/s]
 92%|█████████▏| 4032/4361 [35:39<03:23,  1.62it/s]
 92%|█████████▏| 4033/4361 [35:41<04:36,  1.19it/s]
 93%|█████████▎| 4035/4361 [35:41<03:38,  1.49it/s]
 93%|█████████▎| 4036/4361 [35:42<03:26,  1.57it/s]
 93%|█████████▎| 4037/4361 [35:42<02:53,  1.87it/s]
 93%|█████████▎| 4038/4361 [35:42<02:17,  2.35it/s]
 93%|█████████▎| 4039/4361 [35:43<01:53,  2.84it/s]
 93%|█████████▎| 4040/4361 [35:43<01:51,  2.88it/s]
 93%|█████████▎| 4042/4361 [35:44<02:09,  2.46it/s]
 93%|███████

 96%|█████████▋| 4205/4361 [36:58<00:50,  3.07it/s]
 96%|█████████▋| 4206/4361 [36:58<00:44,  3.48it/s]
 96%|█████████▋| 4207/4361 [36:59<01:02,  2.48it/s]
 96%|█████████▋| 4208/4361 [36:59<00:50,  3.03it/s]
 97%|█████████▋| 4209/4361 [37:00<00:57,  2.62it/s]
 97%|█████████▋| 4210/4361 [37:00<00:54,  2.77it/s]
 97%|█████████▋| 4211/4361 [37:01<00:57,  2.62it/s]
 97%|█████████▋| 4212/4361 [37:01<01:21,  1.83it/s]
 97%|█████████▋| 4213/4361 [37:02<01:03,  2.32it/s]
 97%|█████████▋| 4214/4361 [37:03<01:24,  1.74it/s]
 97%|█████████▋| 4217/4361 [37:03<01:03,  2.27it/s]
 97%|█████████▋| 4218/4361 [37:03<00:49,  2.88it/s]
 97%|█████████▋| 4219/4361 [37:05<01:46,  1.33it/s]
 97%|█████████▋| 4220/4361 [37:05<01:18,  1.79it/s]
 97%|█████████▋| 4221/4361 [37:05<01:03,  2.21it/s]
 97%|█████████▋| 4222/4361 [37:05<00:48,  2.86it/s]
 97%|█████████▋| 4223/4361 [37:06<01:02,  2.21it/s]
 97%|█████████▋| 4224/4361 [37:08<02:17,  1.00s/it]
 97%|█████████▋| 4225/4361 [37:12<04:02,  1.78s/it]
 97%|███████

CPU times: user 15.3 s, sys: 4.82 s, total: 20.1 s
Wall time: 39min 3s


In [14]:
transcript_df = pd.DataFrame(transcript_dict)
print(len(transcript_df))
transcript_df.head()

4361


Unnamed: 0,audio_file,google_transcription
0,data_processed_DCB/wav/DCB_se1_ag1_m_01_1_part...,I just want to do everything
1,data_processed_DCB/wav/DCB_se1_ag1_m_01_1_part...,ugly one message for people made
2,data_processed_DCB/wav/DCB_se1_ag1_m_01_1_part...,I had a you practice and I just told me up for...
3,data_processed_DCB/wav/DCB_se1_ag1_m_01_1_part...,find something that you like by something is d...
4,data_processed_DCB/wav/DCB_se1_ag1_m_01_1_part...,because my family's most be spread out to dece...


In [15]:
print("HEEEELLLLOO")

HEEEELLLLOO


In [16]:
#join dataframes
manifest['key'] = manifest.wav_file.apply(lambda x: x.split("/")[-1])
manifest.head()

Unnamed: 0,wav_file,txt_file,groundtruth_text,duration,age,gender,key
0,data_processed_DCB/wav/DCB_se1_ag1_m_01_1_part...,data_processed_DCB/txt/DCB_se1_ag1_m_01_1_part...,"Uh, I want to- I'm going to pursue IT. And I'm...",13.18,18,Male,DCB_se1_ag1_m_01_1_part_1.wav
1,data_processed_DCB/wav/DCB_se1_ag1_m_01_1_part...,data_processed_DCB/txt/DCB_se1_ag1_m_01_1_part...,showing that all young black men shouldn't go ...,21.988,18,Male,DCB_se1_ag1_m_01_1_part_2.wav
2,data_processed_DCB/wav/DCB_se1_ag1_m_01_1_part...,data_processed_DCB/txt/DCB_se1_ag1_m_01_1_part...,[And one-] And once you in college we will try...,5.134,18,Male,DCB_se1_ag1_m_01_1_part_3.wav
3,data_processed_DCB/wav/DCB_se1_ag1_m_01_1_part...,data_processed_DCB/txt/DCB_se1_ag1_m_01_1_part...,"Uh, well, basically as of today, Congress Heig...",30.588,18,Male,DCB_se1_ag1_m_01_1_part_4.wav
4,data_processed_DCB/wav/DCB_se1_ag1_m_01_1_part...,data_processed_DCB/txt/DCB_se1_ag1_m_01_1_part...,"Uh, I had /began before the street life/ for- ...",28.943,18,Male,DCB_se1_ag1_m_01_1_part_5.wav


In [17]:
transcript_df['key'] = transcript_df.audio_file.apply(lambda x: x.split("/")[-1])
transcript_df.head()

Unnamed: 0,audio_file,google_transcription,key
0,data_processed_DCB/wav/DCB_se1_ag1_m_01_1_part...,I just want to do everything,DCB_se1_ag1_m_01_1_part_10.wav
1,data_processed_DCB/wav/DCB_se1_ag1_m_01_1_part...,ugly one message for people made,DCB_se1_ag1_m_01_1_part_100.wav
2,data_processed_DCB/wav/DCB_se1_ag1_m_01_1_part...,I had a you practice and I just told me up for...,DCB_se1_ag1_m_01_1_part_21.wav
3,data_processed_DCB/wav/DCB_se1_ag1_m_01_1_part...,find something that you like by something is d...,DCB_se1_ag1_m_01_1_part_101.wav
4,data_processed_DCB/wav/DCB_se1_ag1_m_01_1_part...,because my family's most be spread out to dece...,DCB_se1_ag1_m_01_1_part_12.wav


In [18]:
result = manifest.set_index('key').join(transcript_df.set_index('key'), how = 'inner',lsuffix='_caller', rsuffix='_other')
print(len(result))
result.head()

4361


Unnamed: 0_level_0,wav_file,txt_file,groundtruth_text,duration,age,gender,audio_file,google_transcription
key,Unnamed: 1_level_1,Unnamed: 2_level_1,Unnamed: 3_level_1,Unnamed: 4_level_1,Unnamed: 5_level_1,Unnamed: 6_level_1,Unnamed: 7_level_1,Unnamed: 8_level_1
DCB_se1_ag1_m_01_1_part_1.wav,data_processed_DCB/wav/DCB_se1_ag1_m_01_1_part...,data_processed_DCB/txt/DCB_se1_ag1_m_01_1_part...,"Uh, I want to- I'm going to pursue IT. And I'm...",13.18,18,Male,data_processed_DCB/wav/DCB_se1_ag1_m_01_1_part...,I want it going to pursue it nonprofit program...
DCB_se1_ag1_m_01_1_part_2.wav,data_processed_DCB/wav/DCB_se1_ag1_m_01_1_part...,data_processed_DCB/txt/DCB_se1_ag1_m_01_1_part...,showing that all young black men shouldn't go ...,21.988,18,Male,data_processed_DCB/wav/DCB_se1_ag1_m_01_1_part...,all young black man shouldn't go to the street...
DCB_se1_ag1_m_01_1_part_3.wav,data_processed_DCB/wav/DCB_se1_ag1_m_01_1_part...,data_processed_DCB/txt/DCB_se1_ag1_m_01_1_part...,[And one-] And once you in college we will try...,5.134,18,Male,data_processed_DCB/wav/DCB_se1_ag1_m_01_1_part...,don't want you in college me try to do college
DCB_se1_ag1_m_01_1_part_4.wav,data_processed_DCB/wav/DCB_se1_ag1_m_01_1_part...,data_processed_DCB/txt/DCB_se1_ag1_m_01_1_part...,"Uh, well, basically as of today, Congress Heig...",30.588,18,Male,data_processed_DCB/wav/DCB_se1_ag1_m_01_1_part...,baked brie as of today has lost in a month hou...
DCB_se1_ag1_m_01_1_part_5.wav,data_processed_DCB/wav/DCB_se1_ag1_m_01_1_part...,data_processed_DCB/txt/DCB_se1_ag1_m_01_1_part...,"Uh, I had /began before the street life/ for- ...",28.943,18,Male,data_processed_DCB/wav/DCB_se1_ag1_m_01_1_part...,play street lights for a swage 14 because of t...


In [19]:
print(len(audio_files))

4361


In [20]:
len(result[result.google_transcription.isna()])

0

In [21]:
result.to_csv(OUTPUT_PATH, index = False)