In [None]:
## Running deep speech transcriber

In [1]:
import deepspeech
import numpy as np
import pandas as pd
import matplotlib.pyplot as plt
import wave



In [2]:
# Deepspeech trained model 
model_path = 'deepspeech-models/deepspeech-0.8.2-models.pbmm'
model_scorer_path = 'deepspeech-models/deepspeech-0.8.2-models.scorer'
lm_alpha = 0.75
lm_beta = 1.85
beam_width = 500
model = deepspeech.Model(model_path)
model.enableExternalScorer(model_scorer_path)
model.setScorerAlphaBeta(lm_alpha, lm_beta)

0

In [3]:
audio_file = "/home/arun/shares/PROXY/NAS/Testing STT/sample_01.wav"

In [4]:
def extract(audio_file):
    srt = []
    print("Going to process the audio file : {} ".format(audio_file))
    with wave.open(audio_file, 'r') as w:
        rate = w.getframerate()
        frames = w.getnframes()
        print("[process] Audio bit/rate -> [{}]".format(rate))
        print("[process] Frame rate -> [{}]".format(frames))
        buffer = w.readframes(frames)
        print("[process] Buffer length is : {}".format(len(buffer)))
        print("The sample rate is : {}".format(model.sampleRate()))
        formated_buffer = np.frombuffer(buffer, dtype=np.int16)
        text = model.stt(formated_buffer)
        #print("Text Extracted is --> [{}]".format(text))
        srt.append(text)
    return srt

In [None]:
# Batch wise recognition
ds_stream = model.createStream()
buffer_len = len(buffer)
offset = 0
batch_size = 16384
while offset < buffer_len:
        end_offset = offset + batch_size
        chunk = buffer[offset:end_offset]
        data16 = np.frombuffer(chunk, dtype=np.int16)
        ds_stream.feedAudioContent(data16)
        text = ds_stream.intermediateDecode()
        #print("extracting --> {}".format(text))
        offset = end_offset
print(text)

In [5]:
audio_file = "/home/arun/shares/PROXY/NAS/Testing STT/sample_01.wav"
print(extract(audio_file))

Going to process the audio file : /home/arun/shares/PROXY/NAS/Testing STT/sample_01.wav 
[process] Audio bit/rate -> [16000]
[process] Frame rate -> [178240]
[process] Buffer length is : 356480
The sample rate is : 16000
['and chief just as of the massachusetts supreme court in april the stress current leader edward hennesey reaches the mandatory retirement age of seventy and his successor is']


In [6]:
audio_file = "/home/arun/shares/PROXY/NAS/Testing STT/sample_02.wav"
print(extract(audio_file))

Going to process the audio file : /home/arun/shares/PROXY/NAS/Testing STT/sample_02.wav 
[process] Audio bit/rate -> [16000]
[process] Frame rate -> [178080]
[process] Buffer length is : 356160
The sample rate is : 16000
['the justice of the locusts are grand court they had aulestes praeter and were here grates the mandatory retire age seven gates excess']


In [7]:
audio_file = "/home/arun/shares/PROXY/NAS/Testing STT/sample_03.wav"
print(extract(audio_file))

Going to process the audio file : /home/arun/shares/PROXY/NAS/Testing STT/sample_03.wav 
[process] Audio bit/rate -> [16000]
[process] Frame rate -> [178080]
[process] Buffer length is : 356160
The sample rate is : 16000
['the justice of massachusetts a green court in deep because these current leader in war heneage that mandatory retirement tisserand the simpsons']


In [8]:
audio_file = "/home/arun/shares/PROXY/NAS/Testing STT/sample_04.wav"
print(extract(audio_file))

Going to process the audio file : /home/arun/shares/PROXY/NAS/Testing STT/sample_04.wav 
[process] Audio bit/rate -> [16000]
[process] Frame rate -> [178240]
[process] Buffer length is : 356480
The sample rate is : 16000
['wanted chief just as of the massachusetts supreme court in april the scs current leader edward hennesey reaches the mandatory retirement age of seventy and his successor is']


In [9]:
audio_file = "/home/arun/shares/PROXY/NAS/Testing STT/sample_05.wav"
print(extract(audio_file))

Going to process the audio file : /home/arun/shares/PROXY/NAS/Testing STT/sample_05.wav 
[process] Audio bit/rate -> [16000]
[process] Frame rate -> [187040]
[process] Buffer length is : 374080
The sample rate is : 16000
['to be named in marriage it may be the most important appointment governor makedama during the remainder of his administration and one of the toughest as we war as murger melnikov']


In [10]:
audio_file = "/home/arun/shares/PROXY/NAS/Testing STT/sample_06.wav"
print(extract(audio_file))

Going to process the audio file : /home/arun/shares/PROXY/NAS/Testing STT/sample_06.wav 
[process] Audio bit/rate -> [16000]
[process] Frame rate -> [186880]
[process] Buffer length is : 373760
The sample rate is : 16000
['manage it the masking point on the point by evident idea departs may extremely remainder of his administration in one of the test is that the bears nor amalia']


In [11]:
audio_file = "/home/arun/shares/PROXY/NAS/Testing STT/sample_07.wav"
print(extract(audio_file))

Going to process the audio file : /home/arun/shares/PROXY/NAS/Testing STT/sample_07.wav 
[process] Audio bit/rate -> [16000]
[process] Frame rate -> [186880]
[process] Buffer length is : 373760
The sample rate is : 16000
['in may be the most important a point queenlike declares was during the remainder of his invitation and one of the tallest is tabooed']


In [12]:
audio_file = "/home/arun/shares/PROXY/NAS/Testing STT/sample_08.wav"
print(extract(audio_file))

Going to process the audio file : /home/arun/shares/PROXY/NAS/Testing STT/sample_08.wav 
[process] Audio bit/rate -> [16000]
[process] Frame rate -> [128640]
[process] Buffer length is : 257280
The sample rate is : 16000
['repoint out that it school based clinics were established parental permission would be required for students to receive each service offered']


In [13]:
audio_file = "/home/arun/shares/PROXY/NAS/Testing STT/stt_sample_08.mp4.audio.wav"
print(extract(audio_file))

Going to process the audio file : /home/arun/shares/PROXY/NAS/Testing STT/stt_sample_08.mp4.audio.wav 
[process] Audio bit/rate -> [16000]
[process] Frame rate -> [3595193]
[process] Buffer length is : 7190386
The sample rate is : 16000
["what is poetry a page and ripped out her wearisomely isle there are without sir of what you can to grow ripe down sir we never more understanding poetry by doctor j evans pritchard kid the polanders and poetry we must first be fluent with its meter of rhyme and figures of speak then asked you questions one how artfully as the objective of the poem been rendered to how important is that objective question one reads the poem perfection question to rate importance and once of questions have been answered the terming the poems greatness become a relatively simple matter if the bonsor for perfection is applied on the horizontal of a grapestone they made a rising to believe me it's true i do believe you tom gave mister kit but it was in his time on distant 

In [14]:
audio_file = "/home/arun/shares/PROXY/NAS/Testing STT/stt_sample_07.mp4.audio.wav"
print(extract(audio_file))

Going to process the audio file : /home/arun/shares/PROXY/NAS/Testing STT/stt_sample_07.mp4.audio.wav 
[process] Audio bit/rate -> [16000]
[process] Frame rate -> [5810562]
[process] Buffer length is : 11621124
The sample rate is : 16000
["we've all heard them said then a shattered them at our friends there on artesia coffee mugs and are vintage at sea needle point sweaters these are the top one hundred most ionic movie quotes of all time the greatest trick but devil ever pulled was convincing the world he didn't exist she and this world as to transpose my friend and his loaded guns hoddesdon need amenhotep together aliandra that way he is robinson your drives a boll have what she's having as far back as i could remember i always wanted to be a gangster somtimes even entrancement time to eradicate meant you're going and get life move pretty fast you don't stop and look around with an ill you can he have a problem but we've got here is there took me canterburies do not come about by one

In [15]:
audio_file = "/home/arun/shares/PROXY/NAS/Testing STT/stt_sample_06.mp4.audio.wav"
print(extract(audio_file))

Going to process the audio file : /home/arun/shares/PROXY/NAS/Testing STT/stt_sample_06.mp4.audio.wav 
[process] Audio bit/rate -> [16000]
[process] Frame rate -> [4581576]
[process] Buffer length is : 9163152
The sample rate is : 16000
["press some one chris as from his abuseth where a shirt to day you know being the last day and all and thank you how appreciate that butter whereon to morrow though kay because to mars going to be your first day if you'd like to work here as a broker would you like that chris you sir good we couldn't be happier so welcome was it as easy as it looked no sir mozart wasn't good lacrimose contis part of my life this little part is called in athenagoras in an onconsarned nobody on"]


In [19]:
audio_file = "/home/arun/shares/PROXY/NAS/Testing STT/stt_sample_01.mp4.audio.wav"
print(extract(audio_file))

Going to process the audio file : /home/arun/shares/PROXY/NAS/Testing STT/stt_sample_01.mp4.audio.wav 
[process] Audio bit/rate -> [16000]
[process] Frame rate -> [3268256]
[process] Buffer length is : 6536512
The sample rate is : 16000
['a bronson while an three times the size of our son or to end its life had with a collapse the gravitation of forces of the entire mass overcoming the electro magnetic forces of individual atoms and soul collapsing inward if the star is massive enough it will continue this collapse creating a black hole where the warping of space time is so great that nothing can escape not even light it gets smaller smaller the star in fact gets denser as atoms even subatomic particles kept literally crushed into smaller and smaller space and a end point what are we left with a space time singularity space and time come to a stone relations there about that coast to the entire itchiness right is general relativity project then the universe expanding has if you reverse

In [20]:
audio_file = "/home/arun/shares/PROXY/NAS/Testing STT/stt_sample_02.mp4.audio.wav"
print(extract(audio_file))

Going to process the audio file : /home/arun/shares/PROXY/NAS/Testing STT/stt_sample_02.mp4.audio.wav 
[process] Audio bit/rate -> [16000]
[process] Frame rate -> [3300206]
[process] Buffer length is : 6600412
The sample rate is : 16000
["then where are we that the asinine day and this is the mutineers home to many of the greatest paintings in his wonderful ignored a bustling monforte chances we can never when chimaera my child and there is another cracker for it so so good i just wondered between you and me and earthenware where d you think bengore sister of a well big question but to me then go i find pentruan most popular great painter for all time the most been loved his command of carlos magnificent he transformed the pain is tormented life into is dabat paine is easy to portray them to use your passion and pain to betray the estacion joy and magnificent so our world no one had ever done it before perhaps an o and ever will again to my mind that strange wild man who roamed the fie

In [21]:
audio_file = "/home/arun/shares/PROXY/NAS/Testing STT/stt_sample_03.mp4.audio.wav"
print(extract(audio_file))

Going to process the audio file : /home/arun/shares/PROXY/NAS/Testing STT/stt_sample_03.mp4.audio.wav 
[process] Audio bit/rate -> [16000]
[process] Frame rate -> [8525253]
[process] Buffer length is : 17050506
The sample rate is : 16000
["so what makes you think that i'm going to let the whitest man that i have ever seen interview for our firm because i haven't pointed you can do this you did what is wrong with you humour eleven years old i was led to puberty okay i respect and excuse me i was to go back on me for a swim of the boiled her night course sir the children will do best in the city he is the poor clothes i do you the time i can o'clock sorry god utiarity to think one of whom tales just walk in a state radio rick stork in a stork in rick organ excuse me mister skin you are five minutes late there a reason why i should let you in or to the oilometer pete will be rightly he what can get you anything a coffee or water i rick sort pariset or nice to meet you to a sea as can i he

In [None]:
audio_file = "/home/arun/shares/PROXY/NAS/Testing STT/stt_sample_02.mp4.audio.wav"
print(extract(audio_file))

In [None]:
audio_file = "/home/arun/shares/PROXY/NAS/Testing STT/stt_sample_01.mp4.audio.wav"
print(extract(audio_file))