In [1]:
# Import Library
from flask import Flask, render_template, request, session, jsonify
from transformers import Wav2Vec2ProcessorWithLM, Wav2Vec2ForCTC, Wav2Vec2Processor
import speech_recognition as sr
import torch
import gc
import librosa
import numpy as np
import onnxruntime as rt
import time
from flask_socketio import SocketIO, emit
import os

2023-06-19 17:04:37.882217: I tensorflow/core/platform/cpu_feature_guard.cc:182] This TensorFlow binary is optimized to use available CPU instructions in performance-critical operations.
To enable the following instructions: AVX2 FMA, in other operations, rebuild TensorFlow with the appropriate compiler flags.


In [2]:
# Necessary Variable

SAMPLE_RATE = 16_000
FFT_SIZE = 2048
HOP_SIZE = 512
N_MELS = 26
MFCC_BINS = 13
MAX_LEN_PAD = 32
CHANNELS = 3
async_mode = None
dataset_directory = os.getcwd() + "/Audio Classification/AudioClassification Dataset"
dataset_labels = os.listdir(dataset_directory)

In [3]:
# Necessary Function

def resample_audio(path):
    audio, sr = librosa.load(path, sr=SAMPLE_RATE)
    if len(audio) < SAMPLE_RATE: 
        audio = np.pad(audio, (0,16000-len(audio)), "constant")
    else:
        audio = audio[:SAMPLE_RATE]
    return audio

def stft(audio):
    audio_stft = librosa.stft(y = audio, n_fft = FFT_SIZE, hop_length = HOP_SIZE, center=True, pad_mode='constant')
    amp = np.abs(audio_stft)**2

    return amp

def mel_frequency(spectrogram):
    mel = librosa.filters.mel(sr=SAMPLE_RATE, n_fft=FFT_SIZE, n_mels=N_MELS)
    
    mel_spec = mel.dot(spectrogram)
    db_mel_spect = librosa.power_to_db(mel_spec, ref=np.max)
    
    return db_mel_spect

def mfcc(mel_freq):
    mfcc = librosa.feature.mfcc(S=mel_freq, sr=SAMPLE_RATE, n_mfcc=MFCC_BINS, n_fft=FFT_SIZE, hop_length=HOP_SIZE, n_mels=N_MELS)
    
    if (MAX_LEN_PAD > mfcc.shape[1]):
        pad = MAX_LEN_PAD - mfcc.shape[1]
        mfcc = np.pad(mfcc, pad_width=((0, 0), (0, pad)))
    else:
        mfcc = mfcc[:, :MAX_LEN_PAD]
    return mfcc

def delta_mfcc(mfcc):
    delta_mfcc = librosa.feature.delta(mfcc)
    return delta_mfcc

def delta_delta_mfcc(mfcc):
    delta_delta_mfcc = librosa.feature.delta(mfcc, order=2)
    return delta_delta_mfcc

def speaker_input_preprocessing(audio):
    audio_speaker = resample_audio("microphone-results.wav")
    audio_speaker = stft(audio_speaker)
    audio_speaker = mel_frequency(audio_speaker)

    audio_speaker_mfcc = mfcc(audio_speaker)
    audio_speaker_delta = delta_mfcc(audio_speaker_mfcc)
    audio_speaker_delta_delta = delta_delta_mfcc(audio_speaker_mfcc)

    audio_speaker_input = np.zeros((1, MFCC_BINS, MAX_LEN_PAD, CHANNELS), dtype=np.float32)
    audio_speaker_input[:, :, :, 0] = audio_speaker_mfcc
    audio_speaker_input[:, :, :, 1] = audio_speaker_delta
    audio_speaker_input[:, :, :, 2] = audio_speaker_delta_delta
    return audio_speaker_input

In [4]:
# Model Apply

model = Wav2Vec2ForCTC.from_pretrained("Automatic Speech Recognition/asr_skripsi_local_common_voice/checkpoint-2400").to("cuda")
processor = Wav2Vec2Processor.from_pretrained("Automatic Speech Recognition/asr_skripsi_local_common_voice/")
processorLM = Wav2Vec2ProcessorWithLM.from_pretrained("Automatic Speech Recognition/asr_LM_skripsi_local_common_voice", eos_token=None, bos_token=None)
model_onnx = rt.InferenceSession('Audio Classification/Classification.simplified.onnx', providers=["CUDAExecutionProvider"])

Special tokens have been added in the vocabulary, make sure the associated word embeddings are fine-tuned or trained.


In [5]:
# Initialize Speech Recognizer
listener = sr.Recognizer()
listener.dynamic_energy_threshold = True
# listener.energy_threshold = 4500

In [6]:
# Flask (HTML)
app = Flask(__name__, template_folder='MonitoringWeb', static_folder='MonitoringWeb/static')
socketio = SocketIO(app, async_mode=async_mode, cors_allowed_origins="*", headers = {"Content-Type": "application/json; charset=utf-8"})
audio = ""
audio_speaker_input = ""
_ = ""

@app.route('/',methods=["GET", "POST"])
def index():
    return render_template('index.html', progress = "Wait For Record")

@app.route('/listen', methods=['POST'])
def record():
    listener = sr.Recognizer()
    listener.dynamic_energy_threshold = True
    data = request.get_json()
    print(data)
    if 'record' in data:
        try:
            
            with sr.Microphone() as mic:
                listener.adjust_for_ambient_noise(mic, duration=5)
                print("Listening...")
                audio = listener.listen(mic, phrase_time_limit=5)
                with open("microphone-results.wav", "wb") as f:
                    f.write(audio.get_wav_data())
                return jsonify({'path': os.path.abspath("microphone-results.wav")})
            
        except sr.UnknownValueError:
            listener = sr.Recognizer()


@app.route('/preprocessing', methods=['POST'])
def preprocessing():
    data = request.get_json()['audioPath']
    print(data)

    global audio
    global audio_speaker_input
    global _
    
    audio, _ = librosa.load(data, sr=SAMPLE_RATE)
    audio_len = librosa.get_duration(y=audio, sr=SAMPLE_RATE)

    audio_speaker_input = speaker_input_preprocessing(audio)

    if audio_len > 5:
        print("Audio Duration More Than 5 Secs")
        return jsonify({'status': "Audio Duration More Than 5 Secs"})
    return jsonify({'status': "PreProcessing Done!"})

@app.route('/speaker-predict', methods=['POST'])
def speaker_predicting():
    print("Speaker Predicting...\n")
    inputDetails = model_onnx.get_inputs()
    start_time = time.time()
    pred_speaker = model_onnx.run(None, {inputDetails[0].name: audio_speaker_input})[0] 
    print("--- %s seconds ---" % (time.time() - start_time))

    if max(pred_speaker[0]) < 0.90:
        print("Speaker Unidentified")
        return jsonify({'speaker': "Speaker Unidentified"})
    top_index = np.argmax(pred_speaker[0])
    print(labels[top_index])
    return jsonify({'speaker': labels[top_index]})
    

@app.route('/word-predict', methods=['POST'])
def word_predicting():
    global audio
    print("\n\nWords Predicting...\n")
    start_time = time.time()
    input_dict = processor(audio, sampling_rate=SAMPLE_RATE, return_tensors="pt", padding=True)
    with torch.no_grad():
        logits = model(input_dict.input_values.to("cuda")).logits
    transcriptionLM = processorLM.batch_decode(logits.cpu().detach().numpy()).text[0]
    print("--- %s seconds ---" % (time.time() - start_time))

    print(f"\n\nAudio Transcribe : {transcriptionLM}")
    del audio, input_dict, logits
    gc.collect()
    torch.cuda.empty_cache()
    return jsonify({"transcribe" : transcriptionLM})


In [None]:
if __name__ == "__main__":
    socketio.run(app, debug=True, allow_unsafe_werkzeug=True, use_reloader=False)

Werkzeug appears to be used in a production deployment. Consider switching to a production web server instead.


 * Serving Flask app '__main__'
 * Debug mode: on


 * Running on http://127.0.0.1:5000
Press CTRL+C to quit
127.0.0.1 - - [19/Jun/2023 17:07:46] "GET / HTTP/1.1" 200 -
127.0.0.1 - - [19/Jun/2023 17:07:46] "GET /static/test.js HTTP/1.1" 200 -
127.0.0.1 - - [19/Jun/2023 17:07:46] "GET /static/style.css HTTP/1.1" 200 -
127.0.0.1 - - [19/Jun/2023 17:07:46] "GET /static/Lantai_2.jpg HTTP/1.1" 200 -
127.0.0.1 - - [19/Jun/2023 17:07:46] "GET /static/Lantai_1.jpg HTTP/1.1" 200 -
127.0.0.1 - - [19/Jun/2023 17:07:46] "GET /static/pic_bulboff.gif HTTP/1.1" 200 -


{'record': True}


ALSA lib pcm.c:2664:(snd_pcm_open_noupdate) Unknown PCM cards.pcm.rear
ALSA lib pcm.c:2664:(snd_pcm_open_noupdate) Unknown PCM cards.pcm.center_lfe
ALSA lib pcm.c:2664:(snd_pcm_open_noupdate) Unknown PCM cards.pcm.side
ALSA lib pcm_route.c:877:(find_matching_chmap) Found no matching channel map
ALSA lib pcm_route.c:877:(find_matching_chmap) Found no matching channel map
ALSA lib pcm_route.c:877:(find_matching_chmap) Found no matching channel map
ALSA lib pcm_route.c:877:(find_matching_chmap) Found no matching channel map
Expression 'alsa_snd_pcm_hw_params_set_buffer_size_near( pcm, hwParams, &alsaBufferFrames )' failed in 'src/hostapi/alsa/pa_linux_alsa.c', line: 923
Expression 'alsa_snd_pcm_hw_params_set_buffer_size_near( pcm, hwParams, &alsaBufferFrames )' failed in 'src/hostapi/alsa/pa_linux_alsa.c', line: 923
ALSA lib pcm_oss.c:397:(_snd_pcm_oss_open) Cannot open device /dev/dsp
ALSA lib pcm_oss.c:397:(_snd_pcm_oss_open) Cannot open device /dev/dsp
ALSA lib confmisc.c:160:(snd_conf

Listening...


127.0.0.1 - - [19/Jun/2023 17:08:20] "POST /listen HTTP/1.1" 200 -


/home/alckylzer/Desktop/LiveASR/microphone-results.wav


127.0.0.1 - - [19/Jun/2023 17:08:22] "POST /preprocessing HTTP/1.1" 200 -


Speaker Predicting...



127.0.0.1 - - [19/Jun/2023 17:08:23] "POST /speaker-predict HTTP/1.1" 200 -


--- 0.5367157459259033 seconds ---
Gesang


Words Predicting...

--- 0.7538247108459473 seconds ---


Audio Transcribe : jaksa kalau


127.0.0.1 - - [19/Jun/2023 17:08:24] "POST /word-predict HTTP/1.1" 200 -


{'record': True}


ALSA lib pcm.c:2664:(snd_pcm_open_noupdate) Unknown PCM cards.pcm.rear
ALSA lib pcm.c:2664:(snd_pcm_open_noupdate) Unknown PCM cards.pcm.center_lfe
ALSA lib pcm.c:2664:(snd_pcm_open_noupdate) Unknown PCM cards.pcm.side
ALSA lib pcm_route.c:877:(find_matching_chmap) Found no matching channel map
ALSA lib pcm_route.c:877:(find_matching_chmap) Found no matching channel map
ALSA lib pcm_route.c:877:(find_matching_chmap) Found no matching channel map
ALSA lib pcm_route.c:877:(find_matching_chmap) Found no matching channel map
Expression 'alsa_snd_pcm_hw_params_set_buffer_size_near( pcm, hwParams, &alsaBufferFrames )' failed in 'src/hostapi/alsa/pa_linux_alsa.c', line: 923
Expression 'alsa_snd_pcm_hw_params_set_buffer_size_near( pcm, hwParams, &alsaBufferFrames )' failed in 'src/hostapi/alsa/pa_linux_alsa.c', line: 923
ALSA lib pcm_oss.c:397:(_snd_pcm_oss_open) Cannot open device /dev/dsp
ALSA lib pcm_oss.c:397:(_snd_pcm_oss_open) Cannot open device /dev/dsp
ALSA lib confmisc.c:160:(snd_conf

Listening...


127.0.0.1 - - [19/Jun/2023 17:08:44] "POST /listen HTTP/1.1" 200 -


/home/alckylzer/Desktop/LiveASR/microphone-results.wav


127.0.0.1 - - [19/Jun/2023 17:08:45] "POST /preprocessing HTTP/1.1" 200 -
127.0.0.1 - - [19/Jun/2023 17:08:46] "POST /speaker-predict HTTP/1.1" 200 -


Speaker Predicting...

--- 0.016249418258666992 seconds ---
Gesang


Words Predicting...

--- 0.877577543258667 seconds ---


Audio Transcribe : saya jalan ini pesan telah ada seri sendiri ini kesan di


127.0.0.1 - - [19/Jun/2023 17:08:47] "POST /word-predict HTTP/1.1" 200 -
127.0.0.1 - - [19/Jun/2023 17:09:12] "GET / HTTP/1.1" 200 -
127.0.0.1 - - [19/Jun/2023 17:09:12] "GET /static/style.css HTTP/1.1" 304 -
127.0.0.1 - - [19/Jun/2023 17:09:12] "GET /static/test.js HTTP/1.1" 304 -
127.0.0.1 - - [19/Jun/2023 17:09:13] "GET /static/Lantai_1.jpg HTTP/1.1" 304 -
127.0.0.1 - - [19/Jun/2023 17:09:13] "GET /static/Lantai_2.jpg HTTP/1.1" 304 -
127.0.0.1 - - [19/Jun/2023 17:09:13] "GET /static/pic_bulboff.gif HTTP/1.1" 304 -


{'record': True}


ALSA lib pcm_dmix.c:1032:(snd_pcm_dmix_open) unable to open slave
ALSA lib pcm.c:2664:(snd_pcm_open_noupdate) Unknown PCM cards.pcm.rear
ALSA lib pcm.c:2664:(snd_pcm_open_noupdate) Unknown PCM cards.pcm.center_lfe
ALSA lib pcm.c:2664:(snd_pcm_open_noupdate) Unknown PCM cards.pcm.side
ALSA lib pcm_route.c:877:(find_matching_chmap) Found no matching channel map
Expression 'alsa_snd_pcm_hw_params_set_buffer_size_near( pcm, hwParams, &alsaBufferFrames )' failed in 'src/hostapi/alsa/pa_linux_alsa.c', line: 923
Expression 'alsa_snd_pcm_hw_params_set_buffer_size_near( pcm, hwParams, &alsaBufferFrames )' failed in 'src/hostapi/alsa/pa_linux_alsa.c', line: 923
ALSA lib pcm_oss.c:397:(_snd_pcm_oss_open) Cannot open device /dev/dsp
ALSA lib pcm_oss.c:397:(_snd_pcm_oss_open) Cannot open device /dev/dsp
ALSA lib confmisc.c:160:(snd_config_get_card) Invalid field card
ALSA lib pcm_usb_stream.c:482:(_snd_pcm_usb_stream_open) Invalid card 'card'
ALSA lib confmisc.c:160:(snd_config_get_card) Invalid fi

Listening...


127.0.0.1 - - [19/Jun/2023 17:09:41] "POST /listen HTTP/1.1" 200 -


/home/alckylzer/Desktop/LiveASR/microphone-results.wav


127.0.0.1 - - [19/Jun/2023 17:09:41] "POST /preprocessing HTTP/1.1" 200 -
127.0.0.1 - - [19/Jun/2023 17:09:41] "POST /speaker-predict HTTP/1.1" 200 -


Speaker Predicting...

--- 0.017792940139770508 seconds ---
Gesang


Words Predicting...

--- 0.47724199295043945 seconds ---


Audio Transcribe : satu nol satu


127.0.0.1 - - [19/Jun/2023 17:09:42] "POST /word-predict HTTP/1.1" 200 -


{'record': True}


ALSA lib pcm.c:2664:(snd_pcm_open_noupdate) Unknown PCM cards.pcm.rear
ALSA lib pcm.c:2664:(snd_pcm_open_noupdate) Unknown PCM cards.pcm.center_lfe
ALSA lib pcm.c:2664:(snd_pcm_open_noupdate) Unknown PCM cards.pcm.side
ALSA lib pcm_route.c:877:(find_matching_chmap) Found no matching channel map
ALSA lib pcm_route.c:877:(find_matching_chmap) Found no matching channel map
ALSA lib pcm_route.c:877:(find_matching_chmap) Found no matching channel map
ALSA lib pcm_route.c:877:(find_matching_chmap) Found no matching channel map
Expression 'alsa_snd_pcm_hw_params_set_buffer_size_near( pcm, hwParams, &alsaBufferFrames )' failed in 'src/hostapi/alsa/pa_linux_alsa.c', line: 923
Expression 'alsa_snd_pcm_hw_params_set_buffer_size_near( pcm, hwParams, &alsaBufferFrames )' failed in 'src/hostapi/alsa/pa_linux_alsa.c', line: 923
ALSA lib pcm_oss.c:397:(_snd_pcm_oss_open) Cannot open device /dev/dsp
ALSA lib pcm_oss.c:397:(_snd_pcm_oss_open) Cannot open device /dev/dsp
ALSA lib confmisc.c:160:(snd_conf

Listening...


127.0.0.1 - - [19/Jun/2023 17:10:12] "POST /listen HTTP/1.1" 200 -


/home/alckylzer/Desktop/LiveASR/microphone-results.wav


127.0.0.1 - - [19/Jun/2023 17:10:13] "POST /preprocessing HTTP/1.1" 200 -


Audio Duration More Than 5 Secs
{'record': True}


ALSA lib pcm.c:2664:(snd_pcm_open_noupdate) Unknown PCM cards.pcm.rear
ALSA lib pcm.c:2664:(snd_pcm_open_noupdate) Unknown PCM cards.pcm.center_lfe
ALSA lib pcm.c:2664:(snd_pcm_open_noupdate) Unknown PCM cards.pcm.side
ALSA lib pcm_route.c:877:(find_matching_chmap) Found no matching channel map
ALSA lib pcm_route.c:877:(find_matching_chmap) Found no matching channel map
ALSA lib pcm_route.c:877:(find_matching_chmap) Found no matching channel map
ALSA lib pcm_route.c:877:(find_matching_chmap) Found no matching channel map
Expression 'alsa_snd_pcm_hw_params_set_buffer_size_near( pcm, hwParams, &alsaBufferFrames )' failed in 'src/hostapi/alsa/pa_linux_alsa.c', line: 923
Expression 'alsa_snd_pcm_hw_params_set_buffer_size_near( pcm, hwParams, &alsaBufferFrames )' failed in 'src/hostapi/alsa/pa_linux_alsa.c', line: 923
ALSA lib pcm_oss.c:397:(_snd_pcm_oss_open) Cannot open device /dev/dsp
ALSA lib pcm_oss.c:397:(_snd_pcm_oss_open) Cannot open device /dev/dsp
ALSA lib confmisc.c:160:(snd_conf

Listening...


127.0.0.1 - - [19/Jun/2023 17:11:42] "POST /listen HTTP/1.1" 200 -


/home/alckylzer/Desktop/LiveASR/microphone-results.wav


127.0.0.1 - - [19/Jun/2023 17:11:43] "POST /preprocessing HTTP/1.1" 200 -
127.0.0.1 - - [19/Jun/2023 17:11:43] "POST /speaker-predict HTTP/1.1" 200 -


Speaker Predicting...

--- 0.01746082305908203 seconds ---
Raja


Words Predicting...

--- 0.5966818332672119 seconds ---


Audio Transcribe : nyalakan lampu dua nol satu


127.0.0.1 - - [19/Jun/2023 17:11:44] "POST /word-predict HTTP/1.1" 200 -
127.0.0.1 - - [19/Jun/2023 17:11:44] "GET /static/pic_bulbon.gif HTTP/1.1" 200 -


{'record': True}


ALSA lib pcm.c:2664:(snd_pcm_open_noupdate) Unknown PCM cards.pcm.rear
ALSA lib pcm.c:2664:(snd_pcm_open_noupdate) Unknown PCM cards.pcm.center_lfe
ALSA lib pcm.c:2664:(snd_pcm_open_noupdate) Unknown PCM cards.pcm.side
ALSA lib pcm_route.c:877:(find_matching_chmap) Found no matching channel map
ALSA lib pcm_route.c:877:(find_matching_chmap) Found no matching channel map
ALSA lib pcm_route.c:877:(find_matching_chmap) Found no matching channel map
ALSA lib pcm_route.c:877:(find_matching_chmap) Found no matching channel map
Expression 'alsa_snd_pcm_hw_params_set_buffer_size_near( pcm, hwParams, &alsaBufferFrames )' failed in 'src/hostapi/alsa/pa_linux_alsa.c', line: 923
Expression 'alsa_snd_pcm_hw_params_set_buffer_size_near( pcm, hwParams, &alsaBufferFrames )' failed in 'src/hostapi/alsa/pa_linux_alsa.c', line: 923
ALSA lib pcm_oss.c:397:(_snd_pcm_oss_open) Cannot open device /dev/dsp
ALSA lib pcm_oss.c:397:(_snd_pcm_oss_open) Cannot open device /dev/dsp
ALSA lib confmisc.c:160:(snd_conf

Listening...


127.0.0.1 - - [19/Jun/2023 17:12:32] "POST /listen HTTP/1.1" 200 -


/home/alckylzer/Desktop/LiveASR/microphone-results.wav


127.0.0.1 - - [19/Jun/2023 17:12:33] "POST /preprocessing HTTP/1.1" 200 -


Audio Duration More Than 5 Secs
{'record': True}


ALSA lib pcm.c:2664:(snd_pcm_open_noupdate) Unknown PCM cards.pcm.rear
ALSA lib pcm.c:2664:(snd_pcm_open_noupdate) Unknown PCM cards.pcm.center_lfe
ALSA lib pcm.c:2664:(snd_pcm_open_noupdate) Unknown PCM cards.pcm.side
ALSA lib pcm_route.c:877:(find_matching_chmap) Found no matching channel map
ALSA lib pcm_route.c:877:(find_matching_chmap) Found no matching channel map
ALSA lib pcm_route.c:877:(find_matching_chmap) Found no matching channel map
ALSA lib pcm_route.c:877:(find_matching_chmap) Found no matching channel map
Expression 'alsa_snd_pcm_hw_params_set_buffer_size_near( pcm, hwParams, &alsaBufferFrames )' failed in 'src/hostapi/alsa/pa_linux_alsa.c', line: 923
Expression 'alsa_snd_pcm_hw_params_set_buffer_size_near( pcm, hwParams, &alsaBufferFrames )' failed in 'src/hostapi/alsa/pa_linux_alsa.c', line: 923
ALSA lib pcm_oss.c:397:(_snd_pcm_oss_open) Cannot open device /dev/dsp
ALSA lib pcm_oss.c:397:(_snd_pcm_oss_open) Cannot open device /dev/dsp
ALSA lib confmisc.c:160:(snd_conf

Listening...


127.0.0.1 - - [19/Jun/2023 17:12:48] "POST /listen HTTP/1.1" 200 -


/home/alckylzer/Desktop/LiveASR/microphone-results.wav


127.0.0.1 - - [19/Jun/2023 17:12:49] "POST /preprocessing HTTP/1.1" 200 -
127.0.0.1 - - [19/Jun/2023 17:12:49] "POST /speaker-predict HTTP/1.1" 200 -


Speaker Predicting...

--- 0.01985454559326172 seconds ---
Raja


Words Predicting...

--- 0.5751993656158447 seconds ---


Audio Transcribe : menyalakan lampu satu nol satu


127.0.0.1 - - [19/Jun/2023 17:12:50] "POST /word-predict HTTP/1.1" 200 -


{'record': True}


ALSA lib pcm.c:2664:(snd_pcm_open_noupdate) Unknown PCM cards.pcm.rear
ALSA lib pcm.c:2664:(snd_pcm_open_noupdate) Unknown PCM cards.pcm.center_lfe
ALSA lib pcm.c:2664:(snd_pcm_open_noupdate) Unknown PCM cards.pcm.side
ALSA lib pcm_route.c:877:(find_matching_chmap) Found no matching channel map
ALSA lib pcm_route.c:877:(find_matching_chmap) Found no matching channel map
ALSA lib pcm_route.c:877:(find_matching_chmap) Found no matching channel map
ALSA lib pcm_route.c:877:(find_matching_chmap) Found no matching channel map
Expression 'alsa_snd_pcm_hw_params_set_buffer_size_near( pcm, hwParams, &alsaBufferFrames )' failed in 'src/hostapi/alsa/pa_linux_alsa.c', line: 923
Expression 'alsa_snd_pcm_hw_params_set_buffer_size_near( pcm, hwParams, &alsaBufferFrames )' failed in 'src/hostapi/alsa/pa_linux_alsa.c', line: 923
ALSA lib pcm_oss.c:397:(_snd_pcm_oss_open) Cannot open device /dev/dsp
ALSA lib pcm_oss.c:397:(_snd_pcm_oss_open) Cannot open device /dev/dsp
ALSA lib confmisc.c:160:(snd_conf

Listening...


127.0.0.1 - - [19/Jun/2023 17:13:20] "POST /listen HTTP/1.1" 200 -


/home/alckylzer/Desktop/LiveASR/microphone-results.wav


127.0.0.1 - - [19/Jun/2023 17:13:21] "POST /preprocessing HTTP/1.1" 200 -
127.0.0.1 - - [19/Jun/2023 17:13:21] "POST /speaker-predict HTTP/1.1" 200 -


Speaker Predicting...

--- 0.016396284103393555 seconds ---
Gesang


Words Predicting...

--- 0.6168172359466553 seconds ---


Audio Transcribe : matikan lampu satu nol satu


127.0.0.1 - - [19/Jun/2023 17:13:22] "POST /word-predict HTTP/1.1" 200 -


{'record': True}


ALSA lib pcm.c:2664:(snd_pcm_open_noupdate) Unknown PCM cards.pcm.rear
ALSA lib pcm.c:2664:(snd_pcm_open_noupdate) Unknown PCM cards.pcm.center_lfe
ALSA lib pcm.c:2664:(snd_pcm_open_noupdate) Unknown PCM cards.pcm.side
ALSA lib pcm_route.c:877:(find_matching_chmap) Found no matching channel map
ALSA lib pcm_route.c:877:(find_matching_chmap) Found no matching channel map
ALSA lib pcm_route.c:877:(find_matching_chmap) Found no matching channel map
ALSA lib pcm_route.c:877:(find_matching_chmap) Found no matching channel map
Expression 'alsa_snd_pcm_hw_params_set_buffer_size_near( pcm, hwParams, &alsaBufferFrames )' failed in 'src/hostapi/alsa/pa_linux_alsa.c', line: 923
Expression 'alsa_snd_pcm_hw_params_set_buffer_size_near( pcm, hwParams, &alsaBufferFrames )' failed in 'src/hostapi/alsa/pa_linux_alsa.c', line: 923
ALSA lib pcm_oss.c:397:(_snd_pcm_oss_open) Cannot open device /dev/dsp
ALSA lib pcm_oss.c:397:(_snd_pcm_oss_open) Cannot open device /dev/dsp
ALSA lib confmisc.c:160:(snd_conf

Listening...
