A convenient Dockerized solution that transcribes media into subtitles using various Whisper implementations.
docker build -t asr .
docker run --rm -it --gpus=all -v $(pwd):/tmp1 asr /bin/bash
#docker run -it --rm --gpus '"device=0,1"' -v $(pwd):/app asr
whisper-faster /tmp1/lesson1.mp4 --model_dir=/models/ --model="large-v2" --language=en --output_dir=/tmp1/ --output_format=srt --vad_min_silence_duration_ms=1000 --temperature=1
whisper-ctranslate2 /tmp1/lesson1.mp4 --model_directory /models/faster-whisper-large-v2/ --vad_filter True --vad_min_silence_duration_ms 1000 --beam_size 5 --print_colors True --output_format srt --device cuda --compute_type float16 --language en
python3 simple.py -i /tmp1/lesson1.mp4 -o /tmp1/lesson1.srt
# local file
python3 app.py -i /tmp1/lesson1.mp4
# from YT
python3 app.py -i https://youtu.be/XZEkIK4_d-o -l fr