# Speech Digit Dataset

This notebook shows you how to prepare a synthetic dataset of speech data for digits 0-9.

This project is motivated by the desire to create a dataset similar to MNIST but for speech data.

## Installation

Python==3.10
piper-tts==1.2.0



In [8]:

voices = {
    "amy": {
        "model": "https://huggingface.co/rhasspy/piper-voices/resolve/v1.0.0/en/en_US/amy/medium/en_US-amy-medium.onnx?download=true",
        "config": "https://huggingface.co/rhasspy/piper-voices/resolve/v1.0.0/en/en_US/amy/medium/en_US-amy-medium.onnx.json?download=true.json"
    },
    "arctic": {
        "model": "https://huggingface.co/rhasspy/piper-voices/resolve/v1.0.0/en/en_US/arctic/medium/en_US-arctic-medium.onnx?download=true",
        "config": "https://huggingface.co/rhasspy/piper-voices/resolve/v1.0.0/en/en_US/arctic/medium/en_US-arctic-medium.onnx.json?download=true.json"
    },
    "bryce": {
        "model": "https://huggingface.co/rhasspy/piper-voices/resolve/v1.0.0/en/en_US/bryce/medium/en_US-bryce-medium.onnx?download=true",
        "config": "https://huggingface.co/rhasspy/piper-voices/resolve/v1.0.0/en/en_US/bryce/medium/en_US-bryce-medium.onnx.json?download=true.json"
    },
    "danny": {
        "model": "https://huggingface.co/rhasspy/piper-voices/resolve/v1.0.0/en/en_US/danny/low/en_US-danny-low.onnx?download=true",
        "config": "https://huggingface.co/rhasspy/piper-voices/resolve/v1.0.0/en/en_US/danny/low/en_US-danny-low.onnx.json?download=true.json"
    },
    "hfc_female": {
        "model": "https://huggingface.co/rhasspy/piper-voices/resolve/v1.0.0/en/en_US/hfc_female/medium/en_US-hfc_female-medium.onnx?download=true",
        "config": "https://huggingface.co/rhasspy/piper-voices/resolve/v1.0.0/en/en_US/hfc_female/medium/en_US-hfc_female-medium.onnx.json?download=true.json"
    },
    "hfc_male": {
        "model": "https://huggingface.co/rhasspy/piper-voices/resolve/v1.0.0/en/en_US/hfc_male/medium/en_US-hfc_male-medium.onnx?download=true",
        "config": "https://huggingface.co/rhasspy/piper-voices/resolve/v1.0.0/en/en_US/hfc_male/medium/en_US-hfc_male-medium.onnx.json?download=true.json"
    },
    "joe": {
        "model": "https://huggingface.co/rhasspy/piper-voices/resolve/v1.0.0/en/en_US/joe/medium/en_US-joe-medium.onnx?download=true",
        "config": "https://huggingface.co/rhasspy/piper-voices/resolve/v1.0.0/en/en_US/joe/medium/en_US-joe-medium.onnx.json?download=true.json"
    },
    "john": {
        "model": "https://huggingface.co/rhasspy/piper-voices/resolve/v1.0.0/en/en_US/john/medium/en_US-john-medium.onnx?download=true",
        "config": "https://huggingface.co/rhasspy/piper-voices/resolve/v1.0.0/en/en_US/john/medium/en_US-john-medium.onnx.json?download=true.json"
    },
    "kathleen": {
        "model": "https://huggingface.co/rhasspy/piper-voices/resolve/v1.0.0/en/en_US/kathleen/low/en_US-kathleen-low.onnx?download=true",
        "config": "https://huggingface.co/rhasspy/piper-voices/resolve/v1.0.0/en/en_US/kathleen/low/en_US-kathleen-low.onnx.json?download=true.json"
    },
    "kristin": {
        "model": "https://huggingface.co/rhasspy/piper-voices/resolve/v1.0.0/en/en_US/kristin/medium/en_US-kristin-medium.onnx?download=true",
        "config": "https://huggingface.co/rhasspy/piper-voices/resolve/v1.0.0/en/en_US/kristin/medium/en_US-kristin-medium.onnx.json?download=true.json"
    },
    "kusal": {
        "model": "https://huggingface.co/rhasspy/piper-voices/resolve/v1.0.0/en/en_US/kusal/medium/en_US-kusal-medium.onnx?download=true",
        "config": "https://huggingface.co/rhasspy/piper-voices/resolve/v1.0.0/en/en_US/kusal/medium/en_US-kusal-medium.onnx.json?download=true.json"
    },
    "l2arctic": {
        "model": "https://huggingface.co/rhasspy/piper-voices/resolve/v1.0.0/en/en_US/l2arctic/medium/en_US-l2arctic-medium.onnx?download=true",
        "config": "https://huggingface.co/rhasspy/piper-voices/resolve/v1.0.0/en/en_US/l2arctic/medium/en_US-l2arctic-medium.onnx.json?download=true.json"
    },
    "lessac": {
        "model": "https://huggingface.co/rhasspy/piper-voices/resolve/v1.0.0/en/en_US/lessac/medium/en_US-lessac-medium.onnx?download=true",
        "config": "https://huggingface.co/rhasspy/piper-voices/resolve/v1.0.0/en/en_US/lessac/medium/en_US-lessac-medium.onnx.json?download=true.json"
    },
    "libritts": {
        "model": "https://huggingface.co/rhasspy/piper-voices/resolve/v1.0.0/en/en_US/libritts/high/en_US-libritts-high.onnx?download=true",
        "config": "https://huggingface.co/rhasspy/piper-voices/resolve/v1.0.0/en/en_US/libritts/high/en_US-libritts-high.onnx.json?download=true.json"
    },
    "libritts_r": {
        "model": "https://huggingface.co/rhasspy/piper-voices/resolve/v1.0.0/en/en_US/libritts_r/medium/en_US-libritts_r-medium.onnx?download=true",
        "config": "https://huggingface.co/rhasspy/piper-voices/resolve/v1.0.0/en/en_US/libritts_r/medium/en_US-libritts_r-medium.onnx.json?download=true.json"
    },
    "ljspeech": {
        "model": "https://huggingface.co/rhasspy/piper-voices/resolve/v1.0.0/en/en_US/ljspeech/medium/en_US-ljspeech-medium.onnx?download=true",
        "config": "https://huggingface.co/rhasspy/piper-voices/resolve/v1.0.0/en/en_US/ljspeech/medium/en_US-ljspeech-medium.onnx.json?download=true.json"
    },
    "norman": {
        "model": "https://huggingface.co/rhasspy/piper-voices/resolve/v1.0.0/en/en_US/norman/medium/en_US-norman-medium.onnx?download=true",
        "config": "https://huggingface.co/rhasspy/piper-voices/resolve/v1.0.0/en/en_US/norman/medium/en_US-norman-medium.onnx.json?download=true.json"
    },
    "ryan": {
        "model": "https://huggingface.co/rhasspy/piper-voices/resolve/v1.0.0/en/en_US/ryan/medium/en_US-ryan-medium.onnx?download=true",
        "config": "https://huggingface.co/rhasspy/piper-voices/resolve/v1.0.0/en/en_US/ryan/medium/en_US-ryan-medium.onnx.json?download=true.json"
    }
}


import os
import subprocess

for voice, urls in voices.items():
    # Create directory for the voice
    voice_dir = os.path.join('voices', voice)
    os.makedirs(voice_dir, exist_ok=True)
    print(voice_dir)
    
    
    # Download model file
    model_url = urls['model']
    model_filename = os.path.join(voice_dir, f'{voice}_model.onnx')
    subprocess.run(['wget', '-O', model_filename, model_url], check=True)
    
    # Download config file
    config_url = urls['config']
    config_filename = os.path.join(voice_dir, f'{voice}_config.json')
    subprocess.run(['wget', '-O', config_filename, config_url], check=True)
    
    print(f"Downloaded files for {voice}")
    

voices/amy


--2024-10-16 19:23:32--  https://huggingface.co/rhasspy/piper-voices/resolve/v1.0.0/en/en_US/amy/medium/en_US-amy-medium.onnx?download=true
Resolving huggingface.co (huggingface.co)... 2600:9000:261f:8a00:17:b174:6d00:93a1, 2600:9000:261f:b800:17:b174:6d00:93a1, 2600:9000:261f:fc00:17:b174:6d00:93a1, ...
Connecting to huggingface.co (huggingface.co)|2600:9000:261f:8a00:17:b174:6d00:93a1|:443... connected.
HTTP request sent, awaiting response... 302 Found
Location: https://cdn-lfs.hf.co/repos/ed/06/ed062eb100d7bd80d78f61252cd190fca48cbda97eb1753fb827ff3339a6b11c/b3a6e47b57b8c7fbe6a0ce2518161a50f59a9cdd8a50835c02cb02bdd6206c18?response-content-disposition=attachment%3B+filename*%3DUTF-8%27%27en_US-amy-medium.onnx%3B+filename%3D%22en_US-amy-medium.onnx%22%3B&Expires=1729365812&Policy=eyJTdGF0ZW1lbnQiOlt7IkNvbmRpdGlvbiI6eyJEYXRlTGVzc1RoYW4iOnsiQVdTOkVwb2NoVGltZSI6MTcyOTM2NTgxMn19LCJSZXNvdXJjZSI6Imh0dHBzOi8vY2RuLWxmcy5oZi5jby9yZXBvcy9lZC8wNi9lZDA2MmViMTAwZDdiZDgwZDc4ZjYxMjUyY2QxOTBmY2E0OGNi

Downloaded files for amy
voices/arctic


connected.
HTTP request sent, awaiting response... 302 Found
Location: https://cdn-lfs.hf.co/repos/ed/06/ed062eb100d7bd80d78f61252cd190fca48cbda97eb1753fb827ff3339a6b11c/483303e294947a3ec2f910ea96093d876e1640f5772e9d89e511d6c82c667286?response-content-disposition=attachment%3B+filename*%3DUTF-8%27%27en_US-arctic-medium.onnx%3B+filename%3D%22en_US-arctic-medium.onnx%22%3B&Expires=1729365813&Policy=eyJTdGF0ZW1lbnQiOlt7IkNvbmRpdGlvbiI6eyJEYXRlTGVzc1RoYW4iOnsiQVdTOkVwb2NoVGltZSI6MTcyOTM2NTgxM319LCJSZXNvdXJjZSI6Imh0dHBzOi8vY2RuLWxmcy5oZi5jby9yZXBvcy9lZC8wNi9lZDA2MmViMTAwZDdiZDgwZDc4ZjYxMjUyY2QxOTBmY2E0OGNiZGE5N2ViMTc1M2ZiODI3ZmYzMzM5YTZiMTFjLzQ4MzMwM2UyOTQ5NDdhM2VjMmY5MTBlYTk2MDkzZDg3NmUxNjQwZjU3NzJlOWQ4OWU1MTFkNmM4MmM2NjcyODY%7EcmVzcG9uc2UtY29udGVudC1kaXNwb3NpdGlvbj0qIn1dfQ__&Signature=pfaOcZxJUx3NpLln0Tu9mZL43rGpHZtLKFETVujvZbpieoUAgBFRjuXdQkf39ca14Qqya1S3Kgpk93i0nfcEI3eUjY5Mg3MROEvo7QRknuZJ1lBHDxF%7EbGWV5od7LLnG7H11ITcf%7E5SMa4UP-fxUZB7XxjGUlV-Ldw1nBiyIjg%7E4upXygeOXggGwnDJ03bQ-o8u8yC1bX

Downloaded files for arctic
voices/bryce


. ..........  2%  104M 1s
  1400K .......... .......... .......... .......... ..........  2%  135M 1s
  1450K .......... .......... .......... .......... ..........  2% 95.1M 1s
  1500K .......... .......... .......... .......... ..........  2%  127M 1s
  1550K .......... .......... .......... .......... ..........  2%  127M 1s
  1600K .......... .......... .......... .......... ..........  2% 86.5M 1s
  1650K .......... .......... .......... .......... ..........  2% 94.4M 1s
  1700K .......... .......... .......... .......... ..........  2%  132M 1s
  1750K .......... .......... .......... .......... ..........  2%  128M 1s
  1800K .......... .......... .......... .......... ..........  2%  112M 1s
  1850K .......... .......... .......... .......... ..........  3%  119M 1s
  1900K .......... .......... .......... .......... ..........  3%  104M 1s
  1950K .......... .......... .......... .......... ..........  3%  112M 1s
  2000K .......... .......... .......... .......... ..........

Downloaded files for bryce
voices/danny


200 OK
Length: 63104526 (60M) [application/octet-stream]
Saving to: ‘voices/danny/danny_model.onnx’

     0K .......... .......... .......... .......... ..........  0% 20.4M 3s
    50K .......... .......... .......... .......... ..........  0% 24.0M 3s
   100K .......... .......... .......... .......... ..........  0% 68.6M 2s
   150K .......... .......... .......... .......... ..........  0% 67.4M 2s
   200K .......... .......... .......... .......... ..........  0% 39.2M 2s
   250K .......... .......... .......... .......... ..........  0% 79.4M 2s
   300K .......... .......... .......... .......... ..........  0% 77.0M 1s
   350K .......... .......... .......... .......... ..........  0% 77.4M 1s
   400K .......... .......... .......... .......... ..........  0%  127M 1s
   450K .......... .......... .......... .......... ..........  0% 77.9M 1s
   500K .......... .......... .......... .......... ..........  0% 99.6M 1s
   550K .......... .......... .......... .......... .......... 

Downloaded files for danny
voices/hfc_female


. .......... ..........  7%  127M 1s
  4750K .......... .......... .......... .......... ..........  7%  105M 1s
  4800K .......... .......... .......... .......... ..........  7% 97.2M 1s
  4850K .......... .......... .......... .......... ..........  7%  128M 1s
  4900K .......... .......... .......... .......... ..........  8% 86.6M 1s
  4950K .......... .......... .......... .......... ..........  8% 91.2M 1s
  5000K .......... .......... .......... .......... ..........  8%  127M 1s
  5050K .......... .......... .......... .......... ..........  8%  129M 1s
  5100K .......... .......... .......... .......... ..........  8% 86.6M 1s
  5150K .......... .......... .......... .......... ..........  8%  103M 1s
  5200K .......... .......... .......... .......... ..........  8% 95.1M 1s
  5250K .......... .......... .......... .......... ..........  8% 87.8M 1s
  5300K .......... .......... .......... .......... ..........  8% 80.5M 1s
  5350K .......... .......... .......... ..........

Downloaded files for hfc_female
voices/hfc_male


Resolving huggingface.co (huggingface.co)... 2600:9000:261f:9a00:17:b174:6d00:93a1, 2600:9000:261f:7600:17:b174:6d00:93a1, 2600:9000:261f:e000:17:b174:6d00:93a1, ...
Connecting to huggingface.co (huggingface.co)|2600:9000:261f:9a00:17:b174:6d00:93a1|:443... connected.
HTTP request sent, awaiting response... 302 Found
Location: https://cdn-lfs.hf.co/repos/ed/06/ed062eb100d7bd80d78f61252cd190fca48cbda97eb1753fb827ff3339a6b11c/d11e403a02bdf5a670c877b3dc56e0e1c8cece6fb30289586314dffdc0a78cb0?response-content-disposition=attachment%3B+filename*%3DUTF-8%27%27en_US-hfc_male-medium.onnx%3B+filename%3D%22en_US-hfc_male-medium.onnx%22%3B&Expires=1729365817&Policy=eyJTdGF0ZW1lbnQiOlt7IkNvbmRpdGlvbiI6eyJEYXRlTGVzc1RoYW4iOnsiQVdTOkVwb2NoVGltZSI6MTcyOTM2NTgxN319LCJSZXNvdXJjZSI6Imh0dHBzOi8vY2RuLWxmcy5oZi5jby9yZXBvcy9lZC8wNi9lZDA2MmViMTAwZDdiZDgwZDc4ZjYxMjUyY2QxOTBmY2E0OGNiZGE5N2ViMTc1M2ZiODI3ZmYzMzM5YTZiMTFjL2QxMWU0MDNhMDJiZGY1YTY3MGM4NzdiM2RjNTZlMGUxYzhjZWNlNmZiMzAyODk1ODYzMTRkZmZkYzBhNzhjYjA%7EcmVz

Downloaded files for hfc_male
voices/joe


3.171.139.118, 3.171.139.62, 3.171.139.14, ...
Connecting to cdn-lfs.hf.co (cdn-lfs.hf.co)|3.171.139.118|:443... connected.
HTTP request sent, awaiting response... 200 OK
Length: 63201294 (60M) [application/octet-stream]
Saving to: ‘voices/joe/joe_model.onnx’

     0K .......... .......... .......... .......... ..........  0% 18.5M 3s
    50K .......... .......... .......... .......... ..........  0% 25.1M 3s
   100K .......... .......... .......... .......... ..........  0% 5.16M 6s
   150K .......... .......... .......... .......... ..........  0% 46.7M 5s
   200K .......... .......... .......... .......... ..........  0% 29.1M 4s
   250K .......... .......... .......... .......... ..........  0% 84.5M 4s
   300K .......... .......... .......... .......... ..........  0% 57.0M 3s
   350K .......... .......... .......... .......... ..........  0% 35.8M 3s
   400K .......... .......... .......... .......... ..........  0% 86.4M 3s
   450K .......... .......... .......... .......... ...

Downloaded files for joe
voices/john


200 OK
Length: 63531379 (61M) [application/octet-stream]
Saving to: ‘voices/john/john_model.onnx’

     0K .......... .......... .......... .......... ..........  0% 20.7M 3s
    50K .......... .......... .......... .......... ..........  0% 22.1M 3s
   100K .......... .......... .......... .......... ..........  0% 43.3M 2s
   150K .......... .......... .......... .......... ..........  0%  116M 2s
   200K .......... .......... .......... .......... ..........  0% 41.8M 2s
   250K .......... .......... .......... .......... ..........  0% 94.2M 2s
   300K .......... .......... .......... .......... ..........  0% 64.4M 2s
   350K .......... .......... .......... .......... ..........  0%  103M 1s
   400K .......... .......... .......... .......... ..........  0%  117M 1s
   450K .......... .......... .......... .......... ..........  0%  112M 1s
   500K .......... .......... .......... .......... ..........  0% 94.0M 1s
   550K .......... .......... .......... .......... ..........  0

Downloaded files for john
voices/kathleen


200 OK
Length: 63104526 (60M) [application/octet-stream]
Saving to: ‘voices/kathleen/kathleen_model.onnx’

     0K .......... .......... .......... .......... ..........  0% 18.1M 3s
    50K .......... .......... .......... .......... ..........  0% 23.3M 3s
   100K .......... .......... .......... .......... ..........  0% 18.5M 3s
   150K .......... .......... .......... .......... ..........  0% 90.5M 2s
   200K .......... .......... .......... .......... ..........  0% 65.8M 2s
   250K .......... .......... .......... .......... ..........  0% 35.7M 2s
   300K .......... .......... .......... .......... ..........  0%  123M 2s
   350K .......... .......... .......... .......... ..........  0% 99.3M 2s
   400K .......... .......... .......... .......... ..........  0% 78.9M 2s
   450K .......... .......... .......... .......... ..........  0% 95.1M 1s
   500K .......... .......... .......... .......... ..........  0% 84.5M 1s
   550K .......... .......... .......... .......... .....

Downloaded files for kathleen
voices/kristin


... ..........  8%  100M 1s
  5450K .......... .......... .......... .......... ..........  8%  109M 1s
  5500K .......... .......... .......... .......... ..........  8% 97.9M 1s
  5550K .......... .......... .......... .......... ..........  9%  130M 1s
  5600K .......... .......... .......... .......... ..........  9% 91.0M 1s
  5650K .......... .......... .......... .......... ..........  9%  129M 1s
  5700K .......... .......... .......... .......... ..........  9%  118M 1s
  5750K .......... .......... .......... .......... ..........  9%  108M 1s
  5800K .......... .......... .......... .......... ..........  9% 99.3M 1s
  5850K .......... .......... .......... .......... ..........  9%  130M 1s
  5900K .......... .......... .......... .......... ..........  9% 91.8M 1s
  5950K .......... .......... .......... .......... ..........  9% 86.3M 1s
  6000K .......... .......... .......... .......... ..........  9%  130M 1s
  6050K .......... .......... .......... .......... ........

Downloaded files for kristin
voices/kusal


...  0% 16.1M 4s
    50K .......... .......... .......... .......... ..........  0% 15.3M 4s
   100K .......... .......... .......... .......... ..........  0% 78.6M 3s
   150K .......... .......... .......... .......... ..........  0% 35.1M 3s
   200K .......... .......... .......... .......... ..........  0% 30.7M 2s
   250K .......... .......... .......... .......... ..........  0% 71.0M 2s
   300K .......... .......... .......... .......... ..........  0% 76.0M 2s
   350K .......... .......... .......... .......... ..........  0% 67.7M 2s
   400K .......... .......... .......... .......... ..........  0% 76.4M 2s
   450K .......... .......... .......... .......... ..........  0% 86.1M 2s
   500K .......... .......... .......... .......... ..........  0% 86.4M 2s
   550K .......... .......... .......... .......... ..........  0% 94.7M 1s
   600K .......... .......... .......... .......... ..........  1%  119M 1s
   650K .......... .......... .......... .......... ..........  1%  102

Downloaded files for kusal
voices/l2arctic


..... .......... .......... ..........  9% 99.7M 1s
  7050K .......... .......... .......... .......... ..........  9% 96.9M 1s
  7100K .......... .......... .......... .......... ..........  9%  103M 1s
  7150K .......... .......... .......... .......... ..........  9%  104M 1s
  7200K .......... .......... .......... .......... ..........  9%  118M 1s
  7250K .......... .......... .......... .......... ..........  9%  111M 1s
  7300K .......... .......... .......... .......... ..........  9% 74.6M 1s
  7350K .......... .......... .......... .......... ..........  9%  128M 1s
  7400K .......... .......... .......... .......... ..........  9%  109M 1s
  7450K .......... .......... .......... .......... .......... 10% 98.3M 1s
  7500K .......... .......... .......... .......... .......... 10%  129M 1s
  7550K .......... .......... .......... .......... .......... 10%  108M 1s
  7600K .......... .......... .......... .......... .......... 10% 93.1M 1s
  7650K .......... .......... ......

Downloaded files for l2arctic
voices/lessac


connected.
HTTP request sent, awaiting response... 200 OK
Length: 63201294 (60M) [application/octet-stream]
Saving to: ‘voices/lessac/lessac_model.onnx’

     0K .......... .......... .......... .......... ..........  0% 20.7M 3s
    50K .......... .......... .......... .......... ..........  0% 16.7M 3s
   100K .......... .......... .......... .......... ..........  0% 86.4M 2s
   150K .......... .......... .......... .......... ..........  0% 30.1M 2s
   200K .......... .......... .......... .......... ..........  0% 63.6M 2s
   250K .......... .......... .......... .......... ..........  0% 64.0M 2s
   300K .......... .......... .......... .......... ..........  0% 82.3M 2s
   350K .......... .......... .......... .......... ..........  0% 80.4M 2s
   400K .......... .......... .......... .......... ..........  0% 92.4M 1s
   450K .......... .......... .......... .......... ..........  0% 96.0M 1s
   500K .......... .......... .......... .......... ..........  0%  139M 1s
   550K ..

Downloaded files for lessac
voices/libritts


200 OK
Length: 136673811 (130M) [application/octet-stream]
Saving to: ‘voices/libritts/libritts_model.onnx’

     0K .......... .......... .......... .......... ..........  0% 18.2M 7s
    50K .......... .......... .......... .......... ..........  0% 19.1M 7s
   100K .......... .......... .......... .......... ..........  0% 93.1M 5s
   150K .......... .......... .......... .......... ..........  0% 42.9M 5s
   200K .......... .......... .......... .......... ..........  0% 40.3M 4s
   250K .......... .......... .......... .......... ..........  0%  112M 4s
   300K .......... .......... .......... .......... ..........  0% 78.9M 3s
   350K .......... .......... .......... .......... ..........  0% 83.1M 3s
   400K .......... .......... .......... .......... ..........  0% 92.4M 3s
   450K .......... .......... .......... .......... ..........  0%  102M 3s
   500K .......... .......... .......... .......... ..........  0%  107M 3s
   550K .......... .......... .......... .......... ...

Downloaded files for libritts
voices/libritts_r


200 OK
Length: 78580914 (75M) [application/octet-stream]
Saving to: ‘voices/libritts_r/libritts_r_model.onnx’

     0K .......... .......... .......... .......... ..........  0% 23.2M 3s
    50K .......... .......... .......... .......... ..........  0% 17.6M 4s
   100K .......... .......... .......... .......... ..........  0% 19.0M 4s
   150K .......... .......... .......... .......... ..........  0% 72.9M 3s
   200K .......... .......... .......... .......... ..........  0% 28.0M 3s
   250K .......... .......... .......... .......... ..........  0% 78.5M 3s
   300K .......... .......... .......... .......... ..........  0% 70.7M 2s
   350K .......... .......... .......... .......... ..........  0% 65.9M 2s
   400K .......... .......... .......... .......... ..........  0%  109M 2s
   450K .......... .......... .......... .......... ..........  0% 89.0M 2s
   500K .......... .......... .......... .......... ..........  0% 85.7M 2s
   550K .......... .......... .......... .......... .

Downloaded files for libritts_r
voices/ljspeech


302 Found
Location: https://cdn-lfs.hf.co/repos/ed/06/ed062eb100d7bd80d78f61252cd190fca48cbda97eb1753fb827ff3339a6b11c/6f52a751e2349abe7a76735eb09dc1875298c77ea2342ffd2fef79ff81b87f22?response-content-disposition=attachment%3B+filename*%3DUTF-8%27%27en_US-ljspeech-medium.onnx%3B+filename%3D%22en_US-ljspeech-medium.onnx%22%3B&Expires=1729365830&Policy=eyJTdGF0ZW1lbnQiOlt7IkNvbmRpdGlvbiI6eyJEYXRlTGVzc1RoYW4iOnsiQVdTOkVwb2NoVGltZSI6MTcyOTM2NTgzMH19LCJSZXNvdXJjZSI6Imh0dHBzOi8vY2RuLWxmcy5oZi5jby9yZXBvcy9lZC8wNi9lZDA2MmViMTAwZDdiZDgwZDc4ZjYxMjUyY2QxOTBmY2E0OGNiZGE5N2ViMTc1M2ZiODI3ZmYzMzM5YTZiMTFjLzZmNTJhNzUxZTIzNDlhYmU3YTc2NzM1ZWIwOWRjMTg3NTI5OGM3N2VhMjM0MmZmZDJmZWY3OWZmODFiODdmMjI%7EcmVzcG9uc2UtY29udGVudC1kaXNwb3NpdGlvbj0qIn1dfQ__&Signature=ZRE0AY0XJ8WiQrYnaHH5vs0txZ8FR6AFzWZZe5ID4dU-1nJBvhFgqSRDvHhm7XGP5napv6nU--M%7ECu61KKIXA6B0htVnOXQHcsHX1l%7EzNthFFppvFBoZGY0cdwPc13qXrHGpxUAfjoZIqfr2QPnYSfjGSFQuUMkU2i2GafcoHakBJpG6JYIKdqKK1pQoTsTi%7EnTgtFsC4T8KNdC-BdNzi5VVKmuIq0Kqpo42v6umI6B1qURQkJg19czV

Downloaded files for ljspeech
voices/norman


200 OK
Length: 63531379 (61M) [application/octet-stream]
Saving to: ‘voices/norman/norman_model.onnx’

     0K .......... .......... .......... .......... ..........  0% 13.0M 5s
    50K .......... .......... .......... .......... ..........  0% 18.2M 4s
   100K .......... .......... .......... .......... ..........  0% 40.9M 3s
   150K .......... .......... .......... .......... ..........  0% 63.9M 3s
   200K .......... .......... .......... .......... ..........  0% 39.6M 2s
   250K .......... .......... .......... .......... ..........  0% 70.2M 2s
   300K .......... .......... .......... .......... ..........  0% 71.2M 2s
   350K .......... .......... .......... .......... ..........  0% 47.4M 2s
   400K .......... .......... .......... .......... ..........  0% 46.1M 2s
   450K .......... .......... .......... .......... ..........  0% 55.5M 2s
   500K .......... .......... .......... .......... ..........  0% 66.7M 2s
   550K .......... .......... .......... .......... .........

Downloaded files for norman
voices/ryan


200 OK
Length: 63201294 (60M) [application/octet-stream]
Saving to: ‘voices/ryan/ryan_model.onnx’

     0K .......... .......... .......... .......... ..........  0% 18.7M 3s
    50K .......... .......... .......... .......... ..........  0% 29.7M 3s
   100K .......... .......... .......... .......... ..........  0% 1.08M 20s
   150K .......... .......... .......... .......... ..........  0% 96.1M 15s
   200K .......... .......... .......... .......... ..........  0% 15.1M 13s
   250K .......... .......... .......... .......... ..........  0% 87.8M 11s
   300K .......... .......... .......... .......... ..........  0% 72.5M 10s
   350K .......... .......... .......... .......... ..........  0% 85.9M 8s
   400K .......... .......... .......... .......... ..........  0% 82.9M 8s
   450K .......... .......... .......... .......... ..........  0% 95.5M 7s
   500K .......... .......... .......... .......... ..........  0% 61.7M 6s
   550K .......... .......... .......... .......... ........

Downloaded files for ryan


... .......... 94%  374K 0s
 58600K .......... .......... .......... .......... .......... 95% 59.1M 0s
 58650K .......... .......... .......... .......... .......... 95% 94.2M 0s
 58700K .......... .......... .......... .......... .......... 95% 28.1M 0s
 58750K .......... .......... .......... .......... .......... 95% 86.1M 0s
 58800K .......... .......... .......... .......... .......... 95% 87.0M 0s
 58850K .......... .......... .......... .......... .......... 95% 83.8M 0s
 58900K .......... .......... .......... .......... .......... 95% 31.3M 0s
 58950K .......... .......... .......... .......... .......... 95%  105M 0s
 59000K .......... .......... .......... .......... .......... 95%  105M 0s
 59050K .......... .......... .......... .......... .......... 95% 78.0M 0s
 59100K .......... .......... .......... .......... .......... 95% 47.6M 0s
 59150K .......... .......... .......... .......... .......... 95% 87.3M 0s
 59200K .......... .......... .......... .......... ........

In [13]:
for voice, urls in voices.items():

    voice_dir = os.path.join('voices', voice)
    print(voice_dir)

    # Download model file
    model_url = urls['model']
    model_filename = os.path.join(voice_dir, f'{voice}_model.onnx')
    
    # Download config file
    config_url = urls['config']
    config_filename = os.path.join(voice_dir, f'{voice}_config.json')

    print(model_filename)
    print(voice)

    piper_cmd = ['piper', '--model', model_filename, '--config', config_filename, '--output_file', f'speech_digits/0/{voice}.wav']
    subprocess.run(['echo', '0'], stdout=subprocess.PIPE, check=True, text=True, input='0\n')
    subprocess.run(piper_cmd, check=True, input='0\n', text=True)




voices/amy
voices/amy/amy_model.onnx
amy
voices/arctic
voices/arctic/arctic_model.onnx
arctic
voices/bryce
voices/bryce/bryce_model.onnx
bryce
voices/danny
voices/danny/danny_model.onnx
danny
voices/hfc_female
voices/hfc_female/hfc_female_model.onnx
hfc_female
voices/hfc_male
voices/hfc_male/hfc_male_model.onnx
hfc_male
voices/joe
voices/joe/joe_model.onnx
joe
voices/john
voices/john/john_model.onnx
john
voices/kathleen
voices/kathleen/kathleen_model.onnx
kathleen
voices/kristin
voices/kristin/kristin_model.onnx
kristin
voices/kusal
voices/kusal/kusal_model.onnx
kusal
voices/l2arctic
voices/l2arctic/l2arctic_model.onnx
l2arctic
voices/lessac
voices/lessac/lessac_model.onnx
lessac
voices/libritts
voices/libritts/libritts_model.onnx
libritts
voices/libritts_r
voices/libritts_r/libritts_r_model.onnx
libritts_r
voices/ljspeech
voices/ljspeech/ljspeech_model.onnx
ljspeech
voices/norman
voices/norman/norman_model.onnx
norman
voices/ryan
voices/ryan/ryan_model.onnx
ryan


In [None]:
# let's listen to all of the 0s

