/
asr_tts.json
53 lines (53 loc) · 1.41 KB
/
asr_tts.json
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
{
"chainer": {
"in": "speech_in_encoded",
"pipe": [
{
"class_name": "base64_decode_bytesIO",
"in": ["speech_in_encoded"],
"out": ["speech_in"]
},
{
"class_name": "nemo_asr",
"nemo_params_path": "{NEMO_PATH}/quartznet15x5/quartznet15x5.yaml",
"load_path": "{NEMO_PATH}/quartznet15x5",
"in": ["speech_in"],
"out": ["text"]
},
{
"class_name": "nemo_tts",
"nemo_params_path": "{TTS_PATH}/tacotron2_waveglow.yaml",
"load_path": "{TTS_PATH}",
"in": ["text"],
"out": ["speech_out"]
},
{
"class_name": "bytesIO_encode_base64",
"in": ["speech_out"],
"out": ["speech_out_encoded"]
}
],
"out": ["text", "speech_out_encoded"]
},
"metadata": {
"variables": {
"NEMO_PATH": "~/.deeppavlov/models/nemo",
"TTS_PATH": "{NEMO_PATH}/tacotron2_waveglow"
},
"requirements": [
"{DEEPPAVLOV_PATH}/requirements/pytorch.txt",
"{DEEPPAVLOV_PATH}/requirements/nemo-asr.txt",
"{DEEPPAVLOV_PATH}/requirements/nemo-tts.txt"
],
"download": [
{
"url": "http://files.deeppavlov.ai/deeppavlov_data/nemo/quartznet15x5.tar.gz",
"subdir": "{NEMO_PATH}"
},
{
"url": "http://files.deeppavlov.ai/deeppavlov_data/nemo/tacotron2_waveglow.tar.gz",
"subdir": "{NEMO_PATH}"
}
]
}
}