forked from koodo-reader/koodo-reader
-
Notifications
You must be signed in to change notification settings - Fork 0
/
edge-tts.js
291 lines (267 loc) · 9.6 KB
/
edge-tts.js
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
118
119
120
121
122
123
124
125
126
127
128
129
130
131
132
133
134
135
136
137
138
139
140
141
142
143
144
145
146
147
148
149
150
151
152
153
154
155
156
157
158
159
160
161
162
163
164
165
166
167
168
169
170
171
172
173
174
175
176
177
178
179
180
181
182
183
184
185
186
187
188
189
190
191
192
193
194
195
196
197
198
199
200
201
202
203
204
205
206
207
208
209
210
211
212
213
214
215
216
217
218
219
220
221
222
223
224
225
226
227
228
229
230
231
232
233
234
235
236
237
238
239
240
241
242
243
244
245
246
247
248
249
250
251
252
253
254
255
256
257
258
259
260
261
262
263
264
265
266
267
268
269
270
271
272
273
274
275
276
277
278
279
280
281
282
283
284
285
286
287
288
289
290
291
const { randomBytes } = require("crypto");
const { WebSocket } = require("ws");
const FORMAT_CONTENT_TYPE = new Map([
["raw-16khz-16bit-mono-pcm", "audio/basic"],
["raw-48khz-16bit-mono-pcm", "audio/basic"],
["raw-8khz-8bit-mono-mulaw", "audio/basic"],
["raw-8khz-8bit-mono-alaw", "audio/basic"],
["raw-16khz-16bit-mono-truesilk", "audio/SILK"],
["raw-24khz-16bit-mono-truesilk", "audio/SILK"],
["riff-16khz-16bit-mono-pcm", "audio/x-wav"],
["riff-24khz-16bit-mono-pcm", "audio/x-wav"],
["riff-48khz-16bit-mono-pcm", "audio/x-wav"],
["riff-8khz-8bit-mono-mulaw", "audio/x-wav"],
["riff-8khz-8bit-mono-alaw", "audio/x-wav"],
["audio-16khz-32kbitrate-mono-mp3", "audio/mpeg"],
["audio-16khz-64kbitrate-mono-mp3", "audio/mpeg"],
["audio-16khz-128kbitrate-mono-mp3", "audio/mpeg"],
["audio-24khz-48kbitrate-mono-mp3", "audio/mpeg"],
["audio-24khz-96kbitrate-mono-mp3", "audio/mpeg"],
["audio-24khz-160kbitrate-mono-mp3", "audio/mpeg"],
["audio-48khz-96kbitrate-mono-mp3", "audio/mpeg"],
["audio-48khz-192kbitrate-mono-mp3", "audio/mpeg"],
["webm-16khz-16bit-mono-opus", "audio/webm; codec=opus"],
["webm-24khz-16bit-mono-opus", "audio/webm; codec=opus"],
["ogg-16khz-16bit-mono-opus", "audio/ogg; codecs=opus; rate=16000"],
["ogg-24khz-16bit-mono-opus", "audio/ogg; codecs=opus; rate=24000"],
["ogg-48khz-16bit-mono-opus", "audio/ogg; codecs=opus; rate=48000"],
]);
class Service {
ws = null;
executorMap;
bufferMap;
timer = null;
constructor() {
this.executorMap = new Map();
this.bufferMap = new Map();
}
async connect() {
const connectionId = randomBytes(16).toString("hex").toLowerCase();
let url = `wss://speech.platform.bing.com/consumer/speech/synthesize/readaloud/edge/v1?TrustedClientToken=6A5AA1D4EAFF4E9FB37E23D68491D6F4&ConnectionId=${connectionId}`;
console.log(url);
let ws = new WebSocket(url, {
host: "speech.platform.bing.com",
origin: "chrome-extension://jdiccldimpdaibmpdkjnbmckianbfold",
headers: {
"User-Agent":
"Mozilla/5.0 (Windows NT 10.0; Win64; x64) AppleWebKit/537.36 (KHTML, like Gecko) Chrome/103.0.5060.66 Safari/537.36 Edg/103.0.1264.44",
},
});
console.log(ws);
return new Promise((resolve, reject) => {
ws.on("open", () => {
resolve(ws);
});
ws.on("close", (code, reason) => {
// 服务器会自动断开空闲超过30秒的连接
this.ws = null;
if (this.timer) {
clearTimeout(this.timer);
this.timer = null;
}
for (let [key, value] of this.executorMap) {
value.reject(`连接已关闭: ${reason} ${code}`);
}
this.executorMap.clear();
this.bufferMap.clear();
console.info(`连接已关闭: ${reason} ${code}`);
});
ws.on("message", (message, isBinary) => {
let pattern = /X-RequestId:(?<id>[a-z|0-9]*)/;
if (!isBinary) {
console.debug("收到文本消息:%s", message);
let data = message.toString();
if (data.includes("Path:turn.start")) {
// 开始传输
let matches = data.match(pattern);
let requestId = matches.groups.id;
console.debug(`开始传输:${requestId}……`);
this.bufferMap.set(requestId, Buffer.from([]));
} else if (data.includes("Path:turn.end")) {
// 结束传输
let matches = data.match(pattern);
let requestId = matches.groups.id;
let executor = this.executorMap.get(requestId);
if (executor) {
this.executorMap.delete(matches.groups.id);
let result = this.bufferMap.get(requestId);
executor.resolve(result);
console.debug(`传输完成:${requestId}……`);
} else {
console.debug(`请求已被丢弃:${requestId}`);
}
}
} else if (isBinary) {
let separator = "Path:audio\r\n";
let data = message;
let contentIndex = data.indexOf(separator) + separator.length;
let headers = data.slice(2, contentIndex).toString();
let matches = headers.match(pattern);
let requestId = matches.groups.id;
let content = data.slice(contentIndex);
console.debug(
`收到音频片段:${requestId} Length: ${content.length}\n${headers}`
);
let buffer = this.bufferMap.get(requestId);
if (buffer) {
buffer = Buffer.concat([buffer, content]);
this.bufferMap.set(requestId, buffer);
} else {
console.debug(`请求已被丢弃:${requestId}`);
}
}
});
ws.on("error", (error) => {
console.error(`连接失败: ${error}`);
reject(`连接失败: ${error}`);
});
ws.on("ping", (data) => {
console.debug("ping %s", data);
});
ws.on("pong", (data) => {
console.debug("pong %s", data);
});
});
}
async convert(ssml, format) {
if (this.ws == null || this.ws.readyState != WebSocket.OPEN) {
console.info("准备连接服务器……");
let connection = await this.connect();
this.ws = connection;
console.info("连接成功!");
}
const requestId = randomBytes(16).toString("hex").toLowerCase();
let result = new Promise((resolve, reject) => {
// 等待服务器返回后这个方法才会返回结果
this.executorMap.set(requestId, {
resolve,
reject,
});
// 发送配置消息
let configData = {
context: {
synthesis: {
audio: {
metadataoptions: {
sentenceBoundaryEnabled: "false",
wordBoundaryEnabled: "false",
},
outputFormat: format,
},
},
},
};
let configMessage =
`X-Timestamp:${Date()}\r\n` +
"Content-Type:application/json; charset=utf-8\r\n" +
"Path:speech.config\r\n\r\n" +
JSON.stringify(configData);
console.info(`开始转换:${requestId}……`);
console.debug(`准备发送配置请求:${requestId}\n`, configMessage);
this.ws.send(configMessage, (configError) => {
if (configError) {
console.error(`配置请求发送失败:${requestId}\n`, configError);
}
// 发送SSML消息
let ssmlMessage =
`X-Timestamp:${Date()}\r\n` +
`X-RequestId:${requestId}\r\n` +
`Content-Type:application/ssml+xml\r\n` +
`Path:ssml\r\n\r\n` +
ssml;
console.debug(`准备发送SSML消息:${requestId}\n`, ssmlMessage);
this.ws.send(ssmlMessage, (ssmlError) => {
if (ssmlError) {
console.error(`SSML消息发送失败:${requestId}\n`, ssmlError);
}
});
});
});
// 收到请求,清除超时定时器
if (this.timer) {
console.debug("收到新的请求,清除超时定时器");
clearTimeout(this.timer);
}
// 设置定时器,超过10秒没有收到请求,主动断开连接
console.debug("创建新的超时定时器");
this.timer = setTimeout(() => {
if (this.ws && this.ws.readyState == WebSocket.OPEN) {
console.debug("已经 10 秒没有请求,主动关闭连接");
this.ws.close(1000);
this.timer = null;
}
}, 10000);
let data = await Promise.race([
result,
new Promise((resolve, reject) => {
// 如果超过 20 秒没有返回结果,则清除请求并返回超时
setTimeout(() => {
this.executorMap.delete(requestId);
this.bufferMap.delete(requestId);
reject("转换超时");
}, 10000);
}),
]);
console.info(`转换完成:${requestId}`);
console.info(`剩余 ${this.executorMap.size} 个任务`);
return data;
}
}
const service = new Service();
const retry = async function (fn, times, errorFn, failedMessage) {
let reason = {
message: failedMessage ?? "多次尝试后失败",
errors: [],
};
for (let i = 0; i < times; i++) {
try {
return await fn();
} catch (error) {
if (errorFn) {
errorFn(i, error);
}
reason.errors.push(error);
}
}
throw reason;
};
const ra = async (text) => {
console.debug(`请求正文:${text}`);
try {
let format = "webm-24khz-16bit-mono-opus";
if (Array.isArray(format)) {
throw `无效的音频格式:${format}`;
}
if (!FORMAT_CONTENT_TYPE.has(format)) {
throw `无效的音频格式:${format}`;
}
let ssml = text;
if (ssml == null) {
throw `转换参数无效`;
}
let result = await retry(
async () => {
let result = await service.convert(ssml, format);
return result;
},
3,
(index, error) => {
console.warn(`第${index}次转换失败:${error}`);
},
"服务器多次尝试后转换失败"
);
return result;
// response.sendDate = true;
// response
// .status(200)
// .setHeader("Content-Type", FORMAT_CONTENT_TYPE.get(format));
// response.end(result);
} catch (error) {
console.error(`发生错误, ${error.message}`);
// response.status(503).json(error);
}
};
// ra(
// `<speak xmlns="http://www.w3.org/2001/10/synthesis" xmlns:mstts="http://www.w3.org/2001/mstts" xmlns:emo="http://www.w3.org/2009/10/emotionml" version="1.0" xml:lang="en-US"> <voice name="zh-CN-XiaoxiaoNeural"><prosody rate="0%" pitch="0%">如果喜欢这个项目的话请点个 Star 吧。</prosody ></voice > </speak >`
// );
module.exports = { ra };