msedge-tts
Advanced tools
Comparing version 1.2.2 to 1.3.2
@@ -125,2 +125,5 @@ "use strict"; | ||
this._log("disconnected after:", (Date.now() - this._startTime) / 1000, "seconds"); | ||
for (const requestId in this._queue) { | ||
this._queue[requestId].push(null); | ||
} | ||
}); | ||
@@ -243,3 +246,3 @@ this._ws.on("error", function (error) { | ||
_rawSSMLRequestToFile(path, requestSSML) { | ||
return new Promise((resolve) => __awaiter(this, void 0, void 0, function* () { | ||
return new Promise((resolve, reject) => __awaiter(this, void 0, void 0, function* () { | ||
const stream = this._rawSSMLRequest(requestSSML); | ||
@@ -249,2 +252,5 @@ const chunks = []; | ||
stream.once("close", () => __awaiter(this, void 0, void 0, function* () { | ||
if (Object.keys(this._queue).length > 0 && chunks.length === 0) { | ||
reject("No audio data received"); | ||
} | ||
const output = fs.createWriteStream(path); | ||
@@ -251,0 +257,0 @@ while (chunks.length > 0) { |
/** | ||
* https://docs.microsoft.com/en-us/azure/cognitive-services/speech-service/rest-text-to-speech#audio-outputs | ||
* Only a few of the [possible formats](https://docs.microsoft.com/en-us/azure/cognitive-services/speech-service/rest-text-to-speech#audio-outputs) are accepted. | ||
*/ | ||
export declare enum OUTPUT_FORMAT { | ||
RAW_16KHZ_16BIT_MONO_PCM = "raw-16khz-16bit-mono-pcm", | ||
RAW_24KHZ_16BIT_MONO_PCM = "raw-24khz-16bit-mono-pcm", | ||
RAW_48KHZ_16BIT_MONO_PCM = "raw-48khz-16bit-mono-pcm", | ||
RAW_8KHZ_8BIT_MONO_MULAW = "raw-8khz-8bit-mono-mulaw", | ||
RAW_8KHZ_8BIT_MONO_ALAW = "raw-8khz-8bit-mono-alaw", | ||
RAW_16KHZ_16BIT_MONO_TRUESILK = "raw-16khz-16bit-mono-truesilk", | ||
RAW_24KHZ_16BIT_MONO_TRUESILK = "raw-24khz-16bit-mono-truesilk", | ||
RIFF_16KHZ_16BIT_MONO_PCM = "riff-16khz-16bit-mono-pcm", | ||
RIFF_24KHZ_16BIT_MONO_PCM = "riff-24khz-16bit-mono-pcm", | ||
RIFF_48KHZ_16BIT_MONO_PCM = "riff-48khz-16bit-mono-pcm", | ||
RIFF_8KHZ_8BIT_MONO_MULAW = "riff-8khz-8bit-mono-mulaw", | ||
RIFF_8KHZ_8BIT_MONO_ALAW = "riff-8khz-8bit-mono-alaw", | ||
AUDIO_16KHZ_32KBITRATE_MONO_MP3 = "audio-16khz-32kbitrate-mono-mp3", | ||
AUDIO_16KHZ_64KBITRATE_MONO_MP3 = "audio-16khz-64kbitrate-mono-mp3", | ||
AUDIO_16KHZ_128KBITRATE_MONO_MP3 = "audio-16khz-128kbitrate-mono-mp3", | ||
AUDIO_24KHZ_48KBITRATE_MONO_MP3 = "audio-24khz-48kbitrate-mono-mp3", | ||
AUDIO_24KHZ_96KBITRATE_MONO_MP3 = "audio-24khz-96kbitrate-mono-mp3", | ||
AUDIO_24KHZ_160KBITRATE_MONO_MP3 = "audio-24khz-160kbitrate-mono-mp3", | ||
AUDIO_48KHZ_96KBITRATE_MONO_MP3 = "audio-48khz-96kbitrate-mono-mp3", | ||
AUDIO_48KHZ_192KBITRATE_MONO_MP3 = "audio-48khz-192kbitrate-mono-mp3", | ||
WEBM_16KHZ_16BIT_MONO_OPUS = "webm-16khz-16bit-mono-opus", | ||
WEBM_24KHZ_16BIT_MONO_OPUS = "webm-24khz-16bit-mono-opus", | ||
OGG_16KHZ_16BIT_MONO_OPUS = "ogg-16khz-16bit-mono-opus", | ||
OGG_24KHZ_16BIT_MONO_OPUS = "ogg-24khz-16bit-mono-opus", | ||
OGG_48KHZ_16BIT_MONO_OPUS = "ogg-48khz-16bit-mono-opus" | ||
WEBM_24KHZ_16BIT_MONO_OPUS = "webm-24khz-16bit-mono-opus" | ||
} |
@@ -5,31 +5,43 @@ "use strict"; | ||
/** | ||
* https://docs.microsoft.com/en-us/azure/cognitive-services/speech-service/rest-text-to-speech#audio-outputs | ||
* Only a few of the [possible formats](https://docs.microsoft.com/en-us/azure/cognitive-services/speech-service/rest-text-to-speech#audio-outputs) are accepted. | ||
*/ | ||
var OUTPUT_FORMAT; | ||
(function (OUTPUT_FORMAT) { | ||
OUTPUT_FORMAT["RAW_16KHZ_16BIT_MONO_PCM"] = "raw-16khz-16bit-mono-pcm"; | ||
OUTPUT_FORMAT["RAW_24KHZ_16BIT_MONO_PCM"] = "raw-24khz-16bit-mono-pcm"; | ||
OUTPUT_FORMAT["RAW_48KHZ_16BIT_MONO_PCM"] = "raw-48khz-16bit-mono-pcm"; | ||
OUTPUT_FORMAT["RAW_8KHZ_8BIT_MONO_MULAW"] = "raw-8khz-8bit-mono-mulaw"; | ||
OUTPUT_FORMAT["RAW_8KHZ_8BIT_MONO_ALAW"] = "raw-8khz-8bit-mono-alaw"; | ||
OUTPUT_FORMAT["RAW_16KHZ_16BIT_MONO_TRUESILK"] = "raw-16khz-16bit-mono-truesilk"; | ||
OUTPUT_FORMAT["RAW_24KHZ_16BIT_MONO_TRUESILK"] = "raw-24khz-16bit-mono-truesilk"; | ||
OUTPUT_FORMAT["RIFF_16KHZ_16BIT_MONO_PCM"] = "riff-16khz-16bit-mono-pcm"; | ||
OUTPUT_FORMAT["RIFF_24KHZ_16BIT_MONO_PCM"] = "riff-24khz-16bit-mono-pcm"; | ||
OUTPUT_FORMAT["RIFF_48KHZ_16BIT_MONO_PCM"] = "riff-48khz-16bit-mono-pcm"; | ||
OUTPUT_FORMAT["RIFF_8KHZ_8BIT_MONO_MULAW"] = "riff-8khz-8bit-mono-mulaw"; | ||
OUTPUT_FORMAT["RIFF_8KHZ_8BIT_MONO_ALAW"] = "riff-8khz-8bit-mono-alaw"; | ||
OUTPUT_FORMAT["AUDIO_16KHZ_32KBITRATE_MONO_MP3"] = "audio-16khz-32kbitrate-mono-mp3"; | ||
OUTPUT_FORMAT["AUDIO_16KHZ_64KBITRATE_MONO_MP3"] = "audio-16khz-64kbitrate-mono-mp3"; | ||
OUTPUT_FORMAT["AUDIO_16KHZ_128KBITRATE_MONO_MP3"] = "audio-16khz-128kbitrate-mono-mp3"; | ||
// Streaming ============================= | ||
// AMR_WB_16000HZ = "amr-wb-16000hz", | ||
// AUDIO_16KHZ_16BIT_32KBPS_MONO_OPUS = "audio-16khz-16bit-32kbps-mono-opus", | ||
// AUDIO_16KHZ_32KBITRATE_MONO_MP3 = "audio-16khz-32kbitrate-mono-mp3", | ||
// AUDIO_16KHZ_64KBITRATE_MONO_MP3 = "audio-16khz-64kbitrate-mono-mp3", | ||
// AUDIO_16KHZ_128KBITRATE_MONO_MP3 = "audio-16khz-128kbitrate-mono-mp3", | ||
// AUDIO_24KHZ_16BIT_24KBPS_MONO_OPUS = "audio-24khz-16bit-24kbps-mono-opus", | ||
// AUDIO_24KHZ_16BIT_48KBPS_MONO_OPUS = "audio-24khz-16bit-48kbps-mono-opus", | ||
OUTPUT_FORMAT["AUDIO_24KHZ_48KBITRATE_MONO_MP3"] = "audio-24khz-48kbitrate-mono-mp3"; | ||
OUTPUT_FORMAT["AUDIO_24KHZ_96KBITRATE_MONO_MP3"] = "audio-24khz-96kbitrate-mono-mp3"; | ||
OUTPUT_FORMAT["AUDIO_24KHZ_160KBITRATE_MONO_MP3"] = "audio-24khz-160kbitrate-mono-mp3"; | ||
OUTPUT_FORMAT["AUDIO_48KHZ_96KBITRATE_MONO_MP3"] = "audio-48khz-96kbitrate-mono-mp3"; | ||
OUTPUT_FORMAT["AUDIO_48KHZ_192KBITRATE_MONO_MP3"] = "audio-48khz-192kbitrate-mono-mp3"; | ||
OUTPUT_FORMAT["WEBM_16KHZ_16BIT_MONO_OPUS"] = "webm-16khz-16bit-mono-opus"; | ||
// AUDIO_24KHZ_160KBITRATE_MONO_MP3 = "audio-24khz-160kbitrate-mono-mp3", | ||
// AUDIO_48KHZ_96KBITRATE_MONO_MP3 = "audio-48khz-96kbitrate-mono-mp3", | ||
// AUDIO_48KHZ_192KBITRATE_MONO_MP3 = "audio-48khz-192kbitrate-mono-mp3", | ||
// OGG_16KHZ_16BIT_MONO_OPUS = "ogg-16khz-16bit-mono-opus", | ||
// OGG_24KHZ_16BIT_MONO_OPUS = "ogg-24khz-16bit-mono-opus", | ||
// OGG_48KHZ_16BIT_MONO_OPUS = "ogg-48khz-16bit-mono-opus", | ||
// RAW_8KHZ_8BIT_MONO_ALAW = "raw-8khz-8bit-mono-alaw", | ||
// RAW_8KHZ_8BIT_MONO_MULAW = "raw-8khz-8bit-mono-mulaw", | ||
// RAW_8KHZ_16BIT_MONO_PCM = "raw-8khz-16bit-mono-pcm", | ||
// RAW_16KHZ_16BIT_MONO_PCM = "raw-16khz-16bit-mono-pcm", | ||
// RAW_16KHZ_16BIT_MONO_TRUESILK = "raw-16khz-16bit-mono-truesilk", | ||
// RAW_22050HZ_16BIT_MONO_PCM = "raw-22050hz-16bit-mono-pcm", | ||
// RAW_24KHZ_16BIT_MONO_PCM = "raw-24khz-16bit-mono-pcm", | ||
// RAW_24KHZ_16BIT_MONO_TRUESILK = "raw-24khz-16bit-mono-truesilk", | ||
// RAW_44100HZ_16BIT_MONO_PCM = "raw-44100hz-16bit-mono-pcm", | ||
// RAW_48KHZ_16BIT_MONO_PCM = "raw-48khz-16bit-mono-pcm", | ||
// WEBM_16KHZ_16BIT_MONO_OPUS = "webm-16khz-16bit-mono-opus", | ||
// WEBM_24KHZ_16BIT_24KBPS_MONO_OPUS = "webm-24khz-16bit-24kbps-mono-opus", | ||
OUTPUT_FORMAT["WEBM_24KHZ_16BIT_MONO_OPUS"] = "webm-24khz-16bit-mono-opus"; | ||
OUTPUT_FORMAT["OGG_16KHZ_16BIT_MONO_OPUS"] = "ogg-16khz-16bit-mono-opus"; | ||
OUTPUT_FORMAT["OGG_24KHZ_16BIT_MONO_OPUS"] = "ogg-24khz-16bit-mono-opus"; | ||
OUTPUT_FORMAT["OGG_48KHZ_16BIT_MONO_OPUS"] = "ogg-48khz-16bit-mono-opus"; | ||
// Non-streaming ============================= | ||
// RIFF_8KHZ_8BIT_MONO_ALAW = "riff-8khz-8bit-mono-alaw", | ||
// RIFF_8KHZ_8BIT_MONO_MULAW = "riff-8khz-8bit-mono-mulaw", | ||
// RIFF_8KHZ_16BIT_MONO_PCM = "riff-8khz-16bit-mono-pcm", | ||
// RIFF_22050HZ_16BIT_MONO_PCM = "riff-22050hz-16bit-mono-pcm", | ||
// RIFF_24KHZ_16BIT_MONO_PCM = "riff-24khz-16bit-mono-pcm", | ||
// RIFF_44100HZ_16BIT_MONO_PCM = "riff-44100hz-16bit-mono-pcm", | ||
// RIFF_48KHZ_16BIT_MONO_PCM = "riff-48khz-16bit-mono-pcm", | ||
})(OUTPUT_FORMAT = exports.OUTPUT_FORMAT || (exports.OUTPUT_FORMAT = {})); |
{ | ||
"name": "msedge-tts", | ||
"version": "1.2.2", | ||
"version": "1.3.2", | ||
"description": "An Azure Speech Service module that uses the Microsoft Edge Read Aloud API.", | ||
@@ -5,0 +5,0 @@ "author": "Migushthe2nd <Migushthe2nd@users.noreply.github.com>", |
@@ -6,3 +6,3 @@ # MsEdgeTTS | ||
Full support for SSML, however, the following is the default SSML object: | ||
~~Full support for SSML~~ Only supports `speak`, `voice`, and `prosody` element types. The following is the default SSML object: | ||
@@ -9,0 +9,0 @@ ```xml |
32028
556