cognitive-services-speech-s.../common/speech_synthesis_output_for...

135 строки
5.7 KiB
Go

// Copyright (c) Microsoft. All rights reserved.
// Licensed under the MIT license. See LICENSE.md file in the project root for full license information.
package common
// SpeechSynthesisOutputFormat defines the possible speech synthesis output audio formats.
type SpeechSynthesisOutputFormat int
const (
// Raw8Khz8BitMonoMULaw stands for raw-8khz-8bit-mono-mulaw
Raw8Khz8BitMonoMULaw SpeechSynthesisOutputFormat = 1
// Riff16Khz16KbpsMonoSiren stands for riff-16khz-16kbps-mono-siren
// Unsupported by the service. Do not use this value.
Riff16Khz16KbpsMonoSiren SpeechSynthesisOutputFormat = 2
// Audio16Khz16KbpsMonoSiren stands for audio-16khz-16kbps-mono-siren
// Unsupported by the service. Do not use this value.
Audio16Khz16KbpsMonoSiren SpeechSynthesisOutputFormat = 3
// Audio16Khz32KBitRateMonoMp3 stands for audio-16khz-32kbitrate-mono-mp3
Audio16Khz32KBitRateMonoMp3 SpeechSynthesisOutputFormat = 4
// Audio16Khz128KBitRateMonoMp3 stands for audio-16khz-128kbitrate-mono-mp3
Audio16Khz128KBitRateMonoMp3 SpeechSynthesisOutputFormat = 5
// Audio16Khz64KBitRateMonoMp3 stands for audio-16khz-64kbitrate-mono-mp3
Audio16Khz64KBitRateMonoMp3 SpeechSynthesisOutputFormat = 6
// Audio24Khz48KBitRateMonoMp3 stands for audio-24khz-48kbitrate-mono-mp3
Audio24Khz48KBitRateMonoMp3 SpeechSynthesisOutputFormat = 7
// Audio24Khz96KBitRateMonoMp3 stands for audio-24khz-96kbitrate-mono-mp3
Audio24Khz96KBitRateMonoMp3 SpeechSynthesisOutputFormat = 8
// Audio24Khz160KBitRateMonoMp3 stands for audio-24khz-160kbitrate-mono-mp3
Audio24Khz160KBitRateMonoMp3 SpeechSynthesisOutputFormat = 9
// Raw16Khz16BitMonoTrueSilk stands for raw-16khz-16bit-mono-truesilk
Raw16Khz16BitMonoTrueSilk SpeechSynthesisOutputFormat = 10
// Riff16Khz16BitMonoPcm stands for riff-16khz-16bit-mono-pcm
Riff16Khz16BitMonoPcm SpeechSynthesisOutputFormat = 11
// Riff8Khz16BitMonoPcm stands for riff-8khz-16bit-mono-pcm
Riff8Khz16BitMonoPcm SpeechSynthesisOutputFormat = 12
// Riff24Khz16BitMonoPcm stands for riff-24khz-16bit-mono-pcm
Riff24Khz16BitMonoPcm SpeechSynthesisOutputFormat = 13
// Riff8Khz8BitMonoMULaw stands for riff-8khz-8bit-mono-mulaw
Riff8Khz8BitMonoMULaw SpeechSynthesisOutputFormat = 14
// Raw16Khz16BitMonoPcm stands for raw-16khz-16bit-mono-pcm
Raw16Khz16BitMonoPcm SpeechSynthesisOutputFormat = 15
// Raw24Khz16BitMonoPcm stands for raw-24khz-16bit-mono-pcm
Raw24Khz16BitMonoPcm SpeechSynthesisOutputFormat = 16
// Raw8Khz16BitMonoPcm stands for raw-8khz-16bit-mono-pcm
Raw8Khz16BitMonoPcm SpeechSynthesisOutputFormat = 17
// Ogg16Khz16BitMonoOpus stands for ogg-16khz-16bit-mono-opus
Ogg16Khz16BitMonoOpus SpeechSynthesisOutputFormat = 18
// Ogg24Khz16BitMonoOpus stands for ogg-24khz-16bit-mono-opus
Ogg24Khz16BitMonoOpus SpeechSynthesisOutputFormat = 19
// Raw48Khz16BitMonoPcm stands for raw-48khz-16bit-mono-pcm
Raw48Khz16BitMonoPcm SpeechSynthesisOutputFormat = 20
// Riff48Khz16BitMonoPcm stands for riff-48khz-16bit-mono-pcm
Riff48Khz16BitMonoPcm SpeechSynthesisOutputFormat = 21
// Audio48Khz96KBitRateMonoMp3 stands for audio-48khz-96kbitrate-mono-mp3
Audio48Khz96KBitRateMonoMp3 SpeechSynthesisOutputFormat = 22
// Audio48Khz192KBitRateMonoMp3 stands for audio-48khz-192kbitrate-mono-mp3
Audio48Khz192KBitRateMonoMp3 SpeechSynthesisOutputFormat = 23
// Ogg48Khz16BitMonoOpus stands for ogg-48khz-16bit-mono-opus
Ogg48Khz16BitMonoOpus SpeechSynthesisOutputFormat = 24
// Webm16Khz16BitMonoOpus stands for webm-16khz-16bit-mono-opus
Webm16Khz16BitMonoOpus SpeechSynthesisOutputFormat = 25
// Webm24Khz16BitMonoOpus stands for webm-24khz-16bit-mono-opus
Webm24Khz16BitMonoOpus SpeechSynthesisOutputFormat = 26
// Raw24Khz16BitMonoTrueSilk stands for raw-24khz-16bit-mono-truesilk
Raw24Khz16BitMonoTrueSilk SpeechSynthesisOutputFormat = 27
// Raw8Khz8BitMonoALaw stands for raw-8khz-8bit-mono-alaw
Raw8Khz8BitMonoALaw SpeechSynthesisOutputFormat = 28
// Riff8Khz8BitMonoALaw stands for riff-8khz-8bit-mono-alaw
Riff8Khz8BitMonoALaw SpeechSynthesisOutputFormat = 29
// Webm24Khz16Bit24KbpsMonoOpus stands for webm-24khz-16bit-24kbps-mono-opus
// Audio compressed by OPUS codec in a WebM container, with bitrate of 24kbps, optimized for IoT scenario.
Webm24Khz16Bit24KbpsMonoOpus SpeechSynthesisOutputFormat = 30
// Audio16Khz16Bit32KbpsMonoOpus stands for audio-16khz-16bit-32kbps-mono-opus
// Audio compressed by OPUS codec without container, with bitrate of 32kbps.
Audio16Khz16Bit32KbpsMonoOpus SpeechSynthesisOutputFormat = 31
// Audio24Khz16Bit48KbpsMonoOpus stands for audio-24khz-16bit-48kbps-mono-opus
// Audio compressed by OPUS codec without container, with bitrate of 48kbps.
Audio24Khz16Bit48KbpsMonoOpus SpeechSynthesisOutputFormat = 32
// Audio24Khz16Bit24KbpsMonoOpus stands for audio-24khz-16bit-24kbps-mono-opus
// Audio compressed by OPUS codec without container, with bitrate of 24kbps.
Audio24Khz16Bit24KbpsMonoOpus SpeechSynthesisOutputFormat = 33
// Raw22050Hz16BitMonoPcm stands for raw-22050hz-16bit-mono-pcm
// Raw PCM audio at 22050Hz sampling rate and 16-bit depth.
Raw22050Hz16BitMonoPcm SpeechSynthesisOutputFormat = 34
// Riff22050Hz16BitMonoPcm stands for riff-22050hz-16bit-mono-pcm
// PCM audio at 22050Hz sampling rate and 16-bit depth, with RIFF header.
Riff22050Hz16BitMonoPcm SpeechSynthesisOutputFormat = 35
// Raw44100Hz16BitMonoPcm stands for raw-44100hz-16bit-mono-pcm
// Raw PCM audio at 44100Hz sampling rate and 16-bit depth.
Raw44100Hz16BitMonoPcm SpeechSynthesisOutputFormat = 36
// Riff44100Hz16BitMonoPcm stands for riff-44100hz-16bit-mono-pcm
// PCM audio at 44100Hz sampling rate and 16-bit depth, with RIFF header.
Riff44100Hz16BitMonoPcm SpeechSynthesisOutputFormat = 37
// AmrWb16000Hz stands for amr-wb-16000hz
// AMR-WB audio at 16kHz sampling rate.
AmrWb16000Hz SpeechSynthesisOutputFormat = 38
)