google-cloud-text_to_speech-v1 1.1.1 → 1.2.0
This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
- checksums.yaml +4 -4
- data/lib/google/cloud/text_to_speech/v1/text_to_speech/client.rb +3 -1
- data/lib/google/cloud/text_to_speech/v1/text_to_speech/rest/client.rb +3 -1
- data/lib/google/cloud/text_to_speech/v1/version.rb +1 -1
- data/lib/google/cloud/texttospeech/v1/cloud_tts_pb.rb +5 -1
- data/proto_docs/google/cloud/texttospeech/v1/cloud_tts.rb +68 -0
- metadata +3 -3
checksums.yaml
CHANGED
@@ -1,7 +1,7 @@
|
|
1
1
|
---
|
2
2
|
SHA256:
|
3
|
-
metadata.gz:
|
4
|
-
data.tar.gz:
|
3
|
+
metadata.gz: fb48791dcea870341c721fee7fe39e36697dd0467219c8d544b58a0a37d4d14e
|
4
|
+
data.tar.gz: 968a0a33b6c1674b4081217033be2233ed32434757ac2c7ecd760ebab54d6aa4
|
5
5
|
SHA512:
|
6
|
-
metadata.gz:
|
7
|
-
data.tar.gz:
|
6
|
+
metadata.gz: 692b8f1eb891d7665b3b2e92e69512eb25befc2afe718a3ca9b59359b2dc805347e66e283457f6fe508bc5266a124cc5a36f5ecbe1820cdf4c5358f1aee93f5d
|
7
|
+
data.tar.gz: 8188dc4151a2c54963a76d86f4e5c0d41d65a57afc1b10a0e26e7832c73d2b18c975a4c274866406de3c3714e4c98382df295a7733beb36a2e41a117000fea24
|
@@ -267,7 +267,7 @@ module Google
|
|
267
267
|
# @param options [::Gapic::CallOptions, ::Hash]
|
268
268
|
# Overrides the default settings for this call, e.g, timeout, retries, etc. Optional.
|
269
269
|
#
|
270
|
-
# @overload synthesize_speech(input: nil, voice: nil, audio_config: nil)
|
270
|
+
# @overload synthesize_speech(input: nil, voice: nil, audio_config: nil, advanced_voice_options: nil)
|
271
271
|
# Pass arguments to `synthesize_speech` via keyword arguments. Note that at
|
272
272
|
# least one keyword argument is required. To specify no parameters, or to keep all
|
273
273
|
# the default parameter values, pass an empty Hash as a request object (see above).
|
@@ -278,6 +278,8 @@ module Google
|
|
278
278
|
# Required. The desired voice of the synthesized audio.
|
279
279
|
# @param audio_config [::Google::Cloud::TextToSpeech::V1::AudioConfig, ::Hash]
|
280
280
|
# Required. The configuration of the synthesized audio.
|
281
|
+
# @param advanced_voice_options [::Google::Cloud::TextToSpeech::V1::AdvancedVoiceOptions, ::Hash]
|
282
|
+
# Advanced voice options.
|
281
283
|
#
|
282
284
|
# @yield [response, operation] Access the result along with the RPC operation
|
283
285
|
# @yieldparam response [::Google::Cloud::TextToSpeech::V1::SynthesizeSpeechResponse]
|
@@ -261,7 +261,7 @@ module Google
|
|
261
261
|
# @param options [::Gapic::CallOptions, ::Hash]
|
262
262
|
# Overrides the default settings for this call, e.g, timeout, retries etc. Optional.
|
263
263
|
#
|
264
|
-
# @overload synthesize_speech(input: nil, voice: nil, audio_config: nil)
|
264
|
+
# @overload synthesize_speech(input: nil, voice: nil, audio_config: nil, advanced_voice_options: nil)
|
265
265
|
# Pass arguments to `synthesize_speech` via keyword arguments. Note that at
|
266
266
|
# least one keyword argument is required. To specify no parameters, or to keep all
|
267
267
|
# the default parameter values, pass an empty Hash as a request object (see above).
|
@@ -272,6 +272,8 @@ module Google
|
|
272
272
|
# Required. The desired voice of the synthesized audio.
|
273
273
|
# @param audio_config [::Google::Cloud::TextToSpeech::V1::AudioConfig, ::Hash]
|
274
274
|
# Required. The configuration of the synthesized audio.
|
275
|
+
# @param advanced_voice_options [::Google::Cloud::TextToSpeech::V1::AdvancedVoiceOptions, ::Hash]
|
276
|
+
# Advanced voice options.
|
275
277
|
# @yield [result, operation] Access the result along with the TransportOperation object
|
276
278
|
# @yieldparam result [::Google::Cloud::TextToSpeech::V1::SynthesizeSpeechResponse]
|
277
279
|
# @yieldparam operation [::Gapic::Rest::TransportOperation]
|
@@ -10,7 +10,7 @@ require 'google/api/field_behavior_pb'
|
|
10
10
|
require 'google/api/resource_pb'
|
11
11
|
|
12
12
|
|
13
|
-
descriptor_data = "\n,google/cloud/texttospeech/v1/cloud_tts.proto\x12\x1cgoogle.cloud.texttospeech.v1\x1a\x1cgoogle/api/annotations.proto\x1a\x17google/api/client.proto\x1a\x1fgoogle/api/field_behavior.proto\x1a\x19google/api/resource.proto\"/\n\x11ListVoicesRequest\x12\x1a\n\rlanguage_code\x18\x01 \x01(\tB\x03\xe0\x41\x01\"I\n\x12ListVoicesResponse\x12\x33\n\x06voices\x18\x01 \x03(\x0b\x32#.google.cloud.texttospeech.v1.Voice\"\x94\x01\n\x05Voice\x12\x16\n\x0elanguage_codes\x18\x01 \x03(\t\x12\x0c\n\x04name\x18\x02 \x01(\t\x12\x42\n\x0bssml_gender\x18\x03 \x01(\x0e\x32-.google.cloud.texttospeech.v1.SsmlVoiceGender\x12!\n\x19natural_sample_rate_hertz\x18\x04 \x01(\x05\"\
|
13
|
+
descriptor_data = "\n,google/cloud/texttospeech/v1/cloud_tts.proto\x12\x1cgoogle.cloud.texttospeech.v1\x1a\x1cgoogle/api/annotations.proto\x1a\x17google/api/client.proto\x1a\x1fgoogle/api/field_behavior.proto\x1a\x19google/api/resource.proto\"/\n\x11ListVoicesRequest\x12\x1a\n\rlanguage_code\x18\x01 \x01(\tB\x03\xe0\x41\x01\"I\n\x12ListVoicesResponse\x12\x33\n\x06voices\x18\x01 \x03(\x0b\x32#.google.cloud.texttospeech.v1.Voice\"\x94\x01\n\x05Voice\x12\x16\n\x0elanguage_codes\x18\x01 \x03(\t\x12\x0c\n\x04name\x18\x02 \x01(\t\x12\x42\n\x0bssml_gender\x18\x03 \x01(\x0e\x32-.google.cloud.texttospeech.v1.SsmlVoiceGender\x12!\n\x19natural_sample_rate_hertz\x18\x04 \x01(\x05\"d\n\x14\x41\x64vancedVoiceOptions\x12*\n\x1dlow_latency_journey_synthesis\x18\x01 \x01(\x08H\x00\x88\x01\x01\x42 \n\x1e_low_latency_journey_synthesis\"\xdd\x02\n\x17SynthesizeSpeechRequest\x12@\n\x05input\x18\x01 \x01(\x0b\x32,.google.cloud.texttospeech.v1.SynthesisInputB\x03\xe0\x41\x02\x12\x46\n\x05voice\x18\x02 \x01(\x0b\x32\x32.google.cloud.texttospeech.v1.VoiceSelectionParamsB\x03\xe0\x41\x02\x12\x44\n\x0c\x61udio_config\x18\x03 \x01(\x0b\x32).google.cloud.texttospeech.v1.AudioConfigB\x03\xe0\x41\x02\x12W\n\x16\x61\x64vanced_voice_options\x18\x08 \x01(\x0b\x32\x32.google.cloud.texttospeech.v1.AdvancedVoiceOptionsH\x00\x88\x01\x01\x42\x19\n\x17_advanced_voice_options\"\xda\x02\n\x19\x43ustomPronunciationParams\x12\x13\n\x06phrase\x18\x01 \x01(\tH\x00\x88\x01\x01\x12h\n\x11phonetic_encoding\x18\x02 \x01(\x0e\x32H.google.cloud.texttospeech.v1.CustomPronunciationParams.PhoneticEncodingH\x01\x88\x01\x01\x12\x1a\n\rpronunciation\x18\x03 \x01(\tH\x02\x88\x01\x01\"o\n\x10PhoneticEncoding\x12!\n\x1dPHONETIC_ENCODING_UNSPECIFIED\x10\x00\x12\x19\n\x15PHONETIC_ENCODING_IPA\x10\x01\x12\x1d\n\x19PHONETIC_ENCODING_X_SAMPA\x10\x02\x42\t\n\x07_phraseB\x14\n\x12_phonetic_encodingB\x10\n\x0e_pronunciation\"g\n\x14\x43ustomPronunciations\x12O\n\x0epronunciations\x18\x01 \x03(\x0b\x32\x37.google.cloud.texttospeech.v1.CustomPronunciationParams\"\x98\x01\n\x0eSynthesisInput\x12\x0e\n\x04text\x18\x01 \x01(\tH\x00\x12\x0e\n\x04ssml\x18\x02 \x01(\tH\x00\x12V\n\x15\x63ustom_pronunciations\x18\x03 \x01(\x0b\x32\x32.google.cloud.texttospeech.v1.CustomPronunciationsB\x03\xe0\x41\x01\x42\x0e\n\x0cinput_source\"\xcb\x01\n\x14VoiceSelectionParams\x12\x1a\n\rlanguage_code\x18\x01 \x01(\tB\x03\xe0\x41\x02\x12\x0c\n\x04name\x18\x02 \x01(\t\x12\x42\n\x0bssml_gender\x18\x03 \x01(\x0e\x32-.google.cloud.texttospeech.v1.SsmlVoiceGender\x12\x45\n\x0c\x63ustom_voice\x18\x04 \x01(\x0b\x32/.google.cloud.texttospeech.v1.CustomVoiceParams\"\xf1\x01\n\x0b\x41udioConfig\x12H\n\x0e\x61udio_encoding\x18\x01 \x01(\x0e\x32+.google.cloud.texttospeech.v1.AudioEncodingB\x03\xe0\x41\x02\x12\x1d\n\rspeaking_rate\x18\x02 \x01(\x01\x42\x06\xe0\x41\x04\xe0\x41\x01\x12\x15\n\x05pitch\x18\x03 \x01(\x01\x42\x06\xe0\x41\x04\xe0\x41\x01\x12\x1e\n\x0evolume_gain_db\x18\x04 \x01(\x01\x42\x06\xe0\x41\x04\xe0\x41\x01\x12\x1e\n\x11sample_rate_hertz\x18\x05 \x01(\x05\x42\x03\xe0\x41\x01\x12\"\n\x12\x65\x66\x66\x65\x63ts_profile_id\x18\x06 \x03(\tB\x06\xe0\x41\x04\xe0\x41\x01\"\xf1\x01\n\x11\x43ustomVoiceParams\x12\x32\n\x05model\x18\x01 \x01(\tB#\xe0\x41\x02\xfa\x41\x1d\n\x1b\x61utoml.googleapis.com/Model\x12\\\n\x0ereported_usage\x18\x03 \x01(\x0e\x32=.google.cloud.texttospeech.v1.CustomVoiceParams.ReportedUsageB\x05\x18\x01\xe0\x41\x01\"J\n\rReportedUsage\x12\x1e\n\x1aREPORTED_USAGE_UNSPECIFIED\x10\x00\x12\x0c\n\x08REALTIME\x10\x01\x12\x0b\n\x07OFFLINE\x10\x02\"1\n\x18SynthesizeSpeechResponse\x12\x15\n\raudio_content\x18\x01 \x01(\x0c\"c\n\x19StreamingSynthesizeConfig\x12\x46\n\x05voice\x18\x01 \x01(\x0b\x32\x32.google.cloud.texttospeech.v1.VoiceSelectionParamsB\x03\xe0\x41\x02\"9\n\x17StreamingSynthesisInput\x12\x0e\n\x04text\x18\x01 \x01(\tH\x00\x42\x0e\n\x0cinput_source\"\xce\x01\n\x1aStreamingSynthesizeRequest\x12S\n\x10streaming_config\x18\x01 \x01(\x0b\x32\x37.google.cloud.texttospeech.v1.StreamingSynthesizeConfigH\x00\x12\x46\n\x05input\x18\x02 \x01(\x0b\x32\x35.google.cloud.texttospeech.v1.StreamingSynthesisInputH\x00\x42\x13\n\x11streaming_request\"4\n\x1bStreamingSynthesizeResponse\x12\x15\n\raudio_content\x18\x01 \x01(\x0c*W\n\x0fSsmlVoiceGender\x12!\n\x1dSSML_VOICE_GENDER_UNSPECIFIED\x10\x00\x12\x08\n\x04MALE\x10\x01\x12\n\n\x06\x46\x45MALE\x10\x02\x12\x0b\n\x07NEUTRAL\x10\x03*i\n\rAudioEncoding\x12\x1e\n\x1a\x41UDIO_ENCODING_UNSPECIFIED\x10\x00\x12\x0c\n\x08LINEAR16\x10\x01\x12\x07\n\x03MP3\x10\x02\x12\x0c\n\x08OGG_OPUS\x10\x03\x12\t\n\x05MULAW\x10\x05\x12\x08\n\x04\x41LAW\x10\x06\x32\xc7\x04\n\x0cTextToSpeech\x12\x93\x01\n\nListVoices\x12/.google.cloud.texttospeech.v1.ListVoicesRequest\x1a\x30.google.cloud.texttospeech.v1.ListVoicesResponse\"\"\xda\x41\rlanguage_code\x82\xd3\xe4\x93\x02\x0c\x12\n/v1/voices\x12\xbc\x01\n\x10SynthesizeSpeech\x12\x35.google.cloud.texttospeech.v1.SynthesizeSpeechRequest\x1a\x36.google.cloud.texttospeech.v1.SynthesizeSpeechResponse\"9\xda\x41\x18input,voice,audio_config\x82\xd3\xe4\x93\x02\x18\"\x13/v1/text:synthesize:\x01*\x12\x90\x01\n\x13StreamingSynthesize\x12\x38.google.cloud.texttospeech.v1.StreamingSynthesizeRequest\x1a\x39.google.cloud.texttospeech.v1.StreamingSynthesizeResponse\"\x00(\x01\x30\x01\x1aO\xca\x41\x1btexttospeech.googleapis.com\xd2\x41.https://www.googleapis.com/auth/cloud-platformB\xbf\x02\n com.google.cloud.texttospeech.v1B\x11TextToSpeechProtoP\x01ZDcloud.google.com/go/texttospeech/apiv1/texttospeechpb;texttospeechpb\xf8\x01\x01\xa2\x02\x04\x43TTS\xaa\x02\x1cGoogle.Cloud.TextToSpeech.V1\xca\x02\x1cGoogle\\Cloud\\TextToSpeech\\V1\xea\x02\x1fGoogle::Cloud::TextToSpeech::V1\xea\x41U\n\x1b\x61utoml.googleapis.com/Model\x12\x36projects/{project}/locations/{location}/models/{model}b\x06proto3"
|
14
14
|
|
15
15
|
pool = Google::Protobuf::DescriptorPool.generated_pool
|
16
16
|
|
@@ -43,7 +43,11 @@ module Google
|
|
43
43
|
ListVoicesRequest = ::Google::Protobuf::DescriptorPool.generated_pool.lookup("google.cloud.texttospeech.v1.ListVoicesRequest").msgclass
|
44
44
|
ListVoicesResponse = ::Google::Protobuf::DescriptorPool.generated_pool.lookup("google.cloud.texttospeech.v1.ListVoicesResponse").msgclass
|
45
45
|
Voice = ::Google::Protobuf::DescriptorPool.generated_pool.lookup("google.cloud.texttospeech.v1.Voice").msgclass
|
46
|
+
AdvancedVoiceOptions = ::Google::Protobuf::DescriptorPool.generated_pool.lookup("google.cloud.texttospeech.v1.AdvancedVoiceOptions").msgclass
|
46
47
|
SynthesizeSpeechRequest = ::Google::Protobuf::DescriptorPool.generated_pool.lookup("google.cloud.texttospeech.v1.SynthesizeSpeechRequest").msgclass
|
48
|
+
CustomPronunciationParams = ::Google::Protobuf::DescriptorPool.generated_pool.lookup("google.cloud.texttospeech.v1.CustomPronunciationParams").msgclass
|
49
|
+
CustomPronunciationParams::PhoneticEncoding = ::Google::Protobuf::DescriptorPool.generated_pool.lookup("google.cloud.texttospeech.v1.CustomPronunciationParams.PhoneticEncoding").enummodule
|
50
|
+
CustomPronunciations = ::Google::Protobuf::DescriptorPool.generated_pool.lookup("google.cloud.texttospeech.v1.CustomPronunciations").msgclass
|
47
51
|
SynthesisInput = ::Google::Protobuf::DescriptorPool.generated_pool.lookup("google.cloud.texttospeech.v1.SynthesisInput").msgclass
|
48
52
|
VoiceSelectionParams = ::Google::Protobuf::DescriptorPool.generated_pool.lookup("google.cloud.texttospeech.v1.VoiceSelectionParams").msgclass
|
49
53
|
AudioConfig = ::Google::Protobuf::DescriptorPool.generated_pool.lookup("google.cloud.texttospeech.v1.AudioConfig").msgclass
|
@@ -66,6 +66,16 @@ module Google
|
|
66
66
|
extend ::Google::Protobuf::MessageExts::ClassMethods
|
67
67
|
end
|
68
68
|
|
69
|
+
# Used for advanced voice options.
|
70
|
+
# @!attribute [rw] low_latency_journey_synthesis
|
71
|
+
# @return [::Boolean]
|
72
|
+
# Only for Journey voices. If false, the synthesis will be context aware
|
73
|
+
# and have higher latency.
|
74
|
+
class AdvancedVoiceOptions
|
75
|
+
include ::Google::Protobuf::MessageExts
|
76
|
+
extend ::Google::Protobuf::MessageExts::ClassMethods
|
77
|
+
end
|
78
|
+
|
69
79
|
# The top-level message sent by the client for the `SynthesizeSpeech` method.
|
70
80
|
# @!attribute [rw] input
|
71
81
|
# @return [::Google::Cloud::TextToSpeech::V1::SynthesisInput]
|
@@ -76,11 +86,55 @@ module Google
|
|
76
86
|
# @!attribute [rw] audio_config
|
77
87
|
# @return [::Google::Cloud::TextToSpeech::V1::AudioConfig]
|
78
88
|
# Required. The configuration of the synthesized audio.
|
89
|
+
# @!attribute [rw] advanced_voice_options
|
90
|
+
# @return [::Google::Cloud::TextToSpeech::V1::AdvancedVoiceOptions]
|
91
|
+
# Advanced voice options.
|
79
92
|
class SynthesizeSpeechRequest
|
80
93
|
include ::Google::Protobuf::MessageExts
|
81
94
|
extend ::Google::Protobuf::MessageExts::ClassMethods
|
82
95
|
end
|
83
96
|
|
97
|
+
# Pronunciation customization for a phrase.
|
98
|
+
# @!attribute [rw] phrase
|
99
|
+
# @return [::String]
|
100
|
+
# The phrase to which the customization will be applied.
|
101
|
+
# The phrase can be multiple words (in the case of proper nouns etc), but
|
102
|
+
# should not span to a whole sentence.
|
103
|
+
# @!attribute [rw] phonetic_encoding
|
104
|
+
# @return [::Google::Cloud::TextToSpeech::V1::CustomPronunciationParams::PhoneticEncoding]
|
105
|
+
# The phonetic encoding of the phrase.
|
106
|
+
# @!attribute [rw] pronunciation
|
107
|
+
# @return [::String]
|
108
|
+
# The pronunciation of the phrase. This must be in the phonetic encoding
|
109
|
+
# specified above.
|
110
|
+
class CustomPronunciationParams
|
111
|
+
include ::Google::Protobuf::MessageExts
|
112
|
+
extend ::Google::Protobuf::MessageExts::ClassMethods
|
113
|
+
|
114
|
+
# The phonetic encoding of the phrase.
|
115
|
+
module PhoneticEncoding
|
116
|
+
# Not specified.
|
117
|
+
PHONETIC_ENCODING_UNSPECIFIED = 0
|
118
|
+
|
119
|
+
# IPA. (e.g. apple -> ˈæpəl )
|
120
|
+
# https://en.wikipedia.org/wiki/International_Phonetic_Alphabet
|
121
|
+
PHONETIC_ENCODING_IPA = 1
|
122
|
+
|
123
|
+
# X-SAMPA (e.g. apple -> "{p@l" )
|
124
|
+
# https://en.wikipedia.org/wiki/X-SAMPA
|
125
|
+
PHONETIC_ENCODING_X_SAMPA = 2
|
126
|
+
end
|
127
|
+
end
|
128
|
+
|
129
|
+
# A collection of pronunciation customizations.
|
130
|
+
# @!attribute [rw] pronunciations
|
131
|
+
# @return [::Array<::Google::Cloud::TextToSpeech::V1::CustomPronunciationParams>]
|
132
|
+
# The pronunciation customizations to be applied.
|
133
|
+
class CustomPronunciations
|
134
|
+
include ::Google::Protobuf::MessageExts
|
135
|
+
extend ::Google::Protobuf::MessageExts::ClassMethods
|
136
|
+
end
|
137
|
+
|
84
138
|
# Contains text input to be synthesized. Either `text` or `ssml` must be
|
85
139
|
# supplied. Supplying both or neither returns
|
86
140
|
# [google.rpc.Code.INVALID_ARGUMENT][google.rpc.Code.INVALID_ARGUMENT]. The
|
@@ -95,6 +149,20 @@ module Google
|
|
95
149
|
# [google.rpc.Code.INVALID_ARGUMENT][google.rpc.Code.INVALID_ARGUMENT]. For
|
96
150
|
# more information, see
|
97
151
|
# [SSML](https://cloud.google.com/text-to-speech/docs/ssml).
|
152
|
+
# @!attribute [rw] custom_pronunciations
|
153
|
+
# @return [::Google::Cloud::TextToSpeech::V1::CustomPronunciations]
|
154
|
+
# Optional. The pronunciation customizations to be applied to the input. If
|
155
|
+
# this is set, the input will be synthesized using the given pronunciation
|
156
|
+
# customizations.
|
157
|
+
#
|
158
|
+
# The initial support will be for EFIGS (English, French,
|
159
|
+
# Italian, German, Spanish) languages, as provided in
|
160
|
+
# VoiceSelectionParams. Journey and Instant Clone voices are
|
161
|
+
# not supported yet.
|
162
|
+
#
|
163
|
+
# In order to customize the pronunciation of a phrase, there must be an exact
|
164
|
+
# match of the phrase in the input types. If using SSML, the phrase must not
|
165
|
+
# be inside a phoneme tag (entirely or partially).
|
98
166
|
class SynthesisInput
|
99
167
|
include ::Google::Protobuf::MessageExts
|
100
168
|
extend ::Google::Protobuf::MessageExts::ClassMethods
|
metadata
CHANGED
@@ -1,14 +1,14 @@
|
|
1
1
|
--- !ruby/object:Gem::Specification
|
2
2
|
name: google-cloud-text_to_speech-v1
|
3
3
|
version: !ruby/object:Gem::Version
|
4
|
-
version: 1.
|
4
|
+
version: 1.2.0
|
5
5
|
platform: ruby
|
6
6
|
authors:
|
7
7
|
- Google LLC
|
8
8
|
autorequire:
|
9
9
|
bindir: bin
|
10
10
|
cert_chain: []
|
11
|
-
date: 2024-
|
11
|
+
date: 2024-10-15 00:00:00.000000000 Z
|
12
12
|
dependencies:
|
13
13
|
- !ruby/object:Gem::Dependency
|
14
14
|
name: gapic-common
|
@@ -114,7 +114,7 @@ required_rubygems_version: !ruby/object:Gem::Requirement
|
|
114
114
|
- !ruby/object:Gem::Version
|
115
115
|
version: '0'
|
116
116
|
requirements: []
|
117
|
-
rubygems_version: 3.5.
|
117
|
+
rubygems_version: 3.5.21
|
118
118
|
signing_key:
|
119
119
|
specification_version: 4
|
120
120
|
summary: Synthesizes natural-sounding speech by applying powerful neural network models.
|