google-cloud-text_to_speech-v1 1.1.1 → 1.2.0
Sign up to get free protection for your applications and to get access to all the features.
- checksums.yaml +4 -4
- data/lib/google/cloud/text_to_speech/v1/text_to_speech/client.rb +3 -1
- data/lib/google/cloud/text_to_speech/v1/text_to_speech/rest/client.rb +3 -1
- data/lib/google/cloud/text_to_speech/v1/version.rb +1 -1
- data/lib/google/cloud/texttospeech/v1/cloud_tts_pb.rb +5 -1
- data/proto_docs/google/cloud/texttospeech/v1/cloud_tts.rb +68 -0
- metadata +3 -3
checksums.yaml
CHANGED
@@ -1,7 +1,7 @@
|
|
1
1
|
---
|
2
2
|
SHA256:
|
3
|
-
metadata.gz:
|
4
|
-
data.tar.gz:
|
3
|
+
metadata.gz: fb48791dcea870341c721fee7fe39e36697dd0467219c8d544b58a0a37d4d14e
|
4
|
+
data.tar.gz: 968a0a33b6c1674b4081217033be2233ed32434757ac2c7ecd760ebab54d6aa4
|
5
5
|
SHA512:
|
6
|
-
metadata.gz:
|
7
|
-
data.tar.gz:
|
6
|
+
metadata.gz: 692b8f1eb891d7665b3b2e92e69512eb25befc2afe718a3ca9b59359b2dc805347e66e283457f6fe508bc5266a124cc5a36f5ecbe1820cdf4c5358f1aee93f5d
|
7
|
+
data.tar.gz: 8188dc4151a2c54963a76d86f4e5c0d41d65a57afc1b10a0e26e7832c73d2b18c975a4c274866406de3c3714e4c98382df295a7733beb36a2e41a117000fea24
|
@@ -267,7 +267,7 @@ module Google
|
|
267
267
|
# @param options [::Gapic::CallOptions, ::Hash]
|
268
268
|
# Overrides the default settings for this call, e.g, timeout, retries, etc. Optional.
|
269
269
|
#
|
270
|
-
# @overload synthesize_speech(input: nil, voice: nil, audio_config: nil)
|
270
|
+
# @overload synthesize_speech(input: nil, voice: nil, audio_config: nil, advanced_voice_options: nil)
|
271
271
|
# Pass arguments to `synthesize_speech` via keyword arguments. Note that at
|
272
272
|
# least one keyword argument is required. To specify no parameters, or to keep all
|
273
273
|
# the default parameter values, pass an empty Hash as a request object (see above).
|
@@ -278,6 +278,8 @@ module Google
|
|
278
278
|
# Required. The desired voice of the synthesized audio.
|
279
279
|
# @param audio_config [::Google::Cloud::TextToSpeech::V1::AudioConfig, ::Hash]
|
280
280
|
# Required. The configuration of the synthesized audio.
|
281
|
+
# @param advanced_voice_options [::Google::Cloud::TextToSpeech::V1::AdvancedVoiceOptions, ::Hash]
|
282
|
+
# Advanced voice options.
|
281
283
|
#
|
282
284
|
# @yield [response, operation] Access the result along with the RPC operation
|
283
285
|
# @yieldparam response [::Google::Cloud::TextToSpeech::V1::SynthesizeSpeechResponse]
|
@@ -261,7 +261,7 @@ module Google
|
|
261
261
|
# @param options [::Gapic::CallOptions, ::Hash]
|
262
262
|
# Overrides the default settings for this call, e.g, timeout, retries etc. Optional.
|
263
263
|
#
|
264
|
-
# @overload synthesize_speech(input: nil, voice: nil, audio_config: nil)
|
264
|
+
# @overload synthesize_speech(input: nil, voice: nil, audio_config: nil, advanced_voice_options: nil)
|
265
265
|
# Pass arguments to `synthesize_speech` via keyword arguments. Note that at
|
266
266
|
# least one keyword argument is required. To specify no parameters, or to keep all
|
267
267
|
# the default parameter values, pass an empty Hash as a request object (see above).
|
@@ -272,6 +272,8 @@ module Google
|
|
272
272
|
# Required. The desired voice of the synthesized audio.
|
273
273
|
# @param audio_config [::Google::Cloud::TextToSpeech::V1::AudioConfig, ::Hash]
|
274
274
|
# Required. The configuration of the synthesized audio.
|
275
|
+
# @param advanced_voice_options [::Google::Cloud::TextToSpeech::V1::AdvancedVoiceOptions, ::Hash]
|
276
|
+
# Advanced voice options.
|
275
277
|
# @yield [result, operation] Access the result along with the TransportOperation object
|
276
278
|
# @yieldparam result [::Google::Cloud::TextToSpeech::V1::SynthesizeSpeechResponse]
|
277
279
|
# @yieldparam operation [::Gapic::Rest::TransportOperation]
|
@@ -10,7 +10,7 @@ require 'google/api/field_behavior_pb'
|
|
10
10
|
require 'google/api/resource_pb'
|
11
11
|
|
12
12
|
|
13
|
-
descriptor_data = "\n,google/cloud/texttospeech/v1/cloud_tts.proto\x12\x1cgoogle.cloud.texttospeech.v1\x1a\x1cgoogle/api/annotations.proto\x1a\x17google/api/client.proto\x1a\x1fgoogle/api/field_behavior.proto\x1a\x19google/api/resource.proto\"/\n\x11ListVoicesRequest\x12\x1a\n\rlanguage_code\x18\x01 \x01(\tB\x03\xe0\x41\x01\"I\n\x12ListVoicesResponse\x12\x33\n\x06voices\x18\x01 \x03(\x0b\x32#.google.cloud.texttospeech.v1.Voice\"\x94\x01\n\x05Voice\x12\x16\n\x0elanguage_codes\x18\x01 \x03(\t\x12\x0c\n\x04name\x18\x02 \x01(\t\x12\x42\n\x0bssml_gender\x18\x03 \x01(\x0e\x32-.google.cloud.texttospeech.v1.SsmlVoiceGender\x12!\n\x19natural_sample_rate_hertz\x18\x04 \x01(\x05\"\
|
13
|
+
descriptor_data = "\n,google/cloud/texttospeech/v1/cloud_tts.proto\x12\x1cgoogle.cloud.texttospeech.v1\x1a\x1cgoogle/api/annotations.proto\x1a\x17google/api/client.proto\x1a\x1fgoogle/api/field_behavior.proto\x1a\x19google/api/resource.proto\"/\n\x11ListVoicesRequest\x12\x1a\n\rlanguage_code\x18\x01 \x01(\tB\x03\xe0\x41\x01\"I\n\x12ListVoicesResponse\x12\x33\n\x06voices\x18\x01 \x03(\x0b\x32#.google.cloud.texttospeech.v1.Voice\"\x94\x01\n\x05Voice\x12\x16\n\x0elanguage_codes\x18\x01 \x03(\t\x12\x0c\n\x04name\x18\x02 \x01(\t\x12\x42\n\x0bssml_gender\x18\x03 \x01(\x0e\x32-.google.cloud.texttospeech.v1.SsmlVoiceGender\x12!\n\x19natural_sample_rate_hertz\x18\x04 \x01(\x05\"d\n\x14\x41\x64vancedVoiceOptions\x12*\n\x1dlow_latency_journey_synthesis\x18\x01 \x01(\x08H\x00\x88\x01\x01\x42 \n\x1e_low_latency_journey_synthesis\"\xdd\x02\n\x17SynthesizeSpeechRequest\x12@\n\x05input\x18\x01 \x01(\x0b\x32,.google.cloud.texttospeech.v1.SynthesisInputB\x03\xe0\x41\x02\x12\x46\n\x05voice\x18\x02 \x01(\x0b\x32\x32.google.cloud.texttospeech.v1.VoiceSelectionParamsB\x03\xe0\x41\x02\x12\x44\n\x0c\x61udio_config\x18\x03 \x01(\x0b\x32).google.cloud.texttospeech.v1.AudioConfigB\x03\xe0\x41\x02\x12W\n\x16\x61\x64vanced_voice_options\x18\x08 \x01(\x0b\x32\x32.google.cloud.texttospeech.v1.AdvancedVoiceOptionsH\x00\x88\x01\x01\x42\x19\n\x17_advanced_voice_options\"\xda\x02\n\x19\x43ustomPronunciationParams\x12\x13\n\x06phrase\x18\x01 \x01(\tH\x00\x88\x01\x01\x12h\n\x11phonetic_encoding\x18\x02 \x01(\x0e\x32H.google.cloud.texttospeech.v1.CustomPronunciationParams.PhoneticEncodingH\x01\x88\x01\x01\x12\x1a\n\rpronunciation\x18\x03 \x01(\tH\x02\x88\x01\x01\"o\n\x10PhoneticEncoding\x12!\n\x1dPHONETIC_ENCODING_UNSPECIFIED\x10\x00\x12\x19\n\x15PHONETIC_ENCODING_IPA\x10\x01\x12\x1d\n\x19PHONETIC_ENCODING_X_SAMPA\x10\x02\x42\t\n\x07_phraseB\x14\n\x12_phonetic_encodingB\x10\n\x0e_pronunciation\"g\n\x14\x43ustomPronunciations\x12O\n\x0epronunciations\x18\x01 \x03(\x0b\x32\x37.google.cloud.texttospeech.v1.CustomPronunciationParams\"\x98\x01\n\x0eSynthesisInput\x12\x0e\n\x04text\x18\x01 \x01(\tH\x00\x12\x0e\n\x04ssml\x18\x02 \x01(\tH\x00\x12V\n\x15\x63ustom_pronunciations\x18\x03 \x01(\x0b\x32\x32.google.cloud.texttospeech.v1.CustomPronunciationsB\x03\xe0\x41\x01\x42\x0e\n\x0cinput_source\"\xcb\x01\n\x14VoiceSelectionParams\x12\x1a\n\rlanguage_code\x18\x01 \x01(\tB\x03\xe0\x41\x02\x12\x0c\n\x04name\x18\x02 \x01(\t\x12\x42\n\x0bssml_gender\x18\x03 \x01(\x0e\x32-.google.cloud.texttospeech.v1.SsmlVoiceGender\x12\x45\n\x0c\x63ustom_voice\x18\x04 \x01(\x0b\x32/.google.cloud.texttospeech.v1.CustomVoiceParams\"\xf1\x01\n\x0b\x41udioConfig\x12H\n\x0e\x61udio_encoding\x18\x01 \x01(\x0e\x32+.google.cloud.texttospeech.v1.AudioEncodingB\x03\xe0\x41\x02\x12\x1d\n\rspeaking_rate\x18\x02 \x01(\x01\x42\x06\xe0\x41\x04\xe0\x41\x01\x12\x15\n\x05pitch\x18\x03 \x01(\x01\x42\x06\xe0\x41\x04\xe0\x41\x01\x12\x1e\n\x0evolume_gain_db\x18\x04 \x01(\x01\x42\x06\xe0\x41\x04\xe0\x41\x01\x12\x1e\n\x11sample_rate_hertz\x18\x05 \x01(\x05\x42\x03\xe0\x41\x01\x12\"\n\x12\x65\x66\x66\x65\x63ts_profile_id\x18\x06 \x03(\tB\x06\xe0\x41\x04\xe0\x41\x01\"\xf1\x01\n\x11\x43ustomVoiceParams\x12\x32\n\x05model\x18\x01 \x01(\tB#\xe0\x41\x02\xfa\x41\x1d\n\x1b\x61utoml.googleapis.com/Model\x12\\\n\x0ereported_usage\x18\x03 \x01(\x0e\x32=.google.cloud.texttospeech.v1.CustomVoiceParams.ReportedUsageB\x05\x18\x01\xe0\x41\x01\"J\n\rReportedUsage\x12\x1e\n\x1aREPORTED_USAGE_UNSPECIFIED\x10\x00\x12\x0c\n\x08REALTIME\x10\x01\x12\x0b\n\x07OFFLINE\x10\x02\"1\n\x18SynthesizeSpeechResponse\x12\x15\n\raudio_content\x18\x01 \x01(\x0c\"c\n\x19StreamingSynthesizeConfig\x12\x46\n\x05voice\x18\x01 \x01(\x0b\x32\x32.google.cloud.texttospeech.v1.VoiceSelectionParamsB\x03\xe0\x41\x02\"9\n\x17StreamingSynthesisInput\x12\x0e\n\x04text\x18\x01 \x01(\tH\x00\x42\x0e\n\x0cinput_source\"\xce\x01\n\x1aStreamingSynthesizeRequest\x12S\n\x10streaming_config\x18\x01 \x01(\x0b\x32\x37.google.cloud.texttospeech.v1.StreamingSynthesizeConfigH\x00\x12\x46\n\x05input\x18\x02 \x01(\x0b\x32\x35.google.cloud.texttospeech.v1.StreamingSynthesisInputH\x00\x42\x13\n\x11streaming_request\"4\n\x1bStreamingSynthesizeResponse\x12\x15\n\raudio_content\x18\x01 \x01(\x0c*W\n\x0fSsmlVoiceGender\x12!\n\x1dSSML_VOICE_GENDER_UNSPECIFIED\x10\x00\x12\x08\n\x04MALE\x10\x01\x12\n\n\x06\x46\x45MALE\x10\x02\x12\x0b\n\x07NEUTRAL\x10\x03*i\n\rAudioEncoding\x12\x1e\n\x1a\x41UDIO_ENCODING_UNSPECIFIED\x10\x00\x12\x0c\n\x08LINEAR16\x10\x01\x12\x07\n\x03MP3\x10\x02\x12\x0c\n\x08OGG_OPUS\x10\x03\x12\t\n\x05MULAW\x10\x05\x12\x08\n\x04\x41LAW\x10\x06\x32\xc7\x04\n\x0cTextToSpeech\x12\x93\x01\n\nListVoices\x12/.google.cloud.texttospeech.v1.ListVoicesRequest\x1a\x30.google.cloud.texttospeech.v1.ListVoicesResponse\"\"\xda\x41\rlanguage_code\x82\xd3\xe4\x93\x02\x0c\x12\n/v1/voices\x12\xbc\x01\n\x10SynthesizeSpeech\x12\x35.google.cloud.texttospeech.v1.SynthesizeSpeechRequest\x1a\x36.google.cloud.texttospeech.v1.SynthesizeSpeechResponse\"9\xda\x41\x18input,voice,audio_config\x82\xd3\xe4\x93\x02\x18\"\x13/v1/text:synthesize:\x01*\x12\x90\x01\n\x13StreamingSynthesize\x12\x38.google.cloud.texttospeech.v1.StreamingSynthesizeRequest\x1a\x39.google.cloud.texttospeech.v1.StreamingSynthesizeResponse\"\x00(\x01\x30\x01\x1aO\xca\x41\x1btexttospeech.googleapis.com\xd2\x41.https://www.googleapis.com/auth/cloud-platformB\xbf\x02\n com.google.cloud.texttospeech.v1B\x11TextToSpeechProtoP\x01ZDcloud.google.com/go/texttospeech/apiv1/texttospeechpb;texttospeechpb\xf8\x01\x01\xa2\x02\x04\x43TTS\xaa\x02\x1cGoogle.Cloud.TextToSpeech.V1\xca\x02\x1cGoogle\\Cloud\\TextToSpeech\\V1\xea\x02\x1fGoogle::Cloud::TextToSpeech::V1\xea\x41U\n\x1b\x61utoml.googleapis.com/Model\x12\x36projects/{project}/locations/{location}/models/{model}b\x06proto3"
|
14
14
|
|
15
15
|
pool = Google::Protobuf::DescriptorPool.generated_pool
|
16
16
|
|
@@ -43,7 +43,11 @@ module Google
|
|
43
43
|
ListVoicesRequest = ::Google::Protobuf::DescriptorPool.generated_pool.lookup("google.cloud.texttospeech.v1.ListVoicesRequest").msgclass
|
44
44
|
ListVoicesResponse = ::Google::Protobuf::DescriptorPool.generated_pool.lookup("google.cloud.texttospeech.v1.ListVoicesResponse").msgclass
|
45
45
|
Voice = ::Google::Protobuf::DescriptorPool.generated_pool.lookup("google.cloud.texttospeech.v1.Voice").msgclass
|
46
|
+
AdvancedVoiceOptions = ::Google::Protobuf::DescriptorPool.generated_pool.lookup("google.cloud.texttospeech.v1.AdvancedVoiceOptions").msgclass
|
46
47
|
SynthesizeSpeechRequest = ::Google::Protobuf::DescriptorPool.generated_pool.lookup("google.cloud.texttospeech.v1.SynthesizeSpeechRequest").msgclass
|
48
|
+
CustomPronunciationParams = ::Google::Protobuf::DescriptorPool.generated_pool.lookup("google.cloud.texttospeech.v1.CustomPronunciationParams").msgclass
|
49
|
+
CustomPronunciationParams::PhoneticEncoding = ::Google::Protobuf::DescriptorPool.generated_pool.lookup("google.cloud.texttospeech.v1.CustomPronunciationParams.PhoneticEncoding").enummodule
|
50
|
+
CustomPronunciations = ::Google::Protobuf::DescriptorPool.generated_pool.lookup("google.cloud.texttospeech.v1.CustomPronunciations").msgclass
|
47
51
|
SynthesisInput = ::Google::Protobuf::DescriptorPool.generated_pool.lookup("google.cloud.texttospeech.v1.SynthesisInput").msgclass
|
48
52
|
VoiceSelectionParams = ::Google::Protobuf::DescriptorPool.generated_pool.lookup("google.cloud.texttospeech.v1.VoiceSelectionParams").msgclass
|
49
53
|
AudioConfig = ::Google::Protobuf::DescriptorPool.generated_pool.lookup("google.cloud.texttospeech.v1.AudioConfig").msgclass
|
@@ -66,6 +66,16 @@ module Google
|
|
66
66
|
extend ::Google::Protobuf::MessageExts::ClassMethods
|
67
67
|
end
|
68
68
|
|
69
|
+
# Used for advanced voice options.
|
70
|
+
# @!attribute [rw] low_latency_journey_synthesis
|
71
|
+
# @return [::Boolean]
|
72
|
+
# Only for Journey voices. If false, the synthesis will be context aware
|
73
|
+
# and have higher latency.
|
74
|
+
class AdvancedVoiceOptions
|
75
|
+
include ::Google::Protobuf::MessageExts
|
76
|
+
extend ::Google::Protobuf::MessageExts::ClassMethods
|
77
|
+
end
|
78
|
+
|
69
79
|
# The top-level message sent by the client for the `SynthesizeSpeech` method.
|
70
80
|
# @!attribute [rw] input
|
71
81
|
# @return [::Google::Cloud::TextToSpeech::V1::SynthesisInput]
|
@@ -76,11 +86,55 @@ module Google
|
|
76
86
|
# @!attribute [rw] audio_config
|
77
87
|
# @return [::Google::Cloud::TextToSpeech::V1::AudioConfig]
|
78
88
|
# Required. The configuration of the synthesized audio.
|
89
|
+
# @!attribute [rw] advanced_voice_options
|
90
|
+
# @return [::Google::Cloud::TextToSpeech::V1::AdvancedVoiceOptions]
|
91
|
+
# Advanced voice options.
|
79
92
|
class SynthesizeSpeechRequest
|
80
93
|
include ::Google::Protobuf::MessageExts
|
81
94
|
extend ::Google::Protobuf::MessageExts::ClassMethods
|
82
95
|
end
|
83
96
|
|
97
|
+
# Pronunciation customization for a phrase.
|
98
|
+
# @!attribute [rw] phrase
|
99
|
+
# @return [::String]
|
100
|
+
# The phrase to which the customization will be applied.
|
101
|
+
# The phrase can be multiple words (in the case of proper nouns etc), but
|
102
|
+
# should not span to a whole sentence.
|
103
|
+
# @!attribute [rw] phonetic_encoding
|
104
|
+
# @return [::Google::Cloud::TextToSpeech::V1::CustomPronunciationParams::PhoneticEncoding]
|
105
|
+
# The phonetic encoding of the phrase.
|
106
|
+
# @!attribute [rw] pronunciation
|
107
|
+
# @return [::String]
|
108
|
+
# The pronunciation of the phrase. This must be in the phonetic encoding
|
109
|
+
# specified above.
|
110
|
+
class CustomPronunciationParams
|
111
|
+
include ::Google::Protobuf::MessageExts
|
112
|
+
extend ::Google::Protobuf::MessageExts::ClassMethods
|
113
|
+
|
114
|
+
# The phonetic encoding of the phrase.
|
115
|
+
module PhoneticEncoding
|
116
|
+
# Not specified.
|
117
|
+
PHONETIC_ENCODING_UNSPECIFIED = 0
|
118
|
+
|
119
|
+
# IPA. (e.g. apple -> ˈæpəl )
|
120
|
+
# https://en.wikipedia.org/wiki/International_Phonetic_Alphabet
|
121
|
+
PHONETIC_ENCODING_IPA = 1
|
122
|
+
|
123
|
+
# X-SAMPA (e.g. apple -> "{p@l" )
|
124
|
+
# https://en.wikipedia.org/wiki/X-SAMPA
|
125
|
+
PHONETIC_ENCODING_X_SAMPA = 2
|
126
|
+
end
|
127
|
+
end
|
128
|
+
|
129
|
+
# A collection of pronunciation customizations.
|
130
|
+
# @!attribute [rw] pronunciations
|
131
|
+
# @return [::Array<::Google::Cloud::TextToSpeech::V1::CustomPronunciationParams>]
|
132
|
+
# The pronunciation customizations to be applied.
|
133
|
+
class CustomPronunciations
|
134
|
+
include ::Google::Protobuf::MessageExts
|
135
|
+
extend ::Google::Protobuf::MessageExts::ClassMethods
|
136
|
+
end
|
137
|
+
|
84
138
|
# Contains text input to be synthesized. Either `text` or `ssml` must be
|
85
139
|
# supplied. Supplying both or neither returns
|
86
140
|
# [google.rpc.Code.INVALID_ARGUMENT][google.rpc.Code.INVALID_ARGUMENT]. The
|
@@ -95,6 +149,20 @@ module Google
|
|
95
149
|
# [google.rpc.Code.INVALID_ARGUMENT][google.rpc.Code.INVALID_ARGUMENT]. For
|
96
150
|
# more information, see
|
97
151
|
# [SSML](https://cloud.google.com/text-to-speech/docs/ssml).
|
152
|
+
# @!attribute [rw] custom_pronunciations
|
153
|
+
# @return [::Google::Cloud::TextToSpeech::V1::CustomPronunciations]
|
154
|
+
# Optional. The pronunciation customizations to be applied to the input. If
|
155
|
+
# this is set, the input will be synthesized using the given pronunciation
|
156
|
+
# customizations.
|
157
|
+
#
|
158
|
+
# The initial support will be for EFIGS (English, French,
|
159
|
+
# Italian, German, Spanish) languages, as provided in
|
160
|
+
# VoiceSelectionParams. Journey and Instant Clone voices are
|
161
|
+
# not supported yet.
|
162
|
+
#
|
163
|
+
# In order to customize the pronunciation of a phrase, there must be an exact
|
164
|
+
# match of the phrase in the input types. If using SSML, the phrase must not
|
165
|
+
# be inside a phoneme tag (entirely or partially).
|
98
166
|
class SynthesisInput
|
99
167
|
include ::Google::Protobuf::MessageExts
|
100
168
|
extend ::Google::Protobuf::MessageExts::ClassMethods
|
metadata
CHANGED
@@ -1,14 +1,14 @@
|
|
1
1
|
--- !ruby/object:Gem::Specification
|
2
2
|
name: google-cloud-text_to_speech-v1
|
3
3
|
version: !ruby/object:Gem::Version
|
4
|
-
version: 1.
|
4
|
+
version: 1.2.0
|
5
5
|
platform: ruby
|
6
6
|
authors:
|
7
7
|
- Google LLC
|
8
8
|
autorequire:
|
9
9
|
bindir: bin
|
10
10
|
cert_chain: []
|
11
|
-
date: 2024-
|
11
|
+
date: 2024-10-15 00:00:00.000000000 Z
|
12
12
|
dependencies:
|
13
13
|
- !ruby/object:Gem::Dependency
|
14
14
|
name: gapic-common
|
@@ -114,7 +114,7 @@ required_rubygems_version: !ruby/object:Gem::Requirement
|
|
114
114
|
- !ruby/object:Gem::Version
|
115
115
|
version: '0'
|
116
116
|
requirements: []
|
117
|
-
rubygems_version: 3.5.
|
117
|
+
rubygems_version: 3.5.21
|
118
118
|
signing_key:
|
119
119
|
specification_version: 4
|
120
120
|
summary: Synthesizes natural-sounding speech by applying powerful neural network models.
|