google-apis-texttospeech_v1 0.32.0 → 0.34.0

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
checksums.yaml CHANGED
@@ -1,7 +1,7 @@
1
1
  ---
2
2
  SHA256:
3
- metadata.gz: f700a3f8560abf9b80877dcecb6a3402a3a718101302ddc2b37f1c3b3e4e1c31
4
- data.tar.gz: 38839ecd1730441dc50849d11dd9ce97b590443ec73a8f8e90188259c3515503
3
+ metadata.gz: 881d8a76ab548234a4b3d8e52813e4a5ccc660d98c2e9761f7a7a277f6451687
4
+ data.tar.gz: 4a80b1ab02b13ff10ff8cbe5adab3e3074b5fcf36b5a3cf0f21c102e25f7d7e0
5
5
  SHA512:
6
- metadata.gz: 4ab393a0727618b3c0bc6d356a9e833e99261148861e2d2af150a4a94716ae9a23dcaaf69f46054a0b2f94c1c32b4b8882e9603192aac8dab3278479bc3dee35
7
- data.tar.gz: e0ce9aa975b440cd21cc590ab07897ecc851bc8b8e480776d83a031e1525fca62c94be8c28c41895f0c3cb4b4caf6e7c677f0ecdc67917a552f35a7fe2f15aea
6
+ metadata.gz: c86f86a081a9fb118e0be29cdba376341839ae2c5a3b2503b5c934fa4ea5b672e67aeaadea8acf1e106ea44f834d4501e91bf18b66c3516aa228f211821b737d
7
+ data.tar.gz: e061b4b5100fceaeeba6a1e95e2aee2a606272684e06a83fee6c245e947dd573aa698705b690efc01a271e2e746419bcbf2a3568c747a3fffe9d1a39ae4099ab
data/CHANGELOG.md CHANGED
@@ -1,5 +1,13 @@
1
1
  # Release history for google-apis-texttospeech_v1
2
2
 
3
+ ### v0.34.0 (2024-11-03)
4
+
5
+ * Regenerated from discovery document revision 20241026
6
+
7
+ ### v0.33.0 (2024-10-20)
8
+
9
+ * Regenerated from discovery document revision 20241008
10
+
3
11
  ### v0.32.0 (2024-10-06)
4
12
 
5
13
  * Regenerated from discovery document revision 20241001
@@ -26,7 +26,7 @@ module Google
26
26
  class AdvancedVoiceOptions
27
27
  include Google::Apis::Core::Hashable
28
28
 
29
- # Only for Jounrney voices. If false, the synthesis will be context aware and
29
+ # Only for Journey voices. If false, the synthesis will be context aware and
30
30
  # have higher latency.
31
31
  # Corresponds to the JSON property `lowLatencyJourneySynthesis`
32
32
  # @return [Boolean]
@@ -221,68 +221,6 @@ module Google
221
221
  end
222
222
  end
223
223
 
224
- # Request message for the `GenerateVoiceCloningKey` method.
225
- class GenerateVoiceCloningKeyRequest
226
- include Google::Apis::Core::Hashable
227
-
228
- # Required. The script used for the voice talent statement. The script will be
229
- # provided to the caller through other channels. It must be returned unchanged
230
- # in this field.
231
- # Corresponds to the JSON property `consentScript`
232
- # @return [String]
233
- attr_accessor :consent_script
234
-
235
- # Required. The language of the supplied audio as a [BCP-47](https://www.rfc-
236
- # editor.org/rfc/bcp/bcp47.txt) language tag. Example: "en-US". See [Language
237
- # Support](https://cloud.google.com/speech-to-text/docs/languages) for a list of
238
- # the currently supported language codes.
239
- # Corresponds to the JSON property `languageCode`
240
- # @return [String]
241
- attr_accessor :language_code
242
-
243
- # Holds audio content and config.
244
- # Corresponds to the JSON property `referenceAudio`
245
- # @return [Google::Apis::TexttospeechV1::InputAudio]
246
- attr_accessor :reference_audio
247
-
248
- # Holds audio content and config.
249
- # Corresponds to the JSON property `voiceTalentConsent`
250
- # @return [Google::Apis::TexttospeechV1::InputAudio]
251
- attr_accessor :voice_talent_consent
252
-
253
- def initialize(**args)
254
- update!(**args)
255
- end
256
-
257
- # Update properties of this object
258
- def update!(**args)
259
- @consent_script = args[:consent_script] if args.key?(:consent_script)
260
- @language_code = args[:language_code] if args.key?(:language_code)
261
- @reference_audio = args[:reference_audio] if args.key?(:reference_audio)
262
- @voice_talent_consent = args[:voice_talent_consent] if args.key?(:voice_talent_consent)
263
- end
264
- end
265
-
266
- # Response message for the `GenerateVoiceCloningKey` method.
267
- class GenerateVoiceCloningKeyResponse
268
- include Google::Apis::Core::Hashable
269
-
270
- # The voice clone key. Use it in the SynthesizeSpeechRequest by setting [voice.
271
- # voice_clone.voice_cloning_key].
272
- # Corresponds to the JSON property `voiceCloningKey`
273
- # @return [String]
274
- attr_accessor :voice_cloning_key
275
-
276
- def initialize(**args)
277
- update!(**args)
278
- end
279
-
280
- # Update properties of this object
281
- def update!(**args)
282
- @voice_cloning_key = args[:voice_cloning_key] if args.key?(:voice_cloning_key)
283
- end
284
- end
285
-
286
224
  # Metadata for response returned by the `SynthesizeLongAudio` method.
287
225
  class GoogleCloudTexttospeechV1SynthesizeLongAudioMetadata
288
226
  include Google::Apis::Core::Hashable
@@ -314,60 +252,6 @@ module Google
314
252
  end
315
253
  end
316
254
 
317
- # Holds audio content and config.
318
- class InputAudio
319
- include Google::Apis::Core::Hashable
320
-
321
- # Description of inputted audio data.
322
- # Corresponds to the JSON property `audioConfig`
323
- # @return [Google::Apis::TexttospeechV1::InputAudioConfig]
324
- attr_accessor :audio_config
325
-
326
- # Required. The audio data bytes encoded as specified in `InputAudioConfig`.
327
- # Note: as with all bytes fields, proto buffers use a pure binary representation,
328
- # whereas JSON representations use base64. Audio samples should be between 5-25
329
- # seconds in length.
330
- # Corresponds to the JSON property `content`
331
- # NOTE: Values are automatically base64 encoded/decoded in the client library.
332
- # @return [String]
333
- attr_accessor :content
334
-
335
- def initialize(**args)
336
- update!(**args)
337
- end
338
-
339
- # Update properties of this object
340
- def update!(**args)
341
- @audio_config = args[:audio_config] if args.key?(:audio_config)
342
- @content = args[:content] if args.key?(:content)
343
- end
344
- end
345
-
346
- # Description of inputted audio data.
347
- class InputAudioConfig
348
- include Google::Apis::Core::Hashable
349
-
350
- # Required. The format of the audio byte stream.
351
- # Corresponds to the JSON property `audioEncoding`
352
- # @return [String]
353
- attr_accessor :audio_encoding
354
-
355
- # Required. The sample rate (in hertz) for this audio.
356
- # Corresponds to the JSON property `sampleRateHertz`
357
- # @return [Fixnum]
358
- attr_accessor :sample_rate_hertz
359
-
360
- def initialize(**args)
361
- update!(**args)
362
- end
363
-
364
- # Update properties of this object
365
- def update!(**args)
366
- @audio_encoding = args[:audio_encoding] if args.key?(:audio_encoding)
367
- @sample_rate_hertz = args[:sample_rate_hertz] if args.key?(:sample_rate_hertz)
368
- end
369
- end
370
-
371
255
  # The response message for Operations.ListOperations.
372
256
  class ListOperationsResponse
373
257
  include Google::Apis::Core::Hashable
@@ -412,6 +296,25 @@ module Google
412
296
  end
413
297
  end
414
298
 
299
+ # A collection of turns for multi-speaker synthesis.
300
+ class MultiSpeakerMarkup
301
+ include Google::Apis::Core::Hashable
302
+
303
+ # Required. Speaker turns.
304
+ # Corresponds to the JSON property `turns`
305
+ # @return [Array<Google::Apis::TexttospeechV1::Turn>]
306
+ attr_accessor :turns
307
+
308
+ def initialize(**args)
309
+ update!(**args)
310
+ end
311
+
312
+ # Update properties of this object
313
+ def update!(**args)
314
+ @turns = args[:turns] if args.key?(:turns)
315
+ end
316
+ end
317
+
415
318
  # This resource represents a long-running operation that is the result of a
416
319
  # network API call.
417
320
  class Operation
@@ -524,6 +427,11 @@ module Google
524
427
  # @return [Google::Apis::TexttospeechV1::CustomPronunciations]
525
428
  attr_accessor :custom_pronunciations
526
429
 
430
+ # A collection of turns for multi-speaker synthesis.
431
+ # Corresponds to the JSON property `multiSpeakerMarkup`
432
+ # @return [Google::Apis::TexttospeechV1::MultiSpeakerMarkup]
433
+ attr_accessor :multi_speaker_markup
434
+
527
435
  # The SSML document to be synthesized. The SSML document must be valid and well-
528
436
  # formed. Otherwise the RPC will fail and return google.rpc.Code.
529
437
  # INVALID_ARGUMENT. For more information, see [SSML](https://cloud.google.com/
@@ -544,6 +452,7 @@ module Google
544
452
  # Update properties of this object
545
453
  def update!(**args)
546
454
  @custom_pronunciations = args[:custom_pronunciations] if args.key?(:custom_pronunciations)
455
+ @multi_speaker_markup = args[:multi_speaker_markup] if args.key?(:multi_speaker_markup)
547
456
  @ssml = args[:ssml] if args.key?(:ssml)
548
457
  @text = args[:text] if args.key?(:text)
549
458
  end
@@ -684,6 +593,32 @@ module Google
684
593
  end
685
594
  end
686
595
 
596
+ # A Multi-speaker turn.
597
+ class Turn
598
+ include Google::Apis::Core::Hashable
599
+
600
+ # Required. The speaker of the turn, for example, 'O' or 'Q'. Please refer to
601
+ # documentation for available speakers.
602
+ # Corresponds to the JSON property `speaker`
603
+ # @return [String]
604
+ attr_accessor :speaker
605
+
606
+ # Required. The text to speak.
607
+ # Corresponds to the JSON property `text`
608
+ # @return [String]
609
+ attr_accessor :text
610
+
611
+ def initialize(**args)
612
+ update!(**args)
613
+ end
614
+
615
+ # Update properties of this object
616
+ def update!(**args)
617
+ @speaker = args[:speaker] if args.key?(:speaker)
618
+ @text = args[:text] if args.key?(:text)
619
+ end
620
+ end
621
+
687
622
  # Description of a voice supported by the TTS service.
688
623
  class Voice
689
624
  include Google::Apis::Core::Hashable
@@ -16,13 +16,13 @@ module Google
16
16
  module Apis
17
17
  module TexttospeechV1
18
18
  # Version of the google-apis-texttospeech_v1 gem
19
- GEM_VERSION = "0.32.0"
19
+ GEM_VERSION = "0.34.0"
20
20
 
21
21
  # Version of the code generator used to generate this client
22
22
  GENERATOR_VERSION = "0.15.1"
23
23
 
24
24
  # Revision of the discovery document this client was generated from
25
- REVISION = "20241001"
25
+ REVISION = "20241026"
26
26
  end
27
27
  end
28
28
  end
@@ -64,43 +64,25 @@ module Google
64
64
  include Google::Apis::Core::JsonObjectSupport
65
65
  end
66
66
 
67
- class GenerateVoiceCloningKeyRequest
68
- class Representation < Google::Apis::Core::JsonRepresentation; end
69
-
70
- include Google::Apis::Core::JsonObjectSupport
71
- end
72
-
73
- class GenerateVoiceCloningKeyResponse
74
- class Representation < Google::Apis::Core::JsonRepresentation; end
75
-
76
- include Google::Apis::Core::JsonObjectSupport
77
- end
78
-
79
67
  class GoogleCloudTexttospeechV1SynthesizeLongAudioMetadata
80
68
  class Representation < Google::Apis::Core::JsonRepresentation; end
81
69
 
82
70
  include Google::Apis::Core::JsonObjectSupport
83
71
  end
84
72
 
85
- class InputAudio
86
- class Representation < Google::Apis::Core::JsonRepresentation; end
87
-
88
- include Google::Apis::Core::JsonObjectSupport
89
- end
90
-
91
- class InputAudioConfig
73
+ class ListOperationsResponse
92
74
  class Representation < Google::Apis::Core::JsonRepresentation; end
93
75
 
94
76
  include Google::Apis::Core::JsonObjectSupport
95
77
  end
96
78
 
97
- class ListOperationsResponse
79
+ class ListVoicesResponse
98
80
  class Representation < Google::Apis::Core::JsonRepresentation; end
99
81
 
100
82
  include Google::Apis::Core::JsonObjectSupport
101
83
  end
102
84
 
103
- class ListVoicesResponse
85
+ class MultiSpeakerMarkup
104
86
  class Representation < Google::Apis::Core::JsonRepresentation; end
105
87
 
106
88
  include Google::Apis::Core::JsonObjectSupport
@@ -148,6 +130,12 @@ module Google
148
130
  include Google::Apis::Core::JsonObjectSupport
149
131
  end
150
132
 
133
+ class Turn
134
+ class Representation < Google::Apis::Core::JsonRepresentation; end
135
+
136
+ include Google::Apis::Core::JsonObjectSupport
137
+ end
138
+
151
139
  class Voice
152
140
  class Representation < Google::Apis::Core::JsonRepresentation; end
153
141
 
@@ -222,25 +210,6 @@ module Google
222
210
  end
223
211
  end
224
212
 
225
- class GenerateVoiceCloningKeyRequest
226
- # @private
227
- class Representation < Google::Apis::Core::JsonRepresentation
228
- property :consent_script, as: 'consentScript'
229
- property :language_code, as: 'languageCode'
230
- property :reference_audio, as: 'referenceAudio', class: Google::Apis::TexttospeechV1::InputAudio, decorator: Google::Apis::TexttospeechV1::InputAudio::Representation
231
-
232
- property :voice_talent_consent, as: 'voiceTalentConsent', class: Google::Apis::TexttospeechV1::InputAudio, decorator: Google::Apis::TexttospeechV1::InputAudio::Representation
233
-
234
- end
235
- end
236
-
237
- class GenerateVoiceCloningKeyResponse
238
- # @private
239
- class Representation < Google::Apis::Core::JsonRepresentation
240
- property :voice_cloning_key, as: 'voiceCloningKey'
241
- end
242
- end
243
-
244
213
  class GoogleCloudTexttospeechV1SynthesizeLongAudioMetadata
245
214
  # @private
246
215
  class Representation < Google::Apis::Core::JsonRepresentation
@@ -250,36 +219,27 @@ module Google
250
219
  end
251
220
  end
252
221
 
253
- class InputAudio
222
+ class ListOperationsResponse
254
223
  # @private
255
224
  class Representation < Google::Apis::Core::JsonRepresentation
256
- property :audio_config, as: 'audioConfig', class: Google::Apis::TexttospeechV1::InputAudioConfig, decorator: Google::Apis::TexttospeechV1::InputAudioConfig::Representation
225
+ property :next_page_token, as: 'nextPageToken'
226
+ collection :operations, as: 'operations', class: Google::Apis::TexttospeechV1::Operation, decorator: Google::Apis::TexttospeechV1::Operation::Representation
257
227
 
258
- property :content, :base64 => true, as: 'content'
259
228
  end
260
229
  end
261
230
 
262
- class InputAudioConfig
263
- # @private
264
- class Representation < Google::Apis::Core::JsonRepresentation
265
- property :audio_encoding, as: 'audioEncoding'
266
- property :sample_rate_hertz, as: 'sampleRateHertz'
267
- end
268
- end
269
-
270
- class ListOperationsResponse
231
+ class ListVoicesResponse
271
232
  # @private
272
233
  class Representation < Google::Apis::Core::JsonRepresentation
273
- property :next_page_token, as: 'nextPageToken'
274
- collection :operations, as: 'operations', class: Google::Apis::TexttospeechV1::Operation, decorator: Google::Apis::TexttospeechV1::Operation::Representation
234
+ collection :voices, as: 'voices', class: Google::Apis::TexttospeechV1::Voice, decorator: Google::Apis::TexttospeechV1::Voice::Representation
275
235
 
276
236
  end
277
237
  end
278
238
 
279
- class ListVoicesResponse
239
+ class MultiSpeakerMarkup
280
240
  # @private
281
241
  class Representation < Google::Apis::Core::JsonRepresentation
282
- collection :voices, as: 'voices', class: Google::Apis::TexttospeechV1::Voice, decorator: Google::Apis::TexttospeechV1::Voice::Representation
242
+ collection :turns, as: 'turns', class: Google::Apis::TexttospeechV1::Turn, decorator: Google::Apis::TexttospeechV1::Turn::Representation
283
243
 
284
244
  end
285
245
  end
@@ -310,6 +270,8 @@ module Google
310
270
  class Representation < Google::Apis::Core::JsonRepresentation
311
271
  property :custom_pronunciations, as: 'customPronunciations', class: Google::Apis::TexttospeechV1::CustomPronunciations, decorator: Google::Apis::TexttospeechV1::CustomPronunciations::Representation
312
272
 
273
+ property :multi_speaker_markup, as: 'multiSpeakerMarkup', class: Google::Apis::TexttospeechV1::MultiSpeakerMarkup, decorator: Google::Apis::TexttospeechV1::MultiSpeakerMarkup::Representation
274
+
313
275
  property :ssml, as: 'ssml'
314
276
  property :text, as: 'text'
315
277
  end
@@ -358,6 +320,14 @@ module Google
358
320
  end
359
321
  end
360
322
 
323
+ class Turn
324
+ # @private
325
+ class Representation < Google::Apis::Core::JsonRepresentation
326
+ property :speaker, as: 'speaker'
327
+ property :text, as: 'text'
328
+ end
329
+ end
330
+
361
331
  class Voice
362
332
  # @private
363
333
  class Representation < Google::Apis::Core::JsonRepresentation
@@ -259,38 +259,6 @@ module Google
259
259
  execute_or_queue_command(command, &block)
260
260
  end
261
261
 
262
- # Generates voice clone key given a short voice prompt. This method validates
263
- # the voice prompts with a series of checks against the voice talent statement
264
- # to verify the voice clone is safe to generate.
265
- # @param [Google::Apis::TexttospeechV1::GenerateVoiceCloningKeyRequest] generate_voice_cloning_key_request_object
266
- # @param [String] fields
267
- # Selector specifying which fields to include in a partial response.
268
- # @param [String] quota_user
269
- # Available to use for quota purposes for server-side applications. Can be any
270
- # arbitrary string assigned to a user, but should not exceed 40 characters.
271
- # @param [Google::Apis::RequestOptions] options
272
- # Request-specific options
273
- #
274
- # @yield [result, err] Result & error if block supplied
275
- # @yieldparam result [Google::Apis::TexttospeechV1::GenerateVoiceCloningKeyResponse] parsed result object
276
- # @yieldparam err [StandardError] error object if request failed
277
- #
278
- # @return [Google::Apis::TexttospeechV1::GenerateVoiceCloningKeyResponse]
279
- #
280
- # @raise [Google::Apis::ServerError] An error occurred on the server and the request can be retried
281
- # @raise [Google::Apis::ClientError] The request is invalid and should not be retried without modification
282
- # @raise [Google::Apis::AuthorizationError] Authorization is required
283
- def generate_voice_cloning_key(generate_voice_cloning_key_request_object = nil, fields: nil, quota_user: nil, options: nil, &block)
284
- command = make_simple_command(:post, 'v1/voices:generateVoiceCloningKey', options)
285
- command.request_representation = Google::Apis::TexttospeechV1::GenerateVoiceCloningKeyRequest::Representation
286
- command.request_object = generate_voice_cloning_key_request_object
287
- command.response_representation = Google::Apis::TexttospeechV1::GenerateVoiceCloningKeyResponse::Representation
288
- command.response_class = Google::Apis::TexttospeechV1::GenerateVoiceCloningKeyResponse
289
- command.query['fields'] = fields unless fields.nil?
290
- command.query['quotaUser'] = quota_user unless quota_user.nil?
291
- execute_or_queue_command(command, &block)
292
- end
293
-
294
262
  # Returns a list of Voice supported for synthesis.
295
263
  # @param [String] language_code
296
264
  # Optional. Recommended. [BCP-47](https://www.rfc-editor.org/rfc/bcp/bcp47.txt)
metadata CHANGED
@@ -1,14 +1,14 @@
1
1
  --- !ruby/object:Gem::Specification
2
2
  name: google-apis-texttospeech_v1
3
3
  version: !ruby/object:Gem::Version
4
- version: 0.32.0
4
+ version: 0.34.0
5
5
  platform: ruby
6
6
  authors:
7
7
  - Google LLC
8
8
  autorequire:
9
9
  bindir: bin
10
10
  cert_chain: []
11
- date: 2024-10-06 00:00:00.000000000 Z
11
+ date: 2024-11-03 00:00:00.000000000 Z
12
12
  dependencies:
13
13
  - !ruby/object:Gem::Dependency
14
14
  name: google-apis-core
@@ -58,7 +58,7 @@ licenses:
58
58
  metadata:
59
59
  bug_tracker_uri: https://github.com/googleapis/google-api-ruby-client/issues
60
60
  changelog_uri: https://github.com/googleapis/google-api-ruby-client/tree/main/generated/google-apis-texttospeech_v1/CHANGELOG.md
61
- documentation_uri: https://googleapis.dev/ruby/google-apis-texttospeech_v1/v0.32.0
61
+ documentation_uri: https://googleapis.dev/ruby/google-apis-texttospeech_v1/v0.34.0
62
62
  source_code_uri: https://github.com/googleapis/google-api-ruby-client/tree/main/generated/google-apis-texttospeech_v1
63
63
  post_install_message:
64
64
  rdoc_options: []
@@ -75,7 +75,7 @@ required_rubygems_version: !ruby/object:Gem::Requirement
75
75
  - !ruby/object:Gem::Version
76
76
  version: '0'
77
77
  requirements: []
78
- rubygems_version: 3.5.6
78
+ rubygems_version: 3.5.21
79
79
  signing_key:
80
80
  specification_version: 4
81
81
  summary: Simple REST client for Cloud Text-to-Speech API V1