google-cloud-speech 0.31.1 → 0.32.0

Sign up to get free protection for your applications and to get access to all the features.
checksums.yaml CHANGED
@@ -1,7 +1,7 @@
1
1
  ---
2
2
  SHA256:
3
- metadata.gz: 6c020aae8d167db11676cfec941720c95d808833a976c7dff4cc5ed70adb76bb
4
- data.tar.gz: ba7bd5abf5fbfe047a62e2208d14df69a295782edbe8a5d96ecdd161ebe07bde
3
+ metadata.gz: 58d05dda613bbd299a497420c6041d87f24341b805c31b1adde99408e0039aeb
4
+ data.tar.gz: ab6f46d2a5013541196b60c3334aae34371a9a7cdeb2aa3e296a6dfb10fc64bb
5
5
  SHA512:
6
- metadata.gz: cc0c3b397c928b5c9f5b12c113aa03e9547aee071e5f5ff7e6591d2dd1b24566210b6c1581c0652a039851faab139175282a9a8735d213f0a3831db41701013e
7
- data.tar.gz: 394fe29602211aa0a6a847631ebe7d26cd0996f9ba9d4a1c31a5144394b1726bc9ecb289e0e6eaf6e4a23eed5235b4cbdc08b1e701ac7f7fa0a4027ffa748791
6
+ metadata.gz: 7e90bf229e973607f17495decf94580dcf3bfd8775eba9dab950434a432a2533db93f847f6a48d1dff430d05d41f63a12461727a58f7acb7acb0963be2adbf4d
7
+ data.tar.gz: 696db8cf73a3ddf704e46e07bbf1108346a371784869d415f314887dd2938c3a9e8f06c9471e24a94d3f289d676deab4b0fe67033d1f00cc5547c9e3f2f4978d
@@ -21,17 +21,17 @@
21
21
  },
22
22
  "methods": {
23
23
  "Recognize": {
24
- "timeout_millis": 1000000,
24
+ "timeout_millis": 200000,
25
25
  "retry_codes_name": "idempotent",
26
26
  "retry_params_name": "default"
27
27
  },
28
28
  "LongRunningRecognize": {
29
- "timeout_millis": 60000,
29
+ "timeout_millis": 200000,
30
30
  "retry_codes_name": "non_idempotent",
31
31
  "retry_params_name": "default"
32
32
  },
33
33
  "StreamingRecognize": {
34
- "timeout_millis": 1000000,
34
+ "timeout_millis": 200000,
35
35
  "retry_codes_name": "idempotent",
36
36
  "retry_params_name": "default"
37
37
  }
@@ -8,6 +8,7 @@ require 'google/api/annotations_pb'
8
8
  require 'google/longrunning/operations_pb'
9
9
  require 'google/protobuf/any_pb'
10
10
  require 'google/protobuf/duration_pb'
11
+ require 'google/protobuf/empty_pb'
11
12
  require 'google/protobuf/timestamp_pb'
12
13
  require 'google/rpc/status_pb'
13
14
  Google::Protobuf::DescriptorPool.generated_pool.build do
@@ -134,6 +135,7 @@ Google::Protobuf::DescriptorPool.generated_pool.build do
134
135
  repeated :alternatives, :message, 1, "google.cloud.speech.v1p1beta1.SpeechRecognitionAlternative"
135
136
  optional :is_final, :bool, 2
136
137
  optional :stability, :float, 3
138
+ optional :result_end_time, :message, 4, "google.protobuf.Duration"
137
139
  optional :channel_tag, :int32, 5
138
140
  optional :language_code, :string, 6
139
141
  end
@@ -1,7 +1,7 @@
1
1
  # Generated by the protocol buffer compiler. DO NOT EDIT!
2
2
  # Source: google/cloud/speech/v1p1beta1/cloud_speech.proto for package 'google.cloud.speech.v1p1beta1'
3
3
  # Original file comments:
4
- # Copyright 2018 Google Inc.
4
+ # Copyright 2018 Google LLC.
5
5
  #
6
6
  # Licensed under the Apache License, Version 2.0 (the "License");
7
7
  # you may not use this file except in compliance with the License.
@@ -15,6 +15,7 @@
15
15
  # See the License for the specific language governing permissions and
16
16
  # limitations under the License.
17
17
  #
18
+ #
18
19
 
19
20
 
20
21
  require 'grpc'
@@ -57,7 +57,7 @@ module Google
57
57
  # `audio_content` data. The audio bytes must be encoded as specified in
58
58
  # `RecognitionConfig`. Note: as with all bytes fields, protobuffers use a
59
59
  # pure binary representation (not base64). See
60
- # [audio limits](https://cloud.google.com/speech/limits#content).
60
+ # [content limits](https://cloud.google.com/speech-to-text/quotas#content).
61
61
  class StreamingRecognizeRequest; end
62
62
 
63
63
  # Provides information to the recognizer that specifies how to process the
@@ -111,36 +111,36 @@ module Google
111
111
  # Valid values for OGG_OPUS are '1'-'254'.
112
112
  # Valid value for MULAW, AMR, AMR_WB and SPEEX_WITH_HEADER_BYTE is only `1`.
113
113
  # If `0` or omitted, defaults to one channel (mono).
114
- # NOTE: We only recognize the first channel by default.
114
+ # Note: We only recognize the first channel by default.
115
115
  # To perform independent recognition on each channel set
116
- # enable_separate_recognition_per_channel to 'true'.
116
+ # `enable_separate_recognition_per_channel` to 'true'.
117
117
  # @!attribute [rw] enable_separate_recognition_per_channel
118
118
  # @return [true, false]
119
- # This needs to be set to ‘true’ explicitly and audio_channel_count > 1
119
+ # This needs to be set to ‘true’ explicitly and `audio_channel_count` > 1
120
120
  # to get each channel recognized separately. The recognition result will
121
- # contain a channel_tag field to state which channel that result belongs to.
122
- # If this is not true’, we will only recognize the first channel.
123
- # NOTE: The request is also billed cumulatively for all channels recognized:
124
- # (audio_channel_count times the audio length)
121
+ # contain a `channel_tag` field to state which channel that result belongs
122
+ # to. If this is not true, we will only recognize the first channel. The
123
+ # request is billed cumulatively for all channels recognized:
124
+ # `audio_channel_count` multiplied by the length of the audio.
125
125
  # @!attribute [rw] language_code
126
126
  # @return [String]
127
127
  # *Required* The language of the supplied audio as a
128
128
  # [BCP-47](https://www.rfc-editor.org/rfc/bcp/bcp47.txt) language tag.
129
129
  # Example: "en-US".
130
- # See [Language Support](https://cloud.google.com/speech/docs/languages)
130
+ # See [Language Support](https://cloud.google.com/speech-to-text/docs/languages)
131
131
  # for a list of the currently supported language codes.
132
132
  # @!attribute [rw] alternative_language_codes
133
133
  # @return [Array<String>]
134
134
  # *Optional* A list of up to 3 additional
135
135
  # [BCP-47](https://www.rfc-editor.org/rfc/bcp/bcp47.txt) language tags,
136
136
  # listing possible alternative languages of the supplied audio.
137
- # See [Language Support](https://cloud.google.com/speech/docs/languages)
137
+ # See [Language Support](https://cloud.google.com/speech-to-text/docs/languages)
138
138
  # for a list of the currently supported language codes.
139
139
  # If alternative languages are listed, recognition result will contain
140
140
  # recognition in the most likely language detected including the main
141
141
  # language_code. The recognition result will include the language tag
142
142
  # of the language detected in the audio.
143
- # NOTE: This feature is only supported for Voice Command and Voice Search
143
+ # Note: This feature is only supported for Voice Command and Voice Search
144
144
  # use cases and performance may vary for other use cases (e.g., phone call
145
145
  # transcription).
146
146
  # @!attribute [rw] max_alternatives
@@ -159,7 +159,9 @@ module Google
159
159
  # won't be filtered out.
160
160
  # @!attribute [rw] speech_contexts
161
161
  # @return [Array<Google::Cloud::Speech::V1p1beta1::SpeechContext>]
162
- # *Optional* A means to provide context to assist the speech recognition.
162
+ # *Optional* array of {Google::Cloud::Speech::V1p1beta1::SpeechContext SpeechContext}.
163
+ # A means to provide context to assist the speech recognition. For more
164
+ # information, see [Phrase Hints](https://cloud.google.com/speech-to-text/docs/basics#phrase-hints).
163
165
  # @!attribute [rw] enable_word_time_offsets
164
166
  # @return [true, false]
165
167
  # *Optional* If `true`, the top result includes a list of words and
@@ -177,18 +179,20 @@ module Google
177
179
  # This feature is only available in select languages. Setting this for
178
180
  # requests in other languages has no effect at all.
179
181
  # The default 'false' value does not add punctuation to result hypotheses.
180
- # NOTE: "This is currently offered as an experimental service, complimentary
182
+ # Note: This is currently offered as an experimental service, complimentary
181
183
  # to all users. In the future this may be exclusively available as a
182
- # premium feature."
184
+ # premium feature.
183
185
  # @!attribute [rw] enable_speaker_diarization
184
186
  # @return [true, false]
185
187
  # *Optional* If 'true', enables speaker detection for each recognized word in
186
188
  # the top alternative of the recognition result using a speaker_tag provided
187
189
  # in the WordInfo.
188
190
  # Note: When this is true, we send all the words from the beginning of the
189
- # audio for the top alternative in every consecutive responses.
191
+ # audio for the top alternative in every consecutive STREAMING responses.
190
192
  # This is done in order to improve our speaker tags as our models learn to
191
193
  # identify the speakers in the conversation over time.
194
+ # For non-streaming requests, the diarization results will be provided only
195
+ # in the top alternative of the FINAL SpeechRecognitionResult.
192
196
  # @!attribute [rw] diarization_speaker_count
193
197
  # @return [Integer]
194
198
  # *Optional*
@@ -235,14 +239,18 @@ module Google
235
239
  # @!attribute [rw] use_enhanced
236
240
  # @return [true, false]
237
241
  # *Optional* Set to true to use an enhanced model for speech recognition.
238
- # You must also set the `model` field to a valid, enhanced model. If
239
- # `use_enhanced` is set to true and the `model` field is not set, then
240
- # `use_enhanced` is ignored. If `use_enhanced` is true and an enhanced
241
- # version of the specified model does not exist, then the speech is
242
- # recognized using the standard version of the specified model.
242
+ # If `use_enhanced` is set to true and the `model` field is not set, then
243
+ # an appropriate enhanced model is chosen if:
244
+ # 1. project is eligible for requesting enhanced models
245
+ # 2. an enhanced model exists for the audio
243
246
  #
244
- # Enhanced speech models require that you opt-in to the audio logging using
245
- # instructions in the [alpha documentation](https://cloud.google.com/speech/data-sharing). If you set
247
+ # If `use_enhanced` is true and an enhanced version of the specified model
248
+ # does not exist, then the speech is recognized using the standard version
249
+ # of the specified model.
250
+ #
251
+ # Enhanced speech models require that you opt-in to data logging using
252
+ # instructions in the
253
+ # [documentation](https://cloud.google.com/speech-to-text/docs/enable-data-logging). If you set
246
254
  # `use_enhanced` to true and you have not enabled audio logging, then you
247
255
  # will receive an error.
248
256
  class RecognitionConfig
@@ -452,13 +460,13 @@ module Google
452
460
  # to improve the accuracy for specific words and phrases, for example, if
453
461
  # specific commands are typically spoken by the user. This can also be used
454
462
  # to add additional words to the vocabulary of the recognizer. See
455
- # [usage limits](https://cloud.google.com/speech/limits#content).
463
+ # [usage limits](https://cloud.google.com/speech-to-text/quotas#content).
456
464
  class SpeechContext; end
457
465
 
458
466
  # Contains audio data in the encoding specified in the `RecognitionConfig`.
459
467
  # Either `content` or `uri` must be supplied. Supplying both or neither
460
468
  # returns {Google::Rpc::Code::INVALID_ARGUMENT}. See
461
- # [audio limits](https://cloud.google.com/speech/limits#content).
469
+ # [content limits](https://cloud.google.com/speech-to-text/quotas#content).
462
470
  # @!attribute [rw] content
463
471
  # @return [String]
464
472
  # The audio data bytes encoded as specified in
@@ -467,7 +475,8 @@ module Google
467
475
  # @!attribute [rw] uri
468
476
  # @return [String]
469
477
  # URI that points to a file that contains audio data bytes as specified in
470
- # `RecognitionConfig`. Currently, only Google Cloud Storage URIs are
478
+ # `RecognitionConfig`. The file must not be compressed (for example, gzip).
479
+ # Currently, only Google Cloud Storage URIs are
471
480
  # supported, which must be specified in the following format:
472
481
  # `gs://bucket_name/object_name` (other URI formats return
473
482
  # {Google::Rpc::Code::INVALID_ARGUMENT}). For more information, see
@@ -610,6 +619,10 @@ module Google
610
619
  # (completely unstable) to 1.0 (completely stable).
611
620
  # This field is only provided for interim results (`is_final=false`).
612
621
  # The default of 0.0 is a sentinel value indicating `stability` was not set.
622
+ # @!attribute [rw] result_end_time
623
+ # @return [Google::Protobuf::Duration]
624
+ # Output only. Time offset of the end of this result relative to the
625
+ # beginning of the audio.
613
626
  # @!attribute [rw] channel_tag
614
627
  # @return [Integer]
615
628
  # For multi-channel audio, this is the channel number corresponding to the
@@ -659,7 +672,7 @@ module Google
659
672
  # @!attribute [rw] words
660
673
  # @return [Array<Google::Cloud::Speech::V1p1beta1::WordInfo>]
661
674
  # Output only. A list of word-specific information for each recognized word.
662
- # Note: When enable_speaker_diarization is true, you will see all the words
675
+ # Note: When `enable_speaker_diarization` is true, you will see all the words
663
676
  # from the beginning of the audio.
664
677
  class SpeechRecognitionAlternative; end
665
678
 
@@ -21,17 +21,17 @@
21
21
  },
22
22
  "methods": {
23
23
  "Recognize": {
24
- "timeout_millis": 1000000,
24
+ "timeout_millis": 200000,
25
25
  "retry_codes_name": "idempotent",
26
26
  "retry_params_name": "default"
27
27
  },
28
28
  "LongRunningRecognize": {
29
- "timeout_millis": 60000,
29
+ "timeout_millis": 200000,
30
30
  "retry_codes_name": "non_idempotent",
31
31
  "retry_params_name": "default"
32
32
  },
33
33
  "StreamingRecognize": {
34
- "timeout_millis": 1000000,
34
+ "timeout_millis": 905000,
35
35
  "retry_codes_name": "idempotent",
36
36
  "retry_params_name": "default"
37
37
  }
metadata CHANGED
@@ -1,14 +1,14 @@
1
1
  --- !ruby/object:Gem::Specification
2
2
  name: google-cloud-speech
3
3
  version: !ruby/object:Gem::Version
4
- version: 0.31.1
4
+ version: 0.32.0
5
5
  platform: ruby
6
6
  authors:
7
7
  - Google LLC
8
8
  autorequire:
9
9
  bindir: bin
10
10
  cert_chain: []
11
- date: 2018-09-21 00:00:00.000000000 Z
11
+ date: 2018-11-15 00:00:00.000000000 Z
12
12
  dependencies:
13
13
  - !ruby/object:Gem::Dependency
14
14
  name: google-gax
@@ -58,14 +58,14 @@ dependencies:
58
58
  requirements:
59
59
  - - "~>"
60
60
  - !ruby/object:Gem::Version
61
- version: 0.50.0
61
+ version: 0.59.2
62
62
  type: :development
63
63
  prerelease: false
64
64
  version_requirements: !ruby/object:Gem::Requirement
65
65
  requirements:
66
66
  - - "~>"
67
67
  - !ruby/object:Gem::Version
68
- version: 0.50.0
68
+ version: 0.59.2
69
69
  - !ruby/object:Gem::Dependency
70
70
  name: simplecov
71
71
  requirement: !ruby/object:Gem::Requirement