RubyGems - google-cloud-speech - Versions diffs - 0.21.0 → 0.21.1 - Mend

google-cloud-speech 0.21.0 → 0.21.1

Files changed (12) hide show

checksums.yaml +4 -4
data/.yardopts +9 -0
data/LICENSE +201 -0
data/README.md +62 -0
data/lib/google/cloud/speech.rb +2 -2
data/lib/google/cloud/speech/project.rb +4 -3
data/lib/google/cloud/speech/result.rb +3 -3
data/lib/google/cloud/speech/stream.rb +42 -39
data/lib/google/cloud/speech/v1beta1/doc/google/cloud/speech/v1beta1/cloud_speech.rb +377 -0
data/lib/google/cloud/speech/v1beta1/speech_api.rb +4 -4
data/lib/google/cloud/speech/version.rb +1 -1
metadata +9 -5

checksums.yaml CHANGED

@@ -1,7 +1,7 @@
 ---
 SHA1:
-  metadata.gz: 83a0ff44f2fad9796bdd39f3493c05e858bb7165
-  data.tar.gz: f5f63a9a256c082864f7fcbcdfa7741e8f55b494
+  metadata.gz: a35a3d6fd09318b755221c8c3f95ef781ebe897f
+  data.tar.gz: 15079061caf8289b64f42f39f5d110d3500d1250
 SHA512:
-  metadata.gz: a077cbf101500f553b7156a23b44e83086e6ef2c452edaffaac4cdedda39ef86712da8e58821f933f6b8076b08e2de5132696e57856a0f528d756816bddee2ee
-  data.tar.gz: cac8e868df8240737eaa8733190743afaf314353f6ad806f885f6d8fd55d5d4e19dda6de4df0325666a621a44216b551883224058ec7c45a2be2b0d0a36f2df6
+  metadata.gz: f55af213c9e770573b0c32f1993dfef05e1566de1b6a0e2643240a2a872319430f218e5f45243750d6bda7d00a46aad1d91bc88473290c6984ba07ca9381c3f1
+  data.tar.gz: ae663be1584beadca2eaeb04090fe313de27ce523099bb770c10fec85f6c8f6861a43bbc6310e19e74958b79a273f10da2033c7b0f8ace09d934f1adec304131

data/.yardopts ADDED

@@ -0,0 +1,9 @@
+--no-private
+--title=Google Cloud Speech
+--exclude lib/google/cloud/speech/v1beta1
+--exclude lib/google/cloud/speech/v1beta1.rb
+--markup markdown
+./lib/**/*.rb
+-
+README.md

data/LICENSE ADDED

@@ -0,0 +1,201 @@
+                                 Apache License
+                           Version 2.0, January 2004
+                        http://www.apache.org/licenses/
+   TERMS AND CONDITIONS FOR USE, REPRODUCTION, AND DISTRIBUTION
+   1. Definitions.
+      "License" shall mean the terms and conditions for use, reproduction,
+      and distribution as defined by Sections 1 through 9 of this document.
+      "Licensor" shall mean the copyright owner or entity authorized by
+      the copyright owner that is granting the License.
+      "Legal Entity" shall mean the union of the acting entity and all
+      other entities that control, are controlled by, or are under common
+      control with that entity. For the purposes of this definition,
+      "control" means (i) the power, direct or indirect, to cause the
+      direction or management of such entity, whether by contract or
+      otherwise, or (ii) ownership of fifty percent (50%) or more of the
+      outstanding shares, or (iii) beneficial ownership of such entity.
+      "You" (or "Your") shall mean an individual or Legal Entity
+      exercising permissions granted by this License.
+      "Source" form shall mean the preferred form for making modifications,
+      including but not limited to software source code, documentation
+      source, and configuration files.
+      "Object" form shall mean any form resulting from mechanical
+      transformation or translation of a Source form, including but
+      not limited to compiled object code, generated documentation,
+      and conversions to other media types.
+      "Work" shall mean the work of authorship, whether in Source or
+      Object form, made available under the License, as indicated by a
+      copyright notice that is included in or attached to the work
+      (an example is provided in the Appendix below).
+      "Derivative Works" shall mean any work, whether in Source or Object
+      form, that is based on (or derived from) the Work and for which the
+      editorial revisions, annotations, elaborations, or other modifications
+      represent, as a whole, an original work of authorship. For the purposes
+      of this License, Derivative Works shall not include works that remain
+      separable from, or merely link (or bind by name) to the interfaces of,
+      the Work and Derivative Works thereof.
+      "Contribution" shall mean any work of authorship, including
+      the original version of the Work and any modifications or additions
+      to that Work or Derivative Works thereof, that is intentionally
+      submitted to Licensor for inclusion in the Work by the copyright owner
+      or by an individual or Legal Entity authorized to submit on behalf of
+      the copyright owner. For the purposes of this definition, "submitted"
+      means any form of electronic, verbal, or written communication sent
+      to the Licensor or its representatives, including but not limited to
+      communication on electronic mailing lists, source code control systems,
+      and issue tracking systems that are managed by, or on behalf of, the
+      Licensor for the purpose of discussing and improving the Work, but
+      excluding communication that is conspicuously marked or otherwise
+      designated in writing by the copyright owner as "Not a Contribution."
+      "Contributor" shall mean Licensor and any individual or Legal Entity
+      on behalf of whom a Contribution has been received by Licensor and
+      subsequently incorporated within the Work.
+   2. Grant of Copyright License. Subject to the terms and conditions of
+      this License, each Contributor hereby grants to You a perpetual,
+      worldwide, non-exclusive, no-charge, royalty-free, irrevocable
+      copyright license to reproduce, prepare Derivative Works of,
+      publicly display, publicly perform, sublicense, and distribute the
+      Work and such Derivative Works in Source or Object form.
+   3. Grant of Patent License. Subject to the terms and conditions of
+      this License, each Contributor hereby grants to You a perpetual,
+      worldwide, non-exclusive, no-charge, royalty-free, irrevocable
+      (except as stated in this section) patent license to make, have made,
+      use, offer to sell, sell, import, and otherwise transfer the Work,
+      where such license applies only to those patent claims licensable
+      by such Contributor that are necessarily infringed by their
+      Contribution(s) alone or by combination of their Contribution(s)
+      with the Work to which such Contribution(s) was submitted. If You
+      institute patent litigation against any entity (including a
+      cross-claim or counterclaim in a lawsuit) alleging that the Work
+      or a Contribution incorporated within the Work constitutes direct
+      or contributory patent infringement, then any patent licenses
+      granted to You under this License for that Work shall terminate
+      as of the date such litigation is filed.
+   4. Redistribution. You may reproduce and distribute copies of the
+      Work or Derivative Works thereof in any medium, with or without
+      modifications, and in Source or Object form, provided that You
+      meet the following conditions:
+      (a) You must give any other recipients of the Work or
+          Derivative Works a copy of this License; and
+      (b) You must cause any modified files to carry prominent notices
+          stating that You changed the files; and
+      (c) You must retain, in the Source form of any Derivative Works
+          that You distribute, all copyright, patent, trademark, and
+          attribution notices from the Source form of the Work,
+          excluding those notices that do not pertain to any part of
+          the Derivative Works; and
+      (d) If the Work includes a "NOTICE" text file as part of its
+          distribution, then any Derivative Works that You distribute must
+          include a readable copy of the attribution notices contained
+          within such NOTICE file, excluding those notices that do not
+          pertain to any part of the Derivative Works, in at least one
+          of the following places: within a NOTICE text file distributed
+          as part of the Derivative Works; within the Source form or
+          documentation, if provided along with the Derivative Works; or,
+          within a display generated by the Derivative Works, if and
+          wherever such third-party notices normally appear. The contents
+          of the NOTICE file are for informational purposes only and
+          do not modify the License. You may add Your own attribution
+          notices within Derivative Works that You distribute, alongside
+          or as an addendum to the NOTICE text from the Work, provided
+          that such additional attribution notices cannot be construed
+          as modifying the License.
+      You may add Your own copyright statement to Your modifications and
+      may provide additional or different license terms and conditions
+      for use, reproduction, or distribution of Your modifications, or
+      for any such Derivative Works as a whole, provided Your use,
+      reproduction, and distribution of the Work otherwise complies with
+      the conditions stated in this License.
+   5. Submission of Contributions. Unless You explicitly state otherwise,
+      any Contribution intentionally submitted for inclusion in the Work
+      by You to the Licensor shall be under the terms and conditions of
+      this License, without any additional terms or conditions.
+      Notwithstanding the above, nothing herein shall supersede or modify
+      the terms of any separate license agreement you may have executed
+      with Licensor regarding such Contributions.
+   6. Trademarks. This License does not grant permission to use the trade
+      names, trademarks, service marks, or product names of the Licensor,
+      except as required for reasonable and customary use in describing the
+      origin of the Work and reproducing the content of the NOTICE file.
+   7. Disclaimer of Warranty. Unless required by applicable law or
+      agreed to in writing, Licensor provides the Work (and each
+      Contributor provides its Contributions) on an "AS IS" BASIS,
+      WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or
+      implied, including, without limitation, any warranties or conditions
+      of TITLE, NON-INFRINGEMENT, MERCHANTABILITY, or FITNESS FOR A
+      PARTICULAR PURPOSE. You are solely responsible for determining the
+      appropriateness of using or redistributing the Work and assume any
+      risks associated with Your exercise of permissions under this License.
+   8. Limitation of Liability. In no event and under no legal theory,
+      whether in tort (including negligence), contract, or otherwise,
+      unless required by applicable law (such as deliberate and grossly
+      negligent acts) or agreed to in writing, shall any Contributor be
+      liable to You for damages, including any direct, indirect, special,
+      incidental, or consequential damages of any character arising as a
+      result of this License or out of the use or inability to use the
+      Work (including but not limited to damages for loss of goodwill,
+      work stoppage, computer failure or malfunction, or any and all
+      other commercial damages or losses), even if such Contributor
+      has been advised of the possibility of such damages.
+   9. Accepting Warranty or Additional Liability. While redistributing
+      the Work or Derivative Works thereof, You may choose to offer,
+      and charge a fee for, acceptance of support, warranty, indemnity,
+      or other liability obligations and/or rights consistent with this
+      License. However, in accepting such obligations, You may act only
+      on Your own behalf and on Your sole responsibility, not on behalf
+      of any other Contributor, and only if You agree to indemnify,
+      defend, and hold each Contributor harmless for any liability
+      incurred by, or claims asserted against, such Contributor by reason
+      of your accepting any such warranty or additional liability.
+   END OF TERMS AND CONDITIONS
+   APPENDIX: How to apply the Apache License to your work.
+      To apply the Apache License to your work, attach the following
+      boilerplate notice, with the fields enclosed by brackets "[]"
+      replaced with your own identifying information. (Don't include
+      the brackets!)  The text should be enclosed in the appropriate
+      comment syntax for the file format. We also recommend that a
+      file or class name and description of purpose be included on the
+      same "printed page" as the copyright notice for easier
+      identification within third-party archives.
+   Copyright [yyyy] [name of copyright owner]
+   Licensed under the Apache License, Version 2.0 (the "License");
+   you may not use this file except in compliance with the License.
+   You may obtain a copy of the License at
+       http://www.apache.org/licenses/LICENSE-2.0
+   Unless required by applicable law or agreed to in writing, software
+   distributed under the License is distributed on an "AS IS" BASIS,
+   WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+   See the License for the specific language governing permissions and
+   limitations under the License.

data/README.md ADDED

@@ -0,0 +1,62 @@
+# google-cloud-speech
+[Google Cloud Speech API](https://cloud.google.com/speech/) ([docs](https://cloud.google.com/speech/docs)) enables developers to convert audio to text by applying powerful neural network models.
+- [google-cloud-speech API documentation](http://googlecloudplatform.github.io/google-cloud-ruby/#/docs/google-cloud-speech/master/google/cloud/speech)
+- [google-cloud-speech on RubyGems](https://rubygems.org/gems/google-cloud-speech)
+- [Google Cloud Speech API documentation](https://cloud.google.com/speech/docs)
+## Quick Start
+```sh
+$ gem install google-cloud-speech
+```
+## Authentication
+This library uses Service Account credentials to connect to Google Cloud services. When running on Compute Engine the credentials will be discovered automatically. When running on other environments the Service Account credentials can be specified by providing the path to the JSON file, or the JSON itself, in environment variables.
+Instructions and configuration options are covered in the [Authentication Guide](https://googlecloudplatform.github.io/google-cloud-ruby/#/docs/google-cloud-speech/guides/authentication).
+## Example
+```ruby
+require "google/cloud/speech"
+speech = Google::Cloud::Speech.new
+audio = speech.audio "path/to/audio.raw",
+                     encoding: :raw, sample_rate: 16000
+results = audio.recognize
+result = results.first
+result.transcript #=> "how old is the Brooklyn Bridge"
+result.confidence #=> 0.9826789498329163
+```
+## Supported Ruby Versions
+This library is supported on Ruby 2.0+.
+## Versioning
+This library follows [Semantic Versioning](http://semver.org/).
+It is currently in major version zero (0.y.z), which means that anything may change at any time and the public API should not be considered stable.
+## Contributing
+Contributions to this library are always welcome and highly encouraged.
+See the [Contributing Guide](https://googlecloudplatform.github.io/google-cloud-ruby/#/docs/guides/contributing) for more information on how to get started.
+Please note that this project is released with a Contributor Code of Conduct. By participating in this project you agree to abide by its terms. See [Code of Conduct](../CODE_OF_CONDUCT.md) for more information.
+## License
+This library is licensed under Apache 2.0. Full license text is available in [LICENSE](LICENSE).
+## Support
+Please [report bugs at the project on Github](https://github.com/GoogleCloudPlatform/google-cloud-ruby/issues).
+Don't hesitate to [ask questions](http://stackoverflow.com/questions/tagged/google-cloud-ruby) about the client or APIs on [StackOverflow](http://stackoverflow.com).

data/lib/google/cloud/speech.rb CHANGED

@@ -158,9 +158,9 @@ module Google
     #   result.confidence #=> 0.9826789498329163
     # end
     #
-    # # Stream 5 seconds of audio from the microhone
+    # # Stream 5 seconds of audio from the microphone
     # # Actual implementation of microphone input varies by platform
-    # 5.times.do
+    # 5.times do
     #   stream.send MicrophoneInput.read(32000)
     # end
     #

data/lib/google/cloud/speech/project.rb CHANGED

@@ -462,7 +462,7 @@ module Google
         #
         #   speech = Google::Cloud::Speech.new
         #
-        #   stream = audio.stream encoding: :raw, sample_rate: 16000
+        #   stream = speech.stream encoding: :raw, sample_rate: 16000
         #
         #   # register callback for when a result is returned
         #   stream.on_result do |results|
@@ -471,9 +471,9 @@ module Google
         #     puts result.confidence # 0.9826789498329163
         #   end
         #
-        #   # Stream 5 seconds of audio from the microhone
+        #   # Stream 5 seconds of audio from the microphone
         #   # Actual implementation of microphone input varies by platform
-        #   5.times.do
+        #   5.times do
         #     stream.send MicrophoneInput.read(32000)
         #   end
         #
@@ -509,6 +509,7 @@ module Google
                          phrases: nil
           context = nil
           context = V1beta1::SpeechContext.new(phrases: phrases) if phrases
+          language = String(language) unless language.nil?
           V1beta1::RecognitionConfig.new({
             encoding: convert_encoding(encoding),
             sample_rate: sample_rate,

data/lib/google/cloud/speech/result.rb CHANGED

@@ -150,7 +150,7 @@ module Google
       #
       #   speech = Google::Cloud::Speech.new
       #
-      #   stream = audio.stream encoding: :raw, sample_rate: 16000
+      #   stream = speech.stream encoding: :raw, sample_rate: 16000
       #
       #   # register callback for when an interim result is returned
       #   stream.on_interim do |final_results, interim_results|
@@ -160,9 +160,9 @@ module Google
       #     puts interim_result.stability # 0.8999
       #   end
       #
-      #   # Stream 5 seconds of audio from the microhone
+      #   # Stream 5 seconds of audio from the microphone
       #   # Actual implementation of microphone input varies by platform
-      #   5.times.do
+      #   5.times do
       #     stream.send MicrophoneInput.read(32000)
       #   end
       #

data/lib/google/cloud/speech/stream.rb CHANGED

@@ -31,7 +31,7 @@ module Google
       #
       #   speech = Google::Cloud::Speech.new
       #
-      #   stream = audio.stream encoding: :raw, sample_rate: 16000
+      #   stream = speech.stream encoding: :raw, sample_rate: 16000
       #
       #   # register callback for when a result is returned
       #   stream.on_result do |results|
@@ -40,9 +40,9 @@ module Google
       #     puts result.confidence # 0.9826789498329163
       #   end
       #
-      #   # Stream 5 seconds of audio from the microhone
+      #   # Stream 5 seconds of audio from the microphone
       #   # Actual implementation of microphone input varies by platform
-      #   5.times.do
+      #   5.times do
       #     stream.send MicrophoneInput.read(32000)
       #   end
       #
@@ -93,6 +93,8 @@ module Google
         #
         #   speech = Google::Cloud::Speech.new
         #
+        #   audio = speech.audio "path/to/audio.raw"
+        #
         #   stream = speech.stream encoding: :raw, sample_rate: 16000
         #
         #   # register callback for when a result is returned
@@ -102,9 +104,9 @@ module Google
         #     puts result.confidence # 0.9826789498329163
         #   end
         #
-        #   # Stream 5 seconds of audio from the microhone
+        #   # Stream 5 seconds of audio from the microphone
         #   # Actual implementation of microphone input varies by platform
-        #   5.times.do
+        #   5.times do
         #     stream.send MicrophoneInput.read(32000)
         #   end
         #
@@ -151,20 +153,21 @@ module Google
         #
         #   speech = Google::Cloud::Speech.new
         #
-        #   stream = audio.stream encoding: :raw, sample_rate: 16000
+        #   stream = speech.stream encoding: :raw, sample_rate: 16000
         #
-        #   # Stream 5 seconds of audio from the microhone
+        #   # Stream 5 seconds of audio from the microphone
         #   # Actual implementation of microphone input varies by platform
-        #   5.times.do
+        #   5.times do
         #     stream.send MicrophoneInput.read(32000)
         #   end
         #
         #   stream.stop
         #
         #   results = stream.results
-        #   result = results.first
-        #   puts result.transcript # "how old is the Brooklyn Bridge"
-        #   puts result.confidence # 0.9826789498329163
+        #   results.each do |result|
+        #     puts result.transcript
+        #     puts result.confidence
+        #   end
         #
         def results
           synchronize do
@@ -184,7 +187,7 @@ module Google
         #
         #   speech = Google::Cloud::Speech.new
         #
-        #   stream = audio.stream encoding: :raw, sample_rate: 16000
+        #   stream = speech.stream encoding: :raw, sample_rate: 16000
         #
         #   # register callback for when an interim result is returned
         #   stream.on_interim do |final_results, interim_results|
@@ -194,9 +197,9 @@ module Google
         #     puts interim_result.stability # 0.8999
         #   end
         #
-        #   # Stream 5 seconds of audio from the microhone
+        #   # Stream 5 seconds of audio from the microphone
         #   # Actual implementation of microphone input varies by platform
-        #   5.times.do
+        #   5.times do
         #     stream.send MicrophoneInput.read(32000)
         #   end
         #
@@ -227,7 +230,7 @@ module Google
         #
         #   speech = Google::Cloud::Speech.new
         #
-        #   stream = audio.stream encoding: :raw, sample_rate: 16000
+        #   stream = speech.stream encoding: :raw, sample_rate: 16000
         #
         #   # register callback for when an interim result is returned
         #   stream.on_result do |results|
@@ -236,9 +239,9 @@ module Google
         #     puts result.confidence # 0.9826789498329163
         #   end
         #
-        #   # Stream 5 seconds of audio from the microhone
+        #   # Stream 5 seconds of audio from the microphone
         #   # Actual implementation of microphone input varies by platform
-        #   5.times.do
+        #   5.times do
         #     stream.send MicrophoneInput.read(32000)
         #   end
         #
@@ -259,7 +262,7 @@ module Google
           result!
         end
-        # @private yields each final results as they are recieved
+        # @private yields each final results as they are received
         def result!
           synchronize do
             @callbacks[:result].each { |c| c.call results }
@@ -278,16 +281,16 @@ module Google
         #
         #   speech = Google::Cloud::Speech.new
         #
-        #   stream = audio.stream encoding: :raw, sample_rate: 16000
+        #   stream = speech.stream encoding: :raw, sample_rate: 16000
         #
         #   # register callback for when speech has started.
         #   stream.on_speech_start do
         #     puts "Speech has started."
         #   end
         #
-        #   # Stream 5 seconds of audio from the microhone
+        #   # Stream 5 seconds of audio from the microphone
         #   # Actual implementation of microphone input varies by platform
-        #   5.times.do
+        #   5.times do
         #     stream.send MicrophoneInput.read(32000)
         #   end
         #
@@ -300,7 +303,7 @@ module Google
         end
         # @private returns single final result once :END_OF_UTTERANCE is
-        # recieved.
+        # received.
         def speech_start!
           synchronize do
             @callbacks[:speech_start].each(&:call)
@@ -319,16 +322,16 @@ module Google
         #
         #   speech = Google::Cloud::Speech.new
         #
-        #   stream = audio.stream encoding: :raw, sample_rate: 16000
+        #   stream = speech.stream encoding: :raw, sample_rate: 16000
         #
         #   # register callback for when speech has ended.
         #   stream.on_speech_end do
         #     puts "Speech has ended."
         #   end
         #
-        #   # Stream 5 seconds of audio from the microhone
+        #   # Stream 5 seconds of audio from the microphone
         #   # Actual implementation of microphone input varies by platform
-        #   5.times.do
+        #   5.times do
         #     stream.send MicrophoneInput.read(32000)
         #   end
         #
@@ -341,7 +344,7 @@ module Google
         end
         # @private yields single final result once :END_OF_UTTERANCE is
-        # recieved.
+        # received.
         def speech_end!
           synchronize do
             @callbacks[:speech_end].each(&:call)
@@ -360,16 +363,16 @@ module Google
         #
         #   speech = Google::Cloud::Speech.new
         #
-        #   stream = audio.stream encoding: :raw, sample_rate: 16000
+        #   stream = speech.stream encoding: :raw, sample_rate: 16000
         #
         #   # register callback for when audio has ended.
         #   stream.on_complete do
         #     puts "Audio has ended."
         #   end
         #
-        #   # Stream 5 seconds of audio from the microhone
+        #   # Stream 5 seconds of audio from the microphone
         #   # Actual implementation of microphone input varies by platform
-        #   5.times.do
+        #   5.times do
         #     stream.send MicrophoneInput.read(32000)
         #   end
         #
@@ -405,9 +408,9 @@ module Google
         #
         #   speech = Google::Cloud::Speech.new
         #
-        #   stream = audio.stream encoding: :raw,
-        #                         sample_rate: 16000,
-        #                         utterance: true
+        #   stream = speech.stream encoding: :raw,
+        #                          sample_rate: 16000,
+        #                          utterance: true
         #
         #   # register callback for when utterance has occurred.
         #   stream.on_utterance do
@@ -415,9 +418,9 @@ module Google
         #     stream.stop
         #   end
         #
-        #   # Stream 5 seconds of audio from the microhone
+        #   # Stream 5 seconds of audio from the microphone
         #   # Actual implementation of microphone input varies by platform
-        #   5.times.do
+        #   5.times do
         #     stream.send MicrophoneInput.read(32000)
         #   end
         #
@@ -430,7 +433,7 @@ module Google
         end
         # @private returns single final result once :END_OF_UTTERANCE is
-        # recieved.
+        # received.
         def utterance!
           synchronize do
             @callbacks[:utterance].each(&:call)
@@ -438,7 +441,7 @@ module Google
         end
         ##
-        # Register to be notified of an error recieved during the stream.
+        # Register to be notified of an error received during the stream.
         #
         # @yield [callback] The block for accessing final results.
         # @yieldparam [Exception] error The error raised.
@@ -448,7 +451,7 @@ module Google
         #
         #   speech = Google::Cloud::Speech.new
         #
-        #   stream = audio.stream encoding: :raw, sample_rate: 16000
+        #   stream = speech.stream encoding: :raw, sample_rate: 16000
         #
         #   # register callback for when an error is returned
         #   stream.on_error do |error|
@@ -456,9 +459,9 @@ module Google
         #     stream.stop
         #   end
         #
-        #   # Stream 5 seconds of audio from the microhone
+        #   # Stream 5 seconds of audio from the microphone
         #   # Actual implementation of microphone input varies by platform
-        #   5.times.do
+        #   5.times do
         #     stream.send MicrophoneInput.read(32000)
         #   end
         #

data/lib/google/cloud/speech/v1beta1/doc/google/cloud/speech/v1beta1/cloud_speech.rb ADDED

@@ -0,0 +1,377 @@
+# Copyright 2016 Google Inc. All rights reserved.
+#
+# Licensed under the Apache License, Version 2.0 (the "License");
+# you may not use this file except in compliance with the License.
+# You may obtain a copy of the License at
+#
+# http://www.apache.org/licenses/LICENSE-2.0
+#
+# Unless required by applicable law or agreed to in writing, software
+# distributed under the License is distributed on an "AS IS" BASIS,
+# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+# See the License for the specific language governing permissions and
+# limitations under the License.
+module Google
+  module Cloud
+    module Speech
+      module V1beta1
+        # +SyncRecognizeRequest+ is the top-level message sent by the client for
+        # the +SyncRecognize+ method.
+        # @!attribute [rw] config
+        #   @return [Google::Cloud::Speech::V1beta1::RecognitionConfig]
+        #     [Required] The +config+ message provides information to the recognizer
+        #     that specifies how to process the request.
+        # @!attribute [rw] audio
+        #   @return [Google::Cloud::Speech::V1beta1::RecognitionAudio]
+        #     [Required] The audio data to be recognized.
+        class SyncRecognizeRequest; end
+        # +AsyncRecognizeRequest+ is the top-level message sent by the client for
+        # the +AsyncRecognize+ method.
+        # @!attribute [rw] config
+        #   @return [Google::Cloud::Speech::V1beta1::RecognitionConfig]
+        #     [Required] The +config+ message provides information to the recognizer
+        #     that specifies how to process the request.
+        # @!attribute [rw] audio
+        #   @return [Google::Cloud::Speech::V1beta1::RecognitionAudio]
+        #     [Required] The audio data to be recognized.
+        class AsyncRecognizeRequest; end
+        # +StreamingRecognizeRequest+ is the top-level message sent by the client for
+        # the +StreamingRecognize+. Multiple +StreamingRecognizeRequest+ messages are
+        # sent. The first message must contain a +streaming_config+ message and must
+        # not contain +audio+ data. All subsequent messages must contain +audio+ data
+        # and must not contain a +streaming_config+ message.
+        # @!attribute [rw] streaming_config
+        #   @return [Google::Cloud::Speech::V1beta1::StreamingRecognitionConfig]
+        #     The +streaming_config+ message provides information to the recognizer
+        #     that specifies how to process the request.
+        #
+        #     The first +StreamingRecognizeRequest+ message must contain a
+        #     +streaming_config+  message.
+        # @!attribute [rw] audio_content
+        #   @return [String]
+        #     The audio data to be recognized. Sequential chunks of audio data are sent
+        #     in sequential +StreamingRecognizeRequest+ messages. The first
+        #     +StreamingRecognizeRequest+ message must not contain +audio_content+ data
+        #     and all subsequent +StreamingRecognizeRequest+ messages must contain
+        #     +audio_content+ data. The audio bytes must be encoded as specified in
+        #     +RecognitionConfig+. Note: as with all bytes fields, protobuffers use a
+        #     pure binary representation (not base64). See
+        #     {audio limits}[https://cloud.google.com/speech/limits#content].
+        class StreamingRecognizeRequest; end
+        # The +StreamingRecognitionConfig+ message provides information to the
+        # recognizer that specifies how to process the request.
+        # @!attribute [rw] config
+        #   @return [Google::Cloud::Speech::V1beta1::RecognitionConfig]
+        #     [Required] The +config+ message provides information to the recognizer
+        #     that specifies how to process the request.
+        # @!attribute [rw] single_utterance
+        #   @return [true, false]
+        #     [Optional] If +false+ or omitted, the recognizer will perform continuous
+        #     recognition (continuing to process audio even if the user pauses speaking)
+        #     until the client closes the output stream (gRPC API) or when the maximum
+        #     time limit has been reached. Multiple +StreamingRecognitionResult+s with
+        #     the +is_final+ flag set to +true+ may be returned.
+        #
+        #     If +true+, the recognizer will detect a single spoken utterance. When it
+        #     detects that the user has paused or stopped speaking, it will return an
+        #     +END_OF_UTTERANCE+ event and cease recognition. It will return no more than
+        #     one +StreamingRecognitionResult+ with the +is_final+ flag set to +true+.
+        # @!attribute [rw] interim_results
+        #   @return [true, false]
+        #     [Optional] If +true+, interim results (tentative hypotheses) may be
+        #     returned as they become available (these interim results are indicated with
+        #     the +is_final=false+ flag).
+        #     If +false+ or omitted, only +is_final=true+ result(s) are returned.
+        class StreamingRecognitionConfig; end
+        # The +RecognitionConfig+ message provides information to the recognizer
+        # that specifies how to process the request.
+        # @!attribute [rw] encoding
+        #   @return [Google::Cloud::Speech::V1beta1::RecognitionConfig::AudioEncoding]
+        #     [Required] Encoding of audio data sent in all +RecognitionAudio+ messages.
+        # @!attribute [rw] sample_rate
+        #   @return [Integer]
+        #     [Required] Sample rate in Hertz of the audio data sent in all
+        #     +RecognitionAudio+ messages. Valid values are: 8000-48000.
+        #     16000 is optimal. For best results, set the sampling rate of the audio
+        #     source to 16000 Hz. If that's not possible, use the native sample rate of
+        #     the audio source (instead of re-sampling).
+        # @!attribute [rw] language_code
+        #   @return [String]
+        #     [Optional] The language of the supplied audio as a BCP-47 language tag.
+        #     Example: "en-GB"  https://www.rfc-editor.org/rfc/bcp/bcp47.txt
+        #     If omitted, defaults to "en-US". See
+        #     {Language Support}[https://cloud.google.com/speech/docs/best-practices#language_support]
+        #     for a list of the currently supported language codes.
+        # @!attribute [rw] max_alternatives
+        #   @return [Integer]
+        #     [Optional] Maximum number of recognition hypotheses to be returned.
+        #     Specifically, the maximum number of +SpeechRecognitionAlternative+ messages
+        #     within each +SpeechRecognitionResult+.
+        #     The server may return fewer than +max_alternatives+.
+        #     Valid values are +0+-+30+. A value of +0+ or +1+ will return a maximum of
+        #     +1+. If omitted, defaults to +1+.
+        # @!attribute [rw] profanity_filter
+        #   @return [true, false]
+        #     [Optional] If set to +true+, the server will attempt to filter out
+        #     profanities, replacing all but the initial character in each filtered word
+        #     with asterisks, e.g. "f***". If set to +false+ or omitted, profanities
+        #     won't be filtered out.
+        # @!attribute [rw] speech_context
+        #   @return [Google::Cloud::Speech::V1beta1::SpeechContext]
+        #     [Optional] A means to provide context to assist the speech recognition.
+        class RecognitionConfig
+          # Audio encoding of the data sent in the audio message. All encodings support
+          # only 1 channel (mono) audio. Only +FLAC+ includes a header that describes
+          # the bytes of audio that follow the header. The other encodings are raw
+          # audio bytes with no header.
+          #
+          # For best results, the audio source should be captured and transmitted using
+          # a lossless encoding (+FLAC+ or +LINEAR16+). Recognition accuracy may be
+          # reduced if lossy codecs (such as AMR, AMR_WB and MULAW) are used to capture
+          # or transmit the audio, particularly if background noise is present.
+          module AudioEncoding
+            # Not specified. Will return result Google::Rpc::Code::INVALID_ARGUMENT.
+            ENCODING_UNSPECIFIED = 0
+            # Uncompressed 16-bit signed little-endian samples (Linear PCM).
+            # This is the only encoding that may be used by +AsyncRecognize+.
+            LINEAR16 = 1
+            # This is the recommended encoding for +SyncRecognize+ and
+            # +StreamingRecognize+ because it uses lossless compression; therefore
+            # recognition accuracy is not compromised by a lossy codec.
+            #
+            # The stream FLAC (Free Lossless Audio Codec) encoding is specified at:
+            # http://flac.sourceforge.net/documentation.html.
+            # 16-bit and 24-bit samples are supported.
+            # Not all fields in STREAMINFO are supported.
+            FLAC = 2
+            # 8-bit samples that compand 14-bit audio samples using G.711 PCMU/mu-law.
+            MULAW = 3
+            # Adaptive Multi-Rate Narrowband codec. +sample_rate+ must be 8000 Hz.
+            AMR = 4
+            # Adaptive Multi-Rate Wideband codec. +sample_rate+ must be 16000 Hz.
+            AMR_WB = 5
+          end
+        end
+        # Provides "hints" to the speech recognizer to favor specific words and phrases
+        # in the results.
+        # @!attribute [rw] phrases
+        #   @return [Array<String>]
+        #     [Optional] A list of strings containing words and phrases "hints" so that
+        #     the speech recognition is more likely to recognize them. This can be used
+        #     to improve the accuracy for specific words and phrases, for example, if
+        #     specific commands are typically spoken by the user. This can also be used
+        #     to add additional words to the vocabulary of the recognizer. See
+        #     {usage limits}[https://cloud.google.com/speech/limits#content].
+        class SpeechContext; end
+        # Contains audio data in the encoding specified in the +RecognitionConfig+.
+        # Either +content+ or +uri+ must be supplied. Supplying both or neither
+        # returns Google::Rpc::Code::INVALID_ARGUMENT. See
+        # {audio limits}[https://cloud.google.com/speech/limits#content].
+        # @!attribute [rw] content
+        #   @return [String]
+        #     The audio data bytes encoded as specified in
+        #     +RecognitionConfig+. Note: as with all bytes fields, protobuffers use a
+        #     pure binary representation, whereas JSON representations use base64.
+        # @!attribute [rw] uri
+        #   @return [String]
+        #     URI that points to a file that contains audio data bytes as specified in
+        #     +RecognitionConfig+. Currently, only Google Cloud Storage URIs are
+        #     supported, which must be specified in the following format:
+        #     +gs://bucket_name/object_name+ (other URI formats return
+        #     Google::Rpc::Code::INVALID_ARGUMENT). For more information, see
+        #     {Request URIs}[https://cloud.google.com/storage/docs/reference-uris].
+        class RecognitionAudio; end
+        # +SyncRecognizeResponse+ is the only message returned to the client by
+        # +SyncRecognize+. It contains the result as zero or more sequential
+        # +SpeechRecognitionResult+ messages.
+        # @!attribute [rw] results
+        #   @return [Array<Google::Cloud::Speech::V1beta1::SpeechRecognitionResult>]
+        #     [Output-only] Sequential list of transcription results corresponding to
+        #     sequential portions of audio.
+        class SyncRecognizeResponse; end
+        # +AsyncRecognizeResponse+ is the only message returned to the client by
+        # +AsyncRecognize+. It contains the result as zero or more sequential
+        # +SpeechRecognitionResult+ messages. It is included in the +result.response+
+        # field of the +Operation+ returned by the +GetOperation+ call of the
+        # +google::longrunning::Operations+ service.
+        # @!attribute [rw] results
+        #   @return [Array<Google::Cloud::Speech::V1beta1::SpeechRecognitionResult>]
+        #     [Output-only] Sequential list of transcription results corresponding to
+        #     sequential portions of audio.
+        class AsyncRecognizeResponse; end
+        # +AsyncRecognizeMetadata+ describes the progress of a long-running
+        # +AsyncRecognize+ call. It is included in the +metadata+ field of the
+        # +Operation+ returned by the +GetOperation+ call of the
+        # +google::longrunning::Operations+ service.
+        # @!attribute [rw] progress_percent
+        #   @return [Integer]
+        #     Approximate percentage of audio processed thus far. Guaranteed to be 100
+        #     when the audio is fully processed and the results are available.
+        # @!attribute [rw] start_time
+        #   @return [Google::Protobuf::Timestamp]
+        #     Time when the request was received.
+        # @!attribute [rw] last_update_time
+        #   @return [Google::Protobuf::Timestamp]
+        #     Time of the most recent processing update.
+        class AsyncRecognizeMetadata; end
+        # +StreamingRecognizeResponse+ is the only message returned to the client by
+        # +StreamingRecognize+. A series of one or more +StreamingRecognizeResponse+
+        # messages are streamed back to the client.
+        #
+        # Here's an example of a series of ten +StreamingRecognizeResponse+s that might
+        # be returned while processing audio:
+        #
+        # 1. endpointer_type: START_OF_SPEECH
+        #
+        # 2. results { alternatives { transcript: "tube" } stability: 0.01 }
+        #    result_index: 0
+        #
+        # 3. results { alternatives { transcript: "to be a" } stability: 0.01 }
+        #    result_index: 0
+        #
+        # 4. results { alternatives { transcript: "to be" } stability: 0.9 }
+        #    results { alternatives { transcript: " or not to be" } stability: 0.01 }
+        #    result_index: 0
+        #
+        # 5. results { alternatives { transcript: "to be or not to be"
+        #                             confidence: 0.92 }
+        #              alternatives { transcript: "to bee or not to bee" }
+        #              is_final: true }
+        #    result_index: 0
+        #
+        # 6. results { alternatives { transcript: " that's" } stability: 0.01 }
+        #    result_index: 1
+        #
+        # 7. results { alternatives { transcript: " that is" } stability: 0.9 }
+        #    results { alternatives { transcript: " the question" } stability: 0.01 }
+        #    result_index: 1
+        #
+        # 8. endpointer_type: END_OF_SPEECH
+        #
+        # 9. results { alternatives { transcript: " that is the question"
+        #                             confidence: 0.98 }
+        #              alternatives { transcript: " that was the question" }
+        #              is_final: true }
+        #    result_index: 1
+        #
+        # 10. endpointer_type: END_OF_AUDIO
+        #
+        # Notes:
+        #
+        # - Only two of the above responses #5 and #9 contain final results, they are
+        #   indicated by +is_final: true+. Concatenating these together generates the
+        #   full transcript: "to be or not to be that is the question".
+        #
+        # - The others contain interim +results+. #4 and #7 contain two interim
+        #   +results+, the first portion has a high stability and is less likely to
+        #   change, the second portion has a low stability and is very likely to
+        #   change. A UI designer might choose to show only high stability +results+.
+        #
+        # - The +result_index+ indicates the portion of audio that has had final
+        #   results returned, and is no longer being processed. For example, the
+        #   +results+ in #6 and later correspond to the portion of audio after
+        #   "to be or not to be".
+        # @!attribute [rw] error
+        #   @return [Google::Rpc::Status]
+        #     [Output-only] If set, returns a Google::Rpc::Status message that
+        #     specifies the error for the operation.
+        # @!attribute [rw] results
+        #   @return [Array<Google::Cloud::Speech::V1beta1::StreamingRecognitionResult>]
+        #     [Output-only] This repeated list contains zero or more results that
+        #     correspond to consecutive portions of the audio currently being processed.
+        #     It contains zero or one +is_final=true+ result (the newly settled portion),
+        #     followed by zero or more +is_final=false+ results.
+        # @!attribute [rw] result_index
+        #   @return [Integer]
+        #     [Output-only] Indicates the lowest index in the +results+ array that has
+        #     changed. The repeated +StreamingRecognitionResult+ results overwrite past
+        #     results at this index and higher.
+        # @!attribute [rw] endpointer_type
+        #   @return [Google::Cloud::Speech::V1beta1::StreamingRecognizeResponse::EndpointerType]
+        #     [Output-only] Indicates the type of endpointer event.
+        class StreamingRecognizeResponse
+          # Indicates the type of endpointer event.
+          module EndpointerType
+            # No endpointer event specified.
+            ENDPOINTER_EVENT_UNSPECIFIED = 0
+            # Speech has been detected in the audio stream.
+            START_OF_SPEECH = 1
+            # Speech has ceased to be detected in the audio stream.
+            END_OF_SPEECH = 2
+            # The end of the audio stream has been reached. and it is being processed.
+            END_OF_AUDIO = 3
+            # This event is only sent when +single_utterance+ is +true+. It indicates
+            # that the server has detected the end of the user's speech utterance and
+            # expects no additional speech. Therefore, the server will not process
+            # additional audio. The client should stop sending additional audio data.
+            END_OF_UTTERANCE = 4
+          end
+        end
+        # A streaming speech recognition result corresponding to a portion of the audio
+        # that is currently being processed.
+        # @!attribute [rw] alternatives
+        #   @return [Array<Google::Cloud::Speech::V1beta1::SpeechRecognitionAlternative>]
+        #     [Output-only] May contain one or more recognition hypotheses (up to the
+        #     maximum specified in +max_alternatives+).
+        # @!attribute [rw] is_final
+        #   @return [true, false]
+        #     [Output-only] If +false+, this +StreamingRecognitionResult+ represents an
+        #     interim result that may change. If +true+, this is the final time the
+        #     speech service will return this particular +StreamingRecognitionResult+,
+        #     the recognizer will not return any further hypotheses for this portion of
+        #     the transcript and corresponding audio.
+        # @!attribute [rw] stability
+        #   @return [Float]
+        #     [Output-only] An estimate of the probability that the recognizer will not
+        #     change its guess about this interim result. Values range from 0.0
+        #     (completely unstable) to 1.0 (completely stable). Note that this is not the
+        #     same as +confidence+, which estimates the probability that a recognition
+        #     result is correct.
+        #     This field is only provided for interim results (+is_final=false+).
+        #     The default of 0.0 is a sentinel value indicating stability was not set.
+        class StreamingRecognitionResult; end
+        # A speech recognition result corresponding to a portion of the audio.
+        # @!attribute [rw] alternatives
+        #   @return [Array<Google::Cloud::Speech::V1beta1::SpeechRecognitionAlternative>]
+        #     [Output-only] May contain one or more recognition hypotheses (up to the
+        #     maximum specified in +max_alternatives+).
+        class SpeechRecognitionResult; end
+        # Alternative hypotheses (a.k.a. n-best list).
+        # @!attribute [rw] transcript
+        #   @return [String]
+        #     [Output-only] Transcript text representing the words that the user spoke.
+        # @!attribute [rw] confidence
+        #   @return [Float]
+        #     [Output-only] The confidence estimate between 0.0 and 1.0. A higher number
+        #     means the system is more confident that the recognition is correct.
+        #     This field is typically provided only for the top hypothesis, and only for
+        #     +is_final=true+ results.
+        #     The default of 0.0 is a sentinel value indicating confidence was not set.
+        class SpeechRecognitionAlternative; end
+      end
+    end
+  end
+end

data/lib/google/cloud/speech/v1beta1/speech_api.rb CHANGED

@@ -158,10 +158,10 @@ module Google
               config,
               audio,
               options: nil
-            req = Google::Cloud::Speech::V1beta1::SyncRecognizeRequest.new(
+            req = Google::Cloud::Speech::V1beta1::SyncRecognizeRequest.new({
               config: config,
               audio: audio
-            )
+            }.delete_if { |_, v| v.nil? })
             @sync_recognize.call(req, options)
           end
@@ -196,10 +196,10 @@ module Google
               config,
               audio,
               options: nil
-            req = Google::Cloud::Speech::V1beta1::AsyncRecognizeRequest.new(
+            req = Google::Cloud::Speech::V1beta1::AsyncRecognizeRequest.new({
               config: config,
               audio: audio
-            )
+            }.delete_if { |_, v| v.nil? })
             @async_recognize.call(req, options)
           end
         end

data/lib/google/cloud/speech/version.rb CHANGED

@@ -16,7 +16,7 @@
 module Google
   module Cloud
     module Speech
-      VERSION = "0.21.0"
+      VERSION = "0.21.1"
     end
   end
 end

metadata CHANGED

@@ -1,7 +1,7 @@
 --- !ruby/object:Gem::Specification
 name: google-cloud-speech
 version: !ruby/object:Gem::Version
-  version: 0.21.0
+  version: 0.21.1
 platform: ruby
 authors:
 - Mike Moore
@@ -9,7 +9,7 @@ authors:
 autorequire:
 bindir: bin
 cert_chain: []
-date: 2016-10-20 00:00:00.000000000 Z
+date: 2016-11-19 00:00:00.000000000 Z
 dependencies:
 - !ruby/object:Gem::Dependency
   name: google-cloud-core
@@ -199,14 +199,14 @@ dependencies:
     requirements:
     - - "~>"
       - !ruby/object:Gem::Version
-        version: 0.1.6
+        version: 0.1.8
   type: :development
   prerelease: false
   version_requirements: !ruby/object:Gem::Requirement
     requirements:
     - - "~>"
       - !ruby/object:Gem::Version
-        version: 0.1.6
+        version: 0.1.8
 description: google-cloud-speech is the official library for Google Cloud Speech API.
 email:
 - mike@blowmage.com
@@ -215,6 +215,9 @@ executables: []
 extensions: []
 extra_rdoc_files: []
 files:
+- ".yardopts"
+- LICENSE
+- README.md
 - lib/google-cloud-speech.rb
 - lib/google/cloud/speech.rb
 - lib/google/cloud/speech/audio.rb
@@ -227,6 +230,7 @@ files:
 - lib/google/cloud/speech/v1beta1.rb
 - lib/google/cloud/speech/v1beta1/cloud_speech_pb.rb
 - lib/google/cloud/speech/v1beta1/cloud_speech_services_pb.rb
+- lib/google/cloud/speech/v1beta1/doc/google/cloud/speech/v1beta1/cloud_speech.rb
 - lib/google/cloud/speech/v1beta1/speech_api.rb
 - lib/google/cloud/speech/v1beta1/speech_client_config.json
 - lib/google/cloud/speech/version.rb
@@ -250,7 +254,7 @@ required_rubygems_version: !ruby/object:Gem::Requirement
       version: '0'
 requirements: []
 rubyforge_project:
-rubygems_version: 2.6.4
+rubygems_version: 2.4.5.1
 signing_key:
 specification_version: 4
 summary: API Client library for Google Cloud Speech API