RubyGems - google_speech - Versions diffs - 0.1.2 → 0.1.3 - Mend

google_speech 0.1.2 → 0.1.3

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (5) hide show

data/README.md +21 -17
data/lib/google_speech/transcriber.rb +7 -3
data/lib/google_speech/utility.rb +4 -1
data/lib/google_speech/version.rb +1 -1
metadata +4 -4

data/README.md CHANGED Viewed

@@ -26,20 +26,22 @@ Or install it yourself as:
 ## Usage
-As a gem in yourt code:
+As a gem in your code:
+```ruby
+require 'google_speech'
-	require 'google_speech'
-	f = File.open '/Users/you/Downloads/audio.wav'
-  	transcriber = GoogleSpeech::Transcriber.new(f)
-  	t = transcriber.transcribe
+f = File.open '/Users/you/Downloads/audio.wav'
+transcriber = GoogleSpeech::Transcriber.new(f)
+t = transcriber.transcribe
+```
 As a command line tool
 	> google_speech somefile.wav
-Options:
+### Options:
 * language - what language is the speech in
 * chunk_duration - length in seconds for each audio chunk of the wav to send
 * overlap - chunking does not respect word boundaries; overlap can compensate
@@ -47,16 +49,18 @@ Options:
 * request_pause - sleep seconds between chunk transcription requests
 * profanity_filter - google by default filters profanity; this gem does not.
-Default option values:
-	{
-		:language         => 'en-US',
-		:chunk_duration   => 8,
-		:overlap          => 1,
-		:max_results      => 2,
-		:request_pause    => 1,
-		:profanity_filter => false
-	}
+### Default option values:
+```ruby
+{
+	:language         => 'en-US',
+	:chunk_duration   => 8,
+	:overlap          => 1,
+	:max_results      => 2,
+	:request_pause    => 1,
+	:profanity_filter => false
+}
+```
 ## Contributing

data/lib/google_speech/transcriber.rb CHANGED Viewed

@@ -10,7 +10,7 @@ module GoogleSpeech
     DEFAULT_OPTIONS =   {
       :language         => 'en-US',
-      :chunk_duration   => 8,
+      :chunk_duration   => 5,
       :overlap          => 1,
       :max_results      => 2,
       :request_pause    => 1,
@@ -28,12 +28,14 @@ module GoogleSpeech
       chunk_factory.each{ |chunk|
         result = chunk.to_hash
         transcript = transcribe_data(chunk.data)
+        next unless transcript
+        # puts "transcript: #{transcript.inspect}\n\n"
         hypothesis = transcript['hypotheses'].first || Hash.new("")
         result[:text]       = hypothesis['utterance']
         result[:confidence] = hypothesis['confidence']
         @results << result
-        # puts "\n#{result[:start_time]} - #{result[:start_time].to_i + result[:duration].to_i}: #{(result[:confidence].to_f * 100).to_i}%: #{result[:text]}"
+        # puts "\n#{result[:start_time]}: #{(result[:confidence].to_f * 100).to_i}%: #{result[:text]}"
         sleep(options[:request_pause].to_i)
       }
@@ -66,8 +68,10 @@ module GoogleSpeech
       while(!result && retry_count < retry_max)
         connection = Excon.new(url)
         response = connection.request(params)
+        # puts "response: #{response.inspect}\n\n"
         if response.status.to_s.start_with?('2')
-          result = JSON.parse(response.body)
+          result = JSON.parse(response.body)
+          # puts "results: #{result.inspect}\n\n"
         else
           sleep(1)
           retry_count += 1

data/lib/google_speech/utility.rb CHANGED Viewed

@@ -23,7 +23,10 @@ module GoogleSpeech
       def trim_to_flac(wav_path, duration, flac_path, start, length)
         check_local_file(wav_path)
-        command = "sox -t wav '#{wav_path}' -t flac '#{flac_path}' trim #{start.to_i} #{length.to_i} rate 16k"
+        command = "sox -t wav '#{wav_path}' -r 16000 -c 1 -t flac '#{flac_path}' trim #{start.to_i} #{length.to_i} compand .5,2 -80,-80,-75,-50,-30,-15,0,0 norm -0.1"
+        # command = "sox -t wav '#{wav_path}' -t flac '#{flac_path}' trim #{start.to_i} #{length.to_i} rate 16k"
         out, err = run_command(command)
         response = out + err
         response.split("\n").each{ |l| raise("trim_to_flac: error cmd: '#{command}'\nout: '#{response}'") if l =~ SOX_ERROR_RE }

data/lib/google_speech/version.rb CHANGED Viewed

@@ -1,5 +1,5 @@
 # -*- encoding: utf-8 -*-
 module GoogleSpeech
-  VERSION = "0.1.2"
+  VERSION = "0.1.3"
 end

metadata CHANGED Viewed

@@ -1,7 +1,7 @@
 --- !ruby/object:Gem::Specification
 name: google_speech
 version: !ruby/object:Gem::Version
-  version: 0.1.2
+  version: 0.1.3
   prerelease:
 platform: ruby
 authors:
@@ -9,7 +9,7 @@ authors:
 autorequire:
 bindir: bin
 cert_chain: []
-date: 2013-03-09 00:00:00.000000000 Z
+date: 2013-09-03 00:00:00.000000000 Z
 dependencies:
 - !ruby/object:Gem::Dependency
   name: excon
@@ -97,7 +97,7 @@ required_ruby_version: !ruby/object:Gem::Requirement
       version: '0'
       segments:
       - 0
-      hash: 4464618755073906790
+      hash: -4222726659936394268
 required_rubygems_version: !ruby/object:Gem::Requirement
   none: false
   requirements:
@@ -106,7 +106,7 @@ required_rubygems_version: !ruby/object:Gem::Requirement
       version: '0'
       segments:
       - 0
-      hash: 4464618755073906790
+      hash: -4222726659936394268
 requirements: []
 rubyforge_project:
 rubygems_version: 1.8.23