RubyGems - google_speech - Versions diffs - 0.3.3 → 0.4.0 - Mend

google_speech 0.3.3 → 0.4.0

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (8) hide show

checksums.yaml +4 -4
data/google_speech.gemspec +1 -0
data/lib/google_speech.rb +2 -0
data/lib/google_speech/chunk.rb +6 -0
data/lib/google_speech/chunk_factory.rb +8 -3
data/lib/google_speech/transcriber.rb +28 -10
data/lib/google_speech/version.rb +1 -1
metadata +15 -1

checksums.yaml CHANGED

@@ -1,7 +1,7 @@
 ---
 SHA1:
-  metadata.gz: ec2a81e64decb108511c6e41e180634d3c5e2fb0
-  data.tar.gz: 547610e9ebb2c7c8f881a952eb089ec4f2ccd0fd
+  metadata.gz: 6813210970cbd391fc353833b73cf483fecb35be
+  data.tar.gz: 9800a202fb0bb0a66cf6e74f921021cb1f89f4f8
 SHA512:
-  metadata.gz: 33efc21a61cf1bce77e10ca55c5df5c545da5638e56e12cb1598388360e3d539c9f75e720ad4349bf8d0323fe410d2019042b25081715e54fe242a9044e8567f
-  data.tar.gz: 7658ba2000a389388bcc58d35ad120a375f6365634f0b9ffe16e5b399cb5cd94af83250091a40fd5ce3d588b364fc14e223ef3aae81bc86946002d532a371178
+  metadata.gz: f77c8400be4f09302c472fa3da92679ff557e8f1a44b1bf12830c76d233130e500bba99583e62d2921a7d8d6a5850fe717b716f923cd754f9b9a8e87ba52156b
+  data.tar.gz: c998ca0fee9037f8691ae0c68dd994b555a3c13073afde8f93d58e5e47f179555df5beb4f669356ef8bcff5297c5c7d1db379e98b016a3fc4dd6aef3457fca12

data/google_speech.gemspec CHANGED

@@ -21,6 +21,7 @@ Gem::Specification.new do |gem|
   gem.require_paths = ["lib"]
   gem.add_dependency "excon"
+  gem.add_dependency "uuid"
   gem.add_development_dependency "rake"
   gem.add_development_dependency "minitest"

data/lib/google_speech.rb CHANGED

@@ -5,6 +5,8 @@ require 'logger'
 module GoogleSpeech
+  TMP_FILE_DIR = ENV['GOOGLE_SPEECH_TMP_DIR'] || '/tmp/'
   def self.logger
     @_logger ||= Logger.new(STDOUT)
   end

data/lib/google_speech/chunk.rb CHANGED

@@ -33,5 +33,11 @@ module GoogleSpeech
       GoogleSpeech.logger
     end
+    def close_file
+      return unless @chunk_file
+      @chunk_file.close rescue nil
+      @chunk_file.unlink rescue nil
+    end
   end
 end

data/lib/google_speech/chunk_factory.rb CHANGED

@@ -18,9 +18,14 @@ module GoogleSpeech
     def each
       pos = 0
       while(pos < @original_duration) do
-        chunk = Chunk.new(@original_file, @original_duration, pos, (@chunk_duration + @overlap), @rate)
-        yield chunk
-        pos = pos + [chunk.duration, @chunk_duration].min
+        chunk = nil
+        begin
+          chunk = Chunk.new(@original_file, @original_duration, pos, (@chunk_duration + @overlap), @rate)
+          yield chunk
+          pos = pos + [chunk.duration, @chunk_duration].min
+        ensure
+          chunk.close_file if chunk
+        end
       end
     end

data/lib/google_speech/transcriber.rb CHANGED

@@ -2,6 +2,7 @@
 require 'excon'
 require 'json'
+require 'uuid'
 module GoogleSpeech
@@ -31,21 +32,38 @@ module GoogleSpeech
       @last_ua = 0
     end
+    def open_working_file
+      Utility.check_local_file(@original_file.path)
+      wf_path = random_file_name(@original_file.path)
+      FileUtils.ln(@original_file.path, wf_path)
+      File.open(wf_path, 'r') {|f|
+        yield f
+      }
+      FileUtils.rm(wf_path, :force=>true)
+    end
+    def random_file_name(path)
+      File.join(GoogleSpeech::TMP_FILE_DIR, File.basename(path) + '_' + UUID.generate + '.wav')
+    end
     def transcribe
-      chunk_factory = ChunkFactory.new(@original_file, options[:chunk_duration], options[:overlap], options[:rate])
-      chunk_factory.each{ |chunk|
-        result = chunk.to_hash
-        transcript = transcribe_data(chunk.data)
-        next unless transcript
+      open_working_file do |working_file|
+        chunk_factory = ChunkFactory.new(working_file, options[:chunk_duration], options[:overlap], options[:rate])
+        chunk_factory.each{ |chunk|
+          result = chunk.to_hash
+          transcript = transcribe_data(chunk.data)
+          next unless transcript
-        result = result.merge(extract_result(transcript))
+          result = result.merge(extract_result(transcript))
-        logger.debug "#{result[:start_time]}: #{(result[:confidence].to_f * 100).to_i}%: #{result[:text]}"
+          logger.debug "#{result[:start_time]}: #{(result[:confidence].to_f * 100).to_i}%: #{result[:text]}"
-        @results << result
+          @results << result
+          sleep(options[:request_pause].to_i)
+        }
+      end
-        sleep(options[:request_pause].to_i)
-      }
       @results
     end

data/lib/google_speech/version.rb CHANGED

@@ -1,5 +1,5 @@
 # -*- encoding: utf-8 -*-
 module GoogleSpeech
-  VERSION = "0.3.3"
+  VERSION = "0.4.0"
 end

metadata CHANGED

@@ -1,7 +1,7 @@
 --- !ruby/object:Gem::Specification
 name: google_speech
 version: !ruby/object:Gem::Version
-  version: 0.3.3
+  version: 0.4.0
 platform: ruby
 authors:
 - Andrew Kuklewicz
@@ -24,6 +24,20 @@ dependencies:
     - - '>='
       - !ruby/object:Gem::Version
         version: '0'
+- !ruby/object:Gem::Dependency
+  name: uuid
+  requirement: !ruby/object:Gem::Requirement
+    requirements:
+    - - '>='
+      - !ruby/object:Gem::Version
+        version: '0'
+  type: :runtime
+  prerelease: false
+  version_requirements: !ruby/object:Gem::Requirement
+    requirements:
+    - - '>='
+      - !ruby/object:Gem::Version
+        version: '0'
 - !ruby/object:Gem::Dependency
   name: rake
   requirement: !ruby/object:Gem::Requirement