RubyGems - speech_to_text - Versions diffs - 0.1.4 → 0.1.5 - Mend

speech_to_text 0.1.4 → 0.1.5

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (13) hide show

checksums.yaml +4 -4
data/.gitignore +5 -0
data/Gemfile.lock +1 -1
data/README.md +1 -1
data/lib/speech_to_text/3playmedia.rb +13 -1
data/lib/speech_to_text/deepspeech.rb +29 -2
data/lib/speech_to_text/google.rb +5 -8
data/lib/speech_to_text/speechmatics.rb +15 -1
data/lib/speech_to_text/util.rb +22 -8
data/lib/speech_to_text/version.rb +1 -1
metadata +2 -4
data/abc.mp3 +0 -0
data/webcams.webm +0 -0

checksums.yaml CHANGED Viewed

@@ -1,7 +1,7 @@
 ---
 SHA256:
-  metadata.gz: 0601f9186723489cc821a5afe961b94925734a73586f134b43cd8c28ce6c4e68
-  data.tar.gz: 7f7fd338e9255e5357a6f6a684131559b386f8377617f33ede8c1b90c8d777de
+  metadata.gz: 912dddca8963d0db76d95ca167a7a0935c264a39384c6baec8dc20c956b97f8a
+  data.tar.gz: bbdeaf426301438a7009e38d07c008c0253b18e1c56e61c2c063e678d7c17128
 SHA512:
-  metadata.gz: e1f01caf754a1a015c7c82a2d8bf0e3112a7224859cbbf527d977a84cfc60b407cb9708cc756d63ebc175650282c64fb2f10c1de878aa7c38973dc392e492263
-  data.tar.gz: 3a9ddd6b49011df32d52d50b4f3c83b48c78e11b3e0fac458cb1e75231769e86fa1b4600735cd56d1bd8676b1987f4a605aa936dfc2832af5288d49d5c92f7cd
+  metadata.gz: 2dc6bc04f997a4f4101b3b5c45de7e354d11eacac6d3f7ad217df4eabc0afa1a30c1584c9bcc4ba63ab8008914a0a37da8515bbb64a03fb7c1390a0701e726cf
+  data.tar.gz: 8980ccbe70389e5029a145a0a4bcfefa72b2e2f815f49daf42bb300291f7cd33e8b2da6f2a69dca79a548ea7225f7578d1199198b9bc8cc1556829fc464846d5

data/.gitignore CHANGED Viewed

@@ -7,3 +7,8 @@
 /spec/reports/
 /tmp/
 *.gem
+*.mp3
+*.mp4
+*.webm
+*.wav
+*.flac

data/Gemfile.lock CHANGED Viewed

@@ -1,7 +1,7 @@
 PATH
   remote: .
   specs:
-    speech_to_text (0.1.4)
+    speech_to_text (0.1.5)
       google-cloud-speech (= 0.35.0)
       google-cloud-storage (= 1.18.2)
       ibm_watson (~> 0.18.2)

data/README.md CHANGED Viewed

@@ -79,7 +79,7 @@ bucket_name could be any string
 file = SpeechToText::GoogleS2T.google_storage(audio_file_path,audio_name,audio_content_type,bucket_name)
 operation_name = SpeechToText::GoogleS2T.create_job(audio_name,audio_content_type,bucket_name,language_code)
-data = SpeechToText::GoogleS2T.check_job(operation_name)
+data = SpeechToText::GoogleS2T.check_status(operation_name)
 myarray = SpeechToText::GoogleS2T.create_array_google(data["results"])
 SpeechToText::GoogleS2T.delete_google_storage(bucket_name,audio_name,audio_content_type)
 ```

data/lib/speech_to_text/3playmedia.rb CHANGED Viewed

@@ -11,12 +11,24 @@
 require 'json'
 require 'net/http'
 require 'uri'
+require 'open3'
 module SpeechToText
   module ThreePlaymediaS2T # rubocop:disable Style/Documentation
     def self.create_job(api_key, audio_file, name, create_job_file)
       cretae_job_command = "curl -X POST -F \"source_file=@#{audio_file}\" \"https://api.3playmedia.com/v3/files?api_key=#{api_key}&language_id=1&name=#{name}\" > #{create_job_file}"
-      system(cretae_job_command)
+      Open3.popen2e(cretae_job_command) do |stdin, stdout_err, wait_thr|
+        while line = stdout_err.gets
+          puts "#{line}"
+        end
+        exit_status = wait_thr.value
+        unless exit_status.success?
+          puts '---------------------'
+          puts "FAILED to execute --> #{cretae_job_command}"
+          puts '---------------------'
+        end
+      end
       file = File.open(create_job_file, 'r')
       response = JSON.load file
       job_id = response['data']['id']

data/lib/speech_to_text/deepspeech.rb CHANGED Viewed

@@ -11,6 +11,7 @@
 require 'json'
 require 'net/http'
 require 'uri'
+require 'open3'
 require_relative 'util.rb'
 module SpeechToText
@@ -19,7 +20,20 @@ module SpeechToText
     def self.create_job(audio, server_url, jobdetails_json)
       request = "curl -F \"file=@#{audio}\" \"#{server_url}/deepspeech/createjob\" > #{jobdetails_json}"
-      system(request)
+      Open3.popen2e(request) do |stdin, stdout_err, wait_thr|
+        while line = stdout_err.gets
+          puts "#{line}"
+        end
+        exit_status = wait_thr.value
+        unless exit_status.success?
+          puts '---------------------'
+          puts "FAILED to execute --> #{request}"
+          puts '---------------------'
+        end
+      end
       file = File.open(jobdetails_json, 'r')
       data = JSON.load file
       data['job_id']
@@ -42,7 +56,20 @@ module SpeechToText
     # used by deepspeech server only
     def self.generate_transcript(audio, json_file, model_path)
       deepspeech_command = "#{model_path}/deepspeech --model #{model_path}/models/output_graph.pbmm --alphabet #{model_path}/models/alphabet.txt --lm #{model_path}/models/lm.binary --trie #{model_path}/models/trie -e --audio #{audio} > #{json_file}"
-      system(deepspeech_command.to_s)
+      Open3.popen2e(deepspeech_command) do |stdin, stdout_err, wait_thr|
+        while line = stdout_err.gets
+          puts "#{line}"
+        end
+        exit_status = wait_thr.value
+        unless exit_status.success?
+          puts '---------------------'
+          puts "FAILED to execute --> #{deepspeech_command}"
+          puts '---------------------'
+        end
+      end
     end
     # rubocop:disable Metrics/MethodLength

data/lib/speech_to_text/google.rb CHANGED Viewed

@@ -70,18 +70,15 @@ module SpeechToText
       # construct a new operation object from the id
       speech = Google::Cloud::Speech.new(version: :v1p1beta1)
       operation2 = speech.get_operation operation_name
+      status = 'not found'
       if operation2.error?
         status = 'failed'
-        return status
-      end
-      if operation2.done?
+      elsif operation2.done?
         status = 'completed'
-        return status
+      else
+        status = 'inProgress'
       end
-      status = 'inProgress'
-      status
+      return status
     end
     def self.get_words(operation_name)

data/lib/speech_to_text/speechmatics.rb CHANGED Viewed

@@ -12,6 +12,7 @@ require_relative 'util.rb'
 require 'net/http'
 require 'uri'
 require 'json'
+require 'open3'
 module SpeechToText
   module SpeechmaticsS2T # rubocop:disable Style/Documentation
@@ -24,7 +25,20 @@ module SpeechToText
       # rubocop:enable Metrics/ParameterLists
       # rubocop:enable Naming/VariableName
       upload_audio = "curl -F data_file=@#{audio_file_path}/#{audio_name}.#{audio_content_type} -F model=#{model} \"https://api.speechmatics.com/v1.0/user/#{userID}/jobs/?auth_token=#{authKey}\" > #{jobID_json_file}"
-      system(upload_audio.to_s)
+      Open3.popen2e(upload_audio) do |stdin, stdout_err, wait_thr|
+        while line = stdout_err.gets
+          puts "#{line}"
+        end
+        exit_status = wait_thr.value
+        unless exit_status.success?
+          puts '---------------------'
+          puts "FAILED to execute --> #{upload_audio}"
+          puts '---------------------'
+        end
+      end
       file = File.open(jobID_json_file)
       data = JSON.load file
       jobID = data['id'] # rubocop:disable Naming/VariableName

data/lib/speech_to_text/util.rb CHANGED Viewed

@@ -8,6 +8,7 @@
 #
 # Copyright (c) 2019 BigBlueButton Inc. and by respective authors (see below).
 #
+require 'open3'
 module SpeechToText
   module Util # rubocop:disable Style/Documentation
@@ -122,21 +123,34 @@ module SpeechToText
                             audio_content_type:,
                             **duration)
       # rubocop:enable Metrics/ParameterLists
+      video_to_audio_command = ''
       if duration.empty?
         video_to_audio_command = "ffmpeg -y -i #{video_file_path}/#{video_name}.#{video_content_type} -ac 1 -ar 16000 #{audio_file_path}/#{audio_name}.#{audio_content_type}"
-        system(video_to_audio_command.to_s)
       elsif duration[:start_time].nil? && duration[:end_time] != nil
         video_to_audio_command = "ffmpeg -y -ss #{0.to_i} -i #{video_file_path}/#{video_name}.#{video_content_type} -t #{duration[:end_time]} -ac 1 -ar 16000 #{audio_file_path}/#{audio_name}.#{audio_content_type}"
-        system(video_to_audio_command.to_s)
       elsif duration[:end_time].nil? && duration[:start_time] != nil
         video_to_audio_command = "ffmpeg -y -ss #{duration[:start_time]} -i #{video_file_path}/#{video_name}.#{video_content_type} -ac 1 -ar 16000 #{audio_file_path}/#{audio_name}.#{audio_content_type}"
-        system(video_to_audio_command.to_s)
       else
-        video_to_audio_command = "ffmpeg -y -ss #{duration[:start_time]} -i #{video_file_path}/#{video_name}.#{video_content_type} -to #{duration[:end_time]} -ac 1 -ar 16000 #{audio_file_path}/#{audio_name}.#{audio_content_type}"
-        system(video_to_audio_command.to_s)
-      end
+        video_to_audio_command = "ffmpeg -y -t #{duration[:end_time]} -i #{video_file_path}/#{video_name}.#{video_content_type} -ss #{duration[:start_time]} -ac 1 -ar 16000 #{audio_file_path}/#{audio_name}.#{audio_content_type}"
+      end
+        Open3.popen2e(video_to_audio_command) do |stdin, stdout_err, wait_thr|
+          while line = stdout_err.gets
+            puts "#{line}"
+          end
+          exit_status = wait_thr.value
+          unless exit_status.success?
+            puts '---------------------'
+            puts "FAILED to execute --> #{video_to_audio_command}"
+            puts '---------------------'
+          end
+        end
+        #Open3.popen3(video_to_audio_command.to_s) do |stdin, stdout, stderr, wait_thr|
+        #  puts "stdout is:" + stdout.read
+        #  puts "stderr is:" + stderr.read
+        #end
     end
   end
 end

data/lib/speech_to_text/version.rb CHANGED Viewed

@@ -1,5 +1,5 @@
 # frozen_string_literal: true
 module SpeechToText
-  VERSION = '0.1.4'
+  VERSION = '0.1.5'
 end

metadata CHANGED Viewed

@@ -1,14 +1,14 @@
 --- !ruby/object:Gem::Specification
 name: speech_to_text
 version: !ruby/object:Gem::Version
-  version: 0.1.4
+  version: 0.1.5
 platform: ruby
 authors:
 - Richard Alam
 autorequire:
 bindir: exe
 cert_chain: []
-date: 2019-11-20 00:00:00.000000000 Z
+date: 2019-11-21 00:00:00.000000000 Z
 dependencies:
 - !ruby/object:Gem::Dependency
   name: bundler
@@ -94,7 +94,6 @@ files:
 - LICENSE.txt
 - README.md
 - Rakefile
-- abc.mp3
 - bin/console
 - bin/setup
 - examples/3playmedia.rb
@@ -113,7 +112,6 @@ files:
 - resources/test/test.json
 - resources/test/video/video.mp4
 - speech_to_text.gemspec
-- webcams.webm
 homepage: https://github.com/bigbluebutton/speech_to_text
 licenses:
 - MIT

data/abc.mp3 DELETED Viewed

Binary file

data/webcams.webm DELETED Viewed

Binary file