right_scraper 1.0.26 → 3.0.0
This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
- data/Gemfile +16 -0
- data/README.rdoc +9 -28
- data/Rakefile +51 -39
- data/lib/right_scraper/builders/base.rb +64 -0
- data/lib/right_scraper/builders/filesystem.rb +96 -0
- data/lib/right_scraper/builders/union.rb +57 -0
- data/lib/right_scraper/logger.rb +102 -0
- data/lib/right_scraper/loggers/noisy.rb +85 -0
- data/lib/right_scraper/processes/ssh.rb +188 -0
- data/lib/right_scraper/repositories/base.rb +299 -0
- data/lib/right_scraper/repositories/download.rb +90 -0
- data/lib/right_scraper/repositories/git.rb +92 -0
- data/lib/right_scraper/repositories/mock.rb +70 -0
- data/lib/right_scraper/repositories/svn.rb +96 -0
- data/lib/right_scraper/resources/base.rb +70 -0
- data/{spec/scraper_base_spec.rb → lib/right_scraper/resources/cookbook.rb} +9 -23
- data/lib/right_scraper/resources/workflow.rb +55 -0
- data/lib/right_scraper/retrievers/base.rb +114 -0
- data/lib/right_scraper/retrievers/checkout.rb +79 -0
- data/lib/right_scraper/retrievers/download.rb +97 -0
- data/lib/right_scraper/retrievers/git.rb +140 -0
- data/lib/right_scraper/retrievers/svn.rb +87 -0
- data/lib/right_scraper/scanners/base.rb +111 -0
- data/lib/right_scraper/scanners/cookbook_manifest.rb +59 -0
- data/lib/right_scraper/scanners/cookbook_metadata.rb +69 -0
- data/lib/right_scraper/scanners/cookbook_s3_upload.rb +84 -0
- data/lib/right_scraper/scanners/union.rb +89 -0
- data/lib/right_scraper/scanners/workflow_manifest.rb +86 -0
- data/lib/right_scraper/scanners/workflow_metadata.rb +70 -0
- data/lib/right_scraper/scanners/workflow_s3_upload.rb +85 -0
- data/lib/right_scraper/scraper.rb +81 -57
- data/lib/right_scraper/scraper_logger.rb +61 -0
- data/lib/right_scraper/scrapers/base.rb +262 -0
- data/lib/right_scraper/scrapers/cookbook.rb +73 -0
- data/lib/right_scraper/scrapers/workflow.rb +88 -0
- data/lib/right_scraper/svn_client.rb +101 -0
- data/lib/right_scraper/version.rb +28 -0
- data/lib/right_scraper.rb +35 -11
- data/right_scraper.gemspec +26 -13
- data/right_scraper.rconf +13 -0
- data/spec/builder_spec.rb +50 -0
- data/spec/cookbook_helper.rb +73 -0
- data/spec/cookbook_manifest_spec.rb +55 -0
- data/spec/cookbook_s3_upload_spec.rb +152 -0
- data/spec/download/download_retriever_spec.rb +118 -0
- data/spec/download/download_retriever_spec_helper.rb +72 -0
- data/spec/download/download_spec.rb +130 -0
- data/spec/download/multi_dir_spec.rb +106 -0
- data/spec/download/multi_dir_spec_helper.rb +40 -0
- data/spec/git/cookbook_spec.rb +166 -0
- data/spec/git/demokey +27 -0
- data/spec/git/demokey.pub +1 -0
- data/spec/git/password_key +30 -0
- data/spec/git/password_key.pub +1 -0
- data/spec/git/repository_spec.rb +110 -0
- data/spec/git/retriever_spec.rb +505 -0
- data/spec/git/retriever_spec_helper.rb +112 -0
- data/spec/git/scraper_spec.rb +136 -0
- data/spec/git/ssh_spec.rb +170 -0
- data/spec/git/url_spec.rb +103 -0
- data/spec/logger_spec.rb +185 -0
- data/spec/repository_spec.rb +89 -23
- data/spec/{scraper_spec_helper_base.rb → retriever_spec_helper.rb} +41 -27
- data/spec/scanner_spec.rb +61 -0
- data/spec/scraper_helper.rb +96 -0
- data/spec/scraper_spec.rb +123 -45
- data/spec/spec_helper.rb +87 -14
- data/spec/svn/cookbook_spec.rb +97 -0
- data/spec/svn/multi_svn_spec.rb +64 -0
- data/spec/svn/multi_svn_spec_helper.rb +40 -0
- data/spec/svn/repository_spec.rb +72 -0
- data/spec/svn/retriever_spec.rb +261 -0
- data/spec/svn/scraper_spec.rb +90 -0
- data/spec/svn/{svn_scraper_spec_helper.rb → svn_retriever_spec_helper.rb} +46 -27
- data/spec/svn/url_spec.rb +47 -0
- data/spec/url_spec.rb +164 -0
- metadata +203 -31
- data/lib/right_scraper/linux/process_monitor.rb +0 -84
- data/lib/right_scraper/repository.rb +0 -78
- data/lib/right_scraper/scraper_base.rb +0 -175
- data/lib/right_scraper/scrapers/download_scraper.rb +0 -67
- data/lib/right_scraper/scrapers/git_scraper.rb +0 -283
- data/lib/right_scraper/scrapers/svn_scraper.rb +0 -119
- data/lib/right_scraper/watcher.rb +0 -158
- data/lib/right_scraper/win32/process_monitor.rb +0 -98
- data/spec/download/download_scraper_spec.rb +0 -94
- data/spec/git/git_scraper_spec.rb +0 -165
- data/spec/git/git_scraper_spec_helper.rb +0 -72
- data/spec/rcov.opts +0 -1
- data/spec/spec.opts +0 -2
- data/spec/svn/svn_scraper_spec.rb +0 -148
- data/spec/watcher_spec.rb +0 -74
|
@@ -1,119 +0,0 @@
|
|
|
1
|
-
#--
|
|
2
|
-
# Copyright: Copyright (c) 2010 RightScale, Inc.
|
|
3
|
-
#
|
|
4
|
-
# Permission is hereby granted, free of charge, to any person obtaining
|
|
5
|
-
# a copy of this software and associated documentation files (the
|
|
6
|
-
# 'Software'), to deal in the Software without restriction, including
|
|
7
|
-
# without limitation the rights to use, copy, modify, merge, publish,
|
|
8
|
-
# distribute, sublicense, and/or sell copies of the Software, and to
|
|
9
|
-
# permit persons to whom the Software is furnished to do so, subject to
|
|
10
|
-
# the following conditions:
|
|
11
|
-
#
|
|
12
|
-
# The above copyright notice and this permission notice shall be
|
|
13
|
-
# included in all copies or substantial portions of the Software.
|
|
14
|
-
#
|
|
15
|
-
# THE SOFTWARE IS PROVIDED 'AS IS', WITHOUT WARRANTY OF ANY KIND,
|
|
16
|
-
# EXPRESS OR IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF
|
|
17
|
-
# MERCHANTABILITY, FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT.
|
|
18
|
-
# IN NO EVENT SHALL THE AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY
|
|
19
|
-
# CLAIM, DAMAGES OR OTHER LIABILITY, WHETHER IN AN ACTION OF CONTRACT,
|
|
20
|
-
# TORT OR OTHERWISE, ARISING FROM, OUT OF OR IN CONNECTION WITH THE
|
|
21
|
-
# SOFTWARE OR THE USE OR OTHER DEALINGS IN THE SOFTWARE.
|
|
22
|
-
#++
|
|
23
|
-
|
|
24
|
-
module RightScale
|
|
25
|
-
|
|
26
|
-
class SvnScraper < ScraperBase
|
|
27
|
-
|
|
28
|
-
# Check whether it is possible to perform an incremental update of the repo
|
|
29
|
-
#
|
|
30
|
-
# === Return
|
|
31
|
-
# true:: Scrape directory contains files belonging to the scraped repo and protocol supports
|
|
32
|
-
# incremental updates
|
|
33
|
-
# false:: Otherwise
|
|
34
|
-
def incremental_update?
|
|
35
|
-
return false unless File.directory?(@current_repo_dir)
|
|
36
|
-
inc = false
|
|
37
|
-
cookbooks_path = repo.cookbooks_path || []
|
|
38
|
-
cookbooks_path = [ cookbooks_path ] unless cookbooks_path.is_a?(Array)
|
|
39
|
-
if cookbooks_path.empty?
|
|
40
|
-
Dir.chdir(@current_repo_dir) do
|
|
41
|
-
info = run('svn', 'info')
|
|
42
|
-
inc = $?.success? && info =~ (/^URL: (.*)$/) && $1 == @repo.url
|
|
43
|
-
end
|
|
44
|
-
else
|
|
45
|
-
cookbooks_path.each do |path|
|
|
46
|
-
Dir.chdir(File.join(@current_repo_dir, path)) do
|
|
47
|
-
info = run('svn', 'info')
|
|
48
|
-
inc = $?.success? && info =~ (/^URL: (.*)$/) && $1 == File.join(@repo.url, path)
|
|
49
|
-
break unless inc
|
|
50
|
-
end
|
|
51
|
-
end
|
|
52
|
-
end
|
|
53
|
-
inc
|
|
54
|
-
end
|
|
55
|
-
|
|
56
|
-
# Scrape SVN repository, see RightScale::Scraper#scrape
|
|
57
|
-
#
|
|
58
|
-
# === Return
|
|
59
|
-
# true:: Always return true
|
|
60
|
-
def scrape_imp
|
|
61
|
-
msg = @incremental ? "Updating " : "Checking out "
|
|
62
|
-
msg += "SVN repository '#{@repo.display_name}'"
|
|
63
|
-
@callback.call(msg, is_step=true) if @callback
|
|
64
|
-
cookbooks_path = repo.cookbooks_path || []
|
|
65
|
-
cookbooks_path = [ cookbooks_path ] unless cookbooks_path.is_a?(Array)
|
|
66
|
-
if @incremental
|
|
67
|
-
args = ['update', '--no-auth-cache', '--non-interactive', '--quiet']
|
|
68
|
-
args += ['--revision', @repo.tag] if (!@repo.tag.nil? && !@repo.tag.empty?)
|
|
69
|
-
args += ['--username', @repo.first_credential] if @repo.first_credential
|
|
70
|
-
args += ['--password', @repo.second_credential] if @repo.second_credential
|
|
71
|
-
|
|
72
|
-
if cookbooks_path.empty?
|
|
73
|
-
Dir.chdir(@current_repo_dir) do
|
|
74
|
-
res = @watcher.launch_and_watch('svn', args, @current_repo_dir)
|
|
75
|
-
handle_watcher_result(res, 'SVN update')
|
|
76
|
-
end
|
|
77
|
-
else
|
|
78
|
-
cookbooks_path.each do |path|
|
|
79
|
-
break unless succeeded?
|
|
80
|
-
full_path = File.join(@current_repo_dir, path)
|
|
81
|
-
Dir.chdir(full_path) do
|
|
82
|
-
res = @watcher.launch_and_watch('svn', args, @current_repo_dir)
|
|
83
|
-
handle_watcher_result(res, 'SVN update')
|
|
84
|
-
end
|
|
85
|
-
end
|
|
86
|
-
end
|
|
87
|
-
end
|
|
88
|
-
if !@incremental && succeeded?
|
|
89
|
-
if cookbooks_path.empty?
|
|
90
|
-
res = @watcher.launch_and_watch('svn', svn_checkout_args, @current_repo_dir)
|
|
91
|
-
handle_watcher_result(res, 'SVN checkout')
|
|
92
|
-
else
|
|
93
|
-
cookbooks_path.each do |path|
|
|
94
|
-
break unless succeeded?
|
|
95
|
-
res = @watcher.launch_and_watch('svn', svn_checkout_args(path), @current_repo_dir)
|
|
96
|
-
handle_watcher_result(res, 'SVN checkout')
|
|
97
|
-
end
|
|
98
|
-
end
|
|
99
|
-
end
|
|
100
|
-
true
|
|
101
|
-
end
|
|
102
|
-
|
|
103
|
-
# SVN checkout command using current repo definition and given path into it
|
|
104
|
-
#
|
|
105
|
-
# === Parameters
|
|
106
|
-
# path(String):: Relative path inside repo that should be checked out
|
|
107
|
-
#
|
|
108
|
-
# === Return
|
|
109
|
-
# svn_cmd(String):: Corresponding SVN command line
|
|
110
|
-
def svn_checkout_args(path='')
|
|
111
|
-
args = ['checkout', File.join(@repo.url, path), File.join(@current_repo_dir, path),
|
|
112
|
-
'--no-auth-cache', '--non-interactive', '--quiet']
|
|
113
|
-
args += ['--revision', @repo.tag] if !@repo.tag.nil? && !@repo.tag.empty?
|
|
114
|
-
args += ['--username', @repo.first_credential] if @repo.first_credential
|
|
115
|
-
args += ['--password', @repo.second_credential] if @repo.second_credential
|
|
116
|
-
return args
|
|
117
|
-
end
|
|
118
|
-
end
|
|
119
|
-
end
|
|
@@ -1,158 +0,0 @@
|
|
|
1
|
-
#--
|
|
2
|
-
# Copyright: Copyright (c) 2010 RightScale, Inc.
|
|
3
|
-
#
|
|
4
|
-
# Permission is hereby granted, free of charge, to any person obtaining
|
|
5
|
-
# a copy of this software and associated documentation files (the
|
|
6
|
-
# 'Software'), to deal in the Software without restriction, including
|
|
7
|
-
# without limitation the rights to use, copy, modify, merge, publish,
|
|
8
|
-
# distribute, sublicense, and/or sell copies of the Software, and to
|
|
9
|
-
# permit persons to whom the Software is furnished to do so, subject to
|
|
10
|
-
# the following conditions:
|
|
11
|
-
#
|
|
12
|
-
# The above copyright notice and this permission notice shall be
|
|
13
|
-
# included in all copies or substantial portions of the Software.
|
|
14
|
-
#
|
|
15
|
-
# THE SOFTWARE IS PROVIDED 'AS IS', WITHOUT WARRANTY OF ANY KIND,
|
|
16
|
-
# EXPRESS OR IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF
|
|
17
|
-
# MERCHANTABILITY, FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT.
|
|
18
|
-
# IN NO EVENT SHALL THE AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY
|
|
19
|
-
# CLAIM, DAMAGES OR OTHER LIABILITY, WHETHER IN AN ACTION OF CONTRACT,
|
|
20
|
-
# TORT OR OTHERWISE, ARISING FROM, OUT OF OR IN CONNECTION WITH THE
|
|
21
|
-
# SOFTWARE OR THE USE OR OTHER DEALINGS IN THE SOFTWARE.
|
|
22
|
-
#++
|
|
23
|
-
|
|
24
|
-
require 'find'
|
|
25
|
-
if RUBY_PLATFORM =~ /mswin/
|
|
26
|
-
require File.join(File.dirname(__FILE__), 'win32', 'process_monitor')
|
|
27
|
-
else
|
|
28
|
-
require File.join(File.dirname(__FILE__), 'linux', 'process_monitor')
|
|
29
|
-
end
|
|
30
|
-
|
|
31
|
-
module RightScale
|
|
32
|
-
|
|
33
|
-
# Encapsulate information returned by watcher
|
|
34
|
-
class WatchStatus
|
|
35
|
-
|
|
36
|
-
# Potential outcome of watcher
|
|
37
|
-
VALID_STATUSES = [ :success, :timeout, :size_exceeded ]
|
|
38
|
-
|
|
39
|
-
attr_reader :status # One of VALID_STATUSES
|
|
40
|
-
attr_reader :exit_code # Watched process exit code or -1 if process was killed
|
|
41
|
-
attr_reader :output # Watched process combined output
|
|
42
|
-
|
|
43
|
-
# Initialize attibutes
|
|
44
|
-
def initialize(status, exit_code, output)
|
|
45
|
-
@status = status
|
|
46
|
-
@exit_code = exit_code
|
|
47
|
-
@output = output
|
|
48
|
-
end
|
|
49
|
-
|
|
50
|
-
end
|
|
51
|
-
|
|
52
|
-
class Watcher
|
|
53
|
-
|
|
54
|
-
attr_reader :max_bytes # Maximum size in bytes of watched directory before process is killed
|
|
55
|
-
attr_reader :max_seconds # Maximum number of elapased seconds before external process is killed
|
|
56
|
-
|
|
57
|
-
# Initialize attributes
|
|
58
|
-
#
|
|
59
|
-
# max_bytes(Integer):: Maximum size in bytes of watched directory before process is killed
|
|
60
|
-
# max_seconds(Integer):: Maximum number of elapased seconds before external process is killed
|
|
61
|
-
def initialize(max_bytes, max_seconds)
|
|
62
|
-
@max_bytes = max_bytes
|
|
63
|
-
@max_seconds = max_seconds
|
|
64
|
-
end
|
|
65
|
-
|
|
66
|
-
# Launch given command as external process and watch given directory
|
|
67
|
-
# so it doesn't exceed given size. Also watch time elapsed and kill
|
|
68
|
-
# external process if either the size of the watched directory exceed
|
|
69
|
-
# @max_bytes or the time elapsed exceeds @max_seconds.
|
|
70
|
-
# Note: This method is not thread-safe, instantiate one watcher per thread
|
|
71
|
-
#
|
|
72
|
-
# === Parameters
|
|
73
|
-
# cmd(String):: Command line to be launched
|
|
74
|
-
# dest_dir(String):: Watched directory
|
|
75
|
-
#
|
|
76
|
-
# === Return
|
|
77
|
-
# res(RightScale::WatchStatus):: Outcome of watch, see RightScale::WatchStatus
|
|
78
|
-
def launch_and_watch(cmd, args, dest_dir)
|
|
79
|
-
exit_code = nil
|
|
80
|
-
output = ''
|
|
81
|
-
monitor = ProcessMonitor.new
|
|
82
|
-
|
|
83
|
-
# Run external process and monitor it in a new thread, platform specific
|
|
84
|
-
pid = monitor.spawn(cmd, *args) do |data|
|
|
85
|
-
output << data[:output] if data[:output]
|
|
86
|
-
exit_code = data[:exit_code] if data.include?(:exit_code)
|
|
87
|
-
end
|
|
88
|
-
|
|
89
|
-
# Loop until process is done or times out or takes too much space
|
|
90
|
-
timed_out = repeat(1, @max_seconds) do
|
|
91
|
-
if @max_bytes < 0
|
|
92
|
-
exit_code
|
|
93
|
-
else
|
|
94
|
-
size = 0
|
|
95
|
-
Find.find(dest_dir) { |f| size += File.stat(f).size rescue 0 if File.file?(f) } if File.directory?(dest_dir)
|
|
96
|
-
size > @max_bytes || exit_code
|
|
97
|
-
end
|
|
98
|
-
end
|
|
99
|
-
|
|
100
|
-
# Cleanup and report status
|
|
101
|
-
# Note: We need to store the exit status before we kill the underlying process so that
|
|
102
|
-
# if it finished in the mean time we still report -1 as exit code
|
|
103
|
-
if exit_code
|
|
104
|
-
exit_status = exit_code
|
|
105
|
-
outcome = :success
|
|
106
|
-
else
|
|
107
|
-
exit_status = -1
|
|
108
|
-
outcome = (timed_out ? :timeout : :size_exceeded)
|
|
109
|
-
Process.kill('INT', pid)
|
|
110
|
-
end
|
|
111
|
-
|
|
112
|
-
# Cleanup any open handle etc., platform specific
|
|
113
|
-
monitor.cleanup
|
|
114
|
-
|
|
115
|
-
res = WatchStatus.new(outcome, exit_status, output)
|
|
116
|
-
end
|
|
117
|
-
|
|
118
|
-
protected
|
|
119
|
-
|
|
120
|
-
# Run given block in thread and time execution
|
|
121
|
-
#
|
|
122
|
-
# === Block
|
|
123
|
-
# Block whose execution is timed
|
|
124
|
-
#
|
|
125
|
-
# === Return
|
|
126
|
-
# elapsed(Integer):: Number of seconds elapsed while running given block
|
|
127
|
-
def timed
|
|
128
|
-
start_at = Time.now
|
|
129
|
-
yield
|
|
130
|
-
elapsed = Time.now - start_at
|
|
131
|
-
end
|
|
132
|
-
|
|
133
|
-
# Repeat given block at regular intervals
|
|
134
|
-
#
|
|
135
|
-
# === Parameters
|
|
136
|
-
# seconds(Integer):: Number of seconds between executions
|
|
137
|
-
# timeout(Integer):: Timeout after which execution stops and method returns
|
|
138
|
-
#
|
|
139
|
-
# === Block
|
|
140
|
-
# Given block gets executed every period seconds until timeout is reached
|
|
141
|
-
# *or* block returns true
|
|
142
|
-
#
|
|
143
|
-
# === Return
|
|
144
|
-
# res(TrueClass|FalseClass):: true if timeout is reached, false otherwise.
|
|
145
|
-
def repeat(period, timeout)
|
|
146
|
-
end_at = Time.now + timeout
|
|
147
|
-
while res = (timeout < 0 || Time.now < end_at)
|
|
148
|
-
exit = false
|
|
149
|
-
elapsed = timed { exit = yield }
|
|
150
|
-
break if exit
|
|
151
|
-
sleep(period - elapsed) if elapsed < period
|
|
152
|
-
end
|
|
153
|
-
!res
|
|
154
|
-
end
|
|
155
|
-
|
|
156
|
-
end
|
|
157
|
-
|
|
158
|
-
end
|
|
@@ -1,98 +0,0 @@
|
|
|
1
|
-
#--
|
|
2
|
-
# Copyright: Copyright (c) 2010 RightScale, Inc.
|
|
3
|
-
#
|
|
4
|
-
# Permission is hereby granted, free of charge, to any person obtaining
|
|
5
|
-
# a copy of this software and associated documentation files (the
|
|
6
|
-
# 'Software'), to deal in the Software without restriction, including
|
|
7
|
-
# without limitation the rights to use, copy, modify, merge, publish,
|
|
8
|
-
# distribute, sublicense, and/or sell copies of the Software, and to
|
|
9
|
-
# permit persons to whom the Software is furnished to do so, subject to
|
|
10
|
-
# the following conditions:
|
|
11
|
-
#
|
|
12
|
-
# The above copyright notice and this permission notice shall be
|
|
13
|
-
# included in all copies or substantial portions of the Software.
|
|
14
|
-
#
|
|
15
|
-
# THE SOFTWARE IS PROVIDED 'AS IS', WITHOUT WARRANTY OF ANY KIND,
|
|
16
|
-
# EXPRESS OR IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF
|
|
17
|
-
# MERCHANTABILITY, FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT.
|
|
18
|
-
# IN NO EVENT SHALL THE AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY
|
|
19
|
-
# CLAIM, DAMAGES OR OTHER LIABILITY, WHETHER IN AN ACTION OF CONTRACT,
|
|
20
|
-
# TORT OR OTHERWISE, ARISING FROM, OUT OF OR IN CONNECTION WITH THE
|
|
21
|
-
# SOFTWARE OR THE USE OR OTHER DEALINGS IN THE SOFTWARE.
|
|
22
|
-
#++
|
|
23
|
-
|
|
24
|
-
require 'win32/process'
|
|
25
|
-
|
|
26
|
-
module RightScale
|
|
27
|
-
|
|
28
|
-
# Windows specific watcher implementation
|
|
29
|
-
class ProcessMonitor
|
|
30
|
-
|
|
31
|
-
include ::Windows::Process
|
|
32
|
-
include ::Windows::Synchronize
|
|
33
|
-
include ::Windows::Handle
|
|
34
|
-
|
|
35
|
-
# Spawn given process and callback given block with output and exit code
|
|
36
|
-
#
|
|
37
|
-
# === Parameters
|
|
38
|
-
# cmd(String):: Name of the command to run
|
|
39
|
-
# arg1(String):: Optional, first command-line argumument
|
|
40
|
-
# arg2(String):: Optional, first command-line argumument
|
|
41
|
-
# ...
|
|
42
|
-
# argN(String):: Optional, Nth command-line argumument
|
|
43
|
-
#
|
|
44
|
-
# === Block
|
|
45
|
-
# Given block should take one argument which is a hash which may contain
|
|
46
|
-
# the keys :output and :exit_code. The value associated with :output is a chunk
|
|
47
|
-
# of output while the value associated with :exit_code is the process exit code
|
|
48
|
-
# This block won't be called anymore once the :exit_code key has associated value
|
|
49
|
-
#
|
|
50
|
-
# === Return
|
|
51
|
-
# pid(Integer):: Spawned process pid
|
|
52
|
-
def spawn(cmd, *args)
|
|
53
|
-
args = args.map { |a| a.to_s }
|
|
54
|
-
cmd = ([cmd] + args).join(' ')
|
|
55
|
-
|
|
56
|
-
# Run external process and monitor it in a new thread
|
|
57
|
-
@io = IO.popen(cmd)
|
|
58
|
-
@handle = OpenProcess(PROCESS_ALL_ACCESS, 0, @io.pid)
|
|
59
|
-
case @handle
|
|
60
|
-
when INVALID_HANDLE_VALUE
|
|
61
|
-
# Something bad happened
|
|
62
|
-
yield(:exit_code => 1)
|
|
63
|
-
when 0
|
|
64
|
-
# Process already finished
|
|
65
|
-
yield(:exit_code => 0)
|
|
66
|
-
else
|
|
67
|
-
# Start output read
|
|
68
|
-
@reader = Thread.new do
|
|
69
|
-
o = @io.read
|
|
70
|
-
until o == ''
|
|
71
|
-
yield(:output => o)
|
|
72
|
-
o = @io.read
|
|
73
|
-
end
|
|
74
|
-
status = WaitForSingleObject(@handle, INFINITE)
|
|
75
|
-
exit_code = [0].pack('L')
|
|
76
|
-
if GetExitCodeProcess(@handle, exit_code)
|
|
77
|
-
exit_code = exit_code.unpack('L').first
|
|
78
|
-
else
|
|
79
|
-
exit_code = 1
|
|
80
|
-
end
|
|
81
|
-
yield(:exit_code => exit_code)
|
|
82
|
-
end
|
|
83
|
-
end
|
|
84
|
-
@io.pid
|
|
85
|
-
end
|
|
86
|
-
|
|
87
|
-
# Cleanup underlying handle
|
|
88
|
-
#
|
|
89
|
-
# === Return
|
|
90
|
-
# true:: Always return true
|
|
91
|
-
def cleanup
|
|
92
|
-
@reader.join
|
|
93
|
-
CloseHandle(@handle) if @handle > 0
|
|
94
|
-
@io.close
|
|
95
|
-
end
|
|
96
|
-
|
|
97
|
-
end
|
|
98
|
-
end
|
|
@@ -1,94 +0,0 @@
|
|
|
1
|
-
#--
|
|
2
|
-
# Copyright: Copyright (c) 2010 RightScale, Inc.
|
|
3
|
-
#
|
|
4
|
-
# Permission is hereby granted, free of charge, to any person obtaining
|
|
5
|
-
# a copy of this software and associated documentation files (the
|
|
6
|
-
# 'Software'), to deal in the Software without restriction, including
|
|
7
|
-
# without limitation the rights to use, copy, modify, merge, publish,
|
|
8
|
-
# distribute, sublicense, and/or sell copies of the Software, and to
|
|
9
|
-
# permit persons to whom the Software is furnished to do so, subject to
|
|
10
|
-
# the following conditions:
|
|
11
|
-
#
|
|
12
|
-
# The above copyright notice and this permission notice shall be
|
|
13
|
-
# included in all copies or substantial portions of the Software.
|
|
14
|
-
#
|
|
15
|
-
# THE SOFTWARE IS PROVIDED 'AS IS', WITHOUT WARRANTY OF ANY KIND,
|
|
16
|
-
# EXPRESS OR IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF
|
|
17
|
-
# MERCHANTABILITY, FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT.
|
|
18
|
-
# IN NO EVENT SHALL THE AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY
|
|
19
|
-
# CLAIM, DAMAGES OR OTHER LIABILITY, WHETHER IN AN ACTION OF CONTRACT,
|
|
20
|
-
# TORT OR OTHERWISE, ARISING FROM, OUT OF OR IN CONNECTION WITH THE
|
|
21
|
-
# SOFTWARE OR THE USE OR OTHER DEALINGS IN THE SOFTWARE.
|
|
22
|
-
#++
|
|
23
|
-
|
|
24
|
-
# Not supported on Windows
|
|
25
|
-
unless RUBY_PLATFORM=~/mswin/
|
|
26
|
-
|
|
27
|
-
require File.expand_path(File.join(File.dirname(__FILE__), '..', 'spec_helper'))
|
|
28
|
-
require 'scraper_base'
|
|
29
|
-
require 'repository'
|
|
30
|
-
require 'watcher'
|
|
31
|
-
require File.join('scrapers', 'download_scraper')
|
|
32
|
-
|
|
33
|
-
describe RightScale::DownloadScraper do
|
|
34
|
-
|
|
35
|
-
include RightScale::SpecHelpers
|
|
36
|
-
|
|
37
|
-
# Create download repository following given layout
|
|
38
|
-
# Update @repo_path with path to repository
|
|
39
|
-
# Delete any previously created repo
|
|
40
|
-
def setup_download_repo
|
|
41
|
-
@download_repo_path = File.expand_path(File.join(File.dirname(__FILE__), '__download_repo'))
|
|
42
|
-
@repo_path = File.join(File.dirname(__FILE__), '__repo')
|
|
43
|
-
@repo_content = [ { 'folder1' => [ 'file2', 'file3' ] }, { 'folder2' => [ { 'folder3' => [ 'file4' ] } ] }, 'file1' ]
|
|
44
|
-
FileUtils.rm_rf(@download_repo_path)
|
|
45
|
-
create_file_layout(@download_repo_path, @repo_content)
|
|
46
|
-
@download_file = File.expand_path(File.join(File.dirname(__FILE__), '__download_file.tar'))
|
|
47
|
-
Dir.chdir(@download_repo_path) do
|
|
48
|
-
res, status = exec("tar cf \"#{@download_file}\" *")
|
|
49
|
-
raise "Failed to create tarball: #{res}" unless status.success?
|
|
50
|
-
end
|
|
51
|
-
end
|
|
52
|
-
|
|
53
|
-
# Cleanup after ourselves
|
|
54
|
-
def delete_download_repo
|
|
55
|
-
FileUtils.rm_rf(@download_repo_path) if @download_repo_path
|
|
56
|
-
@download_repo_path = nil
|
|
57
|
-
FileUtils.rm_rf(@repo_path) if @repo_path
|
|
58
|
-
@repo_path = nil
|
|
59
|
-
File.delete(@download_file) if File.exist?(@download_file)
|
|
60
|
-
end
|
|
61
|
-
|
|
62
|
-
context 'given a download repository' do
|
|
63
|
-
|
|
64
|
-
before(:all) do
|
|
65
|
-
setup_download_repo
|
|
66
|
-
end
|
|
67
|
-
|
|
68
|
-
before(:each) do
|
|
69
|
-
@scraper = RightScale::DownloadScraper.new(@repo_path, max_bytes=1024**2, max_seconds=20)
|
|
70
|
-
@repo = RightScale::Repository.from_hash(:display_name => 'test repo',
|
|
71
|
-
:repo_type => :download,
|
|
72
|
-
:url => "file:///#{@download_file}")
|
|
73
|
-
FileUtils.rm_rf(RightScale::ScraperBase.repo_dir(@repo_path, @repo))
|
|
74
|
-
end
|
|
75
|
-
|
|
76
|
-
after(:all) do
|
|
77
|
-
delete_download_repo
|
|
78
|
-
end
|
|
79
|
-
|
|
80
|
-
it 'should scrape' do
|
|
81
|
-
messages = []
|
|
82
|
-
@scraper.scrape(@repo) { |m, progress| messages << m if progress }
|
|
83
|
-
puts "\n **ERRORS: #{@scraper.errors.join("\n")}\n" unless @scraper.succeeded?
|
|
84
|
-
@scraper.succeeded?.should be_true
|
|
85
|
-
messages.size.should == 1
|
|
86
|
-
File.directory?(@scraper.current_repo_dir).should be_true
|
|
87
|
-
extract_file_layout(@scraper.current_repo_dir).should == @repo_content
|
|
88
|
-
end
|
|
89
|
-
|
|
90
|
-
end
|
|
91
|
-
|
|
92
|
-
end
|
|
93
|
-
|
|
94
|
-
end # unless RUBY_PLATFORM=~/mswin/
|
|
@@ -1,165 +0,0 @@
|
|
|
1
|
-
#--
|
|
2
|
-
# Copyright: Copyright (c) 2010 RightScale, Inc.
|
|
3
|
-
#
|
|
4
|
-
# Permission is hereby granted, free of charge, to any person obtaining
|
|
5
|
-
# a copy of this software and associated documentation files (the
|
|
6
|
-
# 'Software'), to deal in the Software without restriction, including
|
|
7
|
-
# without limitation the rights to use, copy, modify, merge, publish,
|
|
8
|
-
# distribute, sublicense, and/or sell copies of the Software, and to
|
|
9
|
-
# permit persons to whom the Software is furnished to do so, subject to
|
|
10
|
-
# the following conditions:
|
|
11
|
-
#
|
|
12
|
-
# The above copyright notice and this permission notice shall be
|
|
13
|
-
# included in all copies or substantial portions of the Software.
|
|
14
|
-
#
|
|
15
|
-
# THE SOFTWARE IS PROVIDED 'AS IS', WITHOUT WARRANTY OF ANY KIND,
|
|
16
|
-
# EXPRESS OR IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF
|
|
17
|
-
# MERCHANTABILITY, FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT.
|
|
18
|
-
# IN NO EVENT SHALL THE AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY
|
|
19
|
-
# CLAIM, DAMAGES OR OTHER LIABILITY, WHETHER IN AN ACTION OF CONTRACT,
|
|
20
|
-
# TORT OR OTHERWISE, ARISING FROM, OUT OF OR IN CONNECTION WITH THE
|
|
21
|
-
# SOFTWARE OR THE USE OR OTHER DEALINGS IN THE SOFTWARE.
|
|
22
|
-
#++
|
|
23
|
-
|
|
24
|
-
require File.expand_path(File.join(File.dirname(__FILE__), 'git_scraper_spec_helper'))
|
|
25
|
-
require 'scraper_base'
|
|
26
|
-
require 'repository'
|
|
27
|
-
require 'watcher'
|
|
28
|
-
require File.join('scrapers', 'git_scraper')
|
|
29
|
-
require 'set'
|
|
30
|
-
|
|
31
|
-
describe RightScale::GitScraper do
|
|
32
|
-
|
|
33
|
-
context 'given a git repository' do
|
|
34
|
-
|
|
35
|
-
before(:each) do
|
|
36
|
-
@helper = RightScale::GitScraperSpecHelper.new
|
|
37
|
-
@helper.setup_test_repo
|
|
38
|
-
@scrape_dir = File.expand_path(File.join(File.dirname(__FILE__), '__scrape'))
|
|
39
|
-
@scraper = RightScale::GitScraper.new(@scrape_dir, max_bytes=1024**2, max_seconds=20)
|
|
40
|
-
@repo = RightScale::Repository.from_hash(:display_name => 'test repo',
|
|
41
|
-
:repo_type => :git,
|
|
42
|
-
:url => @helper.repo_path)
|
|
43
|
-
@current_repo_dir = RightScale::ScraperBase.repo_dir(@scrape_dir, @repo)
|
|
44
|
-
FileUtils.rm_rf(@current_repo_dir)
|
|
45
|
-
end
|
|
46
|
-
|
|
47
|
-
after(:each) do
|
|
48
|
-
@helper.delete_test_repo
|
|
49
|
-
FileUtils.rm_rf(@scrape_dir)
|
|
50
|
-
end
|
|
51
|
-
|
|
52
|
-
it 'should scrape the master branch' do
|
|
53
|
-
messages = []
|
|
54
|
-
@scraper.instance_variable_set(:@current_repo_dir, @current_repo_dir)
|
|
55
|
-
@scraper.incremental_update?.should be_false
|
|
56
|
-
@scraper.scrape(@repo) { |m, progress| messages << m if progress }
|
|
57
|
-
puts "\n **ERRORS: #{@scraper.errors.join("\n")}\n" unless @scraper.succeeded?
|
|
58
|
-
@scraper.succeeded?.should be_true
|
|
59
|
-
messages.size.should == 1
|
|
60
|
-
File.directory?(@scraper.current_repo_dir).should be_true
|
|
61
|
-
Set.new(@helper.extract_file_layout(@scraper.current_repo_dir, [ '.git', '.ssh' ])).should ==
|
|
62
|
-
Set.new(@helper.repo_content)
|
|
63
|
-
end
|
|
64
|
-
|
|
65
|
-
it 'should scrape the master branch incrementally' do
|
|
66
|
-
@scraper.scrape(@repo)
|
|
67
|
-
puts "\n **ERRORS: #{@scraper.errors.join("\n")}\n" unless @scraper.succeeded?
|
|
68
|
-
@scraper.incremental_update?.should be_true
|
|
69
|
-
@helper.create_file_layout(@helper.repo_path, @helper.additional_content)
|
|
70
|
-
@helper.commit_content
|
|
71
|
-
messages = []
|
|
72
|
-
@scraper.scrape(@repo) { |m, progress| messages << m if progress }
|
|
73
|
-
puts "\n **ERRORS: #{@scraper.errors.join("\n")}\n" unless @scraper.succeeded?
|
|
74
|
-
@scraper.succeeded?.should be_true
|
|
75
|
-
messages.size.should == 1
|
|
76
|
-
@scraper.instance_variable_get(:@incremental).should == true
|
|
77
|
-
File.directory?(@scraper.current_repo_dir).should be_true
|
|
78
|
-
Set.new(@helper.extract_file_layout(@scraper.current_repo_dir, [ '.git', '.ssh' ])).should ==
|
|
79
|
-
Set.new(@helper.repo_content + @helper.additional_content)
|
|
80
|
-
end
|
|
81
|
-
|
|
82
|
-
context 'and a branch' do
|
|
83
|
-
|
|
84
|
-
before(:each) do
|
|
85
|
-
@helper.setup_branch('test_branch', @helper.branch_content)
|
|
86
|
-
@branch_repo = RightScale::Repository.from_hash(:display_name => 'test repo',
|
|
87
|
-
:repo_type => :git,
|
|
88
|
-
:url => @helper.repo_path,
|
|
89
|
-
:tag => 'test_branch')
|
|
90
|
-
end
|
|
91
|
-
|
|
92
|
-
it 'should scrape a branch' do
|
|
93
|
-
messages = []
|
|
94
|
-
@scraper.scrape(@branch_repo) { |m, progress| messages << m if progress }
|
|
95
|
-
puts "\n **ERRORS: #{@scraper.errors.join("\n")}\n" unless @scraper.succeeded?
|
|
96
|
-
@scraper.succeeded?.should be_true
|
|
97
|
-
messages.size.should == 1
|
|
98
|
-
File.directory?(@scraper.current_repo_dir).should be_true
|
|
99
|
-
Set.new(@helper.extract_file_layout(@scraper.current_repo_dir, [ '.git', '.ssh' ])).should ==
|
|
100
|
-
Set.new((@helper.repo_content + @helper.branch_content))
|
|
101
|
-
end
|
|
102
|
-
|
|
103
|
-
it 'should scrape a branch incrementally' do
|
|
104
|
-
@scraper.scrape(@branch_repo)
|
|
105
|
-
puts "\n **ERRORS: #{@scraper.errors.join("\n")}\n" unless @scraper.succeeded?
|
|
106
|
-
@scraper.incremental_update?.should be_true
|
|
107
|
-
@helper.create_file_layout(@helper.repo_path, @helper.additional_content)
|
|
108
|
-
@helper.commit_content
|
|
109
|
-
messages = []
|
|
110
|
-
@scraper.scrape(@branch_repo) { |m, progress| messages << m if progress }
|
|
111
|
-
puts "\n **ERRORS: #{@scraper.errors.join("\n")}\n" unless @scraper.succeeded?
|
|
112
|
-
@scraper.succeeded?.should be_true
|
|
113
|
-
messages.size.should == 1
|
|
114
|
-
@scraper.instance_variable_get(:@incremental).should == true
|
|
115
|
-
File.directory?(@scraper.current_repo_dir).should be_true
|
|
116
|
-
Set.new(@helper.extract_file_layout(@scraper.current_repo_dir, [ '.git', '.ssh' ])).should ==
|
|
117
|
-
Set.new((@helper.repo_content + @helper.branch_content + @helper.additional_content))
|
|
118
|
-
end
|
|
119
|
-
|
|
120
|
-
end
|
|
121
|
-
|
|
122
|
-
context 'and a sha ref' do
|
|
123
|
-
|
|
124
|
-
before(:each) do
|
|
125
|
-
@helper.create_file_layout(@helper.repo_path, @helper.branch_content)
|
|
126
|
-
@helper.commit_content
|
|
127
|
-
@sha_repo = RightScale::Repository.from_hash(:display_name => 'test repo',
|
|
128
|
-
:repo_type => :git,
|
|
129
|
-
:url => @helper.repo_path,
|
|
130
|
-
:tag => @helper.commit_id(1))
|
|
131
|
-
end
|
|
132
|
-
|
|
133
|
-
it 'should scrape a sha' do
|
|
134
|
-
messages = []
|
|
135
|
-
@scraper.scrape(@sha_repo) { |m, progress| messages << m if progress }
|
|
136
|
-
puts "\n **ERRORS: #{@scraper.errors.join("\n")}\n" unless @scraper.succeeded?
|
|
137
|
-
@scraper.succeeded?.should be_true
|
|
138
|
-
messages.size.should == 1
|
|
139
|
-
File.directory?(@scraper.current_repo_dir).should be_true
|
|
140
|
-
Set.new(@helper.extract_file_layout(@scraper.current_repo_dir, [ '.git', '.ssh' ])).should ==
|
|
141
|
-
Set.new(@helper.repo_content)
|
|
142
|
-
end
|
|
143
|
-
|
|
144
|
-
it 'should scrape a sha incrementally' do
|
|
145
|
-
@scraper.scrape(@sha_repo)
|
|
146
|
-
puts "\n **ERRORS: #{@scraper.errors.join("\n")}\n" unless @scraper.succeeded?
|
|
147
|
-
@scraper.incremental_update?.should be_true
|
|
148
|
-
@helper.create_file_layout(@helper.repo_path, @helper.additional_content)
|
|
149
|
-
@helper.commit_content
|
|
150
|
-
messages = []
|
|
151
|
-
@scraper.scrape(@sha_repo) { |m, progress| messages << m if progress }
|
|
152
|
-
puts "\n **ERRORS: #{@scraper.errors.join("\n")}\n" unless @scraper.succeeded?
|
|
153
|
-
@scraper.succeeded?.should be_true
|
|
154
|
-
messages.size.should == 1
|
|
155
|
-
@scraper.instance_variable_get(:@incremental).should == true
|
|
156
|
-
File.directory?(@scraper.current_repo_dir).should be_true
|
|
157
|
-
Set.new(@helper.extract_file_layout(@scraper.current_repo_dir, [ '.git', '.ssh' ])).should ==
|
|
158
|
-
Set.new(@helper.repo_content)
|
|
159
|
-
end
|
|
160
|
-
|
|
161
|
-
end
|
|
162
|
-
|
|
163
|
-
end
|
|
164
|
-
|
|
165
|
-
end
|