miniharvest 0.1.2

Sign up to get free protection for your applications and to get access to all the features.
checksums.yaml ADDED
@@ -0,0 +1,7 @@
1
+ ---
2
+ SHA1:
3
+ metadata.gz: d04109b8822d0c99fdd143556813f4a63ff19c65
4
+ data.tar.gz: e51da2311599aea645c6906c7b6e6126831e7ef9
5
+ SHA512:
6
+ metadata.gz: c6f79fed856d7d6a36e53b52388a37e86d42f6b659c94a816b76be2f6b391f4469875baea00b8c45223a388c7c0798ac8c1078307f13f0ea9881700ac5375044
7
+ data.tar.gz: 620db7df75dbf7e3b9e50ddd37cef6c008d762a975f795e6ac6fc30406fef4b9d05eeeea4f4c8057aa270fabe15d2a1d0e95e971a350de6c9f3b31b246c4d390
data/.gitignore ADDED
@@ -0,0 +1,9 @@
1
+ /.bundle/
2
+ /.yardoc
3
+ /Gemfile.lock
4
+ /_yardoc/
5
+ /coverage/
6
+ /doc/
7
+ /pkg/
8
+ /spec/reports/
9
+ /tmp/
data/.travis.yml ADDED
@@ -0,0 +1,5 @@
1
+ sudo: false
2
+ language: ruby
3
+ rvm:
4
+ - 2.3.1
5
+ before_install: gem install bundler -v 1.12.5
data/Gemfile ADDED
@@ -0,0 +1,4 @@
1
+ source 'https://rubygems.org'
2
+
3
+ # Specify your gem's dependencies in miniharvest.gemspec
4
+ gemspec
data/LICENSE.txt ADDED
@@ -0,0 +1,21 @@
1
+ The MIT License (MIT)
2
+
3
+ Copyright (c) 2016 Jamie Little
4
+
5
+ Permission is hereby granted, free of charge, to any person obtaining a copy
6
+ of this software and associated documentation files (the "Software"), to deal
7
+ in the Software without restriction, including without limitation the rights
8
+ to use, copy, modify, merge, publish, distribute, sublicense, and/or sell
9
+ copies of the Software, and to permit persons to whom the Software is
10
+ furnished to do so, subject to the following conditions:
11
+
12
+ The above copyright notice and this permission notice shall be included in
13
+ all copies or substantial portions of the Software.
14
+
15
+ THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
16
+ IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
17
+ FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL THE
18
+ AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER
19
+ LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM,
20
+ OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN
21
+ THE SOFTWARE.
data/README.md ADDED
@@ -0,0 +1,32 @@
1
+ # MiniHarvest
2
+
3
+ MiniHarvest is used to harvest sets of MARCXML records from an OAI-PMH endpoint.The records are appended to a single MARCXML file that can be ingested with SolrMarc or other used with other sofware.
4
+
5
+ ## Installation
6
+
7
+ Add this line to your application's Gemfile:
8
+
9
+ ```ruby
10
+ gem 'miniharvest'
11
+ ```
12
+
13
+ And then execute:
14
+
15
+ $ bundle
16
+
17
+ Or install it yourself as:
18
+
19
+ $ gem install miniharvest
20
+
21
+ ## Usage
22
+
23
+ On the command line:
24
+
25
+ ```bash
26
+ miniharvest http://oai-pmh/endpoint/ setname > marc.xml
27
+ ```
28
+
29
+ ## License
30
+
31
+ The gem is available as open source under the terms of the [MIT License](http://opensource.org/licenses/MIT).
32
+
data/Rakefile ADDED
@@ -0,0 +1,10 @@
1
+ require "bundler/gem_tasks"
2
+ require "rake/testtask"
3
+
4
+ Rake::TestTask.new(:test) do |t|
5
+ t.libs << "test"
6
+ t.libs << "lib"
7
+ t.test_files = FileList['test/**/*_test.rb']
8
+ end
9
+
10
+ task :default => :test
data/bin/console ADDED
@@ -0,0 +1,14 @@
1
+ #!/usr/bin/env ruby
2
+
3
+ require "bundler/setup"
4
+ require "miniharvest"
5
+
6
+ # You can add fixtures and/or initialization code here to make experimenting
7
+ # with your gem easier. You can also use a different console, if you like.
8
+
9
+ # (If you use this, don't forget to add pry to your Gemfile!)
10
+ # require "pry"
11
+ # Pry.start
12
+
13
+ require "irb"
14
+ IRB.start
data/bin/setup ADDED
@@ -0,0 +1,8 @@
1
+ #!/usr/bin/env bash
2
+ set -euo pipefail
3
+ IFS=$'\n\t'
4
+ set -vx
5
+
6
+ bundle install
7
+
8
+ # Do any other automated setup that you need to do here
data/exe/.DS_Store ADDED
Binary file
data/exe/miniharvest ADDED
@@ -0,0 +1,7 @@
1
+ #!/usr/bin/env ruby
2
+ require 'miniharvest'
3
+
4
+ mh = MiniHarvest::MiniHarvest.new
5
+ mh.oai_base_uri = ARGV[0]
6
+ mh.set = ARGV[1]
7
+ puts mh.get_records(mh.initial_request)
data/exe/miniharvest~ ADDED
@@ -0,0 +1,6 @@
1
+ #!/usr/bin/env ruby
2
+
3
+ mh = MiniHarvest::MiniHarvest.new
4
+ mh.oai_base_uri = 'https://na03.alma.exlibrisgroup.com/view/oai/01UOML_INST/request'
5
+ mh.set = 'udvd'
6
+ refute_nil mh.get_records(mh.initial_request)
@@ -0,0 +1,3 @@
1
+ module MiniHarvest
2
+ VERSION = "0.1.2"
3
+ end
@@ -0,0 +1,51 @@
1
+ require "miniharvest/version"
2
+
3
+ module MiniHarvest
4
+ require 'net/http'
5
+ require 'nokogiri'
6
+ require 'open-uri'
7
+
8
+ class MiniHarvest
9
+
10
+ @@marc_collection = Nokogiri::XML('<collection xmlns="http://www.loc.gov/MARC21/slim">')
11
+
12
+ attr_accessor :oai_base_uri, :set
13
+
14
+ def append_to_collection(records)
15
+ @@marc_collection.at('collection').add_child(records)
16
+ end
17
+
18
+ def oai_request(uri,params)
19
+ oai_uri = URI(uri)
20
+ oai_uri.query = URI.encode_www_form(params)
21
+ return Net::HTTP.get_response(oai_uri)
22
+ end
23
+
24
+ def process_request(res)
25
+ doc = Nokogiri::XML(res.body)
26
+ doc.remove_namespaces!
27
+ records = doc.xpath('//record')
28
+ append_to_collection(records)
29
+
30
+ resumption_token = doc.xpath('//resumptionToken')
31
+ return resumption_token.text
32
+ end
33
+
34
+ def initial_request
35
+ params = { :verb => 'ListRecords', :set => self.set, :metadataPrefix => 'marc21' }
36
+ res = oai_request(self.oai_base_uri,params)
37
+ get_records(process_request(res))
38
+ end
39
+
40
+ def get_records(token)
41
+ params = { :verb => 'ListRecords', :resumptionToken => token }
42
+ res = oai_request(self.oai_base_uri,params)
43
+ resumption_token = process_request(res)
44
+ if resumption_token != ""
45
+ get_records(resumption_token)
46
+ else
47
+ puts @@marc_collection.to_s
48
+ end
49
+ end
50
+ end
51
+ end
@@ -0,0 +1,27 @@
1
+ # coding: utf-8
2
+ lib = File.expand_path('../lib', __FILE__)
3
+ $LOAD_PATH.unshift(lib) unless $LOAD_PATH.include?(lib)
4
+ require 'miniharvest/version'
5
+
6
+ Gem::Specification.new do |spec|
7
+ spec.name = "miniharvest"
8
+ spec.version = MiniHarvest::VERSION
9
+ spec.authors = ["Jamie Little"]
10
+ spec.email = ["j.little@miami.edu"]
11
+
12
+ spec.summary = "A Gem to harvest OAI-PMH repositories"
13
+ spec.description = ""
14
+ spec.homepage = ""
15
+ spec.license = "MIT"
16
+
17
+ spec.files = `git ls-files -z`.split("\x0").reject { |f| f.match(%r{^(test|spec|features)/}) }
18
+ spec.bindir = "exe"
19
+ spec.executables = "miniharvest"
20
+ spec.require_paths = ["lib"]
21
+
22
+ spec.add_development_dependency "bundler", "~> 1.12"
23
+ spec.add_development_dependency "rake", "~> 10.0"
24
+ spec.add_development_dependency "minitest", "~> 5.0"
25
+
26
+ spec.add_runtime_dependency "nokogiri"
27
+ end
metadata ADDED
@@ -0,0 +1,115 @@
1
+ --- !ruby/object:Gem::Specification
2
+ name: miniharvest
3
+ version: !ruby/object:Gem::Version
4
+ version: 0.1.2
5
+ platform: ruby
6
+ authors:
7
+ - Jamie Little
8
+ autorequire:
9
+ bindir: exe
10
+ cert_chain: []
11
+ date: 2016-08-01 00:00:00.000000000 Z
12
+ dependencies:
13
+ - !ruby/object:Gem::Dependency
14
+ name: bundler
15
+ requirement: !ruby/object:Gem::Requirement
16
+ requirements:
17
+ - - "~>"
18
+ - !ruby/object:Gem::Version
19
+ version: '1.12'
20
+ type: :development
21
+ prerelease: false
22
+ version_requirements: !ruby/object:Gem::Requirement
23
+ requirements:
24
+ - - "~>"
25
+ - !ruby/object:Gem::Version
26
+ version: '1.12'
27
+ - !ruby/object:Gem::Dependency
28
+ name: rake
29
+ requirement: !ruby/object:Gem::Requirement
30
+ requirements:
31
+ - - "~>"
32
+ - !ruby/object:Gem::Version
33
+ version: '10.0'
34
+ type: :development
35
+ prerelease: false
36
+ version_requirements: !ruby/object:Gem::Requirement
37
+ requirements:
38
+ - - "~>"
39
+ - !ruby/object:Gem::Version
40
+ version: '10.0'
41
+ - !ruby/object:Gem::Dependency
42
+ name: minitest
43
+ requirement: !ruby/object:Gem::Requirement
44
+ requirements:
45
+ - - "~>"
46
+ - !ruby/object:Gem::Version
47
+ version: '5.0'
48
+ type: :development
49
+ prerelease: false
50
+ version_requirements: !ruby/object:Gem::Requirement
51
+ requirements:
52
+ - - "~>"
53
+ - !ruby/object:Gem::Version
54
+ version: '5.0'
55
+ - !ruby/object:Gem::Dependency
56
+ name: nokogiri
57
+ requirement: !ruby/object:Gem::Requirement
58
+ requirements:
59
+ - - ">="
60
+ - !ruby/object:Gem::Version
61
+ version: '0'
62
+ type: :runtime
63
+ prerelease: false
64
+ version_requirements: !ruby/object:Gem::Requirement
65
+ requirements:
66
+ - - ">="
67
+ - !ruby/object:Gem::Version
68
+ version: '0'
69
+ description: ''
70
+ email:
71
+ - j.little@miami.edu
72
+ executables:
73
+ - miniharvest
74
+ extensions: []
75
+ extra_rdoc_files: []
76
+ files:
77
+ - ".gitignore"
78
+ - ".travis.yml"
79
+ - Gemfile
80
+ - LICENSE.txt
81
+ - README.md
82
+ - Rakefile
83
+ - bin/console
84
+ - bin/setup
85
+ - exe/.DS_Store
86
+ - exe/miniharvest
87
+ - exe/miniharvest~
88
+ - lib/miniharvest.rb
89
+ - lib/miniharvest/version.rb
90
+ - miniharvest.gemspec
91
+ homepage: ''
92
+ licenses:
93
+ - MIT
94
+ metadata: {}
95
+ post_install_message:
96
+ rdoc_options: []
97
+ require_paths:
98
+ - lib
99
+ required_ruby_version: !ruby/object:Gem::Requirement
100
+ requirements:
101
+ - - ">="
102
+ - !ruby/object:Gem::Version
103
+ version: '0'
104
+ required_rubygems_version: !ruby/object:Gem::Requirement
105
+ requirements:
106
+ - - ">="
107
+ - !ruby/object:Gem::Version
108
+ version: '0'
109
+ requirements: []
110
+ rubyforge_project:
111
+ rubygems_version: 2.5.1
112
+ signing_key:
113
+ specification_version: 4
114
+ summary: A Gem to harvest OAI-PMH repositories
115
+ test_files: []