warclight 0.5.0 → 0.6.0
This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
- checksums.yaml +4 -4
- data/.rubocop.yml +4 -0
- data/.travis.yml +4 -1
- data/CHANGELOG.md +7 -0
- data/CODE_OF_CONDUCT.md +81 -0
- data/README.md +1 -1
- data/app/helpers/warclight_helper.rb +5 -1
- data/app/models/concerns/warclight/solr_document.rb +9 -7
- data/lib/generators/warclight/install_generator.rb +0 -5
- data/lib/generators/warclight/templates/catalog_controller.rb +3 -3
- data/lib/warclight/version.rb +1 -1
- data/solr/conf/schema.xml +6 -4
- data/solr/warclight_warc-indexer.conf +170 -0
- data/tasks/warclight.rake +2 -1
- data/template.rb +0 -1
- data/warclight.gemspec +2 -3
- metadata +11 -25
- data/app/assets/javascripts/warclight/warclight.js +0 -2
- data/app/views/layouts/warclight/application.html.erb +0 -14
checksums.yaml
CHANGED
|
@@ -1,7 +1,7 @@
|
|
|
1
1
|
---
|
|
2
2
|
SHA1:
|
|
3
|
-
metadata.gz:
|
|
4
|
-
data.tar.gz:
|
|
3
|
+
metadata.gz: a8ae7e47fad95aad7c598fb0eeba1d729bf35641
|
|
4
|
+
data.tar.gz: 47865f795f928fdeba81e30e557f0b9e9f19184c
|
|
5
5
|
SHA512:
|
|
6
|
-
metadata.gz:
|
|
7
|
-
data.tar.gz:
|
|
6
|
+
metadata.gz: 3f8ad4ff95368d0dc27d1235282c23fe88c95d3a2d27d8da1a9849fd0bcfa073232885b5faf10f0a4fe38337c8da05f19b3e3248e74568e83c461e2fe811dac8
|
|
7
|
+
data.tar.gz: b488e29c86bb559189081edf5ee8d95a6f6a401da8d501cba50ef0df701c1b97b9ff3defbab81b46f3c55b30bdc234dd69a8cc8c057e92368aca0b58523bd579
|
data/.rubocop.yml
CHANGED
data/.travis.yml
CHANGED
|
@@ -3,9 +3,12 @@ language: ruby
|
|
|
3
3
|
notifications:
|
|
4
4
|
email: false
|
|
5
5
|
rvm:
|
|
6
|
-
- 2.4.
|
|
6
|
+
- 2.4.2
|
|
7
|
+
- 2.3.5
|
|
8
|
+
- 2.2.8
|
|
7
9
|
jdk:
|
|
8
10
|
- oraclejdk8
|
|
11
|
+
- openjdk8
|
|
9
12
|
|
|
10
13
|
# Update to phantomjs 2.1.1 to fix issues with < 2
|
|
11
14
|
# See https://github.com/travis-ci/travis-ci/issues/3225#issuecomment-177592725
|
data/CHANGELOG.md
CHANGED
|
@@ -1,5 +1,12 @@
|
|
|
1
1
|
# Change Log
|
|
2
2
|
|
|
3
|
+
## [v0.5.0](https://github.com/archivesunleashed/warclight/tree/v0.5.0) (2017-10-19)
|
|
4
|
+
[Full Changelog](https://github.com/archivesunleashed/warclight/compare/v0.4.0...v0.5.0)
|
|
5
|
+
|
|
6
|
+
**Merged pull requests:**
|
|
7
|
+
|
|
8
|
+
- Align with https://github.com/ukwa/webarchive-discovery/pull/129 [\#29](https://github.com/archivesunleashed/warclight/pull/29) ([ruebot](https://github.com/ruebot))
|
|
9
|
+
|
|
3
10
|
## [v0.4.0](https://github.com/archivesunleashed/warclight/tree/v0.4.0) (2017-10-18)
|
|
4
11
|
[Full Changelog](https://github.com/archivesunleashed/warclight/compare/v0.3.0...v0.4.0)
|
|
5
12
|
|
data/CODE_OF_CONDUCT.md
ADDED
|
@@ -0,0 +1,81 @@
|
|
|
1
|
+
# Archives Unleashed Project Code of Conduct
|
|
2
|
+
|
|
3
|
+
## Our Pledge
|
|
4
|
+
|
|
5
|
+
* The Archives Unleashed Project believes in supporting an open, inclusive, and
|
|
6
|
+
diverse community which respects the experience, expertise, and knowledge of
|
|
7
|
+
all community members.
|
|
8
|
+
* The Archives Unleashed community is dedicated to providing a harassment-free
|
|
9
|
+
experience for everyone, and welcomes individuals regardless age, body size,
|
|
10
|
+
disability, ethnicity, gender identity and expression, level of experience,
|
|
11
|
+
nationality, personal appearance, race, religion, or sexual identity and
|
|
12
|
+
orientation.
|
|
13
|
+
* To foster respectful collaborations this code of conduct applies to all
|
|
14
|
+
Archives Unleashed spaces, includes, but is not limited to, GitHub, Slack,
|
|
15
|
+
Medium, social media platforms and meeting spaces, both online and off.
|
|
16
|
+
* Anyone who violates this code of conduct may be sanctioned or expelled from
|
|
17
|
+
these spaces at the discretion of the Archives Unleashed Project Team.
|
|
18
|
+
|
|
19
|
+
## Our Standards
|
|
20
|
+
|
|
21
|
+
Examples of behavior that contributes to creating a positive environment
|
|
22
|
+
include:
|
|
23
|
+
|
|
24
|
+
* Using welcoming and inclusive language
|
|
25
|
+
* Being respectful of differing viewpoints and experiences
|
|
26
|
+
* Gracefully accepting constructive criticism
|
|
27
|
+
* Focusing on what is best for the community
|
|
28
|
+
* Showing empathy towards other community members
|
|
29
|
+
|
|
30
|
+
Examples of unacceptable behavior by participants include:
|
|
31
|
+
|
|
32
|
+
* The use of sexualized language or imagery and unwelcome sexual attention or
|
|
33
|
+
advances
|
|
34
|
+
* Trolling, insulting/derogatory comments, and personal or political attacks
|
|
35
|
+
* Public or private harassment
|
|
36
|
+
* Publishing others' private information, such as a physical or electronic
|
|
37
|
+
address, without explicit permission
|
|
38
|
+
* Other conduct which could reasonably be considered inappropriate in a
|
|
39
|
+
professional setting
|
|
40
|
+
|
|
41
|
+
## Our Responsibilities
|
|
42
|
+
|
|
43
|
+
Project maintainers are responsible for clarifying the standards of acceptable
|
|
44
|
+
behavior and are expected to take appropriate and fair corrective action in
|
|
45
|
+
response to any instances of unacceptable behavior.
|
|
46
|
+
|
|
47
|
+
Project maintainers have the right and responsibility to remove, edit, or
|
|
48
|
+
reject comments, commits, code, wiki edits, issues, and other contributions
|
|
49
|
+
that are not aligned to this Code of Conduct, or to ban temporarily or
|
|
50
|
+
permanently any contributor for other behaviors that they deem inappropriate,
|
|
51
|
+
threatening, offensive, or harmful.
|
|
52
|
+
|
|
53
|
+
## Scope
|
|
54
|
+
|
|
55
|
+
This Code of Conduct applies both within project spaces and in public spaces
|
|
56
|
+
when an individual is representing the project or its community. Examples of
|
|
57
|
+
representing a project or community include using an official project e-mail
|
|
58
|
+
address, posting via an official social media account, or acting as an appointed
|
|
59
|
+
representative at an online or offline event. Representation of a project may be
|
|
60
|
+
further defined and clarified by project maintainers.
|
|
61
|
+
|
|
62
|
+
## Enforcement
|
|
63
|
+
|
|
64
|
+
Instances of abusive, harassing, or otherwise unacceptable behavior may be
|
|
65
|
+
reported by contacting the project team at archivesunleashed@gmail.com. All
|
|
66
|
+
complaints will be reviewed and investigated and will result in a response that
|
|
67
|
+
is deemed necessary and appropriate to the circumstances. The project team is
|
|
68
|
+
obligated to maintain confidentiality with regard to the reporter of an incident.
|
|
69
|
+
Further details of specific enforcement policies may be posted separately.
|
|
70
|
+
|
|
71
|
+
Project maintainers who do not follow or enforce the Code of Conduct in good
|
|
72
|
+
faith may face temporary or permanent repercussions as determined by other
|
|
73
|
+
members of the project's leadership.
|
|
74
|
+
|
|
75
|
+
## Attribution
|
|
76
|
+
|
|
77
|
+
This Code of Conduct is adapted from the [Contributor Covenant][homepage], version 1.4,
|
|
78
|
+
available at [http://contributor-covenant.org/version/1/4][version]
|
|
79
|
+
|
|
80
|
+
[homepage]: http://contributor-covenant.org
|
|
81
|
+
[version]: http://contributor-covenant.org/version/1/4/
|
data/README.md
CHANGED
|
@@ -10,7 +10,7 @@ A [Project Blacklight](http://projectblacklight.org/) based [Rails engine](http:
|
|
|
10
10
|
## Requirements
|
|
11
11
|
|
|
12
12
|
* [Ruby](https://www.ruby-lang.org/en/) 2.2 or later
|
|
13
|
-
* [Rails](http://rubyonrails.org) 5.
|
|
13
|
+
* [Rails](http://rubyonrails.org) 5.0.0 or later
|
|
14
14
|
|
|
15
15
|
## Installation
|
|
16
16
|
|
|
@@ -8,15 +8,17 @@ module Warclight
|
|
|
8
8
|
|
|
9
9
|
def replay_link
|
|
10
10
|
time_travel_base_url = 'http://timetravel.mementoweb.org/api/json/'
|
|
11
|
-
|
|
12
|
-
time_travel_time = (Time.parse(first(:crawl_date)).strftime time_travel_time_format).to_s
|
|
13
|
-
time_travel_request_url = time_travel_base_url + time_travel_time + '/' + first(:url).to_s
|
|
11
|
+
time_travel_request_url = time_travel_base_url + first(:wayback_date).to_s + '/' + first(:url).to_s
|
|
14
12
|
time_travel_request = URI(time_travel_request_url)
|
|
15
13
|
time_travel_response = Net::HTTP.get(time_travel_request)
|
|
16
|
-
|
|
17
|
-
|
|
18
|
-
|
|
19
|
-
|
|
14
|
+
if time_travel_response.present?
|
|
15
|
+
time_travel_response_json = JSON.parse(time_travel_response)
|
|
16
|
+
replay_url = time_travel_response_json['mementos']['closest']['uri'][0]
|
|
17
|
+
replay_url_link = '<a href="' + "#{replay_url}" '" target="_blank">'"#{replay_url}"'</a> 🔗'
|
|
18
|
+
replay_url_link.html_safe
|
|
19
|
+
else
|
|
20
|
+
replay_url = 'Not Available.'
|
|
21
|
+
end
|
|
20
22
|
end
|
|
21
23
|
end
|
|
22
24
|
end
|
|
@@ -19,10 +19,6 @@ module Warclight
|
|
|
19
19
|
end
|
|
20
20
|
end
|
|
21
21
|
|
|
22
|
-
def install_blacklight_range_limit
|
|
23
|
-
generate 'blacklight_range_limit:install'
|
|
24
|
-
end
|
|
25
|
-
|
|
26
22
|
def add_custom_routes
|
|
27
23
|
inject_into_file 'config/routes.rb', after: "mount Blacklight::Engine => '/'" do
|
|
28
24
|
"\n mount Warclight::Engine => '/'\n"
|
|
@@ -31,7 +27,6 @@ module Warclight
|
|
|
31
27
|
|
|
32
28
|
def assets
|
|
33
29
|
copy_file 'warclight.scss', 'app/assets/stylesheets/warclight.scss'
|
|
34
|
-
copy_file 'warclight.js', 'app/assets/javascripts/warclight.js'
|
|
35
30
|
inject_into_file 'app/assets/javascripts/application.js', after: '//= require blacklight/blacklight' do
|
|
36
31
|
"\n//= require bootstrap/scrollspy\n" \
|
|
37
32
|
"\n//= require bootstrap/tab\n"
|
|
@@ -48,13 +48,13 @@ class CatalogController < ApplicationController
|
|
|
48
48
|
# :index_range can be an array or range of prefixes that will be used to
|
|
49
49
|
# create the navigation (note: It is case sensitive when searching values)
|
|
50
50
|
|
|
51
|
-
config.add_facet_field 'content_type_norm', label: 'General Content Type', collapse: false
|
|
52
|
-
config.add_facet_field 'crawl_year', label: 'Crawl Year', collapse: false,
|
|
51
|
+
config.add_facet_field 'content_type_norm', label: 'General Content Type', collapse: false
|
|
52
|
+
config.add_facet_field 'crawl_year', label: 'Crawl Year', collapse: false, sort: 'index'
|
|
53
53
|
config.add_facet_field 'public_suffix', label: 'Public Suffix', collapse: false, limit: true
|
|
54
54
|
config.add_facet_field 'domain', label: 'Domain', limit: true
|
|
55
55
|
config.add_facet_field 'links_domains', label: 'Links Domains', limit: true
|
|
56
56
|
config.add_facet_field 'content_language', label: 'Content Language', limit: true
|
|
57
|
-
config.add_facet_field '
|
|
57
|
+
config.add_facet_field 'resourcename_facet', label: 'Resource Name', limit: true
|
|
58
58
|
config.add_facet_field 'institution', label: 'Institution'
|
|
59
59
|
config.add_facet_field 'collection', label: 'Collection'
|
|
60
60
|
config.add_facet_field 'collection_id', label: 'Collection Id'
|
data/lib/warclight/version.rb
CHANGED
data/solr/conf/schema.xml
CHANGED
|
@@ -24,7 +24,7 @@
|
|
|
24
24
|
<field name="_text_" type="text_general" indexed="true" stored="false" multiValued="true"/>
|
|
25
25
|
|
|
26
26
|
<!--Not defined in SolrFields. Schema only defintion -->
|
|
27
|
-
<field name="index_time" type="date" indexed="true" stored="false" docValues="true" default="NOW" />
|
|
27
|
+
<field name="index_time" type="date" indexed="true" stored="false" docValues="true" default="NOW" />
|
|
28
28
|
|
|
29
29
|
<!-- BL UKWA: additional -->
|
|
30
30
|
<field name="access_terms" type="string" indexed="true" docValues="true" multiValued="true"/>
|
|
@@ -76,7 +76,7 @@
|
|
|
76
76
|
<field name="last_modified" type="tdate" indexed="true" stored="true" docValues="true"/>
|
|
77
77
|
<field name="last_modified_year" type="string" indexed="true" docValues="true"/>
|
|
78
78
|
<field name="license_url" type="string" indexed="true" docValues="true" multiValued="true"/>
|
|
79
|
-
<field name="links_images" type="
|
|
79
|
+
<field name="links_images" type="text_general" indexed="true" stored="true" multiValued="true"/>
|
|
80
80
|
<field name="links_domains" type="string" indexed="true" docValues="true" multiValued="true"/>
|
|
81
81
|
<field name="links_hosts" type="string" indexed="true" docValues="true" multiValued="true"/>
|
|
82
82
|
<field name="links_hosts_surts" type="string" indexed="true" docValues="true" multiValued="true"/>
|
|
@@ -85,7 +85,7 @@
|
|
|
85
85
|
<field name="links" type="string" indexed="true" docValues="true" multiValued="true"/>
|
|
86
86
|
<field name="locations" type="location" indexed="true" stored="true" multiValued="true"/>
|
|
87
87
|
<field name="parse_error" type="string" indexed="true" docValues="true" multiValued="true"/>
|
|
88
|
-
<field name="pdf_pdfa_errors" type="
|
|
88
|
+
<field name="pdf_pdfa_errors" type="text_general" indexed="false" stored="true" multiValued="true"/>
|
|
89
89
|
<field name="pdf_pdfa_is_valid" type="string" indexed="true" docValues="true" multiValued="false"/>
|
|
90
90
|
<field name="postcode_district" type="string" indexed="true" docValues="true" multiValued="true"/>
|
|
91
91
|
<field name="postcode" type="string" indexed="true" docValues="true" multiValued="true"/>
|
|
@@ -93,8 +93,10 @@
|
|
|
93
93
|
<field name="publication_year" type="string" indexed="true" docValues="true" multiValued="false"/>
|
|
94
94
|
<field name="public_suffix" type="string" indexed="true" docValues="true" multiValued="false"/>
|
|
95
95
|
<field name="record_type" type="string" indexed="true" stored="true" multiValued="false" docValues="true"/>
|
|
96
|
+
<field name="redirect_to_norm" type="string" indexed="true" stored="false" docValues="true" multiValued="false"/>
|
|
96
97
|
<field name="referrer_url" type="string" indexed="true" stored="true" multiValued="false" docValues="true"/>
|
|
97
98
|
<field name="resourcename" type="text_general" indexed="true" stored="true"/>
|
|
99
|
+
<field name="resourcename_facet" type="string" indexed="false" stored="false" docValues="true" multiValued="false"/>
|
|
98
100
|
<field name="sentiment_score" type="float" indexed="true" stored="true" multiValued="false"/>
|
|
99
101
|
<field name="sentiment" type="string" indexed="true" docValues="true" multiValued="false"/>
|
|
100
102
|
<field name="server" type="string" indexed="true" docValues="true" multiValued="true"/>
|
|
@@ -192,7 +194,7 @@
|
|
|
192
194
|
<copyField source="wct_description" dest="text"/>
|
|
193
195
|
<copyField source="url" dest="text"/>
|
|
194
196
|
<copyField source="content" dest="text"/>
|
|
195
|
-
<copyField source="resourcename" dest="
|
|
197
|
+
<copyField source="resourcename" dest="resourcename_facet"/>
|
|
196
198
|
|
|
197
199
|
<types>
|
|
198
200
|
<fieldType name="string" class="solr.StrField" sortMissingLast="true" />
|
|
@@ -0,0 +1,170 @@
|
|
|
1
|
+
{
|
|
2
|
+
"warc": {
|
|
3
|
+
"title": "Default Warclight warc-indexer config.",
|
|
4
|
+
"http_proxy": {},
|
|
5
|
+
"solr": {
|
|
6
|
+
"batch_size": 500,
|
|
7
|
+
"num_shards": 1,
|
|
8
|
+
"dummy_run": false,
|
|
9
|
+
"num_threads": 1,
|
|
10
|
+
"disablecommit": true,
|
|
11
|
+
"use_hash_url_id": true,
|
|
12
|
+
"check_solr_for_duplicates": true,
|
|
13
|
+
|
|
14
|
+
"field_setup": {
|
|
15
|
+
"fields" : {
|
|
16
|
+
"url" : { "max_length" : 2048 },
|
|
17
|
+
"url_norm" : { "max_length" : 2048 },
|
|
18
|
+
"links" : { "max_length" : 2048 },
|
|
19
|
+
"content" : { "max_length" : 512K },
|
|
20
|
+
},
|
|
21
|
+
},
|
|
22
|
+
},
|
|
23
|
+
"index": {
|
|
24
|
+
"tika": {
|
|
25
|
+
"parse_timeout": 300000,
|
|
26
|
+
"use_boilerpipe": false,
|
|
27
|
+
"extract_all_metadata": false,
|
|
28
|
+
"exclude_mime": [
|
|
29
|
+
"x-tar",
|
|
30
|
+
"x-gzip",
|
|
31
|
+
"bz",
|
|
32
|
+
"lz",
|
|
33
|
+
"compress",
|
|
34
|
+
"zip",
|
|
35
|
+
"javascript",
|
|
36
|
+
"css",
|
|
37
|
+
"octet-stream"
|
|
38
|
+
],
|
|
39
|
+
"max_text_length": "512K"
|
|
40
|
+
},
|
|
41
|
+
"id": {
|
|
42
|
+
"useResourceURI": true,
|
|
43
|
+
"droid": {
|
|
44
|
+
"enabled": true,
|
|
45
|
+
"useBinarySignaturesOnly": false
|
|
46
|
+
}
|
|
47
|
+
},
|
|
48
|
+
"exclusions": {
|
|
49
|
+
"enabled": false,
|
|
50
|
+
"check_interval": 600,
|
|
51
|
+
"file": "/path/to/exclude.txt"
|
|
52
|
+
},
|
|
53
|
+
"extract": {
|
|
54
|
+
"onDiskThreshold": "500M",
|
|
55
|
+
"response_include": [
|
|
56
|
+
"1",
|
|
57
|
+
"2",
|
|
58
|
+
"3",
|
|
59
|
+
"4",
|
|
60
|
+
"5",
|
|
61
|
+
"6",
|
|
62
|
+
"7",
|
|
63
|
+
"8",
|
|
64
|
+
"9"
|
|
65
|
+
],
|
|
66
|
+
"url_exclude": [],
|
|
67
|
+
"protocol_include": [
|
|
68
|
+
"http",
|
|
69
|
+
"https"
|
|
70
|
+
],
|
|
71
|
+
"record_type_include": [
|
|
72
|
+
"response",
|
|
73
|
+
"revisit"
|
|
74
|
+
],
|
|
75
|
+
"inMemoryThreshold": "500M",
|
|
76
|
+
"content": {
|
|
77
|
+
"text": true,
|
|
78
|
+
"text_stored": true,
|
|
79
|
+
"elements_used": true,
|
|
80
|
+
"first_bytes": {
|
|
81
|
+
"num_bytes": 32,
|
|
82
|
+
"enabled": true
|
|
83
|
+
},
|
|
84
|
+
"annotations": {
|
|
85
|
+
"enabled": false,
|
|
86
|
+
"file": "/path/to/annotations.json",
|
|
87
|
+
"surt_prefix_file": "/path/to/openAccessSurts.txt"
|
|
88
|
+
},
|
|
89
|
+
"images": {
|
|
90
|
+
"dominantColours": false,
|
|
91
|
+
"maxSizeInBytes": "50M",
|
|
92
|
+
"detectFaces": false,
|
|
93
|
+
"analysisSamplingRate": 1,
|
|
94
|
+
"enabled": true
|
|
95
|
+
},
|
|
96
|
+
"extractApachePreflightErrors": false,
|
|
97
|
+
"text_fuzzy_hash": true,
|
|
98
|
+
"text_extract_postcodes": false,
|
|
99
|
+
"language": {
|
|
100
|
+
"langdetectprofiles": [
|
|
101
|
+
"en",
|
|
102
|
+
"fr",
|
|
103
|
+
"af",
|
|
104
|
+
"ar",
|
|
105
|
+
"bg",
|
|
106
|
+
"bn",
|
|
107
|
+
"cs",
|
|
108
|
+
"de",
|
|
109
|
+
"el",
|
|
110
|
+
"es",
|
|
111
|
+
"et",
|
|
112
|
+
"fa",
|
|
113
|
+
"fi",
|
|
114
|
+
"da",
|
|
115
|
+
"gu",
|
|
116
|
+
"he",
|
|
117
|
+
"hi",
|
|
118
|
+
"hr",
|
|
119
|
+
"hu",
|
|
120
|
+
"id",
|
|
121
|
+
"it",
|
|
122
|
+
"ja",
|
|
123
|
+
"kn",
|
|
124
|
+
"ko",
|
|
125
|
+
"lt",
|
|
126
|
+
"lv",
|
|
127
|
+
"mk",
|
|
128
|
+
"ml",
|
|
129
|
+
"mr",
|
|
130
|
+
"ne",
|
|
131
|
+
"nl",
|
|
132
|
+
"no",
|
|
133
|
+
"pa",
|
|
134
|
+
"pl",
|
|
135
|
+
"pt",
|
|
136
|
+
"ro",
|
|
137
|
+
"ru",
|
|
138
|
+
"sk",
|
|
139
|
+
"sl",
|
|
140
|
+
"so",
|
|
141
|
+
"sq",
|
|
142
|
+
"sv",
|
|
143
|
+
"sw",
|
|
144
|
+
"ta",
|
|
145
|
+
"te",
|
|
146
|
+
"th",
|
|
147
|
+
"tl",
|
|
148
|
+
"tr",
|
|
149
|
+
"uk",
|
|
150
|
+
"ur",
|
|
151
|
+
"vi",
|
|
152
|
+
"zh-cn",
|
|
153
|
+
"zh-tw"
|
|
154
|
+
],
|
|
155
|
+
"enabled": true
|
|
156
|
+
},
|
|
157
|
+
"test_sentimentj": false,
|
|
158
|
+
"text_stanford_ner": false
|
|
159
|
+
},
|
|
160
|
+
"linked": {
|
|
161
|
+
"hosts": true,
|
|
162
|
+
"resources": true,
|
|
163
|
+
"domains": true,
|
|
164
|
+
"normalise": true,
|
|
165
|
+
"images": true
|
|
166
|
+
}
|
|
167
|
+
}
|
|
168
|
+
}
|
|
169
|
+
}
|
|
170
|
+
}
|
data/tasks/warclight.rake
CHANGED
|
@@ -56,6 +56,7 @@ namespace :warclight do
|
|
|
56
56
|
puts 'Seeding index with data from spec/fixtures/warcs/...'
|
|
57
57
|
# rubocop:disable Metrics/LineLength
|
|
58
58
|
system('curl -o ".internal_test_app/tmp/warc-indexer.jar" "http://alpha.library.yorku.ca/warc-indexer-3.0.0-SNAPSHOT-jar-with-dependencies.jar"')
|
|
59
|
-
system('java -Djava.io.tmpdir=.internal_test_app/tmp -jar .internal_test_app/tmp/warc-indexer.jar -i "York University Libraries" -n "Test Collection" -u "12345" -s http://localhost:8983/solr/blacklight-core spec/fixtures/warcs/*.gz')
|
|
59
|
+
system('java -Djava.io.tmpdir=.internal_test_app/tmp -jar .internal_test_app/tmp/warc-indexer.jar -c .internal_test_app/solr/warclight_warc-indexer.conf -i "York University Libraries" -n "Test Collection" -u "12345" -s http://localhost:8983/solr/blacklight-core spec/fixtures/warcs/*.gz')
|
|
60
|
+
system('curl "http://localhost:8983/solr/blacklight-core/update?commit=true&openSearcher=true"')
|
|
60
61
|
end
|
|
61
62
|
end
|
data/template.rb
CHANGED
|
@@ -3,7 +3,6 @@
|
|
|
3
3
|
# We can remove `blacklight` and `blacklight_range_limit` once they are released
|
|
4
4
|
# since they are already dependents of Warclight (but we need to pin to particular branches)
|
|
5
5
|
gem 'blacklight', github: 'projectblacklight/blacklight'
|
|
6
|
-
gem 'blacklight_range_limit', github: 'projectblacklight/blacklight_range_limit', branch: 'blacklight-7'
|
|
7
6
|
|
|
8
7
|
gem 'warclight', github: 'archivesunleashed/warclight'
|
|
9
8
|
|
data/warclight.gemspec
CHANGED
|
@@ -22,11 +22,10 @@ Gem::Specification.new do |s|
|
|
|
22
22
|
s.require_paths = ['lib']
|
|
23
23
|
|
|
24
24
|
s.add_dependency 'blacklight'
|
|
25
|
-
s.add_dependency '
|
|
26
|
-
s.add_dependency 'rails', '~> 5.1.2'
|
|
25
|
+
s.add_dependency 'rails', '~> 5.0'
|
|
27
26
|
|
|
28
27
|
s.add_development_dependency 'bundler', '~> 1.14'
|
|
29
|
-
s.add_development_dependency 'engine_cart'
|
|
28
|
+
s.add_development_dependency 'engine_cart', '~> 1.2.0'
|
|
30
29
|
s.add_development_dependency 'mocha'
|
|
31
30
|
s.add_development_dependency 'poltergeist'
|
|
32
31
|
s.add_development_dependency 'rake', '~> 12.0'
|
metadata
CHANGED
|
@@ -1,14 +1,14 @@
|
|
|
1
1
|
--- !ruby/object:Gem::Specification
|
|
2
2
|
name: warclight
|
|
3
3
|
version: !ruby/object:Gem::Version
|
|
4
|
-
version: 0.
|
|
4
|
+
version: 0.6.0
|
|
5
5
|
platform: ruby
|
|
6
6
|
authors:
|
|
7
7
|
- Nick Ruest
|
|
8
8
|
autorequire:
|
|
9
9
|
bindir: exe
|
|
10
10
|
cert_chain: []
|
|
11
|
-
date:
|
|
11
|
+
date: 2018-04-30 00:00:00.000000000 Z
|
|
12
12
|
dependencies:
|
|
13
13
|
- !ruby/object:Gem::Dependency
|
|
14
14
|
name: blacklight
|
|
@@ -24,34 +24,20 @@ dependencies:
|
|
|
24
24
|
- - ">="
|
|
25
25
|
- !ruby/object:Gem::Version
|
|
26
26
|
version: '0'
|
|
27
|
-
- !ruby/object:Gem::Dependency
|
|
28
|
-
name: blacklight_range_limit
|
|
29
|
-
requirement: !ruby/object:Gem::Requirement
|
|
30
|
-
requirements:
|
|
31
|
-
- - ">="
|
|
32
|
-
- !ruby/object:Gem::Version
|
|
33
|
-
version: '0'
|
|
34
|
-
type: :runtime
|
|
35
|
-
prerelease: false
|
|
36
|
-
version_requirements: !ruby/object:Gem::Requirement
|
|
37
|
-
requirements:
|
|
38
|
-
- - ">="
|
|
39
|
-
- !ruby/object:Gem::Version
|
|
40
|
-
version: '0'
|
|
41
27
|
- !ruby/object:Gem::Dependency
|
|
42
28
|
name: rails
|
|
43
29
|
requirement: !ruby/object:Gem::Requirement
|
|
44
30
|
requirements:
|
|
45
31
|
- - "~>"
|
|
46
32
|
- !ruby/object:Gem::Version
|
|
47
|
-
version: 5.
|
|
33
|
+
version: '5.0'
|
|
48
34
|
type: :runtime
|
|
49
35
|
prerelease: false
|
|
50
36
|
version_requirements: !ruby/object:Gem::Requirement
|
|
51
37
|
requirements:
|
|
52
38
|
- - "~>"
|
|
53
39
|
- !ruby/object:Gem::Version
|
|
54
|
-
version: 5.
|
|
40
|
+
version: '5.0'
|
|
55
41
|
- !ruby/object:Gem::Dependency
|
|
56
42
|
name: bundler
|
|
57
43
|
requirement: !ruby/object:Gem::Requirement
|
|
@@ -70,16 +56,16 @@ dependencies:
|
|
|
70
56
|
name: engine_cart
|
|
71
57
|
requirement: !ruby/object:Gem::Requirement
|
|
72
58
|
requirements:
|
|
73
|
-
- - "
|
|
59
|
+
- - "~>"
|
|
74
60
|
- !ruby/object:Gem::Version
|
|
75
|
-
version:
|
|
61
|
+
version: 1.2.0
|
|
76
62
|
type: :development
|
|
77
63
|
prerelease: false
|
|
78
64
|
version_requirements: !ruby/object:Gem::Requirement
|
|
79
65
|
requirements:
|
|
80
|
-
- - "
|
|
66
|
+
- - "~>"
|
|
81
67
|
- !ruby/object:Gem::Version
|
|
82
|
-
version:
|
|
68
|
+
version: 1.2.0
|
|
83
69
|
- !ruby/object:Gem::Dependency
|
|
84
70
|
name: mocha
|
|
85
71
|
requirement: !ruby/object:Gem::Requirement
|
|
@@ -206,6 +192,7 @@ files:
|
|
|
206
192
|
- ".solr_wrapper"
|
|
207
193
|
- ".travis.yml"
|
|
208
194
|
- CHANGELOG.md
|
|
195
|
+
- CODE_OF_CONDUCT.md
|
|
209
196
|
- CONTRIBUTING.md
|
|
210
197
|
- Gemfile
|
|
211
198
|
- LICENSE.txt
|
|
@@ -213,7 +200,6 @@ files:
|
|
|
213
200
|
- Rakefile
|
|
214
201
|
- app/assets/images/blacklight/compact.svg
|
|
215
202
|
- app/assets/images/blacklight/logo.png
|
|
216
|
-
- app/assets/javascripts/warclight/warclight.js
|
|
217
203
|
- app/assets/stylesheets/warclight/application.scss
|
|
218
204
|
- app/assets/stylesheets/warclight/warclight.scss
|
|
219
205
|
- app/controllers/concerns/warclight/field_config_helpers.rb
|
|
@@ -222,7 +208,6 @@ files:
|
|
|
222
208
|
- app/models/concerns/warclight/catalog.rb
|
|
223
209
|
- app/models/concerns/warclight/search_behavior.rb
|
|
224
210
|
- app/models/concerns/warclight/solr_document.rb
|
|
225
|
-
- app/views/layouts/warclight/application.html.erb
|
|
226
211
|
- bin/rails
|
|
227
212
|
- config/routes.rb
|
|
228
213
|
- lib/generators/warclight/install_generator.rb
|
|
@@ -279,6 +264,7 @@ files:
|
|
|
279
264
|
- solr/conf/solrconfig.xml
|
|
280
265
|
- solr/conf/stopwords.txt
|
|
281
266
|
- solr/conf/synonyms.txt
|
|
267
|
+
- solr/warclight_warc-indexer.conf
|
|
282
268
|
- tasks/warclight.rake
|
|
283
269
|
- template.rb
|
|
284
270
|
- vendor/assets/javascripts/responsiveTruncator.js
|
|
@@ -304,7 +290,7 @@ required_rubygems_version: !ruby/object:Gem::Requirement
|
|
|
304
290
|
version: '0'
|
|
305
291
|
requirements: []
|
|
306
292
|
rubyforge_project:
|
|
307
|
-
rubygems_version: 2.6.
|
|
293
|
+
rubygems_version: 2.6.14.1
|
|
308
294
|
signing_key:
|
|
309
295
|
specification_version: 4
|
|
310
296
|
summary: A Rails engine supporting discovery of web archives.
|
|
@@ -1,14 +0,0 @@
|
|
|
1
|
-
<!DOCTYPE html>
|
|
2
|
-
<html>
|
|
3
|
-
<head>
|
|
4
|
-
<title>Warclight</title>
|
|
5
|
-
<%= stylesheet_link_tag "warclight/application", media: "all" %>
|
|
6
|
-
<%= javascript_include_tag "warclight/application" %>
|
|
7
|
-
<%= csrf_meta_tags %>
|
|
8
|
-
</head>
|
|
9
|
-
<body>
|
|
10
|
-
|
|
11
|
-
<%= yield %>
|
|
12
|
-
|
|
13
|
-
</body>
|
|
14
|
-
</html>
|