liveblog-indexer 0.1.0
This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
- checksums.yaml +7 -0
- checksums.yaml.gz.sig +5 -0
- data/lib/liveblog-indexer.rb +76 -0
- data.tar.gz.sig +0 -0
- metadata +108 -0
- metadata.gz.sig +1 -0
checksums.yaml
ADDED
@@ -0,0 +1,7 @@
|
|
1
|
+
---
|
2
|
+
SHA1:
|
3
|
+
metadata.gz: 56937c6f8eb2b40f417e73a5512fa60593647517
|
4
|
+
data.tar.gz: a87152912b799beab92e305565065ee391364b32
|
5
|
+
SHA512:
|
6
|
+
metadata.gz: 9e99db1533e3279c4d4b70ddb58609fb5e234e8e9124d401bff3970d5e8d2ffa5671556d1ec0e6706c0212868bde0c469f5e07e5a85609838aa5494df7bf9426
|
7
|
+
data.tar.gz: 9d58190002e8cb8b490c61879f47901fe07c0ec374546dd52fae46d0c5c95ec8a6dce1c92eff850e957c0d776fe99f59577eb5c32f1bf46c2512a516140f385e
|
checksums.yaml.gz.sig
ADDED
@@ -0,0 +1,76 @@
|
|
1
|
+
#!/usr/bin/env ruby
|
2
|
+
|
3
|
+
# file: liveblog-indexer.rb
|
4
|
+
|
5
|
+
require 'xws'
|
6
|
+
require 'json'
|
7
|
+
require 'polyrex'
|
8
|
+
|
9
|
+
|
10
|
+
class LiveBlogIndexer
|
11
|
+
|
12
|
+
def initialize(filepath=nil)
|
13
|
+
|
14
|
+
@master = if filepath and File.exists? filepath then
|
15
|
+
JSON.parse(File.read(filepath))
|
16
|
+
else
|
17
|
+
{}
|
18
|
+
end
|
19
|
+
|
20
|
+
@xws = XWS.new
|
21
|
+
|
22
|
+
end
|
23
|
+
|
24
|
+
def add_index(src)
|
25
|
+
|
26
|
+
doc = Rexle.new(RXFHelper.read(src).first )
|
27
|
+
sections = doc.root.xpath 'records/section'
|
28
|
+
|
29
|
+
sections.each do |section|
|
30
|
+
|
31
|
+
url = "%s/#%s" % [src[/^https?:\/\/[^\/]+(.*)(?=\/formatted.xml$)/,1], \
|
32
|
+
section.attributes[:id]]
|
33
|
+
|
34
|
+
h = @xws.scan section.element('details')
|
35
|
+
|
36
|
+
h.each do |k, v|
|
37
|
+
|
38
|
+
word, count = k, v
|
39
|
+
|
40
|
+
keyword = @master[word]
|
41
|
+
|
42
|
+
if keyword then
|
43
|
+
|
44
|
+
keyword[url] = count
|
45
|
+
|
46
|
+
else
|
47
|
+
|
48
|
+
@master[word] = {}
|
49
|
+
@master[word][url] = count
|
50
|
+
|
51
|
+
end # /keyword
|
52
|
+
end # /h
|
53
|
+
end # /section
|
54
|
+
end # /add_index
|
55
|
+
|
56
|
+
|
57
|
+
def save(filepath=nil)
|
58
|
+
|
59
|
+
File.write filepath, @master.to_json
|
60
|
+
puts 'saved ' + File.basename(filepath)
|
61
|
+
|
62
|
+
px = Polyrex.new 'words/key[word]/location[url, wordcount]'
|
63
|
+
|
64
|
+
@master.each do |k,rows|
|
65
|
+
px.create.key(word: k) do |create|
|
66
|
+
rows.each do |k, v|
|
67
|
+
create.location url: k, wordcount: v
|
68
|
+
end
|
69
|
+
end
|
70
|
+
end
|
71
|
+
pxfilepath = File.join(File.dirname(filepath), 'search-index.xml')
|
72
|
+
px.save pxfilepath, options: {pretty: true}
|
73
|
+
puts 'saved ' + File.basename(pxfilepath)
|
74
|
+
end
|
75
|
+
|
76
|
+
end
|
data.tar.gz.sig
ADDED
Binary file
|
metadata
ADDED
@@ -0,0 +1,108 @@
|
|
1
|
+
--- !ruby/object:Gem::Specification
|
2
|
+
name: liveblog-indexer
|
3
|
+
version: !ruby/object:Gem::Version
|
4
|
+
version: 0.1.0
|
5
|
+
platform: ruby
|
6
|
+
authors:
|
7
|
+
- James Robertson
|
8
|
+
autorequire:
|
9
|
+
bindir: bin
|
10
|
+
cert_chain:
|
11
|
+
- |
|
12
|
+
-----BEGIN CERTIFICATE-----
|
13
|
+
MIIDljCCAn6gAwIBAgIBATANBgkqhkiG9w0BAQUFADBIMRIwEAYDVQQDDAlnZW1t
|
14
|
+
YXN0ZXIxHjAcBgoJkiaJk/IsZAEZFg5qYW1lc3JvYmVydHNvbjESMBAGCgmSJomT
|
15
|
+
8ixkARkWAmV1MB4XDTE1MTExMjIxMTkyMVoXDTE2MTExMTIxMTkyMVowSDESMBAG
|
16
|
+
A1UEAwwJZ2VtbWFzdGVyMR4wHAYKCZImiZPyLGQBGRYOamFtZXNyb2JlcnRzb24x
|
17
|
+
EjAQBgoJkiaJk/IsZAEZFgJldTCCASIwDQYJKoZIhvcNAQEBBQADggEPADCCAQoC
|
18
|
+
ggEBAMjQ3f/YG2mPM5EMmrUlk2/+K3hOdZCCNIsuVYmfDaSVJO7T2A1hGDpp6qw2
|
19
|
+
NDCOLKXJ8B8MkIuSTZlsqIcM52RtZDLtjuFQvxlDysHjQdS89ab9NXSH+FtjEsnl
|
20
|
+
MAw+HB1na9+esmUfORTq3Qvf8/NVanJ0jpO78zZhHoIcH6/ZNxLGXEXhxCA3SSL/
|
21
|
+
RUwnF2ds4EmYjpYAF4DrtT7uRP80sOa5JDO9HWRIsJH70uZu/YNkzgD4qw9mssUW
|
22
|
+
yCDOOPPBXu1ZyCTYlkb8REMoZHCbIDASY/fJHmB+lfwI7WR10NauCNdru+d5L6db
|
23
|
+
lZ2+imBz1/JaibgbzwtUTkXbw8ECAwEAAaOBijCBhzAJBgNVHRMEAjAAMAsGA1Ud
|
24
|
+
DwQEAwIEsDAdBgNVHQ4EFgQUDiC6KdE35bCvxp4kHsAfxpJz4dEwJgYDVR0RBB8w
|
25
|
+
HYEbZ2VtbWFzdGVyQGphbWVzcm9iZXJ0c29uLmV1MCYGA1UdEgQfMB2BG2dlbW1h
|
26
|
+
c3RlckBqYW1lc3JvYmVydHNvbi5ldTANBgkqhkiG9w0BAQUFAAOCAQEAh7gf6A0R
|
27
|
+
5MN6ar8lV6/5ONlT9aljXGddCasCyC0pM94TIjH/2QblBWRodcb/oTGcnf28s9Zs
|
28
|
+
zBbBfl+YNUAS/y2a3Qj8/xgCC003tXgSuvXzrMlQ/o+2gDuLuGEkId8ceUXfUuXf
|
29
|
+
F4uMWpNiNk1Wt41dDGTzn9oCPt7Ssau3MqfiI5Lyl4lFQNqI+NlnsSkuJ3Fj7yOy
|
30
|
+
f1v1HUEOKUabrwhEuev8u1qZh+K4wUcsEkcvI06xLgObh2dbV2lW1Z0cOF7X8hWQ
|
31
|
+
mOnsi2V1CXpq2biJtSgD7mBx4cO9FXgbK3Xnsv45ygAPo6jj4Eb34udqz+0v88Ys
|
32
|
+
KoTqNQOniHAW2w==
|
33
|
+
-----END CERTIFICATE-----
|
34
|
+
date: 2015-11-12 00:00:00.000000000 Z
|
35
|
+
dependencies:
|
36
|
+
- !ruby/object:Gem::Dependency
|
37
|
+
name: xws
|
38
|
+
requirement: !ruby/object:Gem::Requirement
|
39
|
+
requirements:
|
40
|
+
- - "~>"
|
41
|
+
- !ruby/object:Gem::Version
|
42
|
+
version: '0.1'
|
43
|
+
- - ">="
|
44
|
+
- !ruby/object:Gem::Version
|
45
|
+
version: 0.1.1
|
46
|
+
type: :runtime
|
47
|
+
prerelease: false
|
48
|
+
version_requirements: !ruby/object:Gem::Requirement
|
49
|
+
requirements:
|
50
|
+
- - "~>"
|
51
|
+
- !ruby/object:Gem::Version
|
52
|
+
version: '0.1'
|
53
|
+
- - ">="
|
54
|
+
- !ruby/object:Gem::Version
|
55
|
+
version: 0.1.1
|
56
|
+
- !ruby/object:Gem::Dependency
|
57
|
+
name: polyrex
|
58
|
+
requirement: !ruby/object:Gem::Requirement
|
59
|
+
requirements:
|
60
|
+
- - "~>"
|
61
|
+
- !ruby/object:Gem::Version
|
62
|
+
version: '1.0'
|
63
|
+
- - ">="
|
64
|
+
- !ruby/object:Gem::Version
|
65
|
+
version: 1.0.11
|
66
|
+
type: :runtime
|
67
|
+
prerelease: false
|
68
|
+
version_requirements: !ruby/object:Gem::Requirement
|
69
|
+
requirements:
|
70
|
+
- - "~>"
|
71
|
+
- !ruby/object:Gem::Version
|
72
|
+
version: '1.0'
|
73
|
+
- - ">="
|
74
|
+
- !ruby/object:Gem::Version
|
75
|
+
version: 1.0.11
|
76
|
+
description:
|
77
|
+
email: james@r0bertson.co.uk
|
78
|
+
executables: []
|
79
|
+
extensions: []
|
80
|
+
extra_rdoc_files: []
|
81
|
+
files:
|
82
|
+
- lib/liveblog-indexer.rb
|
83
|
+
homepage: https://github.com/jrobertson/liveblog-indexer
|
84
|
+
licenses:
|
85
|
+
- MIT
|
86
|
+
metadata: {}
|
87
|
+
post_install_message:
|
88
|
+
rdoc_options: []
|
89
|
+
require_paths:
|
90
|
+
- lib
|
91
|
+
required_ruby_version: !ruby/object:Gem::Requirement
|
92
|
+
requirements:
|
93
|
+
- - ">="
|
94
|
+
- !ruby/object:Gem::Version
|
95
|
+
version: '0'
|
96
|
+
required_rubygems_version: !ruby/object:Gem::Requirement
|
97
|
+
requirements:
|
98
|
+
- - ">="
|
99
|
+
- !ruby/object:Gem::Version
|
100
|
+
version: '0'
|
101
|
+
requirements: []
|
102
|
+
rubyforge_project:
|
103
|
+
rubygems_version: 2.4.8
|
104
|
+
signing_key:
|
105
|
+
specification_version: 4
|
106
|
+
summary: This gem is under development. Generates a Liveblog indexed file in JSON
|
107
|
+
format as well as Polyrex format.
|
108
|
+
test_files: []
|
metadata.gz.sig
ADDED
@@ -0,0 +1 @@
|
|
1
|
+
|�U;\�@�M�hN��3��,��lV�0?�\�if*��+Z'5oX�1�Æ�Ԗ���[�g�*�TE`0��aVh�!��C�6�eA�ڒEO-M����Y����2�w�+Q��p��Z��)ɂZV�h2j���b���k�G�CV��\ -������˥���`�����[z&�k���Q�����M�p��<��F�q���U�����ػ��3�O��ۙhJ�������?P&����H�MD��{��/
|