iudex-simhash 1.4.0-java → 1.7.0-java
This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
- checksums.yaml +7 -0
- data/History.rdoc +3 -0
- data/Manifest.txt +1 -1
- data/README.rdoc +1 -1
- data/bin/iudex-simhash-perftest +1 -1
- data/lib/iudex-simhash.rb +1 -1
- data/lib/iudex-simhash/base.rb +2 -2
- data/lib/iudex-simhash/factory_helper.rb +1 -1
- data/lib/iudex-simhash/iudex-simhash-1.7.0.jar +0 -0
- data/lib/iudex-simhash/sim_hash_gen_perf_test_factory.rb +1 -1
- data/pom.xml +3 -3
- data/test/setup.rb +1 -1
- data/test/test_fuzzy_set.rb +1 -1
- data/test/test_simhash_generator.rb +1 -1
- metadata +35 -53
- data/lib/iudex-simhash/iudex-simhash-1.4.0.jar +0 -0
checksums.yaml
ADDED
|
@@ -0,0 +1,7 @@
|
|
|
1
|
+
---
|
|
2
|
+
SHA1:
|
|
3
|
+
metadata.gz: 4c591a91f3182a314f6c96d9764a0256eb75c5c2
|
|
4
|
+
data.tar.gz: 30afa0c9a5c4a9e884a8fe16e50aceec6806b4bc
|
|
5
|
+
SHA512:
|
|
6
|
+
metadata.gz: 9c723fa0aca27dd517ecca690417f61c7154e3291411aa6b8b2a0aabb16b7d054caa867efa395a9c5ea3e34325b8a15ca4d9df3898493513232ed2166c904250
|
|
7
|
+
data.tar.gz: 835caf1590e326acace334d39503ec04e4ad0a304bcb536a7ac7f431d75a9ef43f5826508bb503e125088ecdb3ebbbf4ba74a76857c3b11ece37c0f424e147d3
|
data/History.rdoc
CHANGED
data/Manifest.txt
CHANGED
data/README.rdoc
CHANGED
|
@@ -11,7 +11,7 @@ searching over simhash fingerprints
|
|
|
11
11
|
|
|
12
12
|
== License
|
|
13
13
|
|
|
14
|
-
Copyright (c)
|
|
14
|
+
Copyright (c) 2010-2015 David Kellum
|
|
15
15
|
|
|
16
16
|
Licensed under the Apache License, Version 2.0 (the "License"); you
|
|
17
17
|
may not use this file except in compliance with the License. You
|
data/bin/iudex-simhash-perftest
CHANGED
|
@@ -4,7 +4,7 @@
|
|
|
4
4
|
# For 64b add: -XX:+UseCompressedOops
|
|
5
5
|
|
|
6
6
|
#--
|
|
7
|
-
# Copyright (c)
|
|
7
|
+
# Copyright (c) 2010-2015 David Kellum
|
|
8
8
|
#
|
|
9
9
|
# Licensed under the Apache License, Version 2.0 (the "License"); you
|
|
10
10
|
# may not use this file except in compliance with the License. You may
|
data/lib/iudex-simhash.rb
CHANGED
data/lib/iudex-simhash/base.rb
CHANGED
|
@@ -1,5 +1,5 @@
|
|
|
1
1
|
#--
|
|
2
|
-
# Copyright (c)
|
|
2
|
+
# Copyright (c) 2010-2015 David Kellum
|
|
3
3
|
#
|
|
4
4
|
# Licensed under the Apache License, Version 2.0 (the "License"); you
|
|
5
5
|
# may not use this file except in compliance with the License. You may
|
|
@@ -16,6 +16,6 @@
|
|
|
16
16
|
|
|
17
17
|
module Iudex
|
|
18
18
|
module SimHash
|
|
19
|
-
VERSION = '1.
|
|
19
|
+
VERSION = '1.7.0'
|
|
20
20
|
end
|
|
21
21
|
end
|
|
Binary file
|
data/pom.xml
CHANGED
|
@@ -3,13 +3,13 @@
|
|
|
3
3
|
<groupId>iudex</groupId>
|
|
4
4
|
<artifactId>iudex-simhash</artifactId>
|
|
5
5
|
<packaging>jar</packaging>
|
|
6
|
-
<version>1.
|
|
6
|
+
<version>1.7.0</version>
|
|
7
7
|
<name>Iudex simhash production and searching</name>
|
|
8
8
|
|
|
9
9
|
<parent>
|
|
10
10
|
<groupId>iudex</groupId>
|
|
11
11
|
<artifactId>iudex-parent</artifactId>
|
|
12
|
-
<version>1.
|
|
12
|
+
<version>1.7.0</version>
|
|
13
13
|
<relativePath>..</relativePath>
|
|
14
14
|
</parent>
|
|
15
15
|
|
|
@@ -18,7 +18,7 @@
|
|
|
18
18
|
<dependency>
|
|
19
19
|
<groupId>iudex</groupId>
|
|
20
20
|
<artifactId>iudex-html</artifactId>
|
|
21
|
-
<version>[1.
|
|
21
|
+
<version>[1.7.0,1.999)</version>
|
|
22
22
|
</dependency>
|
|
23
23
|
|
|
24
24
|
<dependency>
|
data/test/setup.rb
CHANGED
data/test/test_fuzzy_set.rb
CHANGED
|
@@ -2,7 +2,7 @@
|
|
|
2
2
|
#.hashdot.profile += jruby-shortlived
|
|
3
3
|
|
|
4
4
|
#--
|
|
5
|
-
# Copyright (c)
|
|
5
|
+
# Copyright (c) 2010-2015 David Kellum
|
|
6
6
|
#
|
|
7
7
|
# Licensed under the Apache License, Version 2.0 (the "License"); you
|
|
8
8
|
# may not use this file except in compliance with the License. You may
|
|
@@ -3,7 +3,7 @@
|
|
|
3
3
|
#.hashdot.profile += jruby-shortlived
|
|
4
4
|
|
|
5
5
|
#--
|
|
6
|
-
# Copyright (c)
|
|
6
|
+
# Copyright (c) 2010-2015 David Kellum
|
|
7
7
|
#
|
|
8
8
|
# Licensed under the Apache License, Version 2.0 (the "License"); you
|
|
9
9
|
# may not use this file except in compliance with the License. You
|
metadata
CHANGED
|
@@ -1,96 +1,85 @@
|
|
|
1
1
|
--- !ruby/object:Gem::Specification
|
|
2
2
|
name: iudex-simhash
|
|
3
3
|
version: !ruby/object:Gem::Version
|
|
4
|
-
|
|
5
|
-
version: 1.4.0
|
|
4
|
+
version: 1.7.0
|
|
6
5
|
platform: java
|
|
7
6
|
authors:
|
|
8
7
|
- David Kellum
|
|
9
8
|
autorequire:
|
|
10
9
|
bindir: bin
|
|
11
10
|
cert_chain: []
|
|
12
|
-
date:
|
|
11
|
+
date: 2015-05-04 00:00:00.000000000 Z
|
|
13
12
|
dependencies:
|
|
14
13
|
- !ruby/object:Gem::Dependency
|
|
15
|
-
name: iudex-core
|
|
16
|
-
version_requirements: !ruby/object:Gem::Requirement
|
|
17
|
-
requirements:
|
|
18
|
-
- - ~>
|
|
19
|
-
- !ruby/object:Gem::Version
|
|
20
|
-
version: 1.4.0
|
|
21
|
-
none: false
|
|
22
14
|
requirement: !ruby/object:Gem::Requirement
|
|
23
15
|
requirements:
|
|
24
16
|
- - ~>
|
|
25
17
|
- !ruby/object:Gem::Version
|
|
26
|
-
version: 1.
|
|
27
|
-
|
|
18
|
+
version: '1.7'
|
|
19
|
+
name: iudex-core
|
|
28
20
|
prerelease: false
|
|
29
21
|
type: :runtime
|
|
30
|
-
- !ruby/object:Gem::Dependency
|
|
31
|
-
name: iudex-html
|
|
32
22
|
version_requirements: !ruby/object:Gem::Requirement
|
|
33
23
|
requirements:
|
|
34
24
|
- - ~>
|
|
35
25
|
- !ruby/object:Gem::Version
|
|
36
|
-
version: 1.
|
|
37
|
-
|
|
26
|
+
version: '1.7'
|
|
27
|
+
- !ruby/object:Gem::Dependency
|
|
38
28
|
requirement: !ruby/object:Gem::Requirement
|
|
39
29
|
requirements:
|
|
40
30
|
- - ~>
|
|
41
31
|
- !ruby/object:Gem::Version
|
|
42
|
-
version: 1.
|
|
43
|
-
|
|
32
|
+
version: '1.7'
|
|
33
|
+
name: iudex-html
|
|
44
34
|
prerelease: false
|
|
45
35
|
type: :runtime
|
|
46
|
-
- !ruby/object:Gem::Dependency
|
|
47
|
-
name: minitest
|
|
48
36
|
version_requirements: !ruby/object:Gem::Requirement
|
|
49
37
|
requirements:
|
|
50
38
|
- - ~>
|
|
51
39
|
- !ruby/object:Gem::Version
|
|
52
|
-
version:
|
|
53
|
-
|
|
40
|
+
version: '1.7'
|
|
41
|
+
- !ruby/object:Gem::Dependency
|
|
54
42
|
requirement: !ruby/object:Gem::Requirement
|
|
55
43
|
requirements:
|
|
56
44
|
- - ~>
|
|
57
45
|
- !ruby/object:Gem::Version
|
|
58
46
|
version: 4.7.4
|
|
59
|
-
|
|
47
|
+
name: minitest
|
|
60
48
|
prerelease: false
|
|
61
49
|
type: :development
|
|
62
|
-
- !ruby/object:Gem::Dependency
|
|
63
|
-
name: rjack-logback
|
|
64
50
|
version_requirements: !ruby/object:Gem::Requirement
|
|
65
51
|
requirements:
|
|
66
52
|
- - ~>
|
|
67
53
|
- !ruby/object:Gem::Version
|
|
68
|
-
version:
|
|
69
|
-
|
|
54
|
+
version: 4.7.4
|
|
55
|
+
- !ruby/object:Gem::Dependency
|
|
70
56
|
requirement: !ruby/object:Gem::Requirement
|
|
71
57
|
requirements:
|
|
72
58
|
- - ~>
|
|
73
59
|
- !ruby/object:Gem::Version
|
|
74
60
|
version: '1.5'
|
|
75
|
-
|
|
61
|
+
name: rjack-logback
|
|
76
62
|
prerelease: false
|
|
77
63
|
type: :development
|
|
78
|
-
- !ruby/object:Gem::Dependency
|
|
79
|
-
name: rjack-tarpit
|
|
80
64
|
version_requirements: !ruby/object:Gem::Requirement
|
|
81
65
|
requirements:
|
|
82
66
|
- - ~>
|
|
83
67
|
- !ruby/object:Gem::Version
|
|
84
|
-
version: '
|
|
85
|
-
|
|
68
|
+
version: '1.5'
|
|
69
|
+
- !ruby/object:Gem::Dependency
|
|
86
70
|
requirement: !ruby/object:Gem::Requirement
|
|
87
71
|
requirements:
|
|
88
72
|
- - ~>
|
|
89
73
|
- !ruby/object:Gem::Version
|
|
90
|
-
version: '2.
|
|
91
|
-
|
|
74
|
+
version: '2.1'
|
|
75
|
+
name: rjack-tarpit
|
|
92
76
|
prerelease: false
|
|
93
77
|
type: :development
|
|
78
|
+
version_requirements: !ruby/object:Gem::Requirement
|
|
79
|
+
requirements:
|
|
80
|
+
- - ~>
|
|
81
|
+
- !ruby/object:Gem::Version
|
|
82
|
+
version: '2.1'
|
|
94
83
|
description: Iudex is a general purpose web crawler and feed processor in ruby/java. The iudex-simhash gem contains support for generation and searching over simhash fingerprints
|
|
95
84
|
email:
|
|
96
85
|
- dek-oss@gravitext.com
|
|
@@ -105,20 +94,22 @@ files:
|
|
|
105
94
|
- Manifest.txt
|
|
106
95
|
- README.rdoc
|
|
107
96
|
- Rakefile
|
|
108
|
-
- pom.xml
|
|
109
97
|
- bin/iudex-simhash-perftest
|
|
110
98
|
- config/stopwords.en
|
|
111
|
-
- lib/iudex-simhash/base.rb
|
|
112
99
|
- lib/iudex-simhash.rb
|
|
100
|
+
- lib/iudex-simhash/base.rb
|
|
113
101
|
- lib/iudex-simhash/factory_helper.rb
|
|
102
|
+
- lib/iudex-simhash/iudex-simhash-1.7.0.jar
|
|
114
103
|
- lib/iudex-simhash/sim_hash_gen_perf_test_factory.rb
|
|
104
|
+
- pom.xml
|
|
105
|
+
- test/html/gentest.html
|
|
115
106
|
- test/setup.rb
|
|
116
107
|
- test/test_fuzzy_set.rb
|
|
117
108
|
- test/test_simhash_generator.rb
|
|
118
|
-
- test/html/gentest.html
|
|
119
|
-
- lib/iudex-simhash/iudex-simhash-1.4.0.jar
|
|
120
109
|
homepage: http://iudex.gravitext.com
|
|
121
|
-
licenses:
|
|
110
|
+
licenses:
|
|
111
|
+
- Apache-2.0
|
|
112
|
+
metadata: {}
|
|
122
113
|
post_install_message:
|
|
123
114
|
rdoc_options:
|
|
124
115
|
- --main
|
|
@@ -127,27 +118,18 @@ require_paths:
|
|
|
127
118
|
- lib
|
|
128
119
|
required_ruby_version: !ruby/object:Gem::Requirement
|
|
129
120
|
requirements:
|
|
130
|
-
- -
|
|
121
|
+
- - '>='
|
|
131
122
|
- !ruby/object:Gem::Version
|
|
132
|
-
version:
|
|
133
|
-
segments:
|
|
134
|
-
- 0
|
|
135
|
-
hash: 2
|
|
136
|
-
none: false
|
|
123
|
+
version: 1.8.7
|
|
137
124
|
required_rubygems_version: !ruby/object:Gem::Requirement
|
|
138
125
|
requirements:
|
|
139
|
-
- -
|
|
126
|
+
- - '>='
|
|
140
127
|
- !ruby/object:Gem::Version
|
|
141
128
|
version: '0'
|
|
142
|
-
segments:
|
|
143
|
-
- 0
|
|
144
|
-
hash: 2
|
|
145
|
-
none: false
|
|
146
129
|
requirements: []
|
|
147
130
|
rubyforge_project:
|
|
148
|
-
rubygems_version:
|
|
131
|
+
rubygems_version: 2.4.5
|
|
149
132
|
signing_key:
|
|
150
|
-
specification_version:
|
|
133
|
+
specification_version: 4
|
|
151
134
|
summary: Iudex is a general purpose web crawler and feed processor in ruby/java.
|
|
152
135
|
test_files: []
|
|
153
|
-
...
|
|
Binary file
|