iudex-simhash 1.1.0-java → 1.2.b.0-java
This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
- data/History.rdoc +3 -0
- data/Manifest.txt +1 -1
- data/README.rdoc +1 -1
- data/Rakefile +2 -34
- data/bin/iudex-simhash-perftest +1 -1
- data/lib/iudex-simhash.rb +1 -1
- data/lib/iudex-simhash/base.rb +2 -2
- data/lib/iudex-simhash/factory_helper.rb +1 -1
- data/lib/iudex-simhash/{iudex-simhash-1.1.0.jar → iudex-simhash-1.2.b.0.jar} +0 -0
- data/lib/iudex-simhash/sim_hash_gen_perf_test_factory.rb +1 -1
- data/pom.xml +3 -3
- data/test/setup.rb +17 -14
- data/test/test_fuzzy_set.rb +1 -1
- data/test/test_simhash_generator.rb +1 -1
- metadata +40 -32
- data/.gemtest +0 -0
data/History.rdoc
CHANGED
data/Manifest.txt
CHANGED
data/README.rdoc
CHANGED
data/Rakefile
CHANGED
|
@@ -1,39 +1,7 @@
|
|
|
1
1
|
# -*- ruby -*-
|
|
2
2
|
|
|
3
|
-
$LOAD_PATH << './lib'
|
|
4
|
-
require 'iudex-simhash/base'
|
|
5
|
-
|
|
6
3
|
require 'rubygems'
|
|
7
|
-
|
|
4
|
+
require 'bundler/setup'
|
|
8
5
|
require 'rjack-tarpit'
|
|
9
6
|
|
|
10
|
-
|
|
11
|
-
Iudex::SimHash::VERSION,
|
|
12
|
-
:no_assembly, :java_platform )
|
|
13
|
-
|
|
14
|
-
t.specify do |h|
|
|
15
|
-
h.developer( "David Kellum", "dek-oss@gravitext.com" )
|
|
16
|
-
h.extra_deps += [ [ 'iudex-html', '~> 1.1.0' ] ]
|
|
17
|
-
|
|
18
|
-
h.testlib = :minitest
|
|
19
|
-
h.extra_dev_deps += [ [ 'minitest', '~> 2.3' ],
|
|
20
|
-
[ 'rjack-logback', '~> 1.0' ] ]
|
|
21
|
-
end
|
|
22
|
-
|
|
23
|
-
file 'Manifest.txt' => [ 'pom.xml' ]
|
|
24
|
-
|
|
25
|
-
task :check_pom_version do
|
|
26
|
-
t.test_line_match( 'pom.xml', /<version>/, /#{t.version}/ )
|
|
27
|
-
end
|
|
28
|
-
task :check_history_version do
|
|
29
|
-
t.test_line_match( 'History.rdoc', /^==/, / #{t.version} / )
|
|
30
|
-
end
|
|
31
|
-
task :check_history_date do
|
|
32
|
-
t.test_line_match( 'History.rdoc', /^==/, /\([0-9\-]+\)$/ )
|
|
33
|
-
end
|
|
34
|
-
|
|
35
|
-
task :gem => [ :check_pom_version, :check_history_version ]
|
|
36
|
-
task :tag => [ :check_pom_version, :check_history_version, :check_history_date ]
|
|
37
|
-
task :push => [ :check_history_date ]
|
|
38
|
-
|
|
39
|
-
t.define_tasks
|
|
7
|
+
RJack::TarPit.new( 'iudex-simhash' ).define_tasks
|
data/bin/iudex-simhash-perftest
CHANGED
|
@@ -4,7 +4,7 @@
|
|
|
4
4
|
# For 64b add: -XX:+UseCompressedOops
|
|
5
5
|
|
|
6
6
|
#--
|
|
7
|
-
# Copyright (c)
|
|
7
|
+
# Copyright (c) 2008-2012 David Kellum
|
|
8
8
|
#
|
|
9
9
|
# Licensed under the Apache License, Version 2.0 (the "License"); you
|
|
10
10
|
# may not use this file except in compliance with the License. You may
|
data/lib/iudex-simhash.rb
CHANGED
data/lib/iudex-simhash/base.rb
CHANGED
|
@@ -1,5 +1,5 @@
|
|
|
1
1
|
#--
|
|
2
|
-
# Copyright (c)
|
|
2
|
+
# Copyright (c) 2008-2012 David Kellum
|
|
3
3
|
#
|
|
4
4
|
# Licensed under the Apache License, Version 2.0 (the "License"); you
|
|
5
5
|
# may not use this file except in compliance with the License. You may
|
|
@@ -16,6 +16,6 @@
|
|
|
16
16
|
|
|
17
17
|
module Iudex
|
|
18
18
|
module SimHash
|
|
19
|
-
VERSION = '1.
|
|
19
|
+
VERSION = '1.2.b.0'
|
|
20
20
|
end
|
|
21
21
|
end
|
|
Binary file
|
data/pom.xml
CHANGED
|
@@ -3,13 +3,13 @@
|
|
|
3
3
|
<groupId>iudex</groupId>
|
|
4
4
|
<artifactId>iudex-simhash</artifactId>
|
|
5
5
|
<packaging>jar</packaging>
|
|
6
|
-
<version>1.
|
|
6
|
+
<version>1.2.b.0</version>
|
|
7
7
|
<name>Iudex simhash production and searching</name>
|
|
8
8
|
|
|
9
9
|
<parent>
|
|
10
10
|
<groupId>iudex</groupId>
|
|
11
11
|
<artifactId>iudex-parent</artifactId>
|
|
12
|
-
<version>1.
|
|
12
|
+
<version>1.2.b.0</version>
|
|
13
13
|
<relativePath>..</relativePath>
|
|
14
14
|
</parent>
|
|
15
15
|
|
|
@@ -18,7 +18,7 @@
|
|
|
18
18
|
<dependency>
|
|
19
19
|
<groupId>iudex</groupId>
|
|
20
20
|
<artifactId>iudex-html</artifactId>
|
|
21
|
-
<version>[1.
|
|
21
|
+
<version>[1.2,1.2.9999)</version>
|
|
22
22
|
</dependency>
|
|
23
23
|
|
|
24
24
|
<dependency>
|
data/test/setup.rb
CHANGED
|
@@ -1,5 +1,5 @@
|
|
|
1
1
|
#--
|
|
2
|
-
# Copyright (c)
|
|
2
|
+
# Copyright (c) 2008-2012 David Kellum
|
|
3
3
|
#
|
|
4
4
|
# Licensed under the Apache License, Version 2.0 (the "License"); you
|
|
5
5
|
# may not use this file except in compliance with the License. You
|
|
@@ -14,22 +14,25 @@
|
|
|
14
14
|
# permissions and limitations under the License.
|
|
15
15
|
#++
|
|
16
16
|
|
|
17
|
-
#### General test setup
|
|
18
|
-
|
|
19
|
-
ldir = File.join( File.dirname( __FILE__ ), "..", "lib" )
|
|
20
|
-
$LOAD_PATH.unshift( ldir ) unless $LOAD_PATH.include?( ldir )
|
|
17
|
+
#### General test setup, logging, console output ####
|
|
21
18
|
|
|
22
19
|
require 'rubygems'
|
|
23
|
-
|
|
24
|
-
require 'rjack-logback'
|
|
25
|
-
RJack::Logback.config_console( :stderr => true )
|
|
20
|
+
require 'bundler/setup'
|
|
26
21
|
|
|
27
22
|
require 'minitest/unit'
|
|
28
23
|
require 'minitest/autorun'
|
|
29
24
|
|
|
30
|
-
|
|
31
|
-
|
|
32
|
-
|
|
33
|
-
|
|
34
|
-
|
|
35
|
-
|
|
25
|
+
require 'rjack-logback'
|
|
26
|
+
|
|
27
|
+
module TestSetup
|
|
28
|
+
include RJack
|
|
29
|
+
Logback.config_console( :stderr => true, :thread => true )
|
|
30
|
+
|
|
31
|
+
if ( ARGV & %w[ -v --verbose --debug ] ).empty?
|
|
32
|
+
Logback.root.level = Logback::INFO
|
|
33
|
+
else
|
|
34
|
+
Logback.root.level = Logback::DEBUG
|
|
35
|
+
end
|
|
36
|
+
|
|
37
|
+
ARGV.delete( '--debug' )
|
|
38
|
+
end
|
data/test/test_fuzzy_set.rb
CHANGED
|
@@ -2,7 +2,7 @@
|
|
|
2
2
|
#.hashdot.profile += jruby-shortlived
|
|
3
3
|
|
|
4
4
|
#--
|
|
5
|
-
# Copyright (c)
|
|
5
|
+
# Copyright (c) 2008-2012 David Kellum
|
|
6
6
|
#
|
|
7
7
|
# Licensed under the Apache License, Version 2.0 (the "License"); you
|
|
8
8
|
# may not use this file except in compliance with the License. You may
|
|
@@ -3,7 +3,7 @@
|
|
|
3
3
|
#.hashdot.profile += jruby-shortlived
|
|
4
4
|
|
|
5
5
|
#--
|
|
6
|
-
# Copyright (c)
|
|
6
|
+
# Copyright (c) 2008-2012 David Kellum
|
|
7
7
|
#
|
|
8
8
|
# Licensed under the Apache License, Version 2.0 (the "License"); you
|
|
9
9
|
# may not use this file except in compliance with the License. You
|
metadata
CHANGED
|
@@ -1,8 +1,8 @@
|
|
|
1
1
|
--- !ruby/object:Gem::Specification
|
|
2
2
|
name: iudex-simhash
|
|
3
3
|
version: !ruby/object:Gem::Version
|
|
4
|
-
prerelease:
|
|
5
|
-
version: 1.
|
|
4
|
+
prerelease: 4
|
|
5
|
+
version: 1.2.b.0
|
|
6
6
|
platform: java
|
|
7
7
|
authors:
|
|
8
8
|
- David Kellum
|
|
@@ -10,56 +10,64 @@ autorequire:
|
|
|
10
10
|
bindir: bin
|
|
11
11
|
cert_chain: []
|
|
12
12
|
|
|
13
|
-
date:
|
|
13
|
+
date: 2012-03-05 00:00:00 Z
|
|
14
14
|
dependencies:
|
|
15
15
|
- !ruby/object:Gem::Dependency
|
|
16
|
-
name: iudex-
|
|
16
|
+
name: iudex-core
|
|
17
|
+
version_requirements: &id001 !ruby/object:Gem::Requirement
|
|
18
|
+
none: false
|
|
19
|
+
requirements:
|
|
20
|
+
- - ~>
|
|
21
|
+
- !ruby/object:Gem::Version
|
|
22
|
+
version: 1.2.b
|
|
23
|
+
requirement: *id001
|
|
17
24
|
prerelease: false
|
|
18
|
-
|
|
25
|
+
type: :runtime
|
|
26
|
+
- !ruby/object:Gem::Dependency
|
|
27
|
+
name: iudex-html
|
|
28
|
+
version_requirements: &id002 !ruby/object:Gem::Requirement
|
|
19
29
|
none: false
|
|
20
30
|
requirements:
|
|
21
31
|
- - ~>
|
|
22
32
|
- !ruby/object:Gem::Version
|
|
23
|
-
version: 1.
|
|
33
|
+
version: 1.2.b
|
|
34
|
+
requirement: *id002
|
|
35
|
+
prerelease: false
|
|
24
36
|
type: :runtime
|
|
25
|
-
version_requirements: *id001
|
|
26
37
|
- !ruby/object:Gem::Dependency
|
|
27
38
|
name: minitest
|
|
28
|
-
|
|
29
|
-
requirement: &id002 !ruby/object:Gem::Requirement
|
|
39
|
+
version_requirements: &id003 !ruby/object:Gem::Requirement
|
|
30
40
|
none: false
|
|
31
41
|
requirements:
|
|
32
42
|
- - ~>
|
|
33
43
|
- !ruby/object:Gem::Version
|
|
34
44
|
version: "2.3"
|
|
45
|
+
requirement: *id003
|
|
46
|
+
prerelease: false
|
|
35
47
|
type: :development
|
|
36
|
-
version_requirements: *id002
|
|
37
48
|
- !ruby/object:Gem::Dependency
|
|
38
49
|
name: rjack-logback
|
|
39
|
-
|
|
40
|
-
requirement: &id003 !ruby/object:Gem::Requirement
|
|
50
|
+
version_requirements: &id004 !ruby/object:Gem::Requirement
|
|
41
51
|
none: false
|
|
42
52
|
requirements:
|
|
43
53
|
- - ~>
|
|
44
54
|
- !ruby/object:Gem::Version
|
|
45
55
|
version: "1.0"
|
|
56
|
+
requirement: *id004
|
|
57
|
+
prerelease: false
|
|
46
58
|
type: :development
|
|
47
|
-
version_requirements: *id003
|
|
48
59
|
- !ruby/object:Gem::Dependency
|
|
49
60
|
name: rjack-tarpit
|
|
50
|
-
|
|
51
|
-
requirement: &id004 !ruby/object:Gem::Requirement
|
|
61
|
+
version_requirements: &id005 !ruby/object:Gem::Requirement
|
|
52
62
|
none: false
|
|
53
63
|
requirements:
|
|
54
64
|
- - ~>
|
|
55
65
|
- !ruby/object:Gem::Version
|
|
56
|
-
version:
|
|
66
|
+
version: "2.0"
|
|
67
|
+
requirement: *id005
|
|
68
|
+
prerelease: false
|
|
57
69
|
type: :development
|
|
58
|
-
|
|
59
|
-
description: |-
|
|
60
|
-
Iudex is a general purpose web crawler and feed processor in
|
|
61
|
-
ruby/java. The iudex-simhash gem contains support for generation and
|
|
62
|
-
searching over simhash fingerprints
|
|
70
|
+
description: Iudex is a general purpose web crawler and feed processor in ruby/java. The iudex-simhash gem contains support for generation and searching over simhash fingerprints
|
|
63
71
|
email:
|
|
64
72
|
- dek-oss@gravitext.com
|
|
65
73
|
executables:
|
|
@@ -67,7 +75,6 @@ executables:
|
|
|
67
75
|
extensions: []
|
|
68
76
|
|
|
69
77
|
extra_rdoc_files:
|
|
70
|
-
- Manifest.txt
|
|
71
78
|
- History.rdoc
|
|
72
79
|
- README.rdoc
|
|
73
80
|
files:
|
|
@@ -86,8 +93,7 @@ files:
|
|
|
86
93
|
- test/test_fuzzy_set.rb
|
|
87
94
|
- test/test_simhash_generator.rb
|
|
88
95
|
- test/html/gentest.html
|
|
89
|
-
- lib/iudex-simhash/iudex-simhash-1.
|
|
90
|
-
- .gemtest
|
|
96
|
+
- lib/iudex-simhash/iudex-simhash-1.2.b.0.jar
|
|
91
97
|
homepage: http://github.com/dekellum/iudex
|
|
92
98
|
licenses: []
|
|
93
99
|
|
|
@@ -102,20 +108,22 @@ required_ruby_version: !ruby/object:Gem::Requirement
|
|
|
102
108
|
requirements:
|
|
103
109
|
- - ">="
|
|
104
110
|
- !ruby/object:Gem::Version
|
|
111
|
+
hash: 2
|
|
112
|
+
segments:
|
|
113
|
+
- 0
|
|
105
114
|
version: "0"
|
|
106
115
|
required_rubygems_version: !ruby/object:Gem::Requirement
|
|
107
116
|
none: false
|
|
108
117
|
requirements:
|
|
109
|
-
- - "
|
|
118
|
+
- - ">"
|
|
110
119
|
- !ruby/object:Gem::Version
|
|
111
|
-
version:
|
|
120
|
+
version: 1.3.1
|
|
112
121
|
requirements: []
|
|
113
122
|
|
|
114
|
-
rubyforge_project:
|
|
115
|
-
rubygems_version: 1.8.
|
|
123
|
+
rubyforge_project:
|
|
124
|
+
rubygems_version: 1.8.15
|
|
116
125
|
signing_key:
|
|
117
126
|
specification_version: 3
|
|
118
|
-
summary: Iudex is a general purpose web crawler and feed processor in ruby/java
|
|
119
|
-
test_files:
|
|
120
|
-
|
|
121
|
-
- test/test_simhash_generator.rb
|
|
127
|
+
summary: Iudex is a general purpose web crawler and feed processor in ruby/java.
|
|
128
|
+
test_files: []
|
|
129
|
+
|
data/.gemtest
DELETED
|
File without changes
|