opener-tree-tagger 4.1.0 → 4.1.1
This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
- checksums.yaml +4 -4
- data/README.md +1 -3
- data/core/token_matcher.pyc +0 -0
- data/lib/opener/tree_tagger/version.rb +1 -1
- data/task/compile.rake +1 -1
- data/task/requirements.rake +1 -1
- data/task/test.rake +2 -0
- data/task/tree_tagger.rake +104 -0
- metadata +3 -3
- data/core/token_matcher.pyo +0 -0
checksums.yaml
CHANGED
@@ -1,7 +1,7 @@
|
|
1
1
|
---
|
2
2
|
SHA1:
|
3
|
-
metadata.gz:
|
4
|
-
data.tar.gz:
|
3
|
+
metadata.gz: 9aca59531b99c79ccd0c90b96cd29b97dbf5bafb
|
4
|
+
data.tar.gz: 0003f755f745bdcfe7b07b32cd73956f2ebccd4a
|
5
5
|
SHA512:
|
6
|
-
metadata.gz:
|
7
|
-
data.tar.gz:
|
6
|
+
metadata.gz: d82e488f8b2762298ab4be2f2ab856ee129c61cb666fa48297a44445024c0e78edcbf0a237625219451d695ec2a1843456922b500f2ccdc5798b7f1bd135eaf8
|
7
|
+
data.tar.gz: 957524f329e7ea0848787b8629f8728eab0102b3b9920a8cfa9abd4f2aa954c79c72e4462d3bc79d374e0b4b2cd5df4cc2d9a0aa8d87ba8dec31d6479307d05e
|
data/README.md
CHANGED
@@ -1,5 +1,3 @@
|
|
1
|
-
[](https://drone.io/github.com/opener-project/VU-tree-tagger_kernel/latest)
|
2
|
-
|
3
1
|
Introduction
|
4
2
|
------------
|
5
3
|
|
@@ -152,4 +150,4 @@ Contributing
|
|
152
150
|
2. Create your feature branch (`git checkout -b my-new-feature`)
|
153
151
|
3. Commit your changes (`git commit -am 'Add some feature'`)
|
154
152
|
4. Push to the branch (`git push origin my-new-feature`)
|
155
|
-
5. Create new Pull Request
|
153
|
+
5. Create new Pull Request
|
data/core/token_matcher.pyc
CHANGED
Binary file
|
data/task/compile.rake
CHANGED
@@ -1,2 +1,2 @@
|
|
1
1
|
desc 'Verifies requirements and compiles the core'
|
2
|
-
task :compile => ['requirements', 'python:compile']
|
2
|
+
task :compile => ['requirements', 'python:compile', 'tree_tagger']
|
data/task/requirements.rake
CHANGED
data/task/test.rake
CHANGED
@@ -0,0 +1,104 @@
|
|
1
|
+
# This Rake task takes care of setting up a local (in ./tmp) installation of the
|
2
|
+
# TreeTagger program used by this OpeNER component. Sadly TreeTagger is a total
|
3
|
+
# pain to install and not shipped with Debian and other distributions. Yay
|
4
|
+
# software!
|
5
|
+
#
|
6
|
+
# Once installed you can set your TREE_TAGGER_PATH as following:
|
7
|
+
#
|
8
|
+
# export TREE_TAGGER_PATH=./tmp/tree_tagger
|
9
|
+
|
10
|
+
# The name of the TreeTagger archive to download. Currently only Linux and OS X
|
11
|
+
# are supported.
|
12
|
+
if RbConfig::CONFIG['build_os'].include?('darwin')
|
13
|
+
archive = 'tree-tagger-MacOSX-3.2-intel.tar.gz'
|
14
|
+
else
|
15
|
+
archive = 'tree-tagger-linux-3.2.tar.gz'
|
16
|
+
end
|
17
|
+
|
18
|
+
tagging_archive = 'tagger-scripts.tar.gz'
|
19
|
+
installer = 'install-tagger.sh'
|
20
|
+
|
21
|
+
parameter_tasks = []
|
22
|
+
parameter_files = [
|
23
|
+
'dutch-par-linux-3.2-utf8.bin.gz',
|
24
|
+
'english-par-linux-3.2-utf8.bin.gz',
|
25
|
+
'french-par-linux-3.2-utf8.bin.gz',
|
26
|
+
'german-par-linux-3.2-utf8.bin.gz',
|
27
|
+
'italian-par-linux-3.2-utf8.bin.gz',
|
28
|
+
'spanish-par-linux-3.2-utf8.bin.gz',
|
29
|
+
'english-chunker-par-linux-3.2-utf8.bin.gz',
|
30
|
+
'french-chunker-par-linux-3.2-utf8.bin.gz',
|
31
|
+
'german-chunker-par-linux-3.2-utf8.bin.gz'
|
32
|
+
]
|
33
|
+
|
34
|
+
base_url = 'http://www.cis.uni-muenchen.de/~schmid/tools/TreeTagger/data/'
|
35
|
+
archive_url = base_url + archive
|
36
|
+
tagging_url = base_url + tagging_archive
|
37
|
+
installer_url = base_url + installer
|
38
|
+
|
39
|
+
tmp_target = 'tmp/tree_tagger'
|
40
|
+
tmp_executable = File.join(tmp_target, 'bin/tree-tagger')
|
41
|
+
tmp_archive = File.join(tmp_target, archive)
|
42
|
+
tmp_tagging_archive = File.join(tmp_target, tagging_archive)
|
43
|
+
tmp_installer = File.join(tmp_target, installer)
|
44
|
+
|
45
|
+
# Downloads the base TreeTagger code
|
46
|
+
file(tmp_archive) do |task|
|
47
|
+
sh "wget #{archive_url} -O #{task.name} --quiet"
|
48
|
+
end
|
49
|
+
|
50
|
+
# Downloads the tagging scripts.
|
51
|
+
file(tmp_tagging_archive) do |task|
|
52
|
+
sh "wget #{tagging_url} -O #{task.name} --quiet"
|
53
|
+
end
|
54
|
+
|
55
|
+
# Downloads the installer script.
|
56
|
+
file(tmp_installer) do |task|
|
57
|
+
sh "wget #{installer_url} -O #{task.name} --quiet"
|
58
|
+
end
|
59
|
+
|
60
|
+
directory(tmp_target) do |task|
|
61
|
+
sh "mkdir -p #{task.name}"
|
62
|
+
end
|
63
|
+
|
64
|
+
parameter_files.each do |name|
|
65
|
+
task_name = File.join(tmp_target, name)
|
66
|
+
input_url = base_url + name
|
67
|
+
|
68
|
+
parameter_tasks << task_name
|
69
|
+
|
70
|
+
file(task_name) do |task|
|
71
|
+
sh "wget #{input_url} -O #{task.name} --quiet"
|
72
|
+
end
|
73
|
+
end
|
74
|
+
|
75
|
+
file(tmp_executable) do |task|
|
76
|
+
# Downloaded half the internet, lets actually install TreeTagger.
|
77
|
+
Dir.chdir(tmp_target) do
|
78
|
+
sh "bash #{installer}"
|
79
|
+
|
80
|
+
# TreeTagger at some point dropped the "-utf8" suffix from tagging scripts
|
81
|
+
# located in cmd/, this however only applies to newer versions of the
|
82
|
+
# tagging scripts. To support both we'll simply symlink these files.
|
83
|
+
#
|
84
|
+
# In case you're wondering: no, TreeTagger doesn't version the tagging
|
85
|
+
# scripts, as such this could break again at any point in time.
|
86
|
+
Dir['cmd/tree-tagger-*'].each do |cmd_file|
|
87
|
+
cmd_file = File.expand_path(cmd_file)
|
88
|
+
suffixed = cmd_file + '-utf8'
|
89
|
+
|
90
|
+
sh "ln -s #{cmd_file} #{suffixed}"
|
91
|
+
sh "chmod +x #{suffixed}"
|
92
|
+
end
|
93
|
+
end
|
94
|
+
end
|
95
|
+
|
96
|
+
build_requirements = [
|
97
|
+
tmp_target,
|
98
|
+
tmp_archive,
|
99
|
+
tmp_tagging_archive,
|
100
|
+
tmp_installer
|
101
|
+
] + parameter_tasks + [tmp_executable]
|
102
|
+
|
103
|
+
desc 'Installs a local copy of TreeTagger'
|
104
|
+
task :tree_tagger => build_requirements
|
metadata
CHANGED
@@ -1,7 +1,7 @@
|
|
1
1
|
--- !ruby/object:Gem::Specification
|
2
2
|
name: opener-tree-tagger
|
3
3
|
version: !ruby/object:Gem::Version
|
4
|
-
version: 4.1.
|
4
|
+
version: 4.1.1
|
5
5
|
platform: ruby
|
6
6
|
authors:
|
7
7
|
- rubenIzquierdo
|
@@ -9,7 +9,7 @@ authors:
|
|
9
9
|
autorequire:
|
10
10
|
bindir: bin
|
11
11
|
cert_chain: []
|
12
|
-
date:
|
12
|
+
date: 2015-01-12 00:00:00.000000000 Z
|
13
13
|
dependencies:
|
14
14
|
- !ruby/object:Gem::Dependency
|
15
15
|
name: opener-daemons
|
@@ -163,7 +163,6 @@ files:
|
|
163
163
|
- core/spanish.map.treetagger.kaf.csv
|
164
164
|
- core/token_matcher.py
|
165
165
|
- core/token_matcher.pyc
|
166
|
-
- core/token_matcher.pyo
|
167
166
|
- core/tt_from_kaf_to_kaf.py
|
168
167
|
- exec/tree-tagger.rb
|
169
168
|
- ext/hack/Rakefile
|
@@ -180,6 +179,7 @@ files:
|
|
180
179
|
- task/python.rake
|
181
180
|
- task/requirements.rake
|
182
181
|
- task/test.rake
|
182
|
+
- task/tree_tagger.rake
|
183
183
|
homepage: http://opener-project.github.com/
|
184
184
|
licenses:
|
185
185
|
- Apache 2.0
|
data/core/token_matcher.pyo
DELETED
Binary file
|