tokenizer 0.0.1.prealpha

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
data/LICENSE ADDED
File without changes
data/README.rdoc ADDED
File without changes
data/Rakefile ADDED
@@ -0,0 +1,37 @@
1
+ begin
2
+ require 'rake'
3
+ rescue LoadError
4
+ require 'rubygems'
5
+ require 'rake'
6
+ end
7
+
8
+ # we can require 'rake/clean' to add 'clobber' and 'clean' tasks
9
+ require 'rake/clean'
10
+
11
+
12
+
13
+ SRC = FileList['**/*.rb']
14
+
15
+ CLOBBER.include('doc', '**/*.html', '**/*.gem')
16
+
17
+ # testing
18
+ require 'rake/testtask'
19
+ Rake::TestTask.new do |t|
20
+ t.test_files = FileList.new('test/**/*.rb').to_a
21
+ end
22
+
23
+ # Build the gem package
24
+ load 'tokenizer.gemspec'
25
+ require 'rubygems/package_task'
26
+ Gem::PackageTask.new(GEMSPEC).define
27
+
28
+ # Generate documentation
29
+ require 'rdoc/task'
30
+ RDoc::Task.new do |rdoc|
31
+ rdoc.rdoc_files.include('README', 'LICENSE', 'lib/**/*')
32
+ end
33
+
34
+ desc "Open an irb session preloaded with this library."
35
+ task :console do
36
+ sh "irb -rubygems -I lib -r tokenizer.rb"
37
+ end
data/bin/tokenize ADDED
@@ -0,0 +1,8 @@
1
+ #!/usr/bin/ruby -nw
2
+
3
+ BEGIN {
4
+ $/ = " "
5
+ }
6
+
7
+ puts $_
8
+
@@ -0,0 +1,3 @@
1
+ module Tokenizer
2
+ VERSION = '0.0.1.prealpha'
3
+ end
File without changes
metadata ADDED
@@ -0,0 +1,76 @@
1
+ --- !ruby/object:Gem::Specification
2
+ name: tokenizer
3
+ version: !ruby/object:Gem::Version
4
+ hash: 196621262
5
+ prerelease: 6
6
+ segments:
7
+ - 0
8
+ - 0
9
+ - 1
10
+ - prealpha
11
+ version: 0.0.1.prealpha
12
+ platform: ruby
13
+ authors:
14
+ - Andrei Beliankou
15
+ autorequire:
16
+ bindir: bin
17
+ cert_chain: []
18
+
19
+ date: 2011-05-05 00:00:00 Z
20
+ dependencies: []
21
+
22
+ description: A simple tokenizer for NLP tasks.
23
+ email: a.belenkow@uni-trier.de
24
+ executables:
25
+ - tokenize
26
+ extensions: []
27
+
28
+ extra_rdoc_files:
29
+ - README.rdoc
30
+ - LICENSE
31
+ files:
32
+ - lib/tokenizer/version.rb
33
+ - bin/tokenize
34
+ - README.rdoc
35
+ - LICENSE
36
+ - Rakefile
37
+ - test/test_tokenizer.rb
38
+ homepage: http://www.uni-trier.de/index.php?id=34451
39
+ licenses: []
40
+
41
+ post_install_message:
42
+ rdoc_options:
43
+ - -m
44
+ - README.rdoc
45
+ require_paths:
46
+ - lib
47
+ required_ruby_version: !ruby/object:Gem::Requirement
48
+ none: false
49
+ requirements:
50
+ - - ">="
51
+ - !ruby/object:Gem::Version
52
+ hash: 31
53
+ segments:
54
+ - 1
55
+ - 8
56
+ version: "1.8"
57
+ required_rubygems_version: !ruby/object:Gem::Requirement
58
+ none: false
59
+ requirements:
60
+ - - ">"
61
+ - !ruby/object:Gem::Version
62
+ hash: 25
63
+ segments:
64
+ - 1
65
+ - 3
66
+ - 1
67
+ version: 1.3.1
68
+ requirements: []
69
+
70
+ rubyforge_project: tokenizer
71
+ rubygems_version: 1.7.2
72
+ signing_key:
73
+ specification_version: 3
74
+ summary: Tokenizer is a linguistic tool intended to split a text into tokens.
75
+ test_files:
76
+ - test/test_tokenizer.rb