tokenizer 0.0.1.prealpha

Sign up to get free protection for your applications and to get access to all the features.
data/LICENSE ADDED
File without changes
data/README.rdoc ADDED
File without changes
data/Rakefile ADDED
@@ -0,0 +1,37 @@
1
+ begin
2
+ require 'rake'
3
+ rescue LoadError
4
+ require 'rubygems'
5
+ require 'rake'
6
+ end
7
+
8
+ # we can require 'rake/clean' to add 'clobber' and 'clean' tasks
9
+ require 'rake/clean'
10
+
11
+
12
+
13
+ SRC = FileList['**/*.rb']
14
+
15
+ CLOBBER.include('doc', '**/*.html', '**/*.gem')
16
+
17
+ # testing
18
+ require 'rake/testtask'
19
+ Rake::TestTask.new do |t|
20
+ t.test_files = FileList.new('test/**/*.rb').to_a
21
+ end
22
+
23
+ # Build the gem package
24
+ load 'tokenizer.gemspec'
25
+ require 'rubygems/package_task'
26
+ Gem::PackageTask.new(GEMSPEC).define
27
+
28
+ # Generate documentation
29
+ require 'rdoc/task'
30
+ RDoc::Task.new do |rdoc|
31
+ rdoc.rdoc_files.include('README', 'LICENSE', 'lib/**/*')
32
+ end
33
+
34
+ desc "Open an irb session preloaded with this library."
35
+ task :console do
36
+ sh "irb -rubygems -I lib -r tokenizer.rb"
37
+ end
data/bin/tokenize ADDED
@@ -0,0 +1,8 @@
1
+ #!/usr/bin/ruby -nw
2
+
3
+ BEGIN {
4
+ $/ = " "
5
+ }
6
+
7
+ puts $_
8
+
@@ -0,0 +1,3 @@
1
+ module Tokenizer
2
+ VERSION = '0.0.1.prealpha'
3
+ end
File without changes
metadata ADDED
@@ -0,0 +1,76 @@
1
+ --- !ruby/object:Gem::Specification
2
+ name: tokenizer
3
+ version: !ruby/object:Gem::Version
4
+ hash: 196621262
5
+ prerelease: 6
6
+ segments:
7
+ - 0
8
+ - 0
9
+ - 1
10
+ - prealpha
11
+ version: 0.0.1.prealpha
12
+ platform: ruby
13
+ authors:
14
+ - Andrei Beliankou
15
+ autorequire:
16
+ bindir: bin
17
+ cert_chain: []
18
+
19
+ date: 2011-05-05 00:00:00 Z
20
+ dependencies: []
21
+
22
+ description: A simple tokenizer for NLP tasks.
23
+ email: a.belenkow@uni-trier.de
24
+ executables:
25
+ - tokenize
26
+ extensions: []
27
+
28
+ extra_rdoc_files:
29
+ - README.rdoc
30
+ - LICENSE
31
+ files:
32
+ - lib/tokenizer/version.rb
33
+ - bin/tokenize
34
+ - README.rdoc
35
+ - LICENSE
36
+ - Rakefile
37
+ - test/test_tokenizer.rb
38
+ homepage: http://www.uni-trier.de/index.php?id=34451
39
+ licenses: []
40
+
41
+ post_install_message:
42
+ rdoc_options:
43
+ - -m
44
+ - README.rdoc
45
+ require_paths:
46
+ - lib
47
+ required_ruby_version: !ruby/object:Gem::Requirement
48
+ none: false
49
+ requirements:
50
+ - - ">="
51
+ - !ruby/object:Gem::Version
52
+ hash: 31
53
+ segments:
54
+ - 1
55
+ - 8
56
+ version: "1.8"
57
+ required_rubygems_version: !ruby/object:Gem::Requirement
58
+ none: false
59
+ requirements:
60
+ - - ">"
61
+ - !ruby/object:Gem::Version
62
+ hash: 25
63
+ segments:
64
+ - 1
65
+ - 3
66
+ - 1
67
+ version: 1.3.1
68
+ requirements: []
69
+
70
+ rubyforge_project: tokenizer
71
+ rubygems_version: 1.7.2
72
+ signing_key:
73
+ specification_version: 3
74
+ summary: Tokenizer is a linguistic tool intended to split a text into tokens.
75
+ test_files:
76
+ - test/test_tokenizer.rb