nabatheon 0.0.1

Sign up to get free protection for your applications and to get access to all the features.
checksums.yaml ADDED
@@ -0,0 +1,7 @@
1
+ ---
2
+ SHA1:
3
+ metadata.gz: ffa754c5da46aa74bc07cf04e237fca122dc1841
4
+ data.tar.gz: 88df7edeba1f3e7249991f524d4597e4d03ce8c1
5
+ SHA512:
6
+ metadata.gz: 46a8570a6ee87b72b1aedcb7d428c12756e77129ec7ee5c8b245e36cfc42851caf47f802e6df6d0918c09066fbfdea10c11835eec821cbeb7719444db85a83dd
7
+ data.tar.gz: a618ccb08402fc33333037ded0dd21110733304f2c4ac547d585c0dc0f82b3452d10833621d0960c2e34ade0624e26483bdcd17c8ca250812e0ece4e37d44240
data/.gitignore ADDED
@@ -0,0 +1,16 @@
1
+ /.bundle/
2
+ /.yardoc
3
+ /Gemfile.lock
4
+ /_yardoc/
5
+ /coverage/
6
+ /doc/
7
+ /pkg/
8
+ /spec/reports/
9
+ /tmp/
10
+ *.bundle
11
+ *.so
12
+ *.o
13
+ *.a
14
+ mkmf.log
15
+ *.gem
16
+
data/Gemfile ADDED
@@ -0,0 +1,4 @@
1
+ source 'https://rubygems.org'
2
+
3
+ # Specify your gem's dependencies in nabatheon.gemspec
4
+ gemspec
data/LICENSE.txt ADDED
@@ -0,0 +1,22 @@
1
+ Copyright (c) 2015 Jacob Burenstam
2
+
3
+ MIT License
4
+
5
+ Permission is hereby granted, free of charge, to any person obtaining
6
+ a copy of this software and associated documentation files (the
7
+ "Software"), to deal in the Software without restriction, including
8
+ without limitation the rights to use, copy, modify, merge, publish,
9
+ distribute, sublicense, and/or sell copies of the Software, and to
10
+ permit persons to whom the Software is furnished to do so, subject to
11
+ the following conditions:
12
+
13
+ The above copyright notice and this permission notice shall be
14
+ included in all copies or substantial portions of the Software.
15
+
16
+ THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND,
17
+ EXPRESS OR IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF
18
+ MERCHANTABILITY, FITNESS FOR A PARTICULAR PURPOSE AND
19
+ NONINFRINGEMENT. IN NO EVENT SHALL THE AUTHORS OR COPYRIGHT HOLDERS BE
20
+ LIABLE FOR ANY CLAIM, DAMAGES OR OTHER LIABILITY, WHETHER IN AN ACTION
21
+ OF CONTRACT, TORT OR OTHERWISE, ARISING FROM, OUT OF OR IN CONNECTION
22
+ WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN THE SOFTWARE.
data/README.md ADDED
@@ -0,0 +1,36 @@
1
+ # Nabatheon
2
+
3
+ TODO: Write a gem description
4
+
5
+ ## Installation
6
+
7
+ Add this line to your application's Gemfile:
8
+
9
+ ```ruby
10
+ gem 'nabatheon'
11
+ ```
12
+
13
+ And then execute:
14
+
15
+ $ bundle
16
+
17
+ Or install it yourself as:
18
+
19
+ $ gem install nabatheon
20
+
21
+ ## Usage
22
+
23
+ ```ruby
24
+ text = <<-content
25
+ Angela Merkel met Nicolas Sarkozy on January 25th in Berlin to discuss a new austerity package. Sarkozy looked pleased, but Merkel was dismayed.
26
+ content
27
+ Nabatheon.annotate(text)
28
+ ```
29
+
30
+ ## Contributing
31
+
32
+ 1. Fork it ( https://github.com/buren/nabatheon/fork )
33
+ 2. Create your feature branch (`git checkout -b my-new-feature`)
34
+ 3. Commit your changes (`git commit -am 'Add some feature'`)
35
+ 4. Push to the branch (`git push origin my-new-feature`)
36
+ 5. Create a new Pull Request
data/Rakefile ADDED
@@ -0,0 +1,11 @@
1
+ require 'bundler/gem_tasks'
2
+
3
+ task default: [:console]
4
+
5
+ task :console do
6
+ require 'irb'
7
+ require 'irb/completion'
8
+ require 'nabatheon'
9
+ ARGV.clear
10
+ IRB.start
11
+ end
data/bin/nabatheon ADDED
@@ -0,0 +1,11 @@
1
+ #!/usr/bin/env ruby
2
+
3
+ require 'nabatheon'
4
+
5
+ text = if File.exists?(ARGV[0])
6
+ File.read(ARGV[0])
7
+ else
8
+ ARGV.join(' ')
9
+ end
10
+
11
+ Nabatheon.annotate(text)
@@ -0,0 +1,3 @@
1
+ module Nabatheon
2
+ VERSION = '0.0.1'
3
+ end
data/lib/nabatheon.rb ADDED
@@ -0,0 +1,26 @@
1
+ require 'nabatheon/version'
2
+ require 'stanford-core-nlp'
3
+
4
+ module Nabatheon
5
+ BASE_DEP_PATH = "#{File.expand_path('~')}/.stanford-nlp"
6
+ StanfordCoreNLP.jar_path = "#{BASE_DEP_PATH}/nlp/jars/stanford-core-nlp-full/"
7
+ StanfordCoreNLP.model_path = "#{BASE_DEP_PATH}/nlp/models/"
8
+ StanfordCoreNLP.log_file = 'tmp/log.txt'
9
+ StanfordCoreNLP.use :english
10
+ Pipeline = StanfordCoreNLP.load(:tokenize, :ssplit, :pos, :lemma, :parse, :ner)
11
+
12
+ def self.annotate(raw_text)
13
+ text = StanfordCoreNLP::Annotation.new(raw_text)
14
+ Pipeline.annotate(text)
15
+
16
+ named_lemma = []
17
+ text.get(:sentences).each do |sentence|
18
+ sentence.get(:tokens).each do |token|
19
+ entity_tag = token.get(:named_entity_tag).to_s
20
+ lemma = token.get(:lemma).to_s
21
+ named_lemma << [entity_tag, lemma] unless entity_tag == 'O'
22
+ end
23
+ end
24
+ puts named_lemma.inspect
25
+ end
26
+ end
data/nabatheon.gemspec ADDED
@@ -0,0 +1,26 @@
1
+ # coding: utf-8
2
+ lib = File.expand_path('../lib', __FILE__)
3
+ $LOAD_PATH.unshift(lib) unless $LOAD_PATH.include?(lib)
4
+ require 'nabatheon/version'
5
+
6
+ Gem::Specification.new do |spec|
7
+ spec.name = 'nabatheon'
8
+ spec.version = Nabatheon::VERSION
9
+ spec.authors = ['Jacob Burenstam']
10
+ spec.email = ['burenstam@gmail.com']
11
+ spec.summary = %q{Extract named entities and lemmas using StanfordCoreNLP.}
12
+ spec.description = %q{Extract named entities and lemmas using StanfordCoreNLP (alpha). Assumes that all dependencies are in ~/.stanford-nlp}
13
+ spec.homepage = 'https://github.com/buren/nabatheon'
14
+ spec.license = 'MIT'
15
+
16
+ spec.files = `git ls-files -z`.split("\x0")
17
+ spec.executables = spec.files.grep(%r{^bin/}) { |f| File.basename(f) }
18
+ spec.test_files = spec.files.grep(%r{^(test|spec|features)/})
19
+ spec.require_paths = ['lib']
20
+
21
+ spec.add_dependency 'stanford-core-nlp', '0.5.1'
22
+
23
+ spec.add_development_dependency 'bundler', '~> 1.7'
24
+ spec.add_development_dependency 'rake', '~> 10.0'
25
+ spec.add_development_dependency 'pry'
26
+ end
metadata ADDED
@@ -0,0 +1,112 @@
1
+ --- !ruby/object:Gem::Specification
2
+ name: nabatheon
3
+ version: !ruby/object:Gem::Version
4
+ version: 0.0.1
5
+ platform: ruby
6
+ authors:
7
+ - Jacob Burenstam
8
+ autorequire:
9
+ bindir: bin
10
+ cert_chain: []
11
+ date: 2015-05-08 00:00:00.000000000 Z
12
+ dependencies:
13
+ - !ruby/object:Gem::Dependency
14
+ name: stanford-core-nlp
15
+ requirement: !ruby/object:Gem::Requirement
16
+ requirements:
17
+ - - '='
18
+ - !ruby/object:Gem::Version
19
+ version: 0.5.1
20
+ type: :runtime
21
+ prerelease: false
22
+ version_requirements: !ruby/object:Gem::Requirement
23
+ requirements:
24
+ - - '='
25
+ - !ruby/object:Gem::Version
26
+ version: 0.5.1
27
+ - !ruby/object:Gem::Dependency
28
+ name: bundler
29
+ requirement: !ruby/object:Gem::Requirement
30
+ requirements:
31
+ - - "~>"
32
+ - !ruby/object:Gem::Version
33
+ version: '1.7'
34
+ type: :development
35
+ prerelease: false
36
+ version_requirements: !ruby/object:Gem::Requirement
37
+ requirements:
38
+ - - "~>"
39
+ - !ruby/object:Gem::Version
40
+ version: '1.7'
41
+ - !ruby/object:Gem::Dependency
42
+ name: rake
43
+ requirement: !ruby/object:Gem::Requirement
44
+ requirements:
45
+ - - "~>"
46
+ - !ruby/object:Gem::Version
47
+ version: '10.0'
48
+ type: :development
49
+ prerelease: false
50
+ version_requirements: !ruby/object:Gem::Requirement
51
+ requirements:
52
+ - - "~>"
53
+ - !ruby/object:Gem::Version
54
+ version: '10.0'
55
+ - !ruby/object:Gem::Dependency
56
+ name: pry
57
+ requirement: !ruby/object:Gem::Requirement
58
+ requirements:
59
+ - - ">="
60
+ - !ruby/object:Gem::Version
61
+ version: '0'
62
+ type: :development
63
+ prerelease: false
64
+ version_requirements: !ruby/object:Gem::Requirement
65
+ requirements:
66
+ - - ">="
67
+ - !ruby/object:Gem::Version
68
+ version: '0'
69
+ description: Extract named entities and lemmas using StanfordCoreNLP (alpha). Assumes
70
+ that all dependencies are in ~/.stanford-nlp
71
+ email:
72
+ - burenstam@gmail.com
73
+ executables:
74
+ - nabatheon
75
+ extensions: []
76
+ extra_rdoc_files: []
77
+ files:
78
+ - ".gitignore"
79
+ - Gemfile
80
+ - LICENSE.txt
81
+ - README.md
82
+ - Rakefile
83
+ - bin/nabatheon
84
+ - lib/nabatheon.rb
85
+ - lib/nabatheon/version.rb
86
+ - nabatheon.gemspec
87
+ homepage: https://github.com/buren/nabatheon
88
+ licenses:
89
+ - MIT
90
+ metadata: {}
91
+ post_install_message:
92
+ rdoc_options: []
93
+ require_paths:
94
+ - lib
95
+ required_ruby_version: !ruby/object:Gem::Requirement
96
+ requirements:
97
+ - - ">="
98
+ - !ruby/object:Gem::Version
99
+ version: '0'
100
+ required_rubygems_version: !ruby/object:Gem::Requirement
101
+ requirements:
102
+ - - ">="
103
+ - !ruby/object:Gem::Version
104
+ version: '0'
105
+ requirements: []
106
+ rubyforge_project:
107
+ rubygems_version: 2.2.2
108
+ signing_key:
109
+ specification_version: 4
110
+ summary: Extract named entities and lemmas using StanfordCoreNLP.
111
+ test_files: []
112
+ has_rdoc: