ark_tweet_nlp 0.3.1 → 0.3.2

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
checksums.yaml CHANGED
@@ -1,7 +1,7 @@
1
1
  ---
2
2
  SHA1:
3
- metadata.gz: 3e871d9a343c2765aa5ffe330399d65186a8f53d
4
- data.tar.gz: e38987b047782875d9da857935b0570fda9ed8fd
3
+ metadata.gz: edcfbf9006fa1fd8b4d0f8fd882f33cdda06d903
4
+ data.tar.gz: f87ed6b80eac040f92a109641dafb651761eb592
5
5
  SHA512:
6
- metadata.gz: 96f63bbdd0534f4b63a5a93c96c5d14702ea572c2286febc45dccda9ee6844c0070e878286557bb66dc2a6c89bc34cc146cf75095d48a99324f82d1efff09c54
7
- data.tar.gz: 5f709d7f6ef82b0942cad0380afc827d4c080ea9acc9f5ec6294797691a893f1582e820a2c66636ea10d5fc5edb2b4149dcc19c488e838e57e1d34e8b6aa82b7
6
+ metadata.gz: ab69ac07296077fe85ccbf2e11d411d97cc690ba1dca8e215255f0d5ae02edff780dbf7406d3482b10a7d4697731f273060241645ab0aa12f7bda26ff091c17f
7
+ data.tar.gz: b02476e693cb8ebf6968a9d252dc090e0df0b8529d99ce441058c1e0871a69f99c92bee6769b88455885bcef73b354a698f791784b54f42c88a54e32f77f8c2e
@@ -40,7 +40,7 @@ module ArkTweetNlp
40
40
  end
41
41
 
42
42
  def Parser.find_tags text
43
- result = Parser.run_tagger(text)
43
+ result = Parser.run_tagger(text.tr_s("\t"," ")).gsub(/\t\t\t\s*\n/,'')
44
44
  result.split("\n").map{ |line| Parser.convert_line( line ) }
45
45
  end
46
46
 
@@ -73,9 +73,9 @@ module ArkTweetNlp
73
73
  end
74
74
 
75
75
  def Parser.convert_line line
76
- text = line.split("\t")[0].split
77
- tags = line.split("\t")[1].split
78
- text.each.with_index.inject({}){ |result,(value,index)| result[value] = tags[index].to_sym; result }
76
+ text = line.split("\t")[0].split
77
+ tags = line.split("\t")[1].split
78
+ text.each.with_index.inject({}){ |result,(value,index)| result[value] = tags[index].to_sym; result }
79
79
  end
80
80
 
81
81
  def Parser.safe_invert hash
@@ -1,3 +1,3 @@
1
1
  module ArkTweetNlp
2
- VERSION = "0.3.1"
2
+ VERSION = "0.3.2"
3
3
  end
@@ -6,6 +6,7 @@ describe ArkTweetNlp::Parser do
6
6
  expect(ArkTweetNlp::Parser::TAGSET.size).to eq 25
7
7
  end
8
8
  end
9
+
9
10
  describe '#find_tags' do
10
11
  it "cathegorizes words in tweets" do
11
12
  expect(ArkTweetNlp::Parser.find_tags('faceboooooooook is awesome')).to eq([ {'faceboooooooook' => :^,
@@ -15,13 +16,16 @@ describe ArkTweetNlp::Parser do
15
16
  it "suports urls" do
16
17
  expect(ArkTweetNlp::Parser.find_tags("I think I haven't had a segmentation fault in years http://t.co/COjaaFj6Ib")).to eq( [{"I"=>:O, "think"=>:V, "haven't"=>:V, "had"=>:V, "a"=>:D, "segmentation"=>:N, "fault"=>:N, "in"=>:P, "years"=>:N, "http://t.co/COjaaFj6Ib"=>:U}] )
17
18
  end
18
- it "supoorts ponctuation from the tweets" do
19
- expect(ArkTweetNlp::Parser.find_tags("Delayed... And waiting on a tire from Louisville. \"You can't be serious #Disappointed #pissed #letdown http://t.co/BFqsPZmr8m")).to eq([{"Delayed"=>:V, "..."=>:",", "And"=>:&, "waiting"=>:V, "on"=>:P, "a"=>:D, "tire"=>:N, "from"=>:P, "Louisville"=>:^, "."=>:",", "\""=>:",", "You"=>:O, "can't"=>:V, "be"=>:V, "serious"=>:A, "#Disappointed"=>:"#", "#pissed"=>:"#", "#letdown"=>:"#", "http://t.co/BFqsPZmr8m"=>:U}])
19
+ it "supoorts ponctuation from the tweets, but removes \t" do
20
+ expect(ArkTweetNlp::Parser.find_tags("Delayed... And waiting on \t a tire from Louisville. \"You can't be serious #Disappointed #pissed #letdown http://t.co/BFqsPZmr8m")).to eq([{"Delayed"=>:V, "..."=>:",", "And"=>:&, "waiting"=>:V, "on"=>:P, "a"=>:D, "tire"=>:N, "from"=>:P, "Louisville"=>:^, "."=>:",", "\""=>:",", "You"=>:O, "can't"=>:V, "be"=>:V, "serious"=>:A, "#Disappointed"=>:"#", "#pissed"=>:"#", "#letdown"=>:"#", "http://t.co/BFqsPZmr8m"=>:U}])
20
21
  end
21
22
  it "tags multiple tweets per line" do
22
23
  expect(ArkTweetNlp::Parser.find_tags("faceboooooooook is awesome\nfaceboooooooook is awesome")).to eq([{'faceboooooooook' => :^,'is' => :V,'awesome' => :A},{'faceboooooooook' => :^,'is' => :V,'awesome' => :A} ])
23
24
 
24
25
  end
26
+ it 'supports empty strings' do
27
+ expect(ArkTweetNlp::Parser.find_tags("\t\t\t\nfaceboooooooook is awesome\nfaceboooooooook is awesome")).to eq([{'faceboooooooook' => :^,'is' => :V,'awesome' => :A},{'faceboooooooook' => :^,'is' => :V,'awesome' => :A} ])
28
+ end
25
29
  end
26
30
 
27
31
  describe '#get_words_tagged_as' do
metadata CHANGED
@@ -1,167 +1,167 @@
1
1
  --- !ruby/object:Gem::Specification
2
2
  name: ark_tweet_nlp
3
3
  version: !ruby/object:Gem::Version
4
- version: 0.3.1
4
+ version: 0.3.2
5
5
  platform: ruby
6
6
  authors:
7
7
  - Bernardo
8
8
  autorequire:
9
9
  bindir: bin
10
10
  cert_chain: []
11
- date: 2014-09-15 00:00:00.000000000 Z
11
+ date: 2014-09-22 00:00:00.000000000 Z
12
12
  dependencies:
13
13
  - !ruby/object:Gem::Dependency
14
14
  name: bundler
15
15
  requirement: !ruby/object:Gem::Requirement
16
16
  requirements:
17
- - - ~>
17
+ - - "~>"
18
18
  - !ruby/object:Gem::Version
19
19
  version: '1.7'
20
20
  type: :development
21
21
  prerelease: false
22
22
  version_requirements: !ruby/object:Gem::Requirement
23
23
  requirements:
24
- - - ~>
24
+ - - "~>"
25
25
  - !ruby/object:Gem::Version
26
26
  version: '1.7'
27
27
  - !ruby/object:Gem::Dependency
28
28
  name: rake
29
29
  requirement: !ruby/object:Gem::Requirement
30
30
  requirements:
31
- - - ~>
31
+ - - "~>"
32
32
  - !ruby/object:Gem::Version
33
33
  version: '10.0'
34
34
  type: :development
35
35
  prerelease: false
36
36
  version_requirements: !ruby/object:Gem::Requirement
37
37
  requirements:
38
- - - ~>
38
+ - - "~>"
39
39
  - !ruby/object:Gem::Version
40
40
  version: '10.0'
41
41
  - !ruby/object:Gem::Dependency
42
42
  name: rspec
43
43
  requirement: !ruby/object:Gem::Requirement
44
44
  requirements:
45
- - - '>='
45
+ - - ">="
46
46
  - !ruby/object:Gem::Version
47
47
  version: '0'
48
48
  type: :development
49
49
  prerelease: false
50
50
  version_requirements: !ruby/object:Gem::Requirement
51
51
  requirements:
52
- - - '>='
52
+ - - ">="
53
53
  - !ruby/object:Gem::Version
54
54
  version: '0'
55
55
  - !ruby/object:Gem::Dependency
56
56
  name: rspec-nc
57
57
  requirement: !ruby/object:Gem::Requirement
58
58
  requirements:
59
- - - '>='
59
+ - - ">="
60
60
  - !ruby/object:Gem::Version
61
61
  version: '0'
62
62
  type: :development
63
63
  prerelease: false
64
64
  version_requirements: !ruby/object:Gem::Requirement
65
65
  requirements:
66
- - - '>='
66
+ - - ">="
67
67
  - !ruby/object:Gem::Version
68
68
  version: '0'
69
69
  - !ruby/object:Gem::Dependency
70
70
  name: pry
71
71
  requirement: !ruby/object:Gem::Requirement
72
72
  requirements:
73
- - - '>='
73
+ - - ">="
74
74
  - !ruby/object:Gem::Version
75
75
  version: '0'
76
76
  type: :development
77
77
  prerelease: false
78
78
  version_requirements: !ruby/object:Gem::Requirement
79
79
  requirements:
80
- - - '>='
80
+ - - ">="
81
81
  - !ruby/object:Gem::Version
82
82
  version: '0'
83
83
  - !ruby/object:Gem::Dependency
84
84
  name: pry-nav
85
85
  requirement: !ruby/object:Gem::Requirement
86
86
  requirements:
87
- - - '>='
87
+ - - ">="
88
88
  - !ruby/object:Gem::Version
89
89
  version: '0'
90
90
  type: :development
91
91
  prerelease: false
92
92
  version_requirements: !ruby/object:Gem::Requirement
93
93
  requirements:
94
- - - '>='
94
+ - - ">="
95
95
  - !ruby/object:Gem::Version
96
96
  version: '0'
97
97
  - !ruby/object:Gem::Dependency
98
98
  name: pry-rescue
99
99
  requirement: !ruby/object:Gem::Requirement
100
100
  requirements:
101
- - - '>='
101
+ - - ">="
102
102
  - !ruby/object:Gem::Version
103
103
  version: '0'
104
104
  type: :development
105
105
  prerelease: false
106
106
  version_requirements: !ruby/object:Gem::Requirement
107
107
  requirements:
108
- - - '>='
108
+ - - ">="
109
109
  - !ruby/object:Gem::Version
110
110
  version: '0'
111
111
  - !ruby/object:Gem::Dependency
112
112
  name: pry-stack_explorer
113
113
  requirement: !ruby/object:Gem::Requirement
114
114
  requirements:
115
- - - '>='
115
+ - - ">="
116
116
  - !ruby/object:Gem::Version
117
117
  version: '0'
118
118
  type: :development
119
119
  prerelease: false
120
120
  version_requirements: !ruby/object:Gem::Requirement
121
121
  requirements:
122
- - - '>='
122
+ - - ">="
123
123
  - !ruby/object:Gem::Version
124
124
  version: '0'
125
125
  - !ruby/object:Gem::Dependency
126
126
  name: pry-doc
127
127
  requirement: !ruby/object:Gem::Requirement
128
128
  requirements:
129
- - - '>='
129
+ - - ">="
130
130
  - !ruby/object:Gem::Version
131
131
  version: '0'
132
132
  type: :development
133
133
  prerelease: false
134
134
  version_requirements: !ruby/object:Gem::Requirement
135
135
  requirements:
136
- - - '>='
136
+ - - ">="
137
137
  - !ruby/object:Gem::Version
138
138
  version: '0'
139
139
  - !ruby/object:Gem::Dependency
140
140
  name: guard
141
141
  requirement: !ruby/object:Gem::Requirement
142
142
  requirements:
143
- - - '>='
143
+ - - ">="
144
144
  - !ruby/object:Gem::Version
145
145
  version: '0'
146
146
  type: :development
147
147
  prerelease: false
148
148
  version_requirements: !ruby/object:Gem::Requirement
149
149
  requirements:
150
- - - '>='
150
+ - - ">="
151
151
  - !ruby/object:Gem::Version
152
152
  version: '0'
153
153
  - !ruby/object:Gem::Dependency
154
154
  name: guard-rspec
155
155
  requirement: !ruby/object:Gem::Requirement
156
156
  requirements:
157
- - - '>='
157
+ - - ">="
158
158
  - !ruby/object:Gem::Version
159
159
  version: '0'
160
160
  type: :development
161
161
  prerelease: false
162
162
  version_requirements: !ruby/object:Gem::Requirement
163
163
  requirements:
164
- - - '>='
164
+ - - ">="
165
165
  - !ruby/object:Gem::Version
166
166
  version: '0'
167
167
  description: Tags tweets word into multiple cathegories using NLP
@@ -173,7 +173,7 @@ executables:
173
173
  extensions: []
174
174
  extra_rdoc_files: []
175
175
  files:
176
- - .gitignore
176
+ - ".gitignore"
177
177
  - Gemfile
178
178
  - Guardfile
179
179
  - LICENSE.txt
@@ -197,20 +197,21 @@ require_paths:
197
197
  - lib
198
198
  required_ruby_version: !ruby/object:Gem::Requirement
199
199
  requirements:
200
- - - '>='
200
+ - - ">="
201
201
  - !ruby/object:Gem::Version
202
202
  version: '0'
203
203
  required_rubygems_version: !ruby/object:Gem::Requirement
204
204
  requirements:
205
- - - '>='
205
+ - - ">="
206
206
  - !ruby/object:Gem::Version
207
207
  version: '0'
208
208
  requirements: []
209
209
  rubyforge_project:
210
- rubygems_version: 2.0.14
210
+ rubygems_version: 2.2.2
211
211
  signing_key:
212
212
  specification_version: 4
213
213
  summary: Ruby wrapper for the Carnegie Mellon Twitter NLP
214
214
  test_files:
215
215
  - spec/parser_spec.rb
216
216
  - spec/spec_helper.rb
217
+ has_rdoc: