ark_tweet_nlp 0.3.1 → 0.3.2

Sign up to get free protection for your applications and to get access to all the features.
checksums.yaml CHANGED
@@ -1,7 +1,7 @@
1
1
  ---
2
2
  SHA1:
3
- metadata.gz: 3e871d9a343c2765aa5ffe330399d65186a8f53d
4
- data.tar.gz: e38987b047782875d9da857935b0570fda9ed8fd
3
+ metadata.gz: edcfbf9006fa1fd8b4d0f8fd882f33cdda06d903
4
+ data.tar.gz: f87ed6b80eac040f92a109641dafb651761eb592
5
5
  SHA512:
6
- metadata.gz: 96f63bbdd0534f4b63a5a93c96c5d14702ea572c2286febc45dccda9ee6844c0070e878286557bb66dc2a6c89bc34cc146cf75095d48a99324f82d1efff09c54
7
- data.tar.gz: 5f709d7f6ef82b0942cad0380afc827d4c080ea9acc9f5ec6294797691a893f1582e820a2c66636ea10d5fc5edb2b4149dcc19c488e838e57e1d34e8b6aa82b7
6
+ metadata.gz: ab69ac07296077fe85ccbf2e11d411d97cc690ba1dca8e215255f0d5ae02edff780dbf7406d3482b10a7d4697731f273060241645ab0aa12f7bda26ff091c17f
7
+ data.tar.gz: b02476e693cb8ebf6968a9d252dc090e0df0b8529d99ce441058c1e0871a69f99c92bee6769b88455885bcef73b354a698f791784b54f42c88a54e32f77f8c2e
@@ -40,7 +40,7 @@ module ArkTweetNlp
40
40
  end
41
41
 
42
42
  def Parser.find_tags text
43
- result = Parser.run_tagger(text)
43
+ result = Parser.run_tagger(text.tr_s("\t"," ")).gsub(/\t\t\t\s*\n/,'')
44
44
  result.split("\n").map{ |line| Parser.convert_line( line ) }
45
45
  end
46
46
 
@@ -73,9 +73,9 @@ module ArkTweetNlp
73
73
  end
74
74
 
75
75
  def Parser.convert_line line
76
- text = line.split("\t")[0].split
77
- tags = line.split("\t")[1].split
78
- text.each.with_index.inject({}){ |result,(value,index)| result[value] = tags[index].to_sym; result }
76
+ text = line.split("\t")[0].split
77
+ tags = line.split("\t")[1].split
78
+ text.each.with_index.inject({}){ |result,(value,index)| result[value] = tags[index].to_sym; result }
79
79
  end
80
80
 
81
81
  def Parser.safe_invert hash
@@ -1,3 +1,3 @@
1
1
  module ArkTweetNlp
2
- VERSION = "0.3.1"
2
+ VERSION = "0.3.2"
3
3
  end
@@ -6,6 +6,7 @@ describe ArkTweetNlp::Parser do
6
6
  expect(ArkTweetNlp::Parser::TAGSET.size).to eq 25
7
7
  end
8
8
  end
9
+
9
10
  describe '#find_tags' do
10
11
  it "cathegorizes words in tweets" do
11
12
  expect(ArkTweetNlp::Parser.find_tags('faceboooooooook is awesome')).to eq([ {'faceboooooooook' => :^,
@@ -15,13 +16,16 @@ describe ArkTweetNlp::Parser do
15
16
  it "suports urls" do
16
17
  expect(ArkTweetNlp::Parser.find_tags("I think I haven't had a segmentation fault in years http://t.co/COjaaFj6Ib")).to eq( [{"I"=>:O, "think"=>:V, "haven't"=>:V, "had"=>:V, "a"=>:D, "segmentation"=>:N, "fault"=>:N, "in"=>:P, "years"=>:N, "http://t.co/COjaaFj6Ib"=>:U}] )
17
18
  end
18
- it "supoorts ponctuation from the tweets" do
19
- expect(ArkTweetNlp::Parser.find_tags("Delayed... And waiting on a tire from Louisville. \"You can't be serious #Disappointed #pissed #letdown http://t.co/BFqsPZmr8m")).to eq([{"Delayed"=>:V, "..."=>:",", "And"=>:&, "waiting"=>:V, "on"=>:P, "a"=>:D, "tire"=>:N, "from"=>:P, "Louisville"=>:^, "."=>:",", "\""=>:",", "You"=>:O, "can't"=>:V, "be"=>:V, "serious"=>:A, "#Disappointed"=>:"#", "#pissed"=>:"#", "#letdown"=>:"#", "http://t.co/BFqsPZmr8m"=>:U}])
19
+ it "supoorts ponctuation from the tweets, but removes \t" do
20
+ expect(ArkTweetNlp::Parser.find_tags("Delayed... And waiting on \t a tire from Louisville. \"You can't be serious #Disappointed #pissed #letdown http://t.co/BFqsPZmr8m")).to eq([{"Delayed"=>:V, "..."=>:",", "And"=>:&, "waiting"=>:V, "on"=>:P, "a"=>:D, "tire"=>:N, "from"=>:P, "Louisville"=>:^, "."=>:",", "\""=>:",", "You"=>:O, "can't"=>:V, "be"=>:V, "serious"=>:A, "#Disappointed"=>:"#", "#pissed"=>:"#", "#letdown"=>:"#", "http://t.co/BFqsPZmr8m"=>:U}])
20
21
  end
21
22
  it "tags multiple tweets per line" do
22
23
  expect(ArkTweetNlp::Parser.find_tags("faceboooooooook is awesome\nfaceboooooooook is awesome")).to eq([{'faceboooooooook' => :^,'is' => :V,'awesome' => :A},{'faceboooooooook' => :^,'is' => :V,'awesome' => :A} ])
23
24
 
24
25
  end
26
+ it 'supports empty strings' do
27
+ expect(ArkTweetNlp::Parser.find_tags("\t\t\t\nfaceboooooooook is awesome\nfaceboooooooook is awesome")).to eq([{'faceboooooooook' => :^,'is' => :V,'awesome' => :A},{'faceboooooooook' => :^,'is' => :V,'awesome' => :A} ])
28
+ end
25
29
  end
26
30
 
27
31
  describe '#get_words_tagged_as' do
metadata CHANGED
@@ -1,167 +1,167 @@
1
1
  --- !ruby/object:Gem::Specification
2
2
  name: ark_tweet_nlp
3
3
  version: !ruby/object:Gem::Version
4
- version: 0.3.1
4
+ version: 0.3.2
5
5
  platform: ruby
6
6
  authors:
7
7
  - Bernardo
8
8
  autorequire:
9
9
  bindir: bin
10
10
  cert_chain: []
11
- date: 2014-09-15 00:00:00.000000000 Z
11
+ date: 2014-09-22 00:00:00.000000000 Z
12
12
  dependencies:
13
13
  - !ruby/object:Gem::Dependency
14
14
  name: bundler
15
15
  requirement: !ruby/object:Gem::Requirement
16
16
  requirements:
17
- - - ~>
17
+ - - "~>"
18
18
  - !ruby/object:Gem::Version
19
19
  version: '1.7'
20
20
  type: :development
21
21
  prerelease: false
22
22
  version_requirements: !ruby/object:Gem::Requirement
23
23
  requirements:
24
- - - ~>
24
+ - - "~>"
25
25
  - !ruby/object:Gem::Version
26
26
  version: '1.7'
27
27
  - !ruby/object:Gem::Dependency
28
28
  name: rake
29
29
  requirement: !ruby/object:Gem::Requirement
30
30
  requirements:
31
- - - ~>
31
+ - - "~>"
32
32
  - !ruby/object:Gem::Version
33
33
  version: '10.0'
34
34
  type: :development
35
35
  prerelease: false
36
36
  version_requirements: !ruby/object:Gem::Requirement
37
37
  requirements:
38
- - - ~>
38
+ - - "~>"
39
39
  - !ruby/object:Gem::Version
40
40
  version: '10.0'
41
41
  - !ruby/object:Gem::Dependency
42
42
  name: rspec
43
43
  requirement: !ruby/object:Gem::Requirement
44
44
  requirements:
45
- - - '>='
45
+ - - ">="
46
46
  - !ruby/object:Gem::Version
47
47
  version: '0'
48
48
  type: :development
49
49
  prerelease: false
50
50
  version_requirements: !ruby/object:Gem::Requirement
51
51
  requirements:
52
- - - '>='
52
+ - - ">="
53
53
  - !ruby/object:Gem::Version
54
54
  version: '0'
55
55
  - !ruby/object:Gem::Dependency
56
56
  name: rspec-nc
57
57
  requirement: !ruby/object:Gem::Requirement
58
58
  requirements:
59
- - - '>='
59
+ - - ">="
60
60
  - !ruby/object:Gem::Version
61
61
  version: '0'
62
62
  type: :development
63
63
  prerelease: false
64
64
  version_requirements: !ruby/object:Gem::Requirement
65
65
  requirements:
66
- - - '>='
66
+ - - ">="
67
67
  - !ruby/object:Gem::Version
68
68
  version: '0'
69
69
  - !ruby/object:Gem::Dependency
70
70
  name: pry
71
71
  requirement: !ruby/object:Gem::Requirement
72
72
  requirements:
73
- - - '>='
73
+ - - ">="
74
74
  - !ruby/object:Gem::Version
75
75
  version: '0'
76
76
  type: :development
77
77
  prerelease: false
78
78
  version_requirements: !ruby/object:Gem::Requirement
79
79
  requirements:
80
- - - '>='
80
+ - - ">="
81
81
  - !ruby/object:Gem::Version
82
82
  version: '0'
83
83
  - !ruby/object:Gem::Dependency
84
84
  name: pry-nav
85
85
  requirement: !ruby/object:Gem::Requirement
86
86
  requirements:
87
- - - '>='
87
+ - - ">="
88
88
  - !ruby/object:Gem::Version
89
89
  version: '0'
90
90
  type: :development
91
91
  prerelease: false
92
92
  version_requirements: !ruby/object:Gem::Requirement
93
93
  requirements:
94
- - - '>='
94
+ - - ">="
95
95
  - !ruby/object:Gem::Version
96
96
  version: '0'
97
97
  - !ruby/object:Gem::Dependency
98
98
  name: pry-rescue
99
99
  requirement: !ruby/object:Gem::Requirement
100
100
  requirements:
101
- - - '>='
101
+ - - ">="
102
102
  - !ruby/object:Gem::Version
103
103
  version: '0'
104
104
  type: :development
105
105
  prerelease: false
106
106
  version_requirements: !ruby/object:Gem::Requirement
107
107
  requirements:
108
- - - '>='
108
+ - - ">="
109
109
  - !ruby/object:Gem::Version
110
110
  version: '0'
111
111
  - !ruby/object:Gem::Dependency
112
112
  name: pry-stack_explorer
113
113
  requirement: !ruby/object:Gem::Requirement
114
114
  requirements:
115
- - - '>='
115
+ - - ">="
116
116
  - !ruby/object:Gem::Version
117
117
  version: '0'
118
118
  type: :development
119
119
  prerelease: false
120
120
  version_requirements: !ruby/object:Gem::Requirement
121
121
  requirements:
122
- - - '>='
122
+ - - ">="
123
123
  - !ruby/object:Gem::Version
124
124
  version: '0'
125
125
  - !ruby/object:Gem::Dependency
126
126
  name: pry-doc
127
127
  requirement: !ruby/object:Gem::Requirement
128
128
  requirements:
129
- - - '>='
129
+ - - ">="
130
130
  - !ruby/object:Gem::Version
131
131
  version: '0'
132
132
  type: :development
133
133
  prerelease: false
134
134
  version_requirements: !ruby/object:Gem::Requirement
135
135
  requirements:
136
- - - '>='
136
+ - - ">="
137
137
  - !ruby/object:Gem::Version
138
138
  version: '0'
139
139
  - !ruby/object:Gem::Dependency
140
140
  name: guard
141
141
  requirement: !ruby/object:Gem::Requirement
142
142
  requirements:
143
- - - '>='
143
+ - - ">="
144
144
  - !ruby/object:Gem::Version
145
145
  version: '0'
146
146
  type: :development
147
147
  prerelease: false
148
148
  version_requirements: !ruby/object:Gem::Requirement
149
149
  requirements:
150
- - - '>='
150
+ - - ">="
151
151
  - !ruby/object:Gem::Version
152
152
  version: '0'
153
153
  - !ruby/object:Gem::Dependency
154
154
  name: guard-rspec
155
155
  requirement: !ruby/object:Gem::Requirement
156
156
  requirements:
157
- - - '>='
157
+ - - ">="
158
158
  - !ruby/object:Gem::Version
159
159
  version: '0'
160
160
  type: :development
161
161
  prerelease: false
162
162
  version_requirements: !ruby/object:Gem::Requirement
163
163
  requirements:
164
- - - '>='
164
+ - - ">="
165
165
  - !ruby/object:Gem::Version
166
166
  version: '0'
167
167
  description: Tags tweets word into multiple cathegories using NLP
@@ -173,7 +173,7 @@ executables:
173
173
  extensions: []
174
174
  extra_rdoc_files: []
175
175
  files:
176
- - .gitignore
176
+ - ".gitignore"
177
177
  - Gemfile
178
178
  - Guardfile
179
179
  - LICENSE.txt
@@ -197,20 +197,21 @@ require_paths:
197
197
  - lib
198
198
  required_ruby_version: !ruby/object:Gem::Requirement
199
199
  requirements:
200
- - - '>='
200
+ - - ">="
201
201
  - !ruby/object:Gem::Version
202
202
  version: '0'
203
203
  required_rubygems_version: !ruby/object:Gem::Requirement
204
204
  requirements:
205
- - - '>='
205
+ - - ">="
206
206
  - !ruby/object:Gem::Version
207
207
  version: '0'
208
208
  requirements: []
209
209
  rubyforge_project:
210
- rubygems_version: 2.0.14
210
+ rubygems_version: 2.2.2
211
211
  signing_key:
212
212
  specification_version: 4
213
213
  summary: Ruby wrapper for the Carnegie Mellon Twitter NLP
214
214
  test_files:
215
215
  - spec/parser_spec.rb
216
216
  - spec/spec_helper.rb
217
+ has_rdoc: