find_keywords 0.0.1

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
checksums.yaml ADDED
@@ -0,0 +1,7 @@
1
+ ---
2
+ SHA1:
3
+ metadata.gz: 0a4277baab77ff4776252c7c37ce8f9588d45710
4
+ data.tar.gz: ac9adf2ce1ddb9b77d732958af824caf1d266e0c
5
+ SHA512:
6
+ metadata.gz: 7a0b27073500e298c0cd9513aeb0722684295b8182b99a3f73f609a9ae46b5b9413c5931ac8a4dce1d8ba3d4097496177d529df24111999620b81617e0293d64
7
+ data.tar.gz: 75497b8673d5ab97afc6adcf1823a316c337e5f7818a18c274572e383dc4b45ae3d61ea8294387111f34fd37acfd45b92057061e4fd56a7e7e3586c1ae77553f
data/.gitignore ADDED
@@ -0,0 +1,22 @@
1
+ *.gem
2
+ *.rbc
3
+ .bundle
4
+ .config
5
+ .yardoc
6
+ Gemfile.lock
7
+ InstalledFiles
8
+ _yardoc
9
+ coverage
10
+ doc/
11
+ lib/bundler/man
12
+ pkg
13
+ rdoc
14
+ spec/reports
15
+ test/tmp
16
+ test/version_tmp
17
+ tmp
18
+ *.bundle
19
+ *.so
20
+ *.o
21
+ *.a
22
+ mkmf.log
data/Gemfile ADDED
@@ -0,0 +1,4 @@
1
+ source 'https://rubygems.org'
2
+
3
+ # Specify your gem's dependencies in find_keywords.gemspec
4
+ gemspec
data/LICENSE.txt ADDED
@@ -0,0 +1,22 @@
1
+ Copyright (c) 2014 Kirk Jarvis
2
+
3
+ MIT License
4
+
5
+ Permission is hereby granted, free of charge, to any person obtaining
6
+ a copy of this software and associated documentation files (the
7
+ "Software"), to deal in the Software without restriction, including
8
+ without limitation the rights to use, copy, modify, merge, publish,
9
+ distribute, sublicense, and/or sell copies of the Software, and to
10
+ permit persons to whom the Software is furnished to do so, subject to
11
+ the following conditions:
12
+
13
+ The above copyright notice and this permission notice shall be
14
+ included in all copies or substantial portions of the Software.
15
+
16
+ THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND,
17
+ EXPRESS OR IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF
18
+ MERCHANTABILITY, FITNESS FOR A PARTICULAR PURPOSE AND
19
+ NONINFRINGEMENT. IN NO EVENT SHALL THE AUTHORS OR COPYRIGHT HOLDERS BE
20
+ LIABLE FOR ANY CLAIM, DAMAGES OR OTHER LIABILITY, WHETHER IN AN ACTION
21
+ OF CONTRACT, TORT OR OTHERWISE, ARISING FROM, OUT OF OR IN CONNECTION
22
+ WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN THE SOFTWARE.
data/README.md ADDED
@@ -0,0 +1,35 @@
1
+ # FindKeywords
2
+
3
+ Finds keywords in a sentence. Uses a stop word list and market word list to remove words that are not relevent.
4
+
5
+ ## Installation
6
+
7
+ Add this line to your application's Gemfile:
8
+
9
+ gem 'find_keywords'
10
+
11
+ And then execute:
12
+
13
+ $ bundle
14
+
15
+ Or install it yourself as:
16
+
17
+ $ gem install find_keywords
18
+
19
+ ## Usage
20
+
21
+ Find keywords is used to take a string (sentence), list (array), or a hash and return only keyword. It removes the stop words and list of other words.
22
+
23
+ ruby```
24
+ sentence = "_the yellow__jeans_"
25
+ keywords = FindKeywords::Keywords.new(sentence).keywords
26
+ keywords => ["yellow", "jeans"]
27
+ ```
28
+
29
+ ## Contributing
30
+
31
+ 1. Fork it ( https://github.com/[my-github-username]/find_keywords/fork )
32
+ 2. Create your feature branch (`git checkout -b my-new-feature`)
33
+ 3. Commit your changes (`git commit -am 'Add some feature'`)
34
+ 4. Push to the branch (`git push origin my-new-feature`)
35
+ 5. Create a new Pull Request
data/Rakefile ADDED
@@ -0,0 +1,2 @@
1
+ require "bundler/gem_tasks"
2
+
@@ -0,0 +1,25 @@
1
+ # coding: utf-8
2
+ lib = File.expand_path('../lib', __FILE__)
3
+ $LOAD_PATH.unshift(lib) unless $LOAD_PATH.include?(lib)
4
+ require 'find_keywords/version'
5
+
6
+ Gem::Specification.new do |spec|
7
+ spec.name = "find_keywords"
8
+ spec.version = FindKeywords::VERSION
9
+ spec.authors = ["Kirk Jarvis"]
10
+ spec.email = ["zuuzlo@yahoo.com"]
11
+ spec.summary = "Finds keywords in a sentence"
12
+ spec.description = "Finds keywords in a sentence. Uses a stop word list and market word list to remove words that are not relevent."
13
+ spec.homepage = ""
14
+ spec.license = "MIT"
15
+
16
+ spec.files = `git ls-files -z`.split("\x0")
17
+ spec.executables = spec.files.grep(%r{^bin/}) { |f| File.basename(f) }
18
+ spec.test_files = spec.files.grep(%r{^(test|spec|features)/})
19
+ spec.require_paths = ["lib"]
20
+
21
+ spec.add_development_dependency "bundler", "~> 1.6"
22
+ spec.add_development_dependency "rake"
23
+ spec.add_development_dependency "rspec"
24
+ spec.add_development_dependency "pry"
25
+ end
@@ -0,0 +1,3 @@
1
+ module FindKeywords
2
+ VERSION = "0.0.1"
3
+ end
@@ -0,0 +1,83 @@
1
+ require "find_keywords/version"
2
+
3
+ module FindKeywords
4
+
5
+ STOP_WORDS = [
6
+ 'a','cannot','into','our','thus','about','co','is','ours','to','above',
7
+ 'could','it','ourselves','together','across','down','its','out','too',
8
+ 'after','during','itself','over','toward','afterwards','each','last','own',
9
+ 'towards','again','eg','latter','per','under','against','either','latterly',
10
+ 'perhaps','until','all','else','least','rather','up','almost','elsewhere',
11
+ 'less','same','upon','alone','enough','ltd','seem','us','along','etc',
12
+ 'many','seemed','very','already','even','may','seeming','via','also','ever',
13
+ 'me','seems','was','although','every','meanwhile','several','we','always',
14
+ 'everyone','might','she','well','among','everything','more','should','were',
15
+ 'amongst','everywhere','moreover','since','what','an','except','most','so',
16
+ 'whatever','and','few','mostly','some','when','another','first','much',
17
+ 'somehow','whence','any','for','must','someone','whenever','anyhow',
18
+ 'former','my','something','where','anyone','formerly','myself','sometime',
19
+ 'whereafter','anything','from','namely','sometimes','whereas','anywhere',
20
+ 'further','neither','somewhere','whereby','are','had','never','still',
21
+ 'wherein','around','has','nevertheless','such','whereupon','as','have',
22
+ 'next','than','wherever','at','he','no','that','whether','be','hence',
23
+ 'nobody','the','whither','became','her','none','their','which','because',
24
+ 'here','noone','them','while','become','hereafter','nor','themselves','who',
25
+ 'becomes','hereby','not','then','whoever','becoming','herein','nothing',
26
+ 'thence','whole','been','hereupon','now','there','whom','before','hers',
27
+ 'nowhere','thereafter','whose','beforehand','herself','of','thereby','why',
28
+ 'behind','him','off','therefore','will','being','himself','often','therein',
29
+ 'with','below','his','on','thereupon','within','beside','how','once',
30
+ 'these','without','besides','however','one','they','would','between','i',
31
+ 'only','this','yet','beyond','ie','onto','those','you','both','if','or',
32
+ 'though','your','but','in','other','through','yours','by','inc','others',
33
+ 'throughout','yourself','can','indeed','otherwise','thru','yourselves'
34
+ ]
35
+
36
+ MARKET_WORDS = [ 'select','styles','shop','reg','orig','set', 'sets', 'offer',
37
+ 'valid','get','free','shipping','double','december','coupon','save','ends',
38
+ 'january','affiliate','exclusive','buy','use','code','size','order','use',
39
+ 'checkout','expires','purchase','just','plus','sales','tax','promo','holiday',
40
+ 'delivery','ca','co','ma','mi','oh','ri','online','members','back','points',
41
+ 'orders'
42
+ ]
43
+
44
+ class Keywords
45
+
46
+ attr_accessor :sentence
47
+
48
+ def initialize (sentence)
49
+ if sentence.is_a?(String)
50
+ @sentence = sentence
51
+ elsif sentence.is_a?(Array)
52
+ @sentence = sentence.join(' ')
53
+ elsif sentence.is_a?(Hash)
54
+ @sentence = sentence.collect { |k, v| "#{k} #{v} " }.join
55
+ else
56
+ @sentence = ''
57
+ end
58
+ end
59
+
60
+ def keywords
61
+ slug = @sentence
62
+ slug.gsub! /['`]/,""
63
+ slug.gsub! /\s*@\s*/, " at "
64
+ slug.gsub! /\s*&\s*/, " and "
65
+ slug.gsub! /\s*[^A-Za-z0-9\.\-]\s*/, ' '
66
+ #slug.gsub! /\ \d+/, ''
67
+ slug.gsub!(/[^a-zA-Z ]/,'')
68
+ slug.gsub!(/ +/,' ')
69
+ #convert double underscores to single
70
+ #slug.gsub! /_+/,"_"
71
+ #strip off leading/trailing underscore
72
+ #slug.gsub! /\A[_\.]+|[_\.]+\z/,""
73
+ words = slug.downcase.scan(/\w+/)
74
+ slug_words = words.select { |word| !STOP_WORDS.include?(word)}
75
+ slug_words = slug_words.select { |word| !MARKET_WORDS.include?(word)}
76
+ slug = slug_words.join(' ')
77
+ keywords = slug.scan(/\w+/)
78
+ keywords.delete_if { |word| word.size <= 2 }
79
+ keywords.uniq! if keywords.uniq
80
+ return keywords
81
+ end
82
+ end
83
+ end
metadata ADDED
@@ -0,0 +1,109 @@
1
+ --- !ruby/object:Gem::Specification
2
+ name: find_keywords
3
+ version: !ruby/object:Gem::Version
4
+ version: 0.0.1
5
+ platform: ruby
6
+ authors:
7
+ - Kirk Jarvis
8
+ autorequire:
9
+ bindir: bin
10
+ cert_chain: []
11
+ date: 2014-05-31 00:00:00.000000000 Z
12
+ dependencies:
13
+ - !ruby/object:Gem::Dependency
14
+ name: bundler
15
+ requirement: !ruby/object:Gem::Requirement
16
+ requirements:
17
+ - - ~>
18
+ - !ruby/object:Gem::Version
19
+ version: '1.6'
20
+ type: :development
21
+ prerelease: false
22
+ version_requirements: !ruby/object:Gem::Requirement
23
+ requirements:
24
+ - - ~>
25
+ - !ruby/object:Gem::Version
26
+ version: '1.6'
27
+ - !ruby/object:Gem::Dependency
28
+ name: rake
29
+ requirement: !ruby/object:Gem::Requirement
30
+ requirements:
31
+ - - '>='
32
+ - !ruby/object:Gem::Version
33
+ version: '0'
34
+ type: :development
35
+ prerelease: false
36
+ version_requirements: !ruby/object:Gem::Requirement
37
+ requirements:
38
+ - - '>='
39
+ - !ruby/object:Gem::Version
40
+ version: '0'
41
+ - !ruby/object:Gem::Dependency
42
+ name: rspec
43
+ requirement: !ruby/object:Gem::Requirement
44
+ requirements:
45
+ - - '>='
46
+ - !ruby/object:Gem::Version
47
+ version: '0'
48
+ type: :development
49
+ prerelease: false
50
+ version_requirements: !ruby/object:Gem::Requirement
51
+ requirements:
52
+ - - '>='
53
+ - !ruby/object:Gem::Version
54
+ version: '0'
55
+ - !ruby/object:Gem::Dependency
56
+ name: pry
57
+ requirement: !ruby/object:Gem::Requirement
58
+ requirements:
59
+ - - '>='
60
+ - !ruby/object:Gem::Version
61
+ version: '0'
62
+ type: :development
63
+ prerelease: false
64
+ version_requirements: !ruby/object:Gem::Requirement
65
+ requirements:
66
+ - - '>='
67
+ - !ruby/object:Gem::Version
68
+ version: '0'
69
+ description: Finds keywords in a sentence. Uses a stop word list and market word
70
+ list to remove words that are not relevent.
71
+ email:
72
+ - zuuzlo@yahoo.com
73
+ executables: []
74
+ extensions: []
75
+ extra_rdoc_files: []
76
+ files:
77
+ - .gitignore
78
+ - Gemfile
79
+ - LICENSE.txt
80
+ - README.md
81
+ - Rakefile
82
+ - find_keywords.gemspec
83
+ - lib/find_keywords.rb
84
+ - lib/find_keywords/version.rb
85
+ homepage: ''
86
+ licenses:
87
+ - MIT
88
+ metadata: {}
89
+ post_install_message:
90
+ rdoc_options: []
91
+ require_paths:
92
+ - lib
93
+ required_ruby_version: !ruby/object:Gem::Requirement
94
+ requirements:
95
+ - - '>='
96
+ - !ruby/object:Gem::Version
97
+ version: '0'
98
+ required_rubygems_version: !ruby/object:Gem::Requirement
99
+ requirements:
100
+ - - '>='
101
+ - !ruby/object:Gem::Version
102
+ version: '0'
103
+ requirements: []
104
+ rubyforge_project:
105
+ rubygems_version: 2.0.3
106
+ signing_key:
107
+ specification_version: 4
108
+ summary: Finds keywords in a sentence
109
+ test_files: []