bayesic_matching 0.1.0

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
@@ -0,0 +1,3 @@
1
+ class BayesicMatching
2
+ VERSION = "0.1.0"
3
+ end
@@ -0,0 +1,34 @@
1
+ require "bayesic_matching/version"
2
+
3
+ class BayesicMatching
4
+ def initialize
5
+ @classifications = []
6
+ @classifications_by_token = {}
7
+ @tokens_by_classification = {}
8
+ @total_token_entries = 0.0
9
+ end
10
+
11
+ def classify(tokens)
12
+ tokens = tokens.reject{|t| @classifications_by_token[t].nil? }
13
+ tokens.each_with_object({}) do |token, hash|
14
+ @classifications_by_token[token].each do |c|
15
+ p_klass = hash[c] || (1.0 / @classifications.size)
16
+ p_not_klass = 1.0 - p_klass
17
+ p_token_given_klass = 1.0
18
+ p_token_given_not_klass = (@classifications_by_token[token].size - 1) / @classifications.size.to_f
19
+ hash[c] = (p_token_given_klass * p_klass) / ((p_token_given_klass * p_klass) + (p_token_given_not_klass * p_not_klass))
20
+ end
21
+ end
22
+ end
23
+
24
+ def train(tokens, classification)
25
+ @classifications << classification
26
+ @tokens_by_classification[classification] ||= []
27
+ @tokens_by_classification[classification].concat(tokens)
28
+ tokens.each do |token|
29
+ @classifications_by_token[token] ||= []
30
+ @classifications_by_token[token] << classification
31
+ @total_token_entries += 1.0
32
+ end
33
+ end
34
+ end
metadata ADDED
@@ -0,0 +1,116 @@
1
+ --- !ruby/object:Gem::Specification
2
+ name: bayesic_matching
3
+ version: !ruby/object:Gem::Version
4
+ version: 0.1.0
5
+ platform: ruby
6
+ authors:
7
+ - Michael Ries
8
+ autorequire:
9
+ bindir: exe
10
+ cert_chain: []
11
+ date: 2017-12-14 00:00:00.000000000 Z
12
+ dependencies:
13
+ - !ruby/object:Gem::Dependency
14
+ name: benchmark-ips
15
+ requirement: !ruby/object:Gem::Requirement
16
+ requirements:
17
+ - - "~>"
18
+ - !ruby/object:Gem::Version
19
+ version: '2.7'
20
+ type: :development
21
+ prerelease: false
22
+ version_requirements: !ruby/object:Gem::Requirement
23
+ requirements:
24
+ - - "~>"
25
+ - !ruby/object:Gem::Version
26
+ version: '2.7'
27
+ - !ruby/object:Gem::Dependency
28
+ name: bundler
29
+ requirement: !ruby/object:Gem::Requirement
30
+ requirements:
31
+ - - "~>"
32
+ - !ruby/object:Gem::Version
33
+ version: '1.16'
34
+ type: :development
35
+ prerelease: false
36
+ version_requirements: !ruby/object:Gem::Requirement
37
+ requirements:
38
+ - - "~>"
39
+ - !ruby/object:Gem::Version
40
+ version: '1.16'
41
+ - !ruby/object:Gem::Dependency
42
+ name: rake
43
+ requirement: !ruby/object:Gem::Requirement
44
+ requirements:
45
+ - - "~>"
46
+ - !ruby/object:Gem::Version
47
+ version: '10.0'
48
+ type: :development
49
+ prerelease: false
50
+ version_requirements: !ruby/object:Gem::Requirement
51
+ requirements:
52
+ - - "~>"
53
+ - !ruby/object:Gem::Version
54
+ version: '10.0'
55
+ - !ruby/object:Gem::Dependency
56
+ name: rspec
57
+ requirement: !ruby/object:Gem::Requirement
58
+ requirements:
59
+ - - "~>"
60
+ - !ruby/object:Gem::Version
61
+ version: '3.0'
62
+ type: :development
63
+ prerelease: false
64
+ version_requirements: !ruby/object:Gem::Requirement
65
+ requirements:
66
+ - - "~>"
67
+ - !ruby/object:Gem::Version
68
+ version: '3.0'
69
+ description: bayesian approach to matching one list of strings with another
70
+ email:
71
+ - michael@riesd.com
72
+ executables: []
73
+ extensions: []
74
+ extra_rdoc_files: []
75
+ files:
76
+ - ".gitignore"
77
+ - ".rspec"
78
+ - ".travis.yml"
79
+ - Gemfile
80
+ - Gemfile.lock
81
+ - LICENSE.txt
82
+ - README.md
83
+ - Rakefile
84
+ - bayesic_matching.gemspec
85
+ - bin/console
86
+ - bin/setup
87
+ - examples/benchmark.rb
88
+ - examples/favorite_recent_movies.csv
89
+ - examples/popular_recent_movies.csv
90
+ - lib/bayesic_matching.rb
91
+ - lib/bayesic_matching/version.rb
92
+ homepage: https://github.com/mmmries/bayesic_matching
93
+ licenses:
94
+ - MIT
95
+ metadata: {}
96
+ post_install_message:
97
+ rdoc_options: []
98
+ require_paths:
99
+ - lib
100
+ required_ruby_version: !ruby/object:Gem::Requirement
101
+ requirements:
102
+ - - ">="
103
+ - !ruby/object:Gem::Version
104
+ version: '0'
105
+ required_rubygems_version: !ruby/object:Gem::Requirement
106
+ requirements:
107
+ - - ">="
108
+ - !ruby/object:Gem::Version
109
+ version: '0'
110
+ requirements: []
111
+ rubyforge_project:
112
+ rubygems_version: 2.6.14
113
+ signing_key:
114
+ specification_version: 4
115
+ summary: bayesian approach to matching one list of strings with another
116
+ test_files: []