classifier 1.3.0 → 1.3.1

Sign up to get free protection for your applications and to get access to all the features.
Files changed (87) hide show
  1. data/README +2 -1
  2. data/Rakefile +3 -4
  3. data/bin/bayes.rb +1 -1
  4. data/bin/summarize.rb +7 -2
  5. data/lib/classifier/extensions/string.rb +2 -2
  6. data/lib/classifier/extensions/vector_serialize.rb +2 -2
  7. data/lib/classifier/lsi.rb +2 -2
  8. data/lib/classifier/lsi/content_node.rb +1 -1
  9. metadata +73 -159
  10. data/doc/classes/Array.html +0 -139
  11. data/doc/classes/Array.src/M000003.html +0 -18
  12. data/doc/classes/Classifier.html +0 -140
  13. data/doc/classes/Classifier/Bayes.html +0 -317
  14. data/doc/classes/Classifier/Bayes.src/M000038.html +0 -20
  15. data/doc/classes/Classifier/Bayes.src/M000039.html +0 -23
  16. data/doc/classes/Classifier/Bayes.src/M000040.html +0 -30
  17. data/doc/classes/Classifier/Bayes.src/M000041.html +0 -27
  18. data/doc/classes/Classifier/Bayes.src/M000042.html +0 -18
  19. data/doc/classes/Classifier/Bayes.src/M000043.html +0 -25
  20. data/doc/classes/Classifier/Bayes.src/M000044.html +0 -18
  21. data/doc/classes/Classifier/ContentNode.html +0 -247
  22. data/doc/classes/Classifier/ContentNode.src/M000046.html +0 -19
  23. data/doc/classes/Classifier/ContentNode.src/M000047.html +0 -18
  24. data/doc/classes/Classifier/ContentNode.src/M000048.html +0 -18
  25. data/doc/classes/Classifier/ContentNode.src/M000049.html +0 -49
  26. data/doc/classes/Classifier/LSI.html +0 -539
  27. data/doc/classes/Classifier/LSI.src/M000022.html +0 -20
  28. data/doc/classes/Classifier/LSI.src/M000023.html +0 -18
  29. data/doc/classes/Classifier/LSI.src/M000024.html +0 -21
  30. data/doc/classes/Classifier/LSI.src/M000025.html +0 -18
  31. data/doc/classes/Classifier/LSI.src/M000026.html +0 -19
  32. data/doc/classes/Classifier/LSI.src/M000027.html +0 -21
  33. data/doc/classes/Classifier/LSI.src/M000028.html +0 -18
  34. data/doc/classes/Classifier/LSI.src/M000029.html +0 -19
  35. data/doc/classes/Classifier/LSI.src/M000030.html +0 -43
  36. data/doc/classes/Classifier/LSI.src/M000031.html +0 -23
  37. data/doc/classes/Classifier/LSI.src/M000032.html +0 -30
  38. data/doc/classes/Classifier/LSI.src/M000033.html +0 -30
  39. data/doc/classes/Classifier/LSI.src/M000034.html +0 -21
  40. data/doc/classes/Classifier/LSI.src/M000035.html +0 -21
  41. data/doc/classes/Classifier/LSI.src/M000036.html +0 -31
  42. data/doc/classes/Classifier/LSI.src/M000037.html +0 -21
  43. data/doc/classes/Classifier/WordList.html +0 -217
  44. data/doc/classes/Classifier/WordList.src/M000017.html +0 -18
  45. data/doc/classes/Classifier/WordList.src/M000018.html +0 -19
  46. data/doc/classes/Classifier/WordList.src/M000019.html +0 -19
  47. data/doc/classes/Classifier/WordList.src/M000020.html +0 -18
  48. data/doc/classes/Classifier/WordList.src/M000021.html +0 -18
  49. data/doc/classes/GSL.html +0 -112
  50. data/doc/classes/GSL/Matrix.html +0 -126
  51. data/doc/classes/GSL/Vector.html +0 -156
  52. data/doc/classes/GSL/Vector.src/M000015.html +0 -18
  53. data/doc/classes/GSL/Vector.src/M000016.html +0 -19
  54. data/doc/classes/Matrix.html +0 -184
  55. data/doc/classes/Matrix.src/M000004.html +0 -18
  56. data/doc/classes/Matrix.src/M000005.html +0 -76
  57. data/doc/classes/Matrix.src/M000006.html +0 -18
  58. data/doc/classes/Object.html +0 -139
  59. data/doc/classes/Object.src/M000007.html +0 -16
  60. data/doc/classes/String.html +0 -275
  61. data/doc/classes/String.src/M000008.html +0 -18
  62. data/doc/classes/String.src/M000009.html +0 -18
  63. data/doc/classes/String.src/M000010.html +0 -18
  64. data/doc/classes/String.src/M000011.html +0 -18
  65. data/doc/classes/String.src/M000012.html +0 -18
  66. data/doc/classes/String.src/M000013.html +0 -18
  67. data/doc/classes/String.src/M000014.html +0 -18
  68. data/doc/classes/Vector.html +0 -154
  69. data/doc/classes/Vector.src/M000001.html +0 -22
  70. data/doc/classes/Vector.src/M000002.html +0 -25
  71. data/doc/created.rid +0 -1
  72. data/doc/files/README.html +0 -252
  73. data/doc/files/lib/classifier/bayes_rb.html +0 -115
  74. data/doc/files/lib/classifier/extensions/string_rb.html +0 -122
  75. data/doc/files/lib/classifier/extensions/vector_rb.html +0 -120
  76. data/doc/files/lib/classifier/extensions/vector_serialize_rb.html +0 -101
  77. data/doc/files/lib/classifier/extensions/word_hash_rb.html +0 -115
  78. data/doc/files/lib/classifier/lsi/content_node_rb.html +0 -115
  79. data/doc/files/lib/classifier/lsi/summary_rb.html +0 -115
  80. data/doc/files/lib/classifier/lsi/word_list_rb.html +0 -115
  81. data/doc/files/lib/classifier/lsi_rb.html +0 -127
  82. data/doc/files/lib/classifier_rb.html +0 -125
  83. data/doc/fr_class_index.html +0 -39
  84. data/doc/fr_file_index.html +0 -37
  85. data/doc/fr_method_index.html +0 -75
  86. data/doc/index.html +0 -24
  87. data/doc/rdoc-style.css +0 -208
@@ -1,18 +0,0 @@
1
- <?xml version="1.0" encoding="iso-8859-1"?>
2
- <!DOCTYPE html
3
- PUBLIC "-//W3C//DTD XHTML 1.0 Transitional//EN"
4
- "http://www.w3.org/TR/xhtml1/DTD/xhtml1-transitional.dtd">
5
-
6
- <html>
7
- <head>
8
- <title>sum (Array)</title>
9
- <meta http-equiv="Content-Type" content="text/html; charset=iso-8859-1" />
10
- <link rel="stylesheet" href="../.././rdoc-style.css" type="text/css" media="screen" />
11
- </head>
12
- <body class="standalone-code">
13
- <pre><span class="ruby-comment cmt"># File lib/classifier/extensions/vector.rb, line 10</span>
14
- <span class="ruby-keyword kw">def</span> <span class="ruby-identifier">sum</span>
15
- <span class="ruby-identifier">inject</span>(<span class="ruby-value">0</span>) { <span class="ruby-operator">|</span><span class="ruby-identifier">sum</span>,<span class="ruby-identifier">term</span><span class="ruby-operator">|</span> <span class="ruby-identifier">sum</span> <span class="ruby-operator">+=</span> <span class="ruby-identifier">term</span> }.<span class="ruby-identifier">to_f</span>
16
- <span class="ruby-keyword kw">end</span></pre>
17
- </body>
18
- </html>
@@ -1,140 +0,0 @@
1
- <?xml version="1.0" encoding="iso-8859-1"?>
2
- <!DOCTYPE html
3
- PUBLIC "-//W3C//DTD XHTML 1.0 Transitional//EN"
4
- "http://www.w3.org/TR/xhtml1/DTD/xhtml1-transitional.dtd">
5
-
6
- <html xmlns="http://www.w3.org/1999/xhtml" xml:lang="en" lang="en">
7
- <head>
8
- <title>Module: Classifier</title>
9
- <meta http-equiv="Content-Type" content="text/html; charset=iso-8859-1" />
10
- <meta http-equiv="Content-Script-Type" content="text/javascript" />
11
- <link rel="stylesheet" href=".././rdoc-style.css" type="text/css" media="screen" />
12
- <script type="text/javascript">
13
- // <![CDATA[
14
-
15
- function popupCode( url ) {
16
- window.open(url, "Code", "resizable=yes,scrollbars=yes,toolbar=no,status=no,height=150,width=400")
17
- }
18
-
19
- function toggleCode( id ) {
20
- if ( document.getElementById )
21
- elem = document.getElementById( id );
22
- else if ( document.all )
23
- elem = eval( "document.all." + id );
24
- else
25
- return false;
26
-
27
- elemStyle = elem.style;
28
-
29
- if ( elemStyle.display != "block" ) {
30
- elemStyle.display = "block"
31
- } else {
32
- elemStyle.display = "none"
33
- }
34
-
35
- return true;
36
- }
37
-
38
- // Make codeblocks hidden by default
39
- document.writeln( "<style type=\"text/css\">div.method-source-code { display: none }</style>" )
40
-
41
- // ]]>
42
- </script>
43
-
44
- </head>
45
- <body>
46
-
47
-
48
-
49
- <div id="classHeader">
50
- <table class="header-table">
51
- <tr class="top-aligned-row">
52
- <td><strong>Module</strong></td>
53
- <td class="class-name-in-header">Classifier</td>
54
- </tr>
55
- <tr class="top-aligned-row">
56
- <td><strong>In:</strong></td>
57
- <td>
58
- <a href="../files/lib/classifier/bayes_rb.html">
59
- lib/classifier/bayes.rb
60
- </a>
61
- <br />
62
- <a href="../files/lib/classifier/lsi_rb.html">
63
- lib/classifier/lsi.rb
64
- </a>
65
- <br />
66
- <a href="../files/lib/classifier/lsi/content_node_rb.html">
67
- lib/classifier/lsi/content_node.rb
68
- </a>
69
- <br />
70
- <a href="../files/lib/classifier/lsi/word_list_rb.html">
71
- lib/classifier/lsi/word_list.rb
72
- </a>
73
- <br />
74
- </td>
75
- </tr>
76
-
77
- </table>
78
- </div>
79
- <!-- banner header -->
80
-
81
- <div id="bodyContent">
82
-
83
-
84
-
85
- <div id="contextContent">
86
-
87
- <div id="description">
88
- <table>
89
- <tr><td valign="top">Author:</td><td>David Fayram (<a href="mailto:dfayram@lensmen.net">dfayram@lensmen.net</a>)
90
-
91
- </td></tr>
92
- <tr><td valign="top">Copyright:</td><td>Copyright &#169; 2005 David Fayram II
93
-
94
- </td></tr>
95
- <tr><td valign="top">License:</td><td>LGPL
96
-
97
- </td></tr>
98
- </table>
99
-
100
- </div>
101
-
102
-
103
- </div>
104
-
105
-
106
- </div>
107
-
108
-
109
- <!-- if includes -->
110
-
111
- <div id="section">
112
-
113
- <div id="class-list">
114
- <h3 class="section-bar">Classes and Modules</h3>
115
-
116
- Class <a href="Classifier/Bayes.html" class="link">Classifier::Bayes</a><br />
117
- Class <a href="Classifier/ContentNode.html" class="link">Classifier::ContentNode</a><br />
118
- Class <a href="Classifier/LSI.html" class="link">Classifier::LSI</a><br />
119
- Class <a href="Classifier/WordList.html" class="link">Classifier::WordList</a><br />
120
-
121
- </div>
122
-
123
-
124
-
125
-
126
-
127
-
128
-
129
- <!-- if method_list -->
130
-
131
-
132
- </div>
133
-
134
-
135
- <div id="validator-badges">
136
- <p><small><a href="http://validator.w3.org/check/referer">[Validate]</a></small></p>
137
- </div>
138
-
139
- </body>
140
- </html>
@@ -1,317 +0,0 @@
1
- <?xml version="1.0" encoding="iso-8859-1"?>
2
- <!DOCTYPE html
3
- PUBLIC "-//W3C//DTD XHTML 1.0 Transitional//EN"
4
- "http://www.w3.org/TR/xhtml1/DTD/xhtml1-transitional.dtd">
5
-
6
- <html xmlns="http://www.w3.org/1999/xhtml" xml:lang="en" lang="en">
7
- <head>
8
- <title>Class: Classifier::Bayes</title>
9
- <meta http-equiv="Content-Type" content="text/html; charset=iso-8859-1" />
10
- <meta http-equiv="Content-Script-Type" content="text/javascript" />
11
- <link rel="stylesheet" href="../.././rdoc-style.css" type="text/css" media="screen" />
12
- <script type="text/javascript">
13
- // <![CDATA[
14
-
15
- function popupCode( url ) {
16
- window.open(url, "Code", "resizable=yes,scrollbars=yes,toolbar=no,status=no,height=150,width=400")
17
- }
18
-
19
- function toggleCode( id ) {
20
- if ( document.getElementById )
21
- elem = document.getElementById( id );
22
- else if ( document.all )
23
- elem = eval( "document.all." + id );
24
- else
25
- return false;
26
-
27
- elemStyle = elem.style;
28
-
29
- if ( elemStyle.display != "block" ) {
30
- elemStyle.display = "block"
31
- } else {
32
- elemStyle.display = "none"
33
- }
34
-
35
- return true;
36
- }
37
-
38
- // Make codeblocks hidden by default
39
- document.writeln( "<style type=\"text/css\">div.method-source-code { display: none }</style>" )
40
-
41
- // ]]>
42
- </script>
43
-
44
- </head>
45
- <body>
46
-
47
-
48
-
49
- <div id="classHeader">
50
- <table class="header-table">
51
- <tr class="top-aligned-row">
52
- <td><strong>Class</strong></td>
53
- <td class="class-name-in-header">Classifier::Bayes</td>
54
- </tr>
55
- <tr class="top-aligned-row">
56
- <td><strong>In:</strong></td>
57
- <td>
58
- <a href="../../files/lib/classifier/bayes_rb.html">
59
- lib/classifier/bayes.rb
60
- </a>
61
- <br />
62
- </td>
63
- </tr>
64
-
65
- <tr class="top-aligned-row">
66
- <td><strong>Parent:</strong></td>
67
- <td>
68
- <a href="../Object.html">
69
- Object
70
- </a>
71
- </td>
72
- </tr>
73
- </table>
74
- </div>
75
- <!-- banner header -->
76
-
77
- <div id="bodyContent">
78
-
79
-
80
-
81
- <div id="contextContent">
82
-
83
-
84
-
85
- </div>
86
-
87
- <div id="method-list">
88
- <h3 class="section-bar">Methods</h3>
89
-
90
- <div class="name-list">
91
- <a href="#M000044">add_category</a>&nbsp;&nbsp;
92
- <a href="#M000045">append_category</a>&nbsp;&nbsp;
93
- <a href="#M000041">classifications</a>&nbsp;&nbsp;
94
- <a href="#M000042">classify</a>&nbsp;&nbsp;
95
- <a href="#M000043">method_missing</a>&nbsp;&nbsp;
96
- <a href="#M000038">new</a>&nbsp;&nbsp;
97
- <a href="#M000039">train</a>&nbsp;&nbsp;
98
- <a href="#M000040">untrain</a>&nbsp;&nbsp;
99
- </div>
100
- </div>
101
-
102
- </div>
103
-
104
-
105
- <!-- if includes -->
106
-
107
- <div id="section">
108
-
109
-
110
-
111
-
112
-
113
-
114
-
115
-
116
- <!-- if method_list -->
117
- <div id="methods">
118
- <h3 class="section-bar">Public Class methods</h3>
119
-
120
- <div id="method-M000038" class="method-detail">
121
- <a name="M000038"></a>
122
-
123
- <div class="method-heading">
124
- <a href="Bayes.src/M000038.html" target="Code" class="method-signature"
125
- onclick="popupCode('Bayes.src/M000038.html');return false;">
126
- <span class="method-name">new</span><span class="method-args">(*categories)</span>
127
- </a>
128
- </div>
129
-
130
- <div class="method-description">
131
- <p>
132
- The class can be created with one or more categories, each of which will be
133
- initialized and given a training method. E.g.,
134
- </p>
135
- <pre>
136
- b = Classifier::Bayes.new 'Interesting', 'Uninteresting', 'Spam'
137
- </pre>
138
- </div>
139
- </div>
140
-
141
- <h3 class="section-bar">Public Instance methods</h3>
142
-
143
- <div id="method-M000044" class="method-detail">
144
- <a name="M000044"></a>
145
-
146
- <div class="method-heading">
147
- <a href="Bayes.src/M000044.html" target="Code" class="method-signature"
148
- onclick="popupCode('Bayes.src/M000044.html');return false;">
149
- <span class="method-name">add_category</span><span class="method-args">(category)</span>
150
- </a>
151
- </div>
152
-
153
- <div class="method-description">
154
- <p>
155
- Allows you to add categories to the classifier. For example:
156
- </p>
157
- <pre>
158
- b.add_category &quot;Not spam&quot;
159
- </pre>
160
- <p>
161
- WARNING: Adding categories to a trained classifier will result in an
162
- undertrained category that will tend to match more criteria than the
163
- trained selective categories. In short, try to initialize your categories
164
- at initialization.
165
- </p>
166
- </div>
167
- </div>
168
-
169
- <div id="method-M000045" class="method-detail">
170
- <a name="M000045"></a>
171
-
172
- <div class="method-heading">
173
- <span class="method-name">append_category</span><span class="method-args">(category)</span>
174
- </div>
175
-
176
- <div class="method-description">
177
- <p>
178
- Alias for <a href="Bayes.html#M000044">add_category</a>
179
- </p>
180
- </div>
181
- </div>
182
-
183
- <div id="method-M000041" class="method-detail">
184
- <a name="M000041"></a>
185
-
186
- <div class="method-heading">
187
- <a href="Bayes.src/M000041.html" target="Code" class="method-signature"
188
- onclick="popupCode('Bayes.src/M000041.html');return false;">
189
- <span class="method-name">classifications</span><span class="method-args">(text)</span>
190
- </a>
191
- </div>
192
-
193
- <div class="method-description">
194
- <p>
195
- Returns the scores in each category the provided <tt>text</tt>. E.g.,
196
- </p>
197
- <pre>
198
- b.classifications &quot;I hate bad words and you&quot;
199
- =&gt; {&quot;Uninteresting&quot;=&gt;-12.6997928013932, &quot;Interesting&quot;=&gt;-18.4206807439524}
200
- </pre>
201
- <p>
202
- The largest of these scores (the one closest to 0) is the one picked out by
203
- <a href="Bayes.html#M000042">classify</a>
204
- </p>
205
- </div>
206
- </div>
207
-
208
- <div id="method-M000042" class="method-detail">
209
- <a name="M000042"></a>
210
-
211
- <div class="method-heading">
212
- <a href="Bayes.src/M000042.html" target="Code" class="method-signature"
213
- onclick="popupCode('Bayes.src/M000042.html');return false;">
214
- <span class="method-name">classify</span><span class="method-args">(text)</span>
215
- </a>
216
- </div>
217
-
218
- <div class="method-description">
219
- <p>
220
- Returns the classification of the provided <tt>text</tt>, which is one of
221
- the categories given in the initializer. E.g.,
222
- </p>
223
- <pre>
224
- b.classify &quot;I hate bad words and you&quot;
225
- =&gt; 'Uninteresting'
226
- </pre>
227
- </div>
228
- </div>
229
-
230
- <div id="method-M000043" class="method-detail">
231
- <a name="M000043"></a>
232
-
233
- <div class="method-heading">
234
- <a href="Bayes.src/M000043.html" target="Code" class="method-signature"
235
- onclick="popupCode('Bayes.src/M000043.html');return false;">
236
- <span class="method-name">method_missing</span><span class="method-args">(name, *args)</span>
237
- </a>
238
- </div>
239
-
240
- <div class="method-description">
241
- <p>
242
- Provides training and untraining methods for the categories specified in <a
243
- href="Bayes.html#M000038">Bayes#new</a> For example:
244
- </p>
245
- <pre>
246
- b = Classifier::Bayes.new 'This', 'That', 'the_other'
247
- b.train_this &quot;This text&quot;
248
- b.train_that &quot;That text&quot;
249
- b.untrain_that &quot;That text&quot;
250
- b.train_the_other &quot;The other text&quot;
251
- </pre>
252
- </div>
253
- </div>
254
-
255
- <div id="method-M000039" class="method-detail">
256
- <a name="M000039"></a>
257
-
258
- <div class="method-heading">
259
- <a href="Bayes.src/M000039.html" target="Code" class="method-signature"
260
- onclick="popupCode('Bayes.src/M000039.html');return false;">
261
- <span class="method-name">train</span><span class="method-args">(category, text)</span>
262
- </a>
263
- </div>
264
-
265
- <div class="method-description">
266
- <p>
267
- Provides a general training method for all categories specified in <a
268
- href="Bayes.html#M000038">Bayes#new</a> For example:
269
- </p>
270
- <pre>
271
- b = Classifier::Bayes.new 'This', 'That', 'the_other'
272
- b.train :this, &quot;This text&quot;
273
- b.train &quot;that&quot;, &quot;That text&quot;
274
- b.train &quot;The other&quot;, &quot;The other text&quot;
275
- </pre>
276
- </div>
277
- </div>
278
-
279
- <div id="method-M000040" class="method-detail">
280
- <a name="M000040"></a>
281
-
282
- <div class="method-heading">
283
- <a href="Bayes.src/M000040.html" target="Code" class="method-signature"
284
- onclick="popupCode('Bayes.src/M000040.html');return false;">
285
- <span class="method-name">untrain</span><span class="method-args">(category, text)</span>
286
- </a>
287
- </div>
288
-
289
- <div class="method-description">
290
- <p>
291
- Provides a untraining method for all categories specified in <a
292
- href="Bayes.html#M000038">Bayes#new</a> Be very careful with this method.
293
- </p>
294
- <p>
295
- For example:
296
- </p>
297
- <pre>
298
- b = Classifier::Bayes.new 'This', 'That', 'the_other'
299
- b.train :this, &quot;This text&quot;
300
- b.untrain :this, &quot;This text&quot;
301
- </pre>
302
- </div>
303
- </div>
304
-
305
-
306
- </div>
307
-
308
-
309
- </div>
310
-
311
-
312
- <div id="validator-badges">
313
- <p><small><a href="http://validator.w3.org/check/referer">[Validate]</a></small></p>
314
- </div>
315
-
316
- </body>
317
- </html>