ocarina 0.0.1

Sign up to get free protection for your applications and to get access to all the features.
Files changed (153) hide show
  1. data/.gitignore +23 -0
  2. data/Gemfile +4 -0
  3. data/LICENSE +204 -0
  4. data/NOTICE +13 -0
  5. data/README.md +83 -0
  6. data/Rakefile +146 -0
  7. data/data/.gitkeep +0 -0
  8. data/data/images/letterpress/board1.png +0 -0
  9. data/data/images/letterpress/board2.png +0 -0
  10. data/data/images/letterpress/board3.png +0 -0
  11. data/data/images/letterpress/board4.png +0 -0
  12. data/data/images/letterpress/board5.png +0 -0
  13. data/data/images/noise/.gitkeep +0 -0
  14. data/data/images/noise/0.gif +0 -0
  15. data/data/images/noise/1.gif +0 -0
  16. data/data/images/noise/2.gif +0 -0
  17. data/data/images/noise/3.gif +0 -0
  18. data/data/images/noise/4.gif +0 -0
  19. data/data/images/noise/5.gif +0 -0
  20. data/data/images/noise/6.gif +0 -0
  21. data/data/images/noise/7.gif +0 -0
  22. data/data/images/noise/8.gif +0 -0
  23. data/data/images/noise/9.gif +0 -0
  24. data/data/images/noise/A.gif +0 -0
  25. data/data/images/noise/B.gif +0 -0
  26. data/data/images/noise/C.gif +0 -0
  27. data/data/images/noise/D.gif +0 -0
  28. data/data/images/noise/E.gif +0 -0
  29. data/data/images/noise/F.gif +0 -0
  30. data/data/images/noise/G.gif +0 -0
  31. data/data/images/noise/H.gif +0 -0
  32. data/data/images/noise/I.gif +0 -0
  33. data/data/images/noise/J.gif +0 -0
  34. data/data/images/noise/K.gif +0 -0
  35. data/data/images/noise/L.gif +0 -0
  36. data/data/images/noise/M.gif +0 -0
  37. data/data/images/noise/N.gif +0 -0
  38. data/data/images/noise/O.gif +0 -0
  39. data/data/images/noise/P.gif +0 -0
  40. data/data/images/noise/Q.gif +0 -0
  41. data/data/images/noise/R.gif +0 -0
  42. data/data/images/noise/S.gif +0 -0
  43. data/data/images/noise/T.gif +0 -0
  44. data/data/images/noise/U.gif +0 -0
  45. data/data/images/noise/V.gif +0 -0
  46. data/data/images/noise/W.gif +0 -0
  47. data/data/images/noise/X.gif +0 -0
  48. data/data/images/noise/Y.gif +0 -0
  49. data/data/images/noise/Z.gif +0 -0
  50. data/data/images/noise/a_lower.gif +0 -0
  51. data/data/images/noise/b_lower.gif +0 -0
  52. data/data/images/noise/c_lower.gif +0 -0
  53. data/data/images/noise/d_lower.gif +0 -0
  54. data/data/images/noise/e_lower.gif +0 -0
  55. data/data/images/noise/f_lower.gif +0 -0
  56. data/data/images/noise/g_lower.gif +0 -0
  57. data/data/images/noise/h_lower.gif +0 -0
  58. data/data/images/noise/i_lower.gif +0 -0
  59. data/data/images/noise/j_lower.gif +0 -0
  60. data/data/images/noise/k_lower.gif +0 -0
  61. data/data/images/noise/l_lower.gif +0 -0
  62. data/data/images/noise/m_lower.gif +0 -0
  63. data/data/images/noise/n_lower.gif +0 -0
  64. data/data/images/noise/o_lower.gif +0 -0
  65. data/data/images/noise/p_lower.gif +0 -0
  66. data/data/images/noise/q_lower.gif +0 -0
  67. data/data/images/noise/r_lower.gif +0 -0
  68. data/data/images/noise/s_lower.gif +0 -0
  69. data/data/images/noise/t_lower.gif +0 -0
  70. data/data/images/noise/u_lower.gif +0 -0
  71. data/data/images/noise/v_lower.gif +0 -0
  72. data/data/images/noise/w_lower.gif +0 -0
  73. data/data/images/noise/x_lower.gif +0 -0
  74. data/data/images/noise/y_lower.gif +0 -0
  75. data/data/images/noise/z_lower.gif +0 -0
  76. data/data/images/reference/.gitkeep +0 -0
  77. data/data/images/reference/0.gif +0 -0
  78. data/data/images/reference/1.gif +0 -0
  79. data/data/images/reference/2.gif +0 -0
  80. data/data/images/reference/3.gif +0 -0
  81. data/data/images/reference/4.gif +0 -0
  82. data/data/images/reference/5.gif +0 -0
  83. data/data/images/reference/6.gif +0 -0
  84. data/data/images/reference/7.gif +0 -0
  85. data/data/images/reference/8.gif +0 -0
  86. data/data/images/reference/9.gif +0 -0
  87. data/data/images/reference/A.gif +0 -0
  88. data/data/images/reference/B.gif +0 -0
  89. data/data/images/reference/C.gif +0 -0
  90. data/data/images/reference/D.gif +0 -0
  91. data/data/images/reference/E.gif +0 -0
  92. data/data/images/reference/F.gif +0 -0
  93. data/data/images/reference/G.gif +0 -0
  94. data/data/images/reference/H.gif +0 -0
  95. data/data/images/reference/I.gif +0 -0
  96. data/data/images/reference/J.gif +0 -0
  97. data/data/images/reference/K.gif +0 -0
  98. data/data/images/reference/L.gif +0 -0
  99. data/data/images/reference/M.gif +0 -0
  100. data/data/images/reference/N.gif +0 -0
  101. data/data/images/reference/O.gif +0 -0
  102. data/data/images/reference/P.gif +0 -0
  103. data/data/images/reference/Q.gif +0 -0
  104. data/data/images/reference/R.gif +0 -0
  105. data/data/images/reference/S.gif +0 -0
  106. data/data/images/reference/T.gif +0 -0
  107. data/data/images/reference/U.gif +0 -0
  108. data/data/images/reference/V.gif +0 -0
  109. data/data/images/reference/W.gif +0 -0
  110. data/data/images/reference/X.gif +0 -0
  111. data/data/images/reference/Y.gif +0 -0
  112. data/data/images/reference/Z.gif +0 -0
  113. data/data/images/reference/a_lower.gif +0 -0
  114. data/data/images/reference/b_lower.gif +0 -0
  115. data/data/images/reference/c_lower.gif +0 -0
  116. data/data/images/reference/d_lower.gif +0 -0
  117. data/data/images/reference/e_lower.gif +0 -0
  118. data/data/images/reference/f_lower.gif +0 -0
  119. data/data/images/reference/g_lower.gif +0 -0
  120. data/data/images/reference/h_lower.gif +0 -0
  121. data/data/images/reference/i_lower.gif +0 -0
  122. data/data/images/reference/j_lower.gif +0 -0
  123. data/data/images/reference/k_lower.gif +0 -0
  124. data/data/images/reference/l_lower.gif +0 -0
  125. data/data/images/reference/m_lower.gif +0 -0
  126. data/data/images/reference/n_lower.gif +0 -0
  127. data/data/images/reference/o_lower.gif +0 -0
  128. data/data/images/reference/p_lower.gif +0 -0
  129. data/data/images/reference/q_lower.gif +0 -0
  130. data/data/images/reference/r_lower.gif +0 -0
  131. data/data/images/reference/s_lower.gif +0 -0
  132. data/data/images/reference/t_lower.gif +0 -0
  133. data/data/images/reference/u_lower.gif +0 -0
  134. data/data/images/reference/v_lower.gif +0 -0
  135. data/data/images/reference/w_lower.gif +0 -0
  136. data/data/images/reference/x_lower.gif +0 -0
  137. data/data/images/reference/y_lower.gif +0 -0
  138. data/data/images/reference/z_lower.gif +0 -0
  139. data/data/letterpress-train.bin +0 -0
  140. data/data/train.bin +0 -0
  141. data/lib/ocarina.rb +12 -0
  142. data/lib/ocarina/character_generator.rb +87 -0
  143. data/lib/ocarina/config.rb +35 -0
  144. data/lib/ocarina/error_stats.rb +62 -0
  145. data/lib/ocarina/letterpress_character_generator.rb +93 -0
  146. data/lib/ocarina/letterpress_cropper.rb +84 -0
  147. data/lib/ocarina/network.rb +264 -0
  148. data/lib/ocarina/util.rb +92 -0
  149. data/lib/ocarina/version.rb +3 -0
  150. data/ocarina.gemspec +20 -0
  151. data/ocarina.png +0 -0
  152. data/test/test_letterpress.rb +60 -0
  153. metadata +231 -0
data/.gitignore ADDED
@@ -0,0 +1,23 @@
1
+ *.gem
2
+ *.rbc
3
+ .bundle
4
+ .config
5
+ .yardoc
6
+ Gemfile.lock
7
+ InstalledFiles
8
+ _yardoc
9
+ coverage
10
+ doc/
11
+ lib/bundler/man
12
+ pkg
13
+ rdoc
14
+ spec/reports
15
+ test/tmp
16
+ test/version_tmp
17
+ tmp
18
+
19
+ # Intellij IDEA project dir
20
+ .idea/
21
+
22
+ # Intellij IDEA project file
23
+ *.iml
data/Gemfile ADDED
@@ -0,0 +1,4 @@
1
+ source 'https://rubygems.org'
2
+
3
+ # Specify your gem's dependencies in ocarina.gemspec
4
+ gemspec
data/LICENSE ADDED
@@ -0,0 +1,204 @@
1
+ Copyright (c) 2012 George Armhold
2
+
3
+
4
+ Apache License
5
+ Version 2.0, January 2004
6
+ http://www.apache.org/licenses/
7
+
8
+ TERMS AND CONDITIONS FOR USE, REPRODUCTION, AND DISTRIBUTION
9
+
10
+ 1. Definitions.
11
+
12
+ "License" shall mean the terms and conditions for use, reproduction,
13
+ and distribution as defined by Sections 1 through 9 of this document.
14
+
15
+ "Licensor" shall mean the copyright owner or entity authorized by
16
+ the copyright owner that is granting the License.
17
+
18
+ "Legal Entity" shall mean the union of the acting entity and all
19
+ other entities that control, are controlled by, or are under common
20
+ control with that entity. For the purposes of this definition,
21
+ "control" means (i) the power, direct or indirect, to cause the
22
+ direction or management of such entity, whether by contract or
23
+ otherwise, or (ii) ownership of fifty percent (50%) or more of the
24
+ outstanding shares, or (iii) beneficial ownership of such entity.
25
+
26
+ "You" (or "Your") shall mean an individual or Legal Entity
27
+ exercising permissions granted by this License.
28
+
29
+ "Source" form shall mean the preferred form for making modifications,
30
+ including but not limited to software source code, documentation
31
+ source, and configuration files.
32
+
33
+ "Object" form shall mean any form resulting from mechanical
34
+ transformation or translation of a Source form, including but
35
+ not limited to compiled object code, generated documentation,
36
+ and conversions to other media types.
37
+
38
+ "Work" shall mean the work of authorship, whether in Source or
39
+ Object form, made available under the License, as indicated by a
40
+ copyright notice that is included in or attached to the work
41
+ (an example is provided in the Appendix below).
42
+
43
+ "Derivative Works" shall mean any work, whether in Source or Object
44
+ form, that is based on (or derived from) the Work and for which the
45
+ editorial revisions, annotations, elaborations, or other modifications
46
+ represent, as a whole, an original work of authorship. For the purposes
47
+ of this License, Derivative Works shall not include works that remain
48
+ separable from, or merely link (or bind by name) to the interfaces of,
49
+ the Work and Derivative Works thereof.
50
+
51
+ "Contribution" shall mean any work of authorship, including
52
+ the original version of the Work and any modifications or additions
53
+ to that Work or Derivative Works thereof, that is intentionally
54
+ submitted to Licensor for inclusion in the Work by the copyright owner
55
+ or by an individual or Legal Entity authorized to submit on behalf of
56
+ the copyright owner. For the purposes of this definition, "submitted"
57
+ means any form of electronic, verbal, or written communication sent
58
+ to the Licensor or its representatives, including but not limited to
59
+ communication on electronic mailing lists, source code control systems,
60
+ and issue tracking systems that are managed by, or on behalf of, the
61
+ Licensor for the purpose of discussing and improving the Work, but
62
+ excluding communication that is conspicuously marked or otherwise
63
+ designated in writing by the copyright owner as "Not a Contribution."
64
+
65
+ "Contributor" shall mean Licensor and any individual or Legal Entity
66
+ on behalf of whom a Contribution has been received by Licensor and
67
+ subsequently incorporated within the Work.
68
+
69
+ 2. Grant of Copyright License. Subject to the terms and conditions of
70
+ this License, each Contributor hereby grants to You a perpetual,
71
+ worldwide, non-exclusive, no-charge, royalty-free, irrevocable
72
+ copyright license to reproduce, prepare Derivative Works of,
73
+ publicly display, publicly perform, sublicense, and distribute the
74
+ Work and such Derivative Works in Source or Object form.
75
+
76
+ 3. Grant of Patent License. Subject to the terms and conditions of
77
+ this License, each Contributor hereby grants to You a perpetual,
78
+ worldwide, non-exclusive, no-charge, royalty-free, irrevocable
79
+ (except as stated in this section) patent license to make, have made,
80
+ use, offer to sell, sell, import, and otherwise transfer the Work,
81
+ where such license applies only to those patent claims licensable
82
+ by such Contributor that are necessarily infringed by their
83
+ Contribution(s) alone or by combination of their Contribution(s)
84
+ with the Work to which such Contribution(s) was submitted. If You
85
+ institute patent litigation against any entity (including a
86
+ cross-claim or counterclaim in a lawsuit) alleging that the Work
87
+ or a Contribution incorporated within the Work constitutes direct
88
+ or contributory patent infringement, then any patent licenses
89
+ granted to You under this License for that Work shall terminate
90
+ as of the date such litigation is filed.
91
+
92
+ 4. Redistribution. You may reproduce and distribute copies of the
93
+ Work or Derivative Works thereof in any medium, with or without
94
+ modifications, and in Source or Object form, provided that You
95
+ meet the following conditions:
96
+
97
+ (a) You must give any other recipients of the Work or
98
+ Derivative Works a copy of this License; and
99
+
100
+ (b) You must cause any modified files to carry prominent notices
101
+ stating that You changed the files; and
102
+
103
+ (c) You must retain, in the Source form of any Derivative Works
104
+ that You distribute, all copyright, patent, trademark, and
105
+ attribution notices from the Source form of the Work,
106
+ excluding those notices that do not pertain to any part of
107
+ the Derivative Works; and
108
+
109
+ (d) If the Work includes a "NOTICE" text file as part of its
110
+ distribution, then any Derivative Works that You distribute must
111
+ include a readable copy of the attribution notices contained
112
+ within such NOTICE file, excluding those notices that do not
113
+ pertain to any part of the Derivative Works, in at least one
114
+ of the following places: within a NOTICE text file distributed
115
+ as part of the Derivative Works; within the Source form or
116
+ documentation, if provided along with the Derivative Works; or,
117
+ within a display generated by the Derivative Works, if and
118
+ wherever such third-party notices normally appear. The contents
119
+ of the NOTICE file are for informational purposes only and
120
+ do not modify the License. You may add Your own attribution
121
+ notices within Derivative Works that You distribute, alongside
122
+ or as an addendum to the NOTICE text from the Work, provided
123
+ that such additional attribution notices cannot be construed
124
+ as modifying the License.
125
+
126
+ You may add Your own copyright statement to Your modifications and
127
+ may provide additional or different license terms and conditions
128
+ for use, reproduction, or distribution of Your modifications, or
129
+ for any such Derivative Works as a whole, provided Your use,
130
+ reproduction, and distribution of the Work otherwise complies with
131
+ the conditions stated in this License.
132
+
133
+ 5. Submission of Contributions. Unless You explicitly state otherwise,
134
+ any Contribution intentionally submitted for inclusion in the Work
135
+ by You to the Licensor shall be under the terms and conditions of
136
+ this License, without any additional terms or conditions.
137
+ Notwithstanding the above, nothing herein shall supersede or modify
138
+ the terms of any separate license agreement you may have executed
139
+ with Licensor regarding such Contributions.
140
+
141
+ 6. Trademarks. This License does not grant permission to use the trade
142
+ names, trademarks, service marks, or product names of the Licensor,
143
+ except as required for reasonable and customary use in describing the
144
+ origin of the Work and reproducing the content of the NOTICE file.
145
+
146
+ 7. Disclaimer of Warranty. Unless required by applicable law or
147
+ agreed to in writing, Licensor provides the Work (and each
148
+ Contributor provides its Contributions) on an "AS IS" BASIS,
149
+ WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or
150
+ implied, including, without limitation, any warranties or conditions
151
+ of TITLE, NON-INFRINGEMENT, MERCHANTABILITY, or FITNESS FOR A
152
+ PARTICULAR PURPOSE. You are solely responsible for determining the
153
+ appropriateness of using or redistributing the Work and assume any
154
+ risks associated with Your exercise of permissions under this License.
155
+
156
+ 8. Limitation of Liability. In no event and under no legal theory,
157
+ whether in tort (including negligence), contract, or otherwise,
158
+ unless required by applicable law (such as deliberate and grossly
159
+ negligent acts) or agreed to in writing, shall any Contributor be
160
+ liable to You for damages, including any direct, indirect, special,
161
+ incidental, or consequential damages of any character arising as a
162
+ result of this License or out of the use or inability to use the
163
+ Work (including but not limited to damages for loss of goodwill,
164
+ work stoppage, computer failure or malfunction, or any and all
165
+ other commercial damages or losses), even if such Contributor
166
+ has been advised of the possibility of such damages.
167
+
168
+ 9. Accepting Warranty or Additional Liability. While redistributing
169
+ the Work or Derivative Works thereof, You may choose to offer,
170
+ and charge a fee for, acceptance of support, warranty, indemnity,
171
+ or other liability obligations and/or rights consistent with this
172
+ License. However, in accepting such obligations, You may act only
173
+ on Your own behalf and on Your sole responsibility, not on behalf
174
+ of any other Contributor, and only if You agree to indemnify,
175
+ defend, and hold each Contributor harmless for any liability
176
+ incurred by, or claims asserted against, such Contributor by reason
177
+ of your accepting any such warranty or additional liability.
178
+
179
+ END OF TERMS AND CONDITIONS
180
+
181
+ APPENDIX: How to apply the Apache License to your work.
182
+
183
+ To apply the Apache License to your work, attach the following
184
+ boilerplate notice, with the fields enclosed by brackets "[]"
185
+ replaced with your own identifying information. (Don't include
186
+ the brackets!) The text should be enclosed in the appropriate
187
+ comment syntax for the file format. We also recommend that a
188
+ file or class name and description of purpose be included on the
189
+ same "printed page" as the copyright notice for easier
190
+ identification within third-party archives.
191
+
192
+ Copyright [yyyy] [name of copyright owner]
193
+
194
+ Licensed under the Apache License, Version 2.0 (the "License");
195
+ you may not use this file except in compliance with the License.
196
+ You may obtain a copy of the License at
197
+
198
+ http://www.apache.org/licenses/LICENSE-2.0
199
+
200
+ Unless required by applicable law or agreed to in writing, software
201
+ distributed under the License is distributed on an "AS IS" BASIS,
202
+ WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
203
+ See the License for the specific language governing permissions and
204
+ limitations under the License.
data/NOTICE ADDED
@@ -0,0 +1,13 @@
1
+ Copyright 2012 George Armhold
2
+
3
+ Licensed under the Apache License, Version 2.0 (the "License");
4
+ you may not use this file except in compliance with the License.
5
+ You may obtain a copy of the License at
6
+
7
+ http://www.apache.org/licenses/LICENSE-2.0
8
+
9
+ Unless required by applicable law or agreed to in writing, software
10
+ distributed under the License is distributed on an "AS IS" BASIS,
11
+ WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
12
+ See the License for the specific language governing permissions and
13
+ limitations under the License.
data/README.md ADDED
@@ -0,0 +1,83 @@
1
+ # Ocarina - Optical Character Recognition (OCR) for Ruby
2
+
3
+ ### A Ruby project that uses machine learning to perform Optical Character Recognition.
4
+
5
+ ![](https://raw.github.com/armhold/ocarina/master/ocarina.png)
6
+
7
+ I created this project in order to learn Ruby. It started as kind of a toy program, but
8
+ quickly grew into something with a practical purpose (decoding [Letterpress](https://itunes.apple.com/us/app/id526619424?mt=8)
9
+ gameboards!)
10
+
11
+ It works fairly well on constrained input, but it's not really intended to be a
12
+ production-level OCR package.
13
+
14
+ ## Status
15
+
16
+ Ocarina successfully trains and recognizes the 26 letters of the alphabet. Once trained, the network
17
+ accurately recognizes its training set (100%) and also does well (98%?) on recognizing characters
18
+ with added noise.
19
+
20
+ I'm still working on how best to organize the neural network (# of hidden nodes, # of outputs,
21
+ edge weights) to increase the set size to support the full ASCII (and beyond) alphabet.
22
+
23
+
24
+ ## Motivation
25
+
26
+ I first encountered OCR technology back in 1991 or so, on an Apple Macintosh. It seemed like
27
+ magic, even though it was a pretty poor implementation by today's standards. Recently I came across the
28
+ [Sudoku Grab](http://itunes.apple.com/app/sudoku-grab/id305614901?mt=8) app. It does OCR very successfully,
29
+ albeit on very constrained input images.
30
+
31
+ This inspired me to try to create my own (simplistic) OCR implementation, and that seemed like a
32
+ great way to learn Ruby.
33
+
34
+
35
+ ## Installation
36
+
37
+
38
+ ### Dependencies
39
+
40
+ Ocarina depends on ImageMagick (and the RMagick gem) to do its graphics processing.
41
+ On OSX at least, ImageMagick requires X11 and ghostscript. You'll likely need to do the following:
42
+
43
+
44
+ 1. Download and install [X11Quartz](http://xquartz.macosforge.org/landing)
45
+ 1. `$ brew install imagemagick`
46
+ 1. `$ brew install ghostscript`
47
+
48
+
49
+ ## Usage
50
+
51
+ #### Training
52
+
53
+ `rake ocarina:train`
54
+
55
+ #### Character Recognition
56
+
57
+ `rake ocarina:eval`
58
+
59
+ ## Contributing
60
+
61
+ 1. Fork it
62
+ 2. Create your feature branch (`git checkout -b my-new-feature`)
63
+ 3. Commit your changes (`git commit -am 'Added some feature'`)
64
+ 4. Push to the branch (`git push origin my-new-feature`)
65
+ 5. Create new Pull Request
66
+
67
+
68
+ ## LICENSE
69
+
70
+ Copyright 2012 George Armhold
71
+
72
+ Licensed under the Apache License, Version 2.0 (the "License");
73
+ you may not use this file except in compliance with the License.
74
+ You may obtain a copy of the License at
75
+
76
+ http://www.apache.org/licenses/LICENSE-2.0
77
+
78
+ Unless required by applicable law or agreed to in writing, software
79
+ distributed under the License is distributed on an "AS IS" BASIS,
80
+ WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
81
+ See the License for the specific language governing permissions and
82
+ limitations under the License.
83
+
data/Rakefile ADDED
@@ -0,0 +1,146 @@
1
+ #!/usr/bin/env rake
2
+ require "bundler/gem_tasks"
3
+ require_relative "lib/ocarina.rb"
4
+ require 'powerbar'
5
+ require 'rake/testtask'
6
+
7
+ Rake::TestTask.new do |t|
8
+ t.libs << 'test'
9
+ end
10
+
11
+ desc "Run tests"
12
+ task :default => :test
13
+
14
+ namespace :ocarina do
15
+ include Ocarina::Util
16
+
17
+ desc "generates and persists bitmaps for reference/noise images"
18
+ task :bitmaps do |t, args|
19
+
20
+ # train/eval does not actually need bitmaps on disk- we provide this so that
21
+ # you can examine the generated bitmap images for debugging purposes.
22
+ #
23
+ # images are saved to data/images/{reference,noise}
24
+
25
+ generator = Ocarina::CharacterGenerator.new(config)
26
+ generator.persist_tiles
27
+ end
28
+
29
+ desc "builds and trains the network"
30
+ task :train do |t, args|
31
+ network = Ocarina::Network.new(config)
32
+ generator = Ocarina::CharacterGenerator.new(network.config)
33
+
34
+ training_iterations = 350
35
+ pbar = PowerBar.new
36
+ pbar.settings.tty.finite.template.barchar = '#'
37
+ pbar.settings.tty.finite.template.padchar = '-'
38
+
39
+ training_iterations.times do |i|
40
+ generator.reference_image_hash.each_pair do |char, tile|
41
+ network.train tile, char
42
+ pbar.show(msg: "current error: #{'%.10f' % network.current_error}", done: i + 1, total: training_iterations)
43
+ end
44
+ end
45
+
46
+ puts "\nfinal training error: #{network.current_error}\n"
47
+
48
+ # run with: ruby -I"lib:test" test/network_test.rb -n test_network
49
+
50
+ file = "#{Ocarina::DATA_DIR}/train.bin"
51
+ network.save_network_to_file file
52
+
53
+ puts "trained network saved to: #{file}"
54
+ end
55
+
56
+ desc "runs the training images back through the network for evaluation"
57
+ task :eval do |t, args|
58
+ file = "#{Ocarina::DATA_DIR}/train.bin"
59
+ network = Ocarina::Network.load_network_from_file file
60
+ generator = Ocarina::CharacterGenerator.new(network.config)
61
+
62
+ puts "##### testing against reference images #####"
63
+ stats = Ocarina::ErrorStats.new(network.config)
64
+
65
+ generator.reference_image_hash.each_pair do |char, tile|
66
+ result = network.recognize tile
67
+ stats.check_error char.ord, result
68
+ end
69
+ stats.report
70
+
71
+ puts
72
+ puts "##### testing against noise images #####"
73
+
74
+ stats = Ocarina::ErrorStats.new(network.config)
75
+
76
+ generator.noise_image_hash.each_pair do |char, tile|
77
+ result = network.recognize tile
78
+ stats.check_error char.ord, result
79
+ end
80
+ stats.report
81
+ end
82
+
83
+ desc "builds and trains network using Letterpress board tiles"
84
+ task :letterpress do |t, args|
85
+ network = Ocarina::Network.new(config)
86
+ generator = Ocarina::LetterpressCharacterGenerator.new(network.config)
87
+
88
+ training_iterations = 1200
89
+ pbar = PowerBar.new
90
+ pbar.settings.tty.finite.template.barchar = '#'
91
+ pbar.settings.tty.finite.template.padchar = '-'
92
+
93
+ training_iterations.times do |i|
94
+ generator.reference_image_hash.each_pair do |char, tile|
95
+ network.train tile, char
96
+ pbar.show(msg: "current error: #{'%.10f' % network.current_error}", done: i + 1, total: training_iterations)
97
+ end
98
+ end
99
+
100
+ puts "\nfinal training error: #{network.current_error}\n"
101
+
102
+ network.save_network_to_file "#{Ocarina::DATA_DIR}/letterpress-train.bin"
103
+
104
+ puts "trained network saved to: #{file}"
105
+
106
+ puts "##### testing against reference images #####"
107
+ stats = Ocarina::ErrorStats.new(network.config)
108
+
109
+ generator.reference_image_hash.each_pair do |char, tile|
110
+ result = network.recognize tile
111
+ stats.check_error char.ord, result
112
+ end
113
+ stats.report
114
+
115
+ end
116
+
117
+ desc "deciphers letters from a letterpress game board"
118
+ task :gameboard, [:board_file] do |t, args|
119
+ network = Ocarina::Network.load_network_from_file "#{Ocarina::DATA_DIR}/letterpress-train.bin"
120
+
121
+ puts "reading letterpress board: #{args.board_file}..."
122
+
123
+ board = Magick::Image.read(args.board_file).first
124
+
125
+ cropper = Ocarina::LetterpressCropper.new(network.config)
126
+ chars = cropper.decipher_board(network, board)
127
+ result = ""
128
+
129
+ chars.each do |row|
130
+ row.each do |char|
131
+ result << " #{char}"
132
+ end
133
+
134
+ result << "\n"
135
+ end
136
+
137
+ puts "result: \n\n#{result}"
138
+ end
139
+
140
+ def config
141
+ # need 8 bits to represent 0..255 in binary
142
+ @config ||= Ocarina::Config.new("ABCDEFGHIJKLMNOPQRSTUVWXYZ", 8, 16, 16)
143
+ end
144
+
145
+
146
+ end