chupa-text 1.0.0

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
Files changed (67) hide show
  1. checksums.yaml +7 -0
  2. data/.yardopts +5 -0
  3. data/Gemfile +21 -0
  4. data/LICENSE.txt +502 -0
  5. data/README.md +91 -0
  6. data/Rakefile +46 -0
  7. data/bin/chupa-text +21 -0
  8. data/bin/chupa-text-generate-decomposer +21 -0
  9. data/chupa-text.gemspec +58 -0
  10. data/data/chupa-text.conf +5 -0
  11. data/data/mime-types.conf +19 -0
  12. data/doc/text/command-line.md +136 -0
  13. data/doc/text/decomposer.md +343 -0
  14. data/doc/text/library.md +72 -0
  15. data/doc/text/news.md +5 -0
  16. data/lib/chupa-text.rb +37 -0
  17. data/lib/chupa-text/command.rb +18 -0
  18. data/lib/chupa-text/command/chupa-text-generate-decomposer.rb +324 -0
  19. data/lib/chupa-text/command/chupa-text.rb +102 -0
  20. data/lib/chupa-text/configuration-loader.rb +95 -0
  21. data/lib/chupa-text/configuration.rb +49 -0
  22. data/lib/chupa-text/data.rb +149 -0
  23. data/lib/chupa-text/decomposer-registry.rb +37 -0
  24. data/lib/chupa-text/decomposer.rb +37 -0
  25. data/lib/chupa-text/decomposers.rb +59 -0
  26. data/lib/chupa-text/decomposers/csv.rb +44 -0
  27. data/lib/chupa-text/decomposers/gzip.rb +51 -0
  28. data/lib/chupa-text/decomposers/tar.rb +42 -0
  29. data/lib/chupa-text/decomposers/xml.rb +55 -0
  30. data/lib/chupa-text/extractor.rb +91 -0
  31. data/lib/chupa-text/file-content.rb +35 -0
  32. data/lib/chupa-text/formatters.rb +17 -0
  33. data/lib/chupa-text/formatters/json.rb +60 -0
  34. data/lib/chupa-text/input-data.rb +58 -0
  35. data/lib/chupa-text/mime-type-registry.rb +41 -0
  36. data/lib/chupa-text/mime-type.rb +36 -0
  37. data/lib/chupa-text/text-data.rb +26 -0
  38. data/lib/chupa-text/version.rb +19 -0
  39. data/lib/chupa-text/virtual-content.rb +91 -0
  40. data/lib/chupa-text/virtual-file-data.rb +46 -0
  41. data/test/command/test-chupa-text.rb +178 -0
  42. data/test/decomposers/test-csv.rb +48 -0
  43. data/test/decomposers/test-gzip.rb +113 -0
  44. data/test/decomposers/test-tar.rb +78 -0
  45. data/test/decomposers/test-xml.rb +58 -0
  46. data/test/fixture/command/chupa-text/hello.txt +1 -0
  47. data/test/fixture/command/chupa-text/hello.txt.gz +0 -0
  48. data/test/fixture/command/chupa-text/no-decomposer.conf +3 -0
  49. data/test/fixture/extractor/hello.txt +1 -0
  50. data/test/fixture/gzip/hello.tar.gz +0 -0
  51. data/test/fixture/gzip/hello.tgz +0 -0
  52. data/test/fixture/gzip/hello.txt.gz +0 -0
  53. data/test/fixture/tar/directory.tar +0 -0
  54. data/test/fixture/tar/top-level.tar +0 -0
  55. data/test/helper.rb +25 -0
  56. data/test/run-test.rb +35 -0
  57. data/test/test-configuration-loader.rb +54 -0
  58. data/test/test-data.rb +85 -0
  59. data/test/test-decomposer-registry.rb +30 -0
  60. data/test/test-decomposer.rb +41 -0
  61. data/test/test-decomposers.rb +59 -0
  62. data/test/test-extractor.rb +125 -0
  63. data/test/test-file-content.rb +51 -0
  64. data/test/test-mime-type-registry.rb +48 -0
  65. data/test/test-text-data.rb +36 -0
  66. data/test/test-virtual-content.rb +103 -0
  67. metadata +183 -0
metadata ADDED
@@ -0,0 +1,183 @@
1
+ --- !ruby/object:Gem::Specification
2
+ name: chupa-text
3
+ version: !ruby/object:Gem::Version
4
+ version: 1.0.0
5
+ platform: ruby
6
+ authors:
7
+ - Kouhei Sutou
8
+ autorequire:
9
+ bindir: bin
10
+ cert_chain: []
11
+ date: 2014-01-04 00:00:00.000000000 Z
12
+ dependencies:
13
+ - !ruby/object:Gem::Dependency
14
+ name: bundler
15
+ requirement: !ruby/object:Gem::Requirement
16
+ requirements:
17
+ - - '>='
18
+ - !ruby/object:Gem::Version
19
+ version: '0'
20
+ type: :development
21
+ prerelease: false
22
+ version_requirements: !ruby/object:Gem::Requirement
23
+ requirements:
24
+ - - '>='
25
+ - !ruby/object:Gem::Version
26
+ version: '0'
27
+ - !ruby/object:Gem::Dependency
28
+ name: rake
29
+ requirement: !ruby/object:Gem::Requirement
30
+ requirements:
31
+ - - '>='
32
+ - !ruby/object:Gem::Version
33
+ version: '0'
34
+ type: :development
35
+ prerelease: false
36
+ version_requirements: !ruby/object:Gem::Requirement
37
+ requirements:
38
+ - - '>='
39
+ - !ruby/object:Gem::Version
40
+ version: '0'
41
+ - !ruby/object:Gem::Dependency
42
+ name: test-unit
43
+ requirement: !ruby/object:Gem::Requirement
44
+ requirements:
45
+ - - '>='
46
+ - !ruby/object:Gem::Version
47
+ version: '0'
48
+ type: :development
49
+ prerelease: false
50
+ version_requirements: !ruby/object:Gem::Requirement
51
+ requirements:
52
+ - - '>='
53
+ - !ruby/object:Gem::Version
54
+ version: '0'
55
+ - !ruby/object:Gem::Dependency
56
+ name: packnga
57
+ requirement: !ruby/object:Gem::Requirement
58
+ requirements:
59
+ - - '>='
60
+ - !ruby/object:Gem::Version
61
+ version: '0'
62
+ type: :development
63
+ prerelease: false
64
+ version_requirements: !ruby/object:Gem::Requirement
65
+ requirements:
66
+ - - '>='
67
+ - !ruby/object:Gem::Version
68
+ version: '0'
69
+ - !ruby/object:Gem::Dependency
70
+ name: redcarpet
71
+ requirement: !ruby/object:Gem::Requirement
72
+ requirements:
73
+ - - '>='
74
+ - !ruby/object:Gem::Version
75
+ version: '0'
76
+ type: :development
77
+ prerelease: false
78
+ version_requirements: !ruby/object:Gem::Requirement
79
+ requirements:
80
+ - - '>='
81
+ - !ruby/object:Gem::Version
82
+ version: '0'
83
+ description: ''
84
+ email:
85
+ - kou@clear-code.com
86
+ executables:
87
+ - chupa-text
88
+ - chupa-text-generate-decomposer
89
+ extensions: []
90
+ extra_rdoc_files: []
91
+ files:
92
+ - chupa-text.gemspec
93
+ - README.md
94
+ - LICENSE.txt
95
+ - Rakefile
96
+ - Gemfile
97
+ - .yardopts
98
+ - data/chupa-text.conf
99
+ - data/mime-types.conf
100
+ - lib/chupa-text/data.rb
101
+ - lib/chupa-text/version.rb
102
+ - lib/chupa-text/extractor.rb
103
+ - lib/chupa-text/command/chupa-text.rb
104
+ - lib/chupa-text/command/chupa-text-generate-decomposer.rb
105
+ - lib/chupa-text/configuration.rb
106
+ - lib/chupa-text/decomposer-registry.rb
107
+ - lib/chupa-text/text-data.rb
108
+ - lib/chupa-text/configuration-loader.rb
109
+ - lib/chupa-text/virtual-file-data.rb
110
+ - lib/chupa-text/formatters/json.rb
111
+ - lib/chupa-text/virtual-content.rb
112
+ - lib/chupa-text/decomposers/csv.rb
113
+ - lib/chupa-text/decomposers/tar.rb
114
+ - lib/chupa-text/decomposers/xml.rb
115
+ - lib/chupa-text/decomposers/gzip.rb
116
+ - lib/chupa-text/formatters.rb
117
+ - lib/chupa-text/decomposers.rb
118
+ - lib/chupa-text/command.rb
119
+ - lib/chupa-text/file-content.rb
120
+ - lib/chupa-text/decomposer.rb
121
+ - lib/chupa-text/mime-type.rb
122
+ - lib/chupa-text/input-data.rb
123
+ - lib/chupa-text/mime-type-registry.rb
124
+ - lib/chupa-text.rb
125
+ - doc/text/decomposer.md
126
+ - doc/text/command-line.md
127
+ - doc/text/news.md
128
+ - doc/text/library.md
129
+ - test/test-decomposers.rb
130
+ - test/test-decomposer.rb
131
+ - test/test-virtual-content.rb
132
+ - test/command/test-chupa-text.rb
133
+ - test/helper.rb
134
+ - test/test-configuration-loader.rb
135
+ - test/test-mime-type-registry.rb
136
+ - test/test-decomposer-registry.rb
137
+ - test/fixture/gzip/hello.txt.gz
138
+ - test/fixture/gzip/hello.tgz
139
+ - test/fixture/gzip/hello.tar.gz
140
+ - test/fixture/tar/top-level.tar
141
+ - test/fixture/tar/directory.tar
142
+ - test/fixture/command/chupa-text/hello.txt.gz
143
+ - test/fixture/command/chupa-text/no-decomposer.conf
144
+ - test/fixture/command/chupa-text/hello.txt
145
+ - test/fixture/extractor/hello.txt
146
+ - test/decomposers/test-csv.rb
147
+ - test/decomposers/test-gzip.rb
148
+ - test/decomposers/test-tar.rb
149
+ - test/decomposers/test-xml.rb
150
+ - test/test-data.rb
151
+ - test/test-file-content.rb
152
+ - test/test-extractor.rb
153
+ - test/run-test.rb
154
+ - test/test-text-data.rb
155
+ - bin/chupa-text
156
+ - bin/chupa-text-generate-decomposer
157
+ homepage: http://ranguba.org/#about-chupa-text
158
+ licenses:
159
+ - LGPLv2.1 or later
160
+ metadata: {}
161
+ post_install_message:
162
+ rdoc_options: []
163
+ require_paths:
164
+ - lib
165
+ required_ruby_version: !ruby/object:Gem::Requirement
166
+ requirements:
167
+ - - '>='
168
+ - !ruby/object:Gem::Version
169
+ version: '0'
170
+ required_rubygems_version: !ruby/object:Gem::Requirement
171
+ requirements:
172
+ - - '>='
173
+ - !ruby/object:Gem::Version
174
+ version: '0'
175
+ requirements: []
176
+ rubyforge_project:
177
+ rubygems_version: 2.0.14
178
+ signing_key:
179
+ specification_version: 4
180
+ summary: ChupaText is an extensible text extractor. You can plug your custom text
181
+ extractor in ChupaText. You can write your plugin by Ruby.
182
+ test_files: []
183
+ has_rdoc: