chupa-text-decomposer-libreoffice 1.0.0

Sign up to get free protection for your applications and to get access to all the features.
Files changed (48) hide show
  1. checksums.yaml +7 -0
  2. data/.yardopts +5 -0
  3. data/Gemfile +34 -0
  4. data/LICENSE.txt +502 -0
  5. data/README.md +45 -0
  6. data/Rakefile +46 -0
  7. data/chupa-text-decomposer-libreoffice.gemspec +51 -0
  8. data/doc/text/news.md +5 -0
  9. data/lib/chupa-text/decomposers/libreoffice.rb +131 -0
  10. data/test/fixture/doc/attributes.doc +0 -0
  11. data/test/fixture/doc/multi-pages.doc +0 -0
  12. data/test/fixture/doc/one-page.doc +0 -0
  13. data/test/fixture/docx/attributes.docx +0 -0
  14. data/test/fixture/docx/multi-pages.docx +0 -0
  15. data/test/fixture/docx/one-page.docx +0 -0
  16. data/test/fixture/odp/attributes.odp +0 -0
  17. data/test/fixture/odp/multi-slides.odp +0 -0
  18. data/test/fixture/odp/one-slide.odp +0 -0
  19. data/test/fixture/ods/attributes.ods +0 -0
  20. data/test/fixture/ods/multi-sheets.ods +0 -0
  21. data/test/fixture/ods/one-sheet.ods +0 -0
  22. data/test/fixture/odt/attributes.odt +0 -0
  23. data/test/fixture/odt/multi-pages.odt +0 -0
  24. data/test/fixture/odt/one-page.odt +0 -0
  25. data/test/fixture/ppt/attributes.ppt +0 -0
  26. data/test/fixture/ppt/multi-slides.ppt +0 -0
  27. data/test/fixture/ppt/one-slide.ppt +0 -0
  28. data/test/fixture/pptx/attributes.pptx +0 -0
  29. data/test/fixture/pptx/multi-slides.pptx +0 -0
  30. data/test/fixture/pptx/one-slide.pptx +0 -0
  31. data/test/fixture/xls/attributes.xls +0 -0
  32. data/test/fixture/xls/multi-sheets.xls +0 -0
  33. data/test/fixture/xls/one-sheet.xls +0 -0
  34. data/test/fixture/xlsx/attributes.xlsx +0 -0
  35. data/test/fixture/xlsx/multi-sheets.xlsx +0 -0
  36. data/test/fixture/xlsx/one-sheet.xlsx +0 -0
  37. data/test/helper.rb +45 -0
  38. data/test/run-test.rb +31 -0
  39. data/test/test-doc.rb +123 -0
  40. data/test/test-docx.rb +123 -0
  41. data/test/test-odp.rb +133 -0
  42. data/test/test-ods.rb +138 -0
  43. data/test/test-odt.rb +123 -0
  44. data/test/test-ppt.rb +133 -0
  45. data/test/test-pptx.rb +136 -0
  46. data/test/test-xls.rb +138 -0
  47. data/test/test-xlsx.rb +138 -0
  48. metadata +187 -0
metadata ADDED
@@ -0,0 +1,187 @@
1
+ --- !ruby/object:Gem::Specification
2
+ name: chupa-text-decomposer-libreoffice
3
+ version: !ruby/object:Gem::Version
4
+ version: 1.0.0
5
+ platform: ruby
6
+ authors:
7
+ - Kouhei Sutou
8
+ autorequire:
9
+ bindir: bin
10
+ cert_chain: []
11
+ date: 2014-02-16 00:00:00.000000000 Z
12
+ dependencies:
13
+ - !ruby/object:Gem::Dependency
14
+ name: chupa-text-decomposer-pdf
15
+ requirement: !ruby/object:Gem::Requirement
16
+ requirements:
17
+ - - '>='
18
+ - !ruby/object:Gem::Version
19
+ version: '0'
20
+ type: :runtime
21
+ prerelease: false
22
+ version_requirements: !ruby/object:Gem::Requirement
23
+ requirements:
24
+ - - '>='
25
+ - !ruby/object:Gem::Version
26
+ version: '0'
27
+ - !ruby/object:Gem::Dependency
28
+ name: bundler
29
+ requirement: !ruby/object:Gem::Requirement
30
+ requirements:
31
+ - - '>='
32
+ - !ruby/object:Gem::Version
33
+ version: '0'
34
+ type: :development
35
+ prerelease: false
36
+ version_requirements: !ruby/object:Gem::Requirement
37
+ requirements:
38
+ - - '>='
39
+ - !ruby/object:Gem::Version
40
+ version: '0'
41
+ - !ruby/object:Gem::Dependency
42
+ name: rake
43
+ requirement: !ruby/object:Gem::Requirement
44
+ requirements:
45
+ - - '>='
46
+ - !ruby/object:Gem::Version
47
+ version: '0'
48
+ type: :development
49
+ prerelease: false
50
+ version_requirements: !ruby/object:Gem::Requirement
51
+ requirements:
52
+ - - '>='
53
+ - !ruby/object:Gem::Version
54
+ version: '0'
55
+ - !ruby/object:Gem::Dependency
56
+ name: test-unit
57
+ requirement: !ruby/object:Gem::Requirement
58
+ requirements:
59
+ - - '>='
60
+ - !ruby/object:Gem::Version
61
+ version: '0'
62
+ type: :development
63
+ prerelease: false
64
+ version_requirements: !ruby/object:Gem::Requirement
65
+ requirements:
66
+ - - '>='
67
+ - !ruby/object:Gem::Version
68
+ version: '0'
69
+ - !ruby/object:Gem::Dependency
70
+ name: packnga
71
+ requirement: !ruby/object:Gem::Requirement
72
+ requirements:
73
+ - - '>='
74
+ - !ruby/object:Gem::Version
75
+ version: '0'
76
+ type: :development
77
+ prerelease: false
78
+ version_requirements: !ruby/object:Gem::Requirement
79
+ requirements:
80
+ - - '>='
81
+ - !ruby/object:Gem::Version
82
+ version: '0'
83
+ - !ruby/object:Gem::Dependency
84
+ name: redcarpet
85
+ requirement: !ruby/object:Gem::Requirement
86
+ requirements:
87
+ - - '>='
88
+ - !ruby/object:Gem::Version
89
+ version: '0'
90
+ type: :development
91
+ prerelease: false
92
+ version_requirements: !ruby/object:Gem::Requirement
93
+ requirements:
94
+ - - '>='
95
+ - !ruby/object:Gem::Version
96
+ version: '0'
97
+ description: |
98
+ This is a ChupaText decomposer plugin for to extract text and
99
+ meta-data from office files such as Microsoft Word file, Microsoft
100
+ Excel file and OpenDocument Format file. It uses
101
+ [LibreOffice](https://www.libreoffice.org/).
102
+
103
+ You can use `libreoffice` decomposer.
104
+
105
+ It depends on `pdf` decomposer. Because it converts a office file to
106
+ PDF file and extracts text and meta-data by `pdf` decomposer.
107
+ email:
108
+ - kou@clear-code.com
109
+ executables: []
110
+ extensions: []
111
+ extra_rdoc_files: []
112
+ files:
113
+ - chupa-text-decomposer-libreoffice.gemspec
114
+ - README.md
115
+ - LICENSE.txt
116
+ - Rakefile
117
+ - Gemfile
118
+ - .yardopts
119
+ - lib/chupa-text/decomposers/libreoffice.rb
120
+ - doc/text/news.md
121
+ - test/test-docx.rb
122
+ - test/test-doc.rb
123
+ - test/helper.rb
124
+ - test/test-ods.rb
125
+ - test/fixture/odp/attributes.odp
126
+ - test/fixture/odp/multi-slides.odp
127
+ - test/fixture/odp/one-slide.odp
128
+ - test/fixture/odt/one-page.odt
129
+ - test/fixture/odt/multi-pages.odt
130
+ - test/fixture/odt/attributes.odt
131
+ - test/fixture/docx/one-page.docx
132
+ - test/fixture/docx/multi-pages.docx
133
+ - test/fixture/docx/attributes.docx
134
+ - test/fixture/ods/one-sheet.ods
135
+ - test/fixture/ods/attributes.ods
136
+ - test/fixture/ods/multi-sheets.ods
137
+ - test/fixture/doc/attributes.doc
138
+ - test/fixture/doc/one-page.doc
139
+ - test/fixture/doc/multi-pages.doc
140
+ - test/fixture/xls/attributes.xls
141
+ - test/fixture/xls/multi-sheets.xls
142
+ - test/fixture/xls/one-sheet.xls
143
+ - test/fixture/pptx/one-slide.pptx
144
+ - test/fixture/pptx/multi-slides.pptx
145
+ - test/fixture/pptx/attributes.pptx
146
+ - test/fixture/xlsx/attributes.xlsx
147
+ - test/fixture/xlsx/one-sheet.xlsx
148
+ - test/fixture/xlsx/multi-sheets.xlsx
149
+ - test/fixture/ppt/attributes.ppt
150
+ - test/fixture/ppt/multi-slides.ppt
151
+ - test/fixture/ppt/one-slide.ppt
152
+ - test/test-odp.rb
153
+ - test/test-xls.rb
154
+ - test/run-test.rb
155
+ - test/test-xlsx.rb
156
+ - test/test-ppt.rb
157
+ - test/test-pptx.rb
158
+ - test/test-odt.rb
159
+ homepage: https://github.com/ranguba/chupa-text-decomposer-libreoffice
160
+ licenses:
161
+ - LGPLv2.1 or later
162
+ metadata: {}
163
+ post_install_message:
164
+ rdoc_options: []
165
+ require_paths:
166
+ - lib
167
+ required_ruby_version: !ruby/object:Gem::Requirement
168
+ requirements:
169
+ - - '>='
170
+ - !ruby/object:Gem::Version
171
+ version: '0'
172
+ required_rubygems_version: !ruby/object:Gem::Requirement
173
+ requirements:
174
+ - - '>='
175
+ - !ruby/object:Gem::Version
176
+ version: '0'
177
+ requirements:
178
+ - LibreOffice
179
+ rubyforge_project:
180
+ rubygems_version: 2.0.14
181
+ signing_key:
182
+ specification_version: 4
183
+ summary: This is a ChupaText decomposer plugin for to extract text and meta-data from
184
+ office files such as Microsoft Word file, Microsoft Excel file and OpenDocument
185
+ Format file. It uses [LibreOffice](https://www.libreoffice.org/).
186
+ test_files: []
187
+ has_rdoc: