chupa-text-decomposer-libreoffice 1.0.0

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
Files changed (48) hide show
  1. checksums.yaml +7 -0
  2. data/.yardopts +5 -0
  3. data/Gemfile +34 -0
  4. data/LICENSE.txt +502 -0
  5. data/README.md +45 -0
  6. data/Rakefile +46 -0
  7. data/chupa-text-decomposer-libreoffice.gemspec +51 -0
  8. data/doc/text/news.md +5 -0
  9. data/lib/chupa-text/decomposers/libreoffice.rb +131 -0
  10. data/test/fixture/doc/attributes.doc +0 -0
  11. data/test/fixture/doc/multi-pages.doc +0 -0
  12. data/test/fixture/doc/one-page.doc +0 -0
  13. data/test/fixture/docx/attributes.docx +0 -0
  14. data/test/fixture/docx/multi-pages.docx +0 -0
  15. data/test/fixture/docx/one-page.docx +0 -0
  16. data/test/fixture/odp/attributes.odp +0 -0
  17. data/test/fixture/odp/multi-slides.odp +0 -0
  18. data/test/fixture/odp/one-slide.odp +0 -0
  19. data/test/fixture/ods/attributes.ods +0 -0
  20. data/test/fixture/ods/multi-sheets.ods +0 -0
  21. data/test/fixture/ods/one-sheet.ods +0 -0
  22. data/test/fixture/odt/attributes.odt +0 -0
  23. data/test/fixture/odt/multi-pages.odt +0 -0
  24. data/test/fixture/odt/one-page.odt +0 -0
  25. data/test/fixture/ppt/attributes.ppt +0 -0
  26. data/test/fixture/ppt/multi-slides.ppt +0 -0
  27. data/test/fixture/ppt/one-slide.ppt +0 -0
  28. data/test/fixture/pptx/attributes.pptx +0 -0
  29. data/test/fixture/pptx/multi-slides.pptx +0 -0
  30. data/test/fixture/pptx/one-slide.pptx +0 -0
  31. data/test/fixture/xls/attributes.xls +0 -0
  32. data/test/fixture/xls/multi-sheets.xls +0 -0
  33. data/test/fixture/xls/one-sheet.xls +0 -0
  34. data/test/fixture/xlsx/attributes.xlsx +0 -0
  35. data/test/fixture/xlsx/multi-sheets.xlsx +0 -0
  36. data/test/fixture/xlsx/one-sheet.xlsx +0 -0
  37. data/test/helper.rb +45 -0
  38. data/test/run-test.rb +31 -0
  39. data/test/test-doc.rb +123 -0
  40. data/test/test-docx.rb +123 -0
  41. data/test/test-odp.rb +133 -0
  42. data/test/test-ods.rb +138 -0
  43. data/test/test-odt.rb +123 -0
  44. data/test/test-ppt.rb +133 -0
  45. data/test/test-pptx.rb +136 -0
  46. data/test/test-xls.rb +138 -0
  47. data/test/test-xlsx.rb +138 -0
  48. metadata +187 -0
metadata ADDED
@@ -0,0 +1,187 @@
1
+ --- !ruby/object:Gem::Specification
2
+ name: chupa-text-decomposer-libreoffice
3
+ version: !ruby/object:Gem::Version
4
+ version: 1.0.0
5
+ platform: ruby
6
+ authors:
7
+ - Kouhei Sutou
8
+ autorequire:
9
+ bindir: bin
10
+ cert_chain: []
11
+ date: 2014-02-16 00:00:00.000000000 Z
12
+ dependencies:
13
+ - !ruby/object:Gem::Dependency
14
+ name: chupa-text-decomposer-pdf
15
+ requirement: !ruby/object:Gem::Requirement
16
+ requirements:
17
+ - - '>='
18
+ - !ruby/object:Gem::Version
19
+ version: '0'
20
+ type: :runtime
21
+ prerelease: false
22
+ version_requirements: !ruby/object:Gem::Requirement
23
+ requirements:
24
+ - - '>='
25
+ - !ruby/object:Gem::Version
26
+ version: '0'
27
+ - !ruby/object:Gem::Dependency
28
+ name: bundler
29
+ requirement: !ruby/object:Gem::Requirement
30
+ requirements:
31
+ - - '>='
32
+ - !ruby/object:Gem::Version
33
+ version: '0'
34
+ type: :development
35
+ prerelease: false
36
+ version_requirements: !ruby/object:Gem::Requirement
37
+ requirements:
38
+ - - '>='
39
+ - !ruby/object:Gem::Version
40
+ version: '0'
41
+ - !ruby/object:Gem::Dependency
42
+ name: rake
43
+ requirement: !ruby/object:Gem::Requirement
44
+ requirements:
45
+ - - '>='
46
+ - !ruby/object:Gem::Version
47
+ version: '0'
48
+ type: :development
49
+ prerelease: false
50
+ version_requirements: !ruby/object:Gem::Requirement
51
+ requirements:
52
+ - - '>='
53
+ - !ruby/object:Gem::Version
54
+ version: '0'
55
+ - !ruby/object:Gem::Dependency
56
+ name: test-unit
57
+ requirement: !ruby/object:Gem::Requirement
58
+ requirements:
59
+ - - '>='
60
+ - !ruby/object:Gem::Version
61
+ version: '0'
62
+ type: :development
63
+ prerelease: false
64
+ version_requirements: !ruby/object:Gem::Requirement
65
+ requirements:
66
+ - - '>='
67
+ - !ruby/object:Gem::Version
68
+ version: '0'
69
+ - !ruby/object:Gem::Dependency
70
+ name: packnga
71
+ requirement: !ruby/object:Gem::Requirement
72
+ requirements:
73
+ - - '>='
74
+ - !ruby/object:Gem::Version
75
+ version: '0'
76
+ type: :development
77
+ prerelease: false
78
+ version_requirements: !ruby/object:Gem::Requirement
79
+ requirements:
80
+ - - '>='
81
+ - !ruby/object:Gem::Version
82
+ version: '0'
83
+ - !ruby/object:Gem::Dependency
84
+ name: redcarpet
85
+ requirement: !ruby/object:Gem::Requirement
86
+ requirements:
87
+ - - '>='
88
+ - !ruby/object:Gem::Version
89
+ version: '0'
90
+ type: :development
91
+ prerelease: false
92
+ version_requirements: !ruby/object:Gem::Requirement
93
+ requirements:
94
+ - - '>='
95
+ - !ruby/object:Gem::Version
96
+ version: '0'
97
+ description: |
98
+ This is a ChupaText decomposer plugin for to extract text and
99
+ meta-data from office files such as Microsoft Word file, Microsoft
100
+ Excel file and OpenDocument Format file. It uses
101
+ [LibreOffice](https://www.libreoffice.org/).
102
+
103
+ You can use `libreoffice` decomposer.
104
+
105
+ It depends on `pdf` decomposer. Because it converts a office file to
106
+ PDF file and extracts text and meta-data by `pdf` decomposer.
107
+ email:
108
+ - kou@clear-code.com
109
+ executables: []
110
+ extensions: []
111
+ extra_rdoc_files: []
112
+ files:
113
+ - chupa-text-decomposer-libreoffice.gemspec
114
+ - README.md
115
+ - LICENSE.txt
116
+ - Rakefile
117
+ - Gemfile
118
+ - .yardopts
119
+ - lib/chupa-text/decomposers/libreoffice.rb
120
+ - doc/text/news.md
121
+ - test/test-docx.rb
122
+ - test/test-doc.rb
123
+ - test/helper.rb
124
+ - test/test-ods.rb
125
+ - test/fixture/odp/attributes.odp
126
+ - test/fixture/odp/multi-slides.odp
127
+ - test/fixture/odp/one-slide.odp
128
+ - test/fixture/odt/one-page.odt
129
+ - test/fixture/odt/multi-pages.odt
130
+ - test/fixture/odt/attributes.odt
131
+ - test/fixture/docx/one-page.docx
132
+ - test/fixture/docx/multi-pages.docx
133
+ - test/fixture/docx/attributes.docx
134
+ - test/fixture/ods/one-sheet.ods
135
+ - test/fixture/ods/attributes.ods
136
+ - test/fixture/ods/multi-sheets.ods
137
+ - test/fixture/doc/attributes.doc
138
+ - test/fixture/doc/one-page.doc
139
+ - test/fixture/doc/multi-pages.doc
140
+ - test/fixture/xls/attributes.xls
141
+ - test/fixture/xls/multi-sheets.xls
142
+ - test/fixture/xls/one-sheet.xls
143
+ - test/fixture/pptx/one-slide.pptx
144
+ - test/fixture/pptx/multi-slides.pptx
145
+ - test/fixture/pptx/attributes.pptx
146
+ - test/fixture/xlsx/attributes.xlsx
147
+ - test/fixture/xlsx/one-sheet.xlsx
148
+ - test/fixture/xlsx/multi-sheets.xlsx
149
+ - test/fixture/ppt/attributes.ppt
150
+ - test/fixture/ppt/multi-slides.ppt
151
+ - test/fixture/ppt/one-slide.ppt
152
+ - test/test-odp.rb
153
+ - test/test-xls.rb
154
+ - test/run-test.rb
155
+ - test/test-xlsx.rb
156
+ - test/test-ppt.rb
157
+ - test/test-pptx.rb
158
+ - test/test-odt.rb
159
+ homepage: https://github.com/ranguba/chupa-text-decomposer-libreoffice
160
+ licenses:
161
+ - LGPLv2.1 or later
162
+ metadata: {}
163
+ post_install_message:
164
+ rdoc_options: []
165
+ require_paths:
166
+ - lib
167
+ required_ruby_version: !ruby/object:Gem::Requirement
168
+ requirements:
169
+ - - '>='
170
+ - !ruby/object:Gem::Version
171
+ version: '0'
172
+ required_rubygems_version: !ruby/object:Gem::Requirement
173
+ requirements:
174
+ - - '>='
175
+ - !ruby/object:Gem::Version
176
+ version: '0'
177
+ requirements:
178
+ - LibreOffice
179
+ rubyforge_project:
180
+ rubygems_version: 2.0.14
181
+ signing_key:
182
+ specification_version: 4
183
+ summary: This is a ChupaText decomposer plugin for to extract text and meta-data from
184
+ office files such as Microsoft Word file, Microsoft Excel file and OpenDocument
185
+ Format file. It uses [LibreOffice](https://www.libreoffice.org/).
186
+ test_files: []
187
+ has_rdoc: