hexapdf 0.1.0

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
Files changed (346) hide show
  1. checksums.yaml +7 -0
  2. data/CONTRIBUTERS +3 -0
  3. data/LICENSE +26 -0
  4. data/README.md +88 -0
  5. data/Rakefile +121 -0
  6. data/VERSION +1 -0
  7. data/agpl-3.0.txt +661 -0
  8. data/bin/hexapdf +6 -0
  9. data/data/hexapdf/afm/Courier-Bold.afm +342 -0
  10. data/data/hexapdf/afm/Courier-BoldOblique.afm +342 -0
  11. data/data/hexapdf/afm/Courier-Oblique.afm +342 -0
  12. data/data/hexapdf/afm/Courier.afm +342 -0
  13. data/data/hexapdf/afm/Helvetica-Bold.afm +2827 -0
  14. data/data/hexapdf/afm/Helvetica-BoldOblique.afm +2827 -0
  15. data/data/hexapdf/afm/Helvetica-Oblique.afm +3051 -0
  16. data/data/hexapdf/afm/Helvetica.afm +3051 -0
  17. data/data/hexapdf/afm/MustRead.html +1 -0
  18. data/data/hexapdf/afm/Symbol.afm +213 -0
  19. data/data/hexapdf/afm/Times-Bold.afm +2588 -0
  20. data/data/hexapdf/afm/Times-BoldItalic.afm +2384 -0
  21. data/data/hexapdf/afm/Times-Italic.afm +2667 -0
  22. data/data/hexapdf/afm/Times-Roman.afm +2419 -0
  23. data/data/hexapdf/afm/ZapfDingbats.afm +225 -0
  24. data/data/hexapdf/encoding/glyphlist.txt +4305 -0
  25. data/data/hexapdf/encoding/zapfdingbats.txt +225 -0
  26. data/examples/arc.rb +50 -0
  27. data/examples/graphics.rb +274 -0
  28. data/examples/hello_world.rb +16 -0
  29. data/examples/machupicchu.jpg +0 -0
  30. data/examples/merging.rb +24 -0
  31. data/examples/optimizing.rb +20 -0
  32. data/examples/show_char_bboxes.rb +55 -0
  33. data/examples/standard_pdf_fonts.rb +72 -0
  34. data/examples/truetype.rb +45 -0
  35. data/lib/hexapdf/cli/extract.rb +128 -0
  36. data/lib/hexapdf/cli/info.rb +121 -0
  37. data/lib/hexapdf/cli/inspect.rb +157 -0
  38. data/lib/hexapdf/cli/modify.rb +218 -0
  39. data/lib/hexapdf/cli.rb +121 -0
  40. data/lib/hexapdf/configuration.rb +392 -0
  41. data/lib/hexapdf/content/canvas.rb +1974 -0
  42. data/lib/hexapdf/content/color_space.rb +364 -0
  43. data/lib/hexapdf/content/graphic_object/arc.rb +267 -0
  44. data/lib/hexapdf/content/graphic_object/endpoint_arc.rb +208 -0
  45. data/lib/hexapdf/content/graphic_object/solid_arc.rb +173 -0
  46. data/lib/hexapdf/content/graphic_object.rb +81 -0
  47. data/lib/hexapdf/content/graphics_state.rb +579 -0
  48. data/lib/hexapdf/content/operator.rb +1072 -0
  49. data/lib/hexapdf/content/parser.rb +204 -0
  50. data/lib/hexapdf/content/processor.rb +451 -0
  51. data/lib/hexapdf/content/transformation_matrix.rb +172 -0
  52. data/lib/hexapdf/content.rb +47 -0
  53. data/lib/hexapdf/data_dir.rb +51 -0
  54. data/lib/hexapdf/dictionary.rb +303 -0
  55. data/lib/hexapdf/dictionary_fields.rb +382 -0
  56. data/lib/hexapdf/document.rb +589 -0
  57. data/lib/hexapdf/document_utils.rb +209 -0
  58. data/lib/hexapdf/encryption/aes.rb +206 -0
  59. data/lib/hexapdf/encryption/arc4.rb +93 -0
  60. data/lib/hexapdf/encryption/fast_aes.rb +79 -0
  61. data/lib/hexapdf/encryption/fast_arc4.rb +67 -0
  62. data/lib/hexapdf/encryption/identity.rb +63 -0
  63. data/lib/hexapdf/encryption/ruby_aes.rb +447 -0
  64. data/lib/hexapdf/encryption/ruby_arc4.rb +96 -0
  65. data/lib/hexapdf/encryption/security_handler.rb +494 -0
  66. data/lib/hexapdf/encryption/standard_security_handler.rb +616 -0
  67. data/lib/hexapdf/encryption.rb +94 -0
  68. data/lib/hexapdf/error.rb +73 -0
  69. data/lib/hexapdf/filter/ascii85_decode.rb +160 -0
  70. data/lib/hexapdf/filter/ascii_hex_decode.rb +87 -0
  71. data/lib/hexapdf/filter/dct_decode.rb +57 -0
  72. data/lib/hexapdf/filter/encryption.rb +59 -0
  73. data/lib/hexapdf/filter/flate_decode.rb +93 -0
  74. data/lib/hexapdf/filter/jpx_decode.rb +56 -0
  75. data/lib/hexapdf/filter/lzw_decode.rb +191 -0
  76. data/lib/hexapdf/filter/predictor.rb +266 -0
  77. data/lib/hexapdf/filter/run_length_decode.rb +108 -0
  78. data/lib/hexapdf/filter.rb +176 -0
  79. data/lib/hexapdf/font/cmap/parser.rb +146 -0
  80. data/lib/hexapdf/font/cmap/writer.rb +176 -0
  81. data/lib/hexapdf/font/cmap.rb +90 -0
  82. data/lib/hexapdf/font/encoding/base.rb +77 -0
  83. data/lib/hexapdf/font/encoding/difference_encoding.rb +64 -0
  84. data/lib/hexapdf/font/encoding/glyph_list.rb +150 -0
  85. data/lib/hexapdf/font/encoding/mac_expert_encoding.rb +221 -0
  86. data/lib/hexapdf/font/encoding/mac_roman_encoding.rb +265 -0
  87. data/lib/hexapdf/font/encoding/standard_encoding.rb +205 -0
  88. data/lib/hexapdf/font/encoding/symbol_encoding.rb +244 -0
  89. data/lib/hexapdf/font/encoding/win_ansi_encoding.rb +280 -0
  90. data/lib/hexapdf/font/encoding/zapf_dingbats_encoding.rb +250 -0
  91. data/lib/hexapdf/font/encoding.rb +68 -0
  92. data/lib/hexapdf/font/true_type/font.rb +179 -0
  93. data/lib/hexapdf/font/true_type/table/cmap.rb +103 -0
  94. data/lib/hexapdf/font/true_type/table/cmap_subtable.rb +384 -0
  95. data/lib/hexapdf/font/true_type/table/directory.rb +92 -0
  96. data/lib/hexapdf/font/true_type/table/glyf.rb +166 -0
  97. data/lib/hexapdf/font/true_type/table/head.rb +143 -0
  98. data/lib/hexapdf/font/true_type/table/hhea.rb +109 -0
  99. data/lib/hexapdf/font/true_type/table/hmtx.rb +79 -0
  100. data/lib/hexapdf/font/true_type/table/loca.rb +79 -0
  101. data/lib/hexapdf/font/true_type/table/maxp.rb +112 -0
  102. data/lib/hexapdf/font/true_type/table/name.rb +218 -0
  103. data/lib/hexapdf/font/true_type/table/os2.rb +200 -0
  104. data/lib/hexapdf/font/true_type/table/post.rb +230 -0
  105. data/lib/hexapdf/font/true_type/table.rb +155 -0
  106. data/lib/hexapdf/font/true_type.rb +48 -0
  107. data/lib/hexapdf/font/true_type_wrapper.rb +240 -0
  108. data/lib/hexapdf/font/type1/afm_parser.rb +230 -0
  109. data/lib/hexapdf/font/type1/character_metrics.rb +67 -0
  110. data/lib/hexapdf/font/type1/font.rb +123 -0
  111. data/lib/hexapdf/font/type1/font_metrics.rb +117 -0
  112. data/lib/hexapdf/font/type1/pfb_parser.rb +71 -0
  113. data/lib/hexapdf/font/type1.rb +52 -0
  114. data/lib/hexapdf/font/type1_wrapper.rb +193 -0
  115. data/lib/hexapdf/font_loader/from_configuration.rb +70 -0
  116. data/lib/hexapdf/font_loader/standard14.rb +98 -0
  117. data/lib/hexapdf/font_loader.rb +85 -0
  118. data/lib/hexapdf/font_utils.rb +89 -0
  119. data/lib/hexapdf/image_loader/jpeg.rb +166 -0
  120. data/lib/hexapdf/image_loader/pdf.rb +89 -0
  121. data/lib/hexapdf/image_loader/png.rb +410 -0
  122. data/lib/hexapdf/image_loader.rb +68 -0
  123. data/lib/hexapdf/importer.rb +139 -0
  124. data/lib/hexapdf/name_tree_node.rb +78 -0
  125. data/lib/hexapdf/number_tree_node.rb +67 -0
  126. data/lib/hexapdf/object.rb +363 -0
  127. data/lib/hexapdf/parser.rb +349 -0
  128. data/lib/hexapdf/rectangle.rb +99 -0
  129. data/lib/hexapdf/reference.rb +98 -0
  130. data/lib/hexapdf/revision.rb +206 -0
  131. data/lib/hexapdf/revisions.rb +194 -0
  132. data/lib/hexapdf/serializer.rb +326 -0
  133. data/lib/hexapdf/stream.rb +279 -0
  134. data/lib/hexapdf/task/dereference.rb +109 -0
  135. data/lib/hexapdf/task/optimize.rb +230 -0
  136. data/lib/hexapdf/task.rb +68 -0
  137. data/lib/hexapdf/tokenizer.rb +406 -0
  138. data/lib/hexapdf/type/catalog.rb +107 -0
  139. data/lib/hexapdf/type/embedded_file.rb +87 -0
  140. data/lib/hexapdf/type/file_specification.rb +232 -0
  141. data/lib/hexapdf/type/font.rb +81 -0
  142. data/lib/hexapdf/type/font_descriptor.rb +109 -0
  143. data/lib/hexapdf/type/font_simple.rb +190 -0
  144. data/lib/hexapdf/type/font_true_type.rb +47 -0
  145. data/lib/hexapdf/type/font_type1.rb +162 -0
  146. data/lib/hexapdf/type/form.rb +103 -0
  147. data/lib/hexapdf/type/graphics_state_parameter.rb +79 -0
  148. data/lib/hexapdf/type/image.rb +73 -0
  149. data/lib/hexapdf/type/info.rb +70 -0
  150. data/lib/hexapdf/type/names.rb +69 -0
  151. data/lib/hexapdf/type/object_stream.rb +224 -0
  152. data/lib/hexapdf/type/page.rb +355 -0
  153. data/lib/hexapdf/type/page_tree_node.rb +269 -0
  154. data/lib/hexapdf/type/resources.rb +212 -0
  155. data/lib/hexapdf/type/trailer.rb +128 -0
  156. data/lib/hexapdf/type/viewer_preferences.rb +73 -0
  157. data/lib/hexapdf/type/xref_stream.rb +204 -0
  158. data/lib/hexapdf/type.rb +67 -0
  159. data/lib/hexapdf/utils/bit_field.rb +87 -0
  160. data/lib/hexapdf/utils/bit_stream.rb +148 -0
  161. data/lib/hexapdf/utils/lru_cache.rb +65 -0
  162. data/lib/hexapdf/utils/math_helpers.rb +55 -0
  163. data/lib/hexapdf/utils/object_hash.rb +130 -0
  164. data/lib/hexapdf/utils/pdf_doc_encoding.rb +93 -0
  165. data/lib/hexapdf/utils/sorted_tree_node.rb +339 -0
  166. data/lib/hexapdf/version.rb +39 -0
  167. data/lib/hexapdf/writer.rb +199 -0
  168. data/lib/hexapdf/xref_section.rb +152 -0
  169. data/lib/hexapdf.rb +34 -0
  170. data/man/man1/hexapdf.1 +249 -0
  171. data/test/data/aes-test-vectors/CBCGFSbox-128-decrypt.data.gz +0 -0
  172. data/test/data/aes-test-vectors/CBCGFSbox-128-encrypt.data.gz +0 -0
  173. data/test/data/aes-test-vectors/CBCGFSbox-192-decrypt.data.gz +0 -0
  174. data/test/data/aes-test-vectors/CBCGFSbox-192-encrypt.data.gz +0 -0
  175. data/test/data/aes-test-vectors/CBCGFSbox-256-decrypt.data.gz +0 -0
  176. data/test/data/aes-test-vectors/CBCGFSbox-256-encrypt.data.gz +0 -0
  177. data/test/data/aes-test-vectors/CBCKeySbox-128-decrypt.data.gz +0 -0
  178. data/test/data/aes-test-vectors/CBCKeySbox-128-encrypt.data.gz +0 -0
  179. data/test/data/aes-test-vectors/CBCKeySbox-192-decrypt.data.gz +0 -0
  180. data/test/data/aes-test-vectors/CBCKeySbox-192-encrypt.data.gz +0 -0
  181. data/test/data/aes-test-vectors/CBCKeySbox-256-decrypt.data.gz +0 -0
  182. data/test/data/aes-test-vectors/CBCKeySbox-256-encrypt.data.gz +0 -0
  183. data/test/data/aes-test-vectors/CBCVarKey-128-decrypt.data.gz +0 -0
  184. data/test/data/aes-test-vectors/CBCVarKey-128-encrypt.data.gz +0 -0
  185. data/test/data/aes-test-vectors/CBCVarKey-192-decrypt.data.gz +0 -0
  186. data/test/data/aes-test-vectors/CBCVarKey-192-encrypt.data.gz +0 -0
  187. data/test/data/aes-test-vectors/CBCVarKey-256-decrypt.data.gz +0 -0
  188. data/test/data/aes-test-vectors/CBCVarKey-256-encrypt.data.gz +0 -0
  189. data/test/data/aes-test-vectors/CBCVarTxt-128-decrypt.data.gz +0 -0
  190. data/test/data/aes-test-vectors/CBCVarTxt-128-encrypt.data.gz +0 -0
  191. data/test/data/aes-test-vectors/CBCVarTxt-192-decrypt.data.gz +0 -0
  192. data/test/data/aes-test-vectors/CBCVarTxt-192-encrypt.data.gz +0 -0
  193. data/test/data/aes-test-vectors/CBCVarTxt-256-decrypt.data.gz +0 -0
  194. data/test/data/aes-test-vectors/CBCVarTxt-256-encrypt.data.gz +0 -0
  195. data/test/data/fonts/Ubuntu-Title.ttf +0 -0
  196. data/test/data/images/cmyk.jpg +0 -0
  197. data/test/data/images/fillbytes.jpg +0 -0
  198. data/test/data/images/gray.jpg +0 -0
  199. data/test/data/images/greyscale-1bit.png +0 -0
  200. data/test/data/images/greyscale-2bit.png +0 -0
  201. data/test/data/images/greyscale-4bit.png +0 -0
  202. data/test/data/images/greyscale-8bit.png +0 -0
  203. data/test/data/images/greyscale-alpha-8bit.png +0 -0
  204. data/test/data/images/greyscale-trns-8bit.png +0 -0
  205. data/test/data/images/greyscale-with-gamma1.0.png +0 -0
  206. data/test/data/images/greyscale-with-gamma1.5.png +0 -0
  207. data/test/data/images/indexed-1bit.png +0 -0
  208. data/test/data/images/indexed-2bit.png +0 -0
  209. data/test/data/images/indexed-4bit.png +0 -0
  210. data/test/data/images/indexed-8bit.png +0 -0
  211. data/test/data/images/indexed-alpha-4bit.png +0 -0
  212. data/test/data/images/indexed-alpha-8bit.png +0 -0
  213. data/test/data/images/rgb.jpg +0 -0
  214. data/test/data/images/truecolour-8bit.png +0 -0
  215. data/test/data/images/truecolour-alpha-8bit.png +0 -0
  216. data/test/data/images/truecolour-gama-chrm-8bit.png +0 -0
  217. data/test/data/images/truecolour-srgb-8bit.png +0 -0
  218. data/test/data/minimal.pdf +44 -0
  219. data/test/data/standard-security-handler/README +9 -0
  220. data/test/data/standard-security-handler/bothpwd-aes-128bit-V4.pdf +44 -0
  221. data/test/data/standard-security-handler/bothpwd-aes-256bit-V5.pdf +0 -0
  222. data/test/data/standard-security-handler/bothpwd-arc4-128bit-V2.pdf +43 -0
  223. data/test/data/standard-security-handler/bothpwd-arc4-128bit-V4.pdf +43 -0
  224. data/test/data/standard-security-handler/bothpwd-arc4-40bit-V1.pdf +0 -0
  225. data/test/data/standard-security-handler/nopwd-aes-128bit-V4.pdf +43 -0
  226. data/test/data/standard-security-handler/nopwd-aes-256bit-V5.pdf +0 -0
  227. data/test/data/standard-security-handler/nopwd-arc4-128bit-V2.pdf +43 -0
  228. data/test/data/standard-security-handler/nopwd-arc4-128bit-V4.pdf +43 -0
  229. data/test/data/standard-security-handler/nopwd-arc4-40bit-V1.pdf +43 -0
  230. data/test/data/standard-security-handler/ownerpwd-aes-128bit-V4.pdf +0 -0
  231. data/test/data/standard-security-handler/ownerpwd-aes-256bit-V5.pdf +43 -0
  232. data/test/data/standard-security-handler/ownerpwd-arc4-128bit-V2.pdf +43 -0
  233. data/test/data/standard-security-handler/ownerpwd-arc4-128bit-V4.pdf +43 -0
  234. data/test/data/standard-security-handler/ownerpwd-arc4-40bit-V1.pdf +43 -0
  235. data/test/data/standard-security-handler/userpwd-aes-128bit-V4.pdf +43 -0
  236. data/test/data/standard-security-handler/userpwd-aes-256bit-V5.pdf +43 -0
  237. data/test/data/standard-security-handler/userpwd-arc4-128bit-V2.pdf +0 -0
  238. data/test/data/standard-security-handler/userpwd-arc4-128bit-V4.pdf +0 -0
  239. data/test/data/standard-security-handler/userpwd-arc4-40bit-V1.pdf +43 -0
  240. data/test/hexapdf/common_tokenizer_tests.rb +204 -0
  241. data/test/hexapdf/content/common.rb +31 -0
  242. data/test/hexapdf/content/graphic_object/test_arc.rb +93 -0
  243. data/test/hexapdf/content/graphic_object/test_endpoint_arc.rb +91 -0
  244. data/test/hexapdf/content/graphic_object/test_solid_arc.rb +86 -0
  245. data/test/hexapdf/content/test_canvas.rb +1113 -0
  246. data/test/hexapdf/content/test_color_space.rb +97 -0
  247. data/test/hexapdf/content/test_graphics_state.rb +138 -0
  248. data/test/hexapdf/content/test_operator.rb +619 -0
  249. data/test/hexapdf/content/test_parser.rb +66 -0
  250. data/test/hexapdf/content/test_processor.rb +156 -0
  251. data/test/hexapdf/content/test_transformation_matrix.rb +64 -0
  252. data/test/hexapdf/encryption/common.rb +87 -0
  253. data/test/hexapdf/encryption/test_aes.rb +121 -0
  254. data/test/hexapdf/encryption/test_arc4.rb +39 -0
  255. data/test/hexapdf/encryption/test_fast_aes.rb +17 -0
  256. data/test/hexapdf/encryption/test_fast_arc4.rb +12 -0
  257. data/test/hexapdf/encryption/test_identity.rb +21 -0
  258. data/test/hexapdf/encryption/test_ruby_aes.rb +23 -0
  259. data/test/hexapdf/encryption/test_ruby_arc4.rb +20 -0
  260. data/test/hexapdf/encryption/test_security_handler.rb +356 -0
  261. data/test/hexapdf/encryption/test_standard_security_handler.rb +274 -0
  262. data/test/hexapdf/filter/common.rb +53 -0
  263. data/test/hexapdf/filter/test_ascii85_decode.rb +60 -0
  264. data/test/hexapdf/filter/test_ascii_hex_decode.rb +33 -0
  265. data/test/hexapdf/filter/test_encryption.rb +24 -0
  266. data/test/hexapdf/filter/test_flate_decode.rb +35 -0
  267. data/test/hexapdf/filter/test_lzw_decode.rb +52 -0
  268. data/test/hexapdf/filter/test_predictor.rb +183 -0
  269. data/test/hexapdf/filter/test_run_length_decode.rb +32 -0
  270. data/test/hexapdf/font/cmap/test_parser.rb +67 -0
  271. data/test/hexapdf/font/cmap/test_writer.rb +58 -0
  272. data/test/hexapdf/font/encoding/test_base.rb +35 -0
  273. data/test/hexapdf/font/encoding/test_difference_encoding.rb +21 -0
  274. data/test/hexapdf/font/encoding/test_glyph_list.rb +59 -0
  275. data/test/hexapdf/font/encoding/test_zapf_dingbats_encoding.rb +16 -0
  276. data/test/hexapdf/font/test_encoding.rb +27 -0
  277. data/test/hexapdf/font/test_true_type_wrapper.rb +110 -0
  278. data/test/hexapdf/font/test_type1_wrapper.rb +66 -0
  279. data/test/hexapdf/font/true_type/common.rb +19 -0
  280. data/test/hexapdf/font/true_type/table/test_cmap.rb +59 -0
  281. data/test/hexapdf/font/true_type/table/test_cmap_subtable.rb +133 -0
  282. data/test/hexapdf/font/true_type/table/test_directory.rb +35 -0
  283. data/test/hexapdf/font/true_type/table/test_glyf.rb +58 -0
  284. data/test/hexapdf/font/true_type/table/test_head.rb +76 -0
  285. data/test/hexapdf/font/true_type/table/test_hhea.rb +40 -0
  286. data/test/hexapdf/font/true_type/table/test_hmtx.rb +38 -0
  287. data/test/hexapdf/font/true_type/table/test_loca.rb +43 -0
  288. data/test/hexapdf/font/true_type/table/test_maxp.rb +62 -0
  289. data/test/hexapdf/font/true_type/table/test_name.rb +95 -0
  290. data/test/hexapdf/font/true_type/table/test_os2.rb +65 -0
  291. data/test/hexapdf/font/true_type/table/test_post.rb +89 -0
  292. data/test/hexapdf/font/true_type/test_font.rb +120 -0
  293. data/test/hexapdf/font/true_type/test_table.rb +41 -0
  294. data/test/hexapdf/font/type1/test_afm_parser.rb +51 -0
  295. data/test/hexapdf/font/type1/test_font.rb +68 -0
  296. data/test/hexapdf/font/type1/test_pfb_parser.rb +37 -0
  297. data/test/hexapdf/font_loader/test_from_configuration.rb +28 -0
  298. data/test/hexapdf/font_loader/test_standard14.rb +22 -0
  299. data/test/hexapdf/image_loader/test_jpeg.rb +83 -0
  300. data/test/hexapdf/image_loader/test_pdf.rb +47 -0
  301. data/test/hexapdf/image_loader/test_png.rb +258 -0
  302. data/test/hexapdf/task/test_dereference.rb +46 -0
  303. data/test/hexapdf/task/test_optimize.rb +137 -0
  304. data/test/hexapdf/test_configuration.rb +82 -0
  305. data/test/hexapdf/test_data_dir.rb +32 -0
  306. data/test/hexapdf/test_dictionary.rb +284 -0
  307. data/test/hexapdf/test_dictionary_fields.rb +185 -0
  308. data/test/hexapdf/test_document.rb +574 -0
  309. data/test/hexapdf/test_document_utils.rb +144 -0
  310. data/test/hexapdf/test_filter.rb +96 -0
  311. data/test/hexapdf/test_font_utils.rb +47 -0
  312. data/test/hexapdf/test_importer.rb +78 -0
  313. data/test/hexapdf/test_object.rb +177 -0
  314. data/test/hexapdf/test_parser.rb +394 -0
  315. data/test/hexapdf/test_rectangle.rb +36 -0
  316. data/test/hexapdf/test_reference.rb +41 -0
  317. data/test/hexapdf/test_revision.rb +139 -0
  318. data/test/hexapdf/test_revisions.rb +93 -0
  319. data/test/hexapdf/test_serializer.rb +169 -0
  320. data/test/hexapdf/test_stream.rb +262 -0
  321. data/test/hexapdf/test_tokenizer.rb +30 -0
  322. data/test/hexapdf/test_writer.rb +120 -0
  323. data/test/hexapdf/test_xref_section.rb +35 -0
  324. data/test/hexapdf/type/test_catalog.rb +30 -0
  325. data/test/hexapdf/type/test_embedded_file.rb +16 -0
  326. data/test/hexapdf/type/test_file_specification.rb +148 -0
  327. data/test/hexapdf/type/test_font.rb +35 -0
  328. data/test/hexapdf/type/test_font_descriptor.rb +51 -0
  329. data/test/hexapdf/type/test_font_simple.rb +190 -0
  330. data/test/hexapdf/type/test_font_type1.rb +128 -0
  331. data/test/hexapdf/type/test_form.rb +60 -0
  332. data/test/hexapdf/type/test_info.rb +14 -0
  333. data/test/hexapdf/type/test_names.rb +9 -0
  334. data/test/hexapdf/type/test_object_stream.rb +84 -0
  335. data/test/hexapdf/type/test_page.rb +260 -0
  336. data/test/hexapdf/type/test_page_tree_node.rb +255 -0
  337. data/test/hexapdf/type/test_resources.rb +167 -0
  338. data/test/hexapdf/type/test_trailer.rb +109 -0
  339. data/test/hexapdf/type/test_xref_stream.rb +131 -0
  340. data/test/hexapdf/utils/test_bit_field.rb +47 -0
  341. data/test/hexapdf/utils/test_lru_cache.rb +22 -0
  342. data/test/hexapdf/utils/test_object_hash.rb +115 -0
  343. data/test/hexapdf/utils/test_pdf_doc_encoding.rb +18 -0
  344. data/test/hexapdf/utils/test_sorted_tree_node.rb +232 -0
  345. data/test/test_helper.rb +56 -0
  346. metadata +427 -0
@@ -0,0 +1,326 @@
1
+ # -*- encoding: utf-8 -*-
2
+ #
3
+ #--
4
+ # This file is part of HexaPDF.
5
+ #
6
+ # HexaPDF - A Versatile PDF Creation and Manipulation Library For Ruby
7
+ # Copyright (C) 2016 Thomas Leitner
8
+ #
9
+ # HexaPDF is free software: you can redistribute it and/or modify it
10
+ # under the terms of the GNU Affero General Public License version 3 as
11
+ # published by the Free Software Foundation with the addition of the
12
+ # following permission added to Section 15 as permitted in Section 7(a):
13
+ # FOR ANY PART OF THE COVERED WORK IN WHICH THE COPYRIGHT IS OWNED BY
14
+ # THOMAS LEITNER, THOMAS LEITNER DISCLAIMS THE WARRANTY OF NON
15
+ # INFRINGEMENT OF THIRD PARTY RIGHTS.
16
+ #
17
+ # HexaPDF is distributed in the hope that it will be useful, but WITHOUT
18
+ # ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
19
+ # FITNESS FOR A PARTICULAR PURPOSE. See the GNU Affero General Public
20
+ # License for more details.
21
+ #
22
+ # You should have received a copy of the GNU Affero General Public License
23
+ # along with HexaPDF. If not, see <http://www.gnu.org/licenses/>.
24
+ #
25
+ # The interactive user interfaces in modified source and object code
26
+ # versions of HexaPDF must display Appropriate Legal Notices, as required
27
+ # under Section 5 of the GNU Affero General Public License version 3.
28
+ #
29
+ # In accordance with Section 7(b) of the GNU Affero General Public
30
+ # License, a covered work must retain the producer line in every PDF that
31
+ # is created or manipulated using HexaPDF.
32
+ #++
33
+
34
+ require 'time'
35
+ require 'hexapdf/tokenizer'
36
+ require 'hexapdf/filter'
37
+ require 'hexapdf/utils/lru_cache'
38
+
39
+ module HexaPDF
40
+
41
+ # Knows how to serialize Ruby objects for a PDF file.
42
+ #
43
+ # For normal serialization purposes, the #serialize or #serialize_to_io methods should be used.
44
+ # However, if the type of the object to be serialized is known, a specialized serialization
45
+ # method like #serialize_float can be used.
46
+ #
47
+ # Additionally, an object for encrypting strings and streams while serializing can be set via the
48
+ # #encrypter= method. The assigned object has to respond to #encrypt_string(str, ind_obj) (where
49
+ # the string is part of the indirect object; returns the encrypted string) and
50
+ # #encrypt_stream(stream) (returns a fiber that represents the encrypted stream).
51
+ #
52
+ #
53
+ # == How This Class Works
54
+ #
55
+ # The main public interface consists of the #serialize and #serialize_to_io methods which accept
56
+ # an object and return its serialized form. During serialization of this object it is accessible
57
+ # by individual serialization methods via the @object instance variable (useful if the object is a
58
+ # composed object).
59
+ #
60
+ # Internally, the #__serialize method is used for invoking the correct serialization method
61
+ # based on the class of a given object. It is also used for serializing individual parts of a
62
+ # composed object.
63
+ #
64
+ # Therefore the serializer contains one serialization method for each class it needs to
65
+ # serialize. The naming scheme of these methods is based on the class name: The full class name
66
+ # is converted to lowercase, the namespace separator '::' is replaced with a single underscore
67
+ # and the string "serialize_" is then prepended.
68
+ #
69
+ # Examples:
70
+ #
71
+ # NilClass => serialize_nilclass
72
+ # TrueClass => serialize_trueclass
73
+ # HexaPDF::Object => serialize_hexapdf_object
74
+ #
75
+ # If no serialization method for a specific class is found, the ancestors classes are tried.
76
+ #
77
+ # See: PDF1.7 s7.3
78
+ class Serializer
79
+
80
+ # The encrypter to use for encrypting strings and streams. If +nil+, strings and streams are not
81
+ # encrypted.
82
+ #
83
+ # Default: +nil+
84
+ attr_accessor :encrypter
85
+
86
+ # Creates a new Serializer object.
87
+ def initialize
88
+ @dispatcher = Hash.new do |h, klass|
89
+ method = nil
90
+ klass.ancestors.each do |ancestor_klass|
91
+ method = "serialize_#{ancestor_klass.name.downcase.gsub(/::/, '_')}"
92
+ (h[klass] = method; break) if respond_to?(method, true)
93
+ end
94
+ method
95
+ end
96
+ @encrypter = false
97
+ @io = nil
98
+ @object = nil
99
+ end
100
+
101
+ # Returns the serialized form of the given object.
102
+ #
103
+ # For developers: While the object is serialized, methods can use the instance variable
104
+ # @object to obtain information about or use the object in case it is a composed object.
105
+ def serialize(obj)
106
+ @object = obj
107
+ __serialize(obj)
108
+ ensure
109
+ @object = nil
110
+ end
111
+
112
+ # Serializes the given object and writes it to the IO.
113
+ #
114
+ # Also see: #serialize
115
+ def serialize_to_io(obj, io)
116
+ @io = io
117
+ @io << serialize(obj).freeze
118
+ ensure
119
+ @io = nil
120
+ end
121
+
122
+ # Serializes the +nil+ value.
123
+ #
124
+ # See: PDF1.7 s7.3.9
125
+ def serialize_nilclass(_obj)
126
+ "null"
127
+ end
128
+
129
+ # Serializes the +true+ value.
130
+ #
131
+ # See: PDF1.7 s7.3.2
132
+ def serialize_trueclass(_obj)
133
+ "true"
134
+ end
135
+
136
+ # Serializes the +false+ value.
137
+ #
138
+ # See: PDF1.7 s7.3.2
139
+ def serialize_falseclass(_obj)
140
+ "false"
141
+ end
142
+
143
+ # Serializes a Numeric object (either Integer or Float).
144
+ #
145
+ # This method should be used for cases where it is known that the object is either an Integer
146
+ # or a Float.
147
+ #
148
+ # See: PDF1.7 s7.3.3
149
+ def serialize_numeric(obj)
150
+ obj.kind_of?(Integer) ? obj.to_s : serialize_float(obj)
151
+ end
152
+
153
+ # Serializes an Integer object.
154
+ #
155
+ # See: PDF1.7 s7.3.3
156
+ def serialize_integer(obj)
157
+ obj.to_s
158
+ end
159
+
160
+ # Serializes a Float object.
161
+ #
162
+ # See: PDF1.7 s7.3.3
163
+ def serialize_float(obj)
164
+ obj.abs < 0.0001 && obj != 0 ? sprintf("%.6f".freeze, obj) : obj.round(6).to_s
165
+ end
166
+
167
+ # The regexp matches all characters that need to be escaped and the substs hash contains the
168
+ # mapping from these characters to their escaped form.
169
+ #
170
+ # See PDF1.7 s7.3.5
171
+ NAME_SUBSTS = {} # :nodoc:
172
+ [0..32, 127..255, Tokenizer::DELIMITER.bytes, Tokenizer::WHITESPACE.bytes, [35]].each do |a|
173
+ a.each {|c| NAME_SUBSTS[c.chr] = "##{c.to_s(16).rjust(2, "0")}"}
174
+ end
175
+ NAME_REGEXP = /[^!-~&&[^##{Regexp.escape(Tokenizer::DELIMITER)}#{Regexp.escape(Tokenizer::WHITESPACE)}]]/ # :nodoc:
176
+ NAME_CACHE = Utils::LRUCache.new(1000) # :nodoc:
177
+
178
+ # Serializes a Symbol object (i.e. a PDF name object).
179
+ #
180
+ # See: PDF1.7 s7.3.5
181
+ def serialize_symbol(obj)
182
+ NAME_CACHE[obj] ||=
183
+ begin
184
+ str = obj.to_s.force_encoding(Encoding::BINARY)
185
+ str.gsub!(NAME_REGEXP) {|m| NAME_SUBSTS[m]}
186
+ "/#{str}"
187
+ end
188
+ end
189
+
190
+ BYTE_IS_DELIMITER = {40 => true, 47 => true, 60 => true, 91 => true, # :nodoc:
191
+ 41 => true, 62 => true, 93 => true}
192
+
193
+ # Serializes an Array object.
194
+ #
195
+ # See: PDF1.7 s7.3.6
196
+ def serialize_array(obj)
197
+ str = "["
198
+ index = 0
199
+ while index < obj.size
200
+ tmp = __serialize(obj[index])
201
+ str << " ".freeze unless BYTE_IS_DELIMITER[tmp.getbyte(0)] ||
202
+ BYTE_IS_DELIMITER[str.getbyte(-1)]
203
+ str << tmp
204
+ index += 1
205
+ end
206
+ str << "]".freeze
207
+ end
208
+
209
+ # Serializes a Hash object (i.e. a PDF dictionary object).
210
+ #
211
+ # See: PDF1.7 s7.3.7
212
+ def serialize_hash(obj)
213
+ str = "<<"
214
+ obj.each do |k, v|
215
+ next if v.nil? || (v.respond_to?(:null?) && v.null?)
216
+ str << __serialize(k)
217
+ tmp = __serialize(v)
218
+ str << " ".freeze unless BYTE_IS_DELIMITER[tmp.getbyte(0)] ||
219
+ BYTE_IS_DELIMITER[str.getbyte(-1)]
220
+ str << tmp
221
+ end
222
+ str << ">>".freeze
223
+ end
224
+
225
+ STRING_ESCAPE_MAP = {"(" => "\\(", ")" => "\\)", "\\" => "\\\\", "\r" => "\\r"} # :nodoc:
226
+
227
+ # Serializes a String object.
228
+ #
229
+ # See: PDF1.7 s7.3.4
230
+ def serialize_string(obj)
231
+ if @encrypter && @object.kind_of?(HexaPDF::Object) && @object.indirect?
232
+ obj = encrypter.encrypt_string(obj, @object)
233
+ elsif obj.encoding != Encoding::BINARY && obj =~ /[^ -~\t\r\n]/
234
+ obj = "\xFE\xFF".b << obj.encode(Encoding::UTF_16BE).force_encoding(Encoding::BINARY)
235
+ elsif obj.encoding != Encoding::BINARY
236
+ obj = obj.b
237
+ end
238
+ "(" << obj.gsub(/[\(\)\\\r]/n) {|m| STRING_ESCAPE_MAP[m]} << ")".freeze
239
+ end
240
+
241
+ # The ISO PDF specification differs in respect to the supported date format. When converting
242
+ # to a date string, a format suitable for both is output.
243
+ #
244
+ # See: PDF1.7 s7.9.4, ADB1.7 3.8.3
245
+ def serialize_time(obj)
246
+ zone = obj.strftime("%z'")
247
+ if zone == "+0000'"
248
+ zone = ''
249
+ else
250
+ zone[3, 0] = "'"
251
+ end
252
+ serialize_string(obj.strftime("D:%Y%m%d%H%M%S#{zone}"))
253
+ end
254
+
255
+ # See: #serialize_time
256
+ def serialize_date(obj)
257
+ serialize_time(obj.to_time)
258
+ end
259
+
260
+ # See: #serialize_time
261
+ def serialize_datetime(obj)
262
+ serialize_time(obj.to_time)
263
+ end
264
+
265
+ private
266
+
267
+ # Uses #serialize_hexapdf_reference if it is an indirect object, otherwise just serializes
268
+ # the objects value.
269
+ def serialize_hexapdf_object(obj)
270
+ if obj.indirect? && obj != @object
271
+ serialize_hexapdf_reference(obj)
272
+ else
273
+ __serialize(obj.value)
274
+ end
275
+ end
276
+
277
+ # See: PDF1.7 s7.3.10
278
+ def serialize_hexapdf_reference(obj)
279
+ "#{obj.oid} #{obj.gen} R".freeze
280
+ end
281
+
282
+ # Serializes the streams dictionary and its stream.
283
+ #
284
+ # See: PDF1.7 s7.3.8
285
+ def serialize_hexapdf_stream(obj)
286
+ if !obj.indirect?
287
+ raise HexaPDF::Error, "Can't serialize PDF stream without object identifier"
288
+ elsif obj != @object
289
+ return serialize_hexapdf_reference(obj)
290
+ end
291
+
292
+ fiber = if @encrypter
293
+ encrypter.encrypt_stream(obj)
294
+ else
295
+ obj.stream_encoder
296
+ end
297
+
298
+ if @io && fiber.respond_to?(:length) && fiber.length >= 0
299
+ obj.value[:Length] = fiber.length
300
+ @io << __serialize(obj.value)
301
+ @io << "stream\n".freeze
302
+ while fiber.alive? && (data = fiber.resume)
303
+ @io << data.freeze
304
+ end
305
+ @io << "\nendstream".freeze
306
+
307
+ nil
308
+ else
309
+ data = Filter.string_from_source(fiber)
310
+ obj.value[:Length] = data.size
311
+
312
+ str = __serialize(obj.value)
313
+ str << "stream\n".freeze
314
+ str << data
315
+ str << "\nendstream".freeze
316
+ end
317
+ end
318
+
319
+ # Invokes the correct serialization method for the object.
320
+ def __serialize(obj)
321
+ send(@dispatcher[obj.class], obj)
322
+ end
323
+
324
+ end
325
+
326
+ end
@@ -0,0 +1,279 @@
1
+ # -*- encoding: utf-8 -*-
2
+ #
3
+ #--
4
+ # This file is part of HexaPDF.
5
+ #
6
+ # HexaPDF - A Versatile PDF Creation and Manipulation Library For Ruby
7
+ # Copyright (C) 2016 Thomas Leitner
8
+ #
9
+ # HexaPDF is free software: you can redistribute it and/or modify it
10
+ # under the terms of the GNU Affero General Public License version 3 as
11
+ # published by the Free Software Foundation with the addition of the
12
+ # following permission added to Section 15 as permitted in Section 7(a):
13
+ # FOR ANY PART OF THE COVERED WORK IN WHICH THE COPYRIGHT IS OWNED BY
14
+ # THOMAS LEITNER, THOMAS LEITNER DISCLAIMS THE WARRANTY OF NON
15
+ # INFRINGEMENT OF THIRD PARTY RIGHTS.
16
+ #
17
+ # HexaPDF is distributed in the hope that it will be useful, but WITHOUT
18
+ # ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
19
+ # FITNESS FOR A PARTICULAR PURPOSE. See the GNU Affero General Public
20
+ # License for more details.
21
+ #
22
+ # You should have received a copy of the GNU Affero General Public License
23
+ # along with HexaPDF. If not, see <http://www.gnu.org/licenses/>.
24
+ #
25
+ # The interactive user interfaces in modified source and object code
26
+ # versions of HexaPDF must display Appropriate Legal Notices, as required
27
+ # under Section 5 of the GNU Affero General Public License version 3.
28
+ #
29
+ # In accordance with Section 7(b) of the GNU Affero General Public
30
+ # License, a covered work must retain the producer line in every PDF that
31
+ # is created or manipulated using HexaPDF.
32
+ #++
33
+
34
+ require 'hexapdf/error'
35
+ require 'hexapdf/dictionary'
36
+ require 'hexapdf/filter'
37
+
38
+ module HexaPDF
39
+
40
+ # Container for stream data that is more complex than a string.
41
+ #
42
+ # This helper class wraps all information necessary to read stream data by using a Fiber object
43
+ # (see HexaPDF::Filter). The underlying data either comes from an IO object, a file represented by
44
+ # its file name or a Fiber defined via a Proc object.
45
+ #
46
+ # Additionally, the #filter and #decode_parms can be set to indicate that the data returned from
47
+ # the Fiber needs to be post-processed. The +filter+ and +decode_parms+ are automatically
48
+ # normalized to arrays on assignment to ease further processing.
49
+ class StreamData
50
+
51
+ # The filter(s) that need to be applied for getting the decoded stream data.
52
+ attr_reader :filter
53
+
54
+ # The decoding parameters associated with the +filter+(s).
55
+ attr_reader :decode_parms
56
+
57
+ # :call-seq:
58
+ # StreamData.new(io) -> stream_data
59
+ # StreamData.new(str) -> stream_data
60
+ # StreamData.new(proc) -> stream_data
61
+ # StreamData.new { block } -> stream_data
62
+ #
63
+ # Creates a new StreamData object for the given +source+ and with the given options.
64
+ #
65
+ # The +source+ can be:
66
+ #
67
+ # * An IO stream which is read starting from a specific +offset+ for a specific +length+
68
+ #
69
+ # * A string which is interpreted as a file name and read starting from a specific +offset+
70
+ # * and for a specific +length+
71
+ #
72
+ # * A Proc object (that is converted to a Fiber when needed) in which case the +offset+ and
73
+ # value is ignored. The Proc object can also be passed by using a block.
74
+ def initialize(source = nil, offset: nil, length: nil, filter: nil, decode_parms: nil, &block)
75
+ if source.nil? && !block_given?
76
+ raise ArgumentError, "Either a source object or a block must be given"
77
+ end
78
+ @source = source || block
79
+ @offset = offset
80
+ @length = length
81
+ @filter = [filter].flatten.compact
82
+ @decode_parms = [decode_parms].flatten
83
+ freeze
84
+ end
85
+
86
+ # Returns a Fiber for getting at the data of the stream represented by this object.
87
+ def fiber(chunk_size = 0)
88
+ if @source.kind_of?(Proc)
89
+ FiberWithLength.new(@length, &@source)
90
+ elsif @source.kind_of?(String)
91
+ HexaPDF::Filter.source_from_file(@source, pos: @offset || 0, length: @length || -1,
92
+ chunk_size: chunk_size)
93
+ else
94
+ HexaPDF::Filter.source_from_io(@source, pos: @offset || 0, length: @length || -1,
95
+ chunk_size: chunk_size)
96
+ end
97
+ end
98
+
99
+ end
100
+
101
+ # Implements Stream objects of the PDF object system.
102
+ #
103
+ # == Stream Objects
104
+ #
105
+ # A stream may also be associated with a PDF object but only if the value is a PDF dictionary.
106
+ # This associated dictionary further describes the stream, like its length or how it is encoded.
107
+ #
108
+ # Such a stream object in PDF contains string data but of possibly unlimited length. Therefore
109
+ # it is used for large amounts of data like images, page descriptions or embedded files.
110
+ #
111
+ # The basic Object class cannot hold stream data, only this subclass contains the necessary
112
+ # methods to conveniently work with the stream data!
113
+ #
114
+ # See: PDF1.7 s7.3.8, Dictionary
115
+ class Stream < Dictionary
116
+
117
+ define_field :Length, type: Integer # not required, will be auto-filled when writing
118
+ define_field :Filter, type: [Symbol, Array]
119
+ define_field :DecodeParms, type: [Dictionary, Hash, Array]
120
+ define_field :F, type: :FileSpec, version: '1.2'
121
+ define_field :FFilter, type: [Symbol, Array], version: '1.2'
122
+ define_field :FDecodeParms, type: [Dictionary, Hash, Array], version: '1.2'
123
+ define_field :DL, type: Integer
124
+
125
+ # Stream objects must always be indirect.
126
+ def must_be_indirect?
127
+ true
128
+ end
129
+
130
+ # Assigns a new stream data object.
131
+ #
132
+ # The +stream+ argument can be a HexaPDF::StreamData object, a String object or +nil+.
133
+ #
134
+ # If +stream+ is +nil+, an empty binary string is used instead.
135
+ def stream=(stream)
136
+ data.stream = stream
137
+ after_data_change
138
+ end
139
+
140
+ # Returns the (possibly decoded) stream data as string.
141
+ #
142
+ # Note that modifications done to the returned string are not reflected in the Stream object
143
+ # itself. The modified string must explicitly be assigned via #stream= to take effect.
144
+ def stream
145
+ if data.stream.kind_of?(String)
146
+ data.stream.dup
147
+ else
148
+ HexaPDF::Filter.string_from_source(stream_decoder)
149
+ end
150
+ end
151
+
152
+ # Returns the raw stream object.
153
+ #
154
+ # The returned value can be of many different types (see #stream=). For working with the
155
+ # decoded stream contents use #stream.
156
+ def raw_stream
157
+ data.stream
158
+ end
159
+
160
+ # Returns the Fiber representing the unprocessed content of the stream.
161
+ def stream_source
162
+ if data.stream.kind_of?(String)
163
+ HexaPDF::Filter.source_from_string(data.stream)
164
+ else
165
+ data.stream.fiber(config['io.chunk_size'.freeze])
166
+ end
167
+ end
168
+
169
+ # Returns the decoder Fiber for the stream data.
170
+ #
171
+ # See the Filter module for more information on how to work with the fiber.
172
+ def stream_decoder
173
+ source = stream_source
174
+
175
+ if data.stream.kind_of?(StreamData)
176
+ data.stream.filter.zip(data.stream.decode_parms) do |filter, decode_parms|
177
+ source = filter_for_name(filter).decoder(source, decode_parms)
178
+ end
179
+ end
180
+
181
+ source
182
+ end
183
+
184
+ # Returns the encoder Fiber for the stream data.
185
+ #
186
+ # The two arguments can be used to add additional filters for *only* this returned encoder
187
+ # Fiber. They should normally *not* be used and are here for use by the encryption facilities.
188
+ #
189
+ # See the Filter module for more information on how to work with the fiber.
190
+ def stream_encoder(additional_filter = nil, additional_decode_parms = nil)
191
+ encoder_data = [additional_filter, document.unwrap(self[:Filter])].flatten.
192
+ zip([additional_decode_parms, document.unwrap(self[:DecodeParms])].flatten).
193
+ delete_if {|f, _| f.nil?}
194
+ source = stream_source
195
+
196
+ if data.stream.kind_of?(StreamData)
197
+ decoder_data = data.stream.filter.zip(data.stream.decode_parms)
198
+
199
+ while !decoder_data.empty? && !encoder_data.empty? && decoder_data.last == encoder_data.last
200
+ decoder_data.pop
201
+ encoder_data.pop
202
+ end
203
+
204
+ decoder_data.each do |filter, decode_parms|
205
+ source = filter_for_name(filter).decoder(source, decode_parms)
206
+ end
207
+ end
208
+
209
+ encoder_data.reverse!.each do |filter, decode_parms|
210
+ source = filter_for_name(filter).encoder(source, decode_parms)
211
+ end
212
+
213
+ source
214
+ end
215
+
216
+ # Sets the filters that should be used for encoding the stream.
217
+ #
218
+ # The arguments +filter+ as well as +decode_parms+ can either be a single items or arrays.
219
+ #
220
+ # The filters have to be specified in the *decoding order*! For example, if the filters would
221
+ # be [:A85, :Fl], the stream would first be encoded with the Flate and then with the ASCII85
222
+ # filter.
223
+ def set_filter(filter, decode_parms = nil)
224
+ if filter.nil? || (filter.kind_of?(Array) && filter.empty?)
225
+ delete(:Filter)
226
+ else
227
+ self[:Filter] = filter
228
+ end
229
+ if decode_parms.nil? || (decode_parms.kind_of?(Array) && decode_parms.empty?) ||
230
+ !key?(:Filter)
231
+ delete(:DecodeParms)
232
+ else
233
+ self[:DecodeParms] = decode_parms
234
+ end
235
+ end
236
+
237
+ private
238
+
239
+ # Makes sure that the stream data is either a String or a HexaPDF::StreamData object.
240
+ def after_data_change
241
+ super
242
+ data.stream ||= ''.b
243
+ unless data.stream.kind_of?(StreamData) || data.stream.kind_of?(String)
244
+ raise ArgumentError, "Object of class #{data.stream.class} cannot be used as stream value"
245
+ end
246
+ end
247
+
248
+ # Returns the filter object that corresponds to the given filter name.
249
+ #
250
+ # See: HexaPDF::Filter
251
+ def filter_for_name(filter_name)
252
+ GlobalConfiguration.constantize('filter.map', filter_name) do
253
+ raise HexaPDF::Error, "Unknown stream filter '#{filter_name}' encountered"
254
+ end
255
+ end
256
+
257
+ # :nodoc:
258
+ # A mapping from short name to long name for filters.
259
+ FILTER_MAP = {AHx: :ASCIIHexDecode, A85: :ASCII85Decode, LZW: :LZWDecode,
260
+ Fl: :FlateDecode, RL: :RunLengthDecode, CCF: :CCITTFaxDecode, DCT: :DCTDecode}
261
+
262
+ # Validates the /Filter entry so that it contains only long-name filter names.
263
+ def perform_validation
264
+ super
265
+ if value[:Filter].kind_of?(Symbol) && FILTER_MAP.key?(value[:Filter])
266
+ yield("A stream's /Filter entry may only use long-form filter names", true)
267
+ value[:Filter] = FILTER_MAP[value[:Filter]]
268
+ elsif value[:Filter].kind_of?(Array)
269
+ value[:Filter].map! do |filter|
270
+ next filter unless FILTER_MAP.key?(filter)
271
+ yield("A stream's /Filter entry may only use long-form filter names", true)
272
+ FILTER_MAP[filter]
273
+ end
274
+ end
275
+ end
276
+
277
+ end
278
+
279
+ end