hexapdf 0.1.0

Sign up to get free protection for your applications and to get access to all the features.
Files changed (346) hide show
  1. checksums.yaml +7 -0
  2. data/CONTRIBUTERS +3 -0
  3. data/LICENSE +26 -0
  4. data/README.md +88 -0
  5. data/Rakefile +121 -0
  6. data/VERSION +1 -0
  7. data/agpl-3.0.txt +661 -0
  8. data/bin/hexapdf +6 -0
  9. data/data/hexapdf/afm/Courier-Bold.afm +342 -0
  10. data/data/hexapdf/afm/Courier-BoldOblique.afm +342 -0
  11. data/data/hexapdf/afm/Courier-Oblique.afm +342 -0
  12. data/data/hexapdf/afm/Courier.afm +342 -0
  13. data/data/hexapdf/afm/Helvetica-Bold.afm +2827 -0
  14. data/data/hexapdf/afm/Helvetica-BoldOblique.afm +2827 -0
  15. data/data/hexapdf/afm/Helvetica-Oblique.afm +3051 -0
  16. data/data/hexapdf/afm/Helvetica.afm +3051 -0
  17. data/data/hexapdf/afm/MustRead.html +1 -0
  18. data/data/hexapdf/afm/Symbol.afm +213 -0
  19. data/data/hexapdf/afm/Times-Bold.afm +2588 -0
  20. data/data/hexapdf/afm/Times-BoldItalic.afm +2384 -0
  21. data/data/hexapdf/afm/Times-Italic.afm +2667 -0
  22. data/data/hexapdf/afm/Times-Roman.afm +2419 -0
  23. data/data/hexapdf/afm/ZapfDingbats.afm +225 -0
  24. data/data/hexapdf/encoding/glyphlist.txt +4305 -0
  25. data/data/hexapdf/encoding/zapfdingbats.txt +225 -0
  26. data/examples/arc.rb +50 -0
  27. data/examples/graphics.rb +274 -0
  28. data/examples/hello_world.rb +16 -0
  29. data/examples/machupicchu.jpg +0 -0
  30. data/examples/merging.rb +24 -0
  31. data/examples/optimizing.rb +20 -0
  32. data/examples/show_char_bboxes.rb +55 -0
  33. data/examples/standard_pdf_fonts.rb +72 -0
  34. data/examples/truetype.rb +45 -0
  35. data/lib/hexapdf/cli/extract.rb +128 -0
  36. data/lib/hexapdf/cli/info.rb +121 -0
  37. data/lib/hexapdf/cli/inspect.rb +157 -0
  38. data/lib/hexapdf/cli/modify.rb +218 -0
  39. data/lib/hexapdf/cli.rb +121 -0
  40. data/lib/hexapdf/configuration.rb +392 -0
  41. data/lib/hexapdf/content/canvas.rb +1974 -0
  42. data/lib/hexapdf/content/color_space.rb +364 -0
  43. data/lib/hexapdf/content/graphic_object/arc.rb +267 -0
  44. data/lib/hexapdf/content/graphic_object/endpoint_arc.rb +208 -0
  45. data/lib/hexapdf/content/graphic_object/solid_arc.rb +173 -0
  46. data/lib/hexapdf/content/graphic_object.rb +81 -0
  47. data/lib/hexapdf/content/graphics_state.rb +579 -0
  48. data/lib/hexapdf/content/operator.rb +1072 -0
  49. data/lib/hexapdf/content/parser.rb +204 -0
  50. data/lib/hexapdf/content/processor.rb +451 -0
  51. data/lib/hexapdf/content/transformation_matrix.rb +172 -0
  52. data/lib/hexapdf/content.rb +47 -0
  53. data/lib/hexapdf/data_dir.rb +51 -0
  54. data/lib/hexapdf/dictionary.rb +303 -0
  55. data/lib/hexapdf/dictionary_fields.rb +382 -0
  56. data/lib/hexapdf/document.rb +589 -0
  57. data/lib/hexapdf/document_utils.rb +209 -0
  58. data/lib/hexapdf/encryption/aes.rb +206 -0
  59. data/lib/hexapdf/encryption/arc4.rb +93 -0
  60. data/lib/hexapdf/encryption/fast_aes.rb +79 -0
  61. data/lib/hexapdf/encryption/fast_arc4.rb +67 -0
  62. data/lib/hexapdf/encryption/identity.rb +63 -0
  63. data/lib/hexapdf/encryption/ruby_aes.rb +447 -0
  64. data/lib/hexapdf/encryption/ruby_arc4.rb +96 -0
  65. data/lib/hexapdf/encryption/security_handler.rb +494 -0
  66. data/lib/hexapdf/encryption/standard_security_handler.rb +616 -0
  67. data/lib/hexapdf/encryption.rb +94 -0
  68. data/lib/hexapdf/error.rb +73 -0
  69. data/lib/hexapdf/filter/ascii85_decode.rb +160 -0
  70. data/lib/hexapdf/filter/ascii_hex_decode.rb +87 -0
  71. data/lib/hexapdf/filter/dct_decode.rb +57 -0
  72. data/lib/hexapdf/filter/encryption.rb +59 -0
  73. data/lib/hexapdf/filter/flate_decode.rb +93 -0
  74. data/lib/hexapdf/filter/jpx_decode.rb +56 -0
  75. data/lib/hexapdf/filter/lzw_decode.rb +191 -0
  76. data/lib/hexapdf/filter/predictor.rb +266 -0
  77. data/lib/hexapdf/filter/run_length_decode.rb +108 -0
  78. data/lib/hexapdf/filter.rb +176 -0
  79. data/lib/hexapdf/font/cmap/parser.rb +146 -0
  80. data/lib/hexapdf/font/cmap/writer.rb +176 -0
  81. data/lib/hexapdf/font/cmap.rb +90 -0
  82. data/lib/hexapdf/font/encoding/base.rb +77 -0
  83. data/lib/hexapdf/font/encoding/difference_encoding.rb +64 -0
  84. data/lib/hexapdf/font/encoding/glyph_list.rb +150 -0
  85. data/lib/hexapdf/font/encoding/mac_expert_encoding.rb +221 -0
  86. data/lib/hexapdf/font/encoding/mac_roman_encoding.rb +265 -0
  87. data/lib/hexapdf/font/encoding/standard_encoding.rb +205 -0
  88. data/lib/hexapdf/font/encoding/symbol_encoding.rb +244 -0
  89. data/lib/hexapdf/font/encoding/win_ansi_encoding.rb +280 -0
  90. data/lib/hexapdf/font/encoding/zapf_dingbats_encoding.rb +250 -0
  91. data/lib/hexapdf/font/encoding.rb +68 -0
  92. data/lib/hexapdf/font/true_type/font.rb +179 -0
  93. data/lib/hexapdf/font/true_type/table/cmap.rb +103 -0
  94. data/lib/hexapdf/font/true_type/table/cmap_subtable.rb +384 -0
  95. data/lib/hexapdf/font/true_type/table/directory.rb +92 -0
  96. data/lib/hexapdf/font/true_type/table/glyf.rb +166 -0
  97. data/lib/hexapdf/font/true_type/table/head.rb +143 -0
  98. data/lib/hexapdf/font/true_type/table/hhea.rb +109 -0
  99. data/lib/hexapdf/font/true_type/table/hmtx.rb +79 -0
  100. data/lib/hexapdf/font/true_type/table/loca.rb +79 -0
  101. data/lib/hexapdf/font/true_type/table/maxp.rb +112 -0
  102. data/lib/hexapdf/font/true_type/table/name.rb +218 -0
  103. data/lib/hexapdf/font/true_type/table/os2.rb +200 -0
  104. data/lib/hexapdf/font/true_type/table/post.rb +230 -0
  105. data/lib/hexapdf/font/true_type/table.rb +155 -0
  106. data/lib/hexapdf/font/true_type.rb +48 -0
  107. data/lib/hexapdf/font/true_type_wrapper.rb +240 -0
  108. data/lib/hexapdf/font/type1/afm_parser.rb +230 -0
  109. data/lib/hexapdf/font/type1/character_metrics.rb +67 -0
  110. data/lib/hexapdf/font/type1/font.rb +123 -0
  111. data/lib/hexapdf/font/type1/font_metrics.rb +117 -0
  112. data/lib/hexapdf/font/type1/pfb_parser.rb +71 -0
  113. data/lib/hexapdf/font/type1.rb +52 -0
  114. data/lib/hexapdf/font/type1_wrapper.rb +193 -0
  115. data/lib/hexapdf/font_loader/from_configuration.rb +70 -0
  116. data/lib/hexapdf/font_loader/standard14.rb +98 -0
  117. data/lib/hexapdf/font_loader.rb +85 -0
  118. data/lib/hexapdf/font_utils.rb +89 -0
  119. data/lib/hexapdf/image_loader/jpeg.rb +166 -0
  120. data/lib/hexapdf/image_loader/pdf.rb +89 -0
  121. data/lib/hexapdf/image_loader/png.rb +410 -0
  122. data/lib/hexapdf/image_loader.rb +68 -0
  123. data/lib/hexapdf/importer.rb +139 -0
  124. data/lib/hexapdf/name_tree_node.rb +78 -0
  125. data/lib/hexapdf/number_tree_node.rb +67 -0
  126. data/lib/hexapdf/object.rb +363 -0
  127. data/lib/hexapdf/parser.rb +349 -0
  128. data/lib/hexapdf/rectangle.rb +99 -0
  129. data/lib/hexapdf/reference.rb +98 -0
  130. data/lib/hexapdf/revision.rb +206 -0
  131. data/lib/hexapdf/revisions.rb +194 -0
  132. data/lib/hexapdf/serializer.rb +326 -0
  133. data/lib/hexapdf/stream.rb +279 -0
  134. data/lib/hexapdf/task/dereference.rb +109 -0
  135. data/lib/hexapdf/task/optimize.rb +230 -0
  136. data/lib/hexapdf/task.rb +68 -0
  137. data/lib/hexapdf/tokenizer.rb +406 -0
  138. data/lib/hexapdf/type/catalog.rb +107 -0
  139. data/lib/hexapdf/type/embedded_file.rb +87 -0
  140. data/lib/hexapdf/type/file_specification.rb +232 -0
  141. data/lib/hexapdf/type/font.rb +81 -0
  142. data/lib/hexapdf/type/font_descriptor.rb +109 -0
  143. data/lib/hexapdf/type/font_simple.rb +190 -0
  144. data/lib/hexapdf/type/font_true_type.rb +47 -0
  145. data/lib/hexapdf/type/font_type1.rb +162 -0
  146. data/lib/hexapdf/type/form.rb +103 -0
  147. data/lib/hexapdf/type/graphics_state_parameter.rb +79 -0
  148. data/lib/hexapdf/type/image.rb +73 -0
  149. data/lib/hexapdf/type/info.rb +70 -0
  150. data/lib/hexapdf/type/names.rb +69 -0
  151. data/lib/hexapdf/type/object_stream.rb +224 -0
  152. data/lib/hexapdf/type/page.rb +355 -0
  153. data/lib/hexapdf/type/page_tree_node.rb +269 -0
  154. data/lib/hexapdf/type/resources.rb +212 -0
  155. data/lib/hexapdf/type/trailer.rb +128 -0
  156. data/lib/hexapdf/type/viewer_preferences.rb +73 -0
  157. data/lib/hexapdf/type/xref_stream.rb +204 -0
  158. data/lib/hexapdf/type.rb +67 -0
  159. data/lib/hexapdf/utils/bit_field.rb +87 -0
  160. data/lib/hexapdf/utils/bit_stream.rb +148 -0
  161. data/lib/hexapdf/utils/lru_cache.rb +65 -0
  162. data/lib/hexapdf/utils/math_helpers.rb +55 -0
  163. data/lib/hexapdf/utils/object_hash.rb +130 -0
  164. data/lib/hexapdf/utils/pdf_doc_encoding.rb +93 -0
  165. data/lib/hexapdf/utils/sorted_tree_node.rb +339 -0
  166. data/lib/hexapdf/version.rb +39 -0
  167. data/lib/hexapdf/writer.rb +199 -0
  168. data/lib/hexapdf/xref_section.rb +152 -0
  169. data/lib/hexapdf.rb +34 -0
  170. data/man/man1/hexapdf.1 +249 -0
  171. data/test/data/aes-test-vectors/CBCGFSbox-128-decrypt.data.gz +0 -0
  172. data/test/data/aes-test-vectors/CBCGFSbox-128-encrypt.data.gz +0 -0
  173. data/test/data/aes-test-vectors/CBCGFSbox-192-decrypt.data.gz +0 -0
  174. data/test/data/aes-test-vectors/CBCGFSbox-192-encrypt.data.gz +0 -0
  175. data/test/data/aes-test-vectors/CBCGFSbox-256-decrypt.data.gz +0 -0
  176. data/test/data/aes-test-vectors/CBCGFSbox-256-encrypt.data.gz +0 -0
  177. data/test/data/aes-test-vectors/CBCKeySbox-128-decrypt.data.gz +0 -0
  178. data/test/data/aes-test-vectors/CBCKeySbox-128-encrypt.data.gz +0 -0
  179. data/test/data/aes-test-vectors/CBCKeySbox-192-decrypt.data.gz +0 -0
  180. data/test/data/aes-test-vectors/CBCKeySbox-192-encrypt.data.gz +0 -0
  181. data/test/data/aes-test-vectors/CBCKeySbox-256-decrypt.data.gz +0 -0
  182. data/test/data/aes-test-vectors/CBCKeySbox-256-encrypt.data.gz +0 -0
  183. data/test/data/aes-test-vectors/CBCVarKey-128-decrypt.data.gz +0 -0
  184. data/test/data/aes-test-vectors/CBCVarKey-128-encrypt.data.gz +0 -0
  185. data/test/data/aes-test-vectors/CBCVarKey-192-decrypt.data.gz +0 -0
  186. data/test/data/aes-test-vectors/CBCVarKey-192-encrypt.data.gz +0 -0
  187. data/test/data/aes-test-vectors/CBCVarKey-256-decrypt.data.gz +0 -0
  188. data/test/data/aes-test-vectors/CBCVarKey-256-encrypt.data.gz +0 -0
  189. data/test/data/aes-test-vectors/CBCVarTxt-128-decrypt.data.gz +0 -0
  190. data/test/data/aes-test-vectors/CBCVarTxt-128-encrypt.data.gz +0 -0
  191. data/test/data/aes-test-vectors/CBCVarTxt-192-decrypt.data.gz +0 -0
  192. data/test/data/aes-test-vectors/CBCVarTxt-192-encrypt.data.gz +0 -0
  193. data/test/data/aes-test-vectors/CBCVarTxt-256-decrypt.data.gz +0 -0
  194. data/test/data/aes-test-vectors/CBCVarTxt-256-encrypt.data.gz +0 -0
  195. data/test/data/fonts/Ubuntu-Title.ttf +0 -0
  196. data/test/data/images/cmyk.jpg +0 -0
  197. data/test/data/images/fillbytes.jpg +0 -0
  198. data/test/data/images/gray.jpg +0 -0
  199. data/test/data/images/greyscale-1bit.png +0 -0
  200. data/test/data/images/greyscale-2bit.png +0 -0
  201. data/test/data/images/greyscale-4bit.png +0 -0
  202. data/test/data/images/greyscale-8bit.png +0 -0
  203. data/test/data/images/greyscale-alpha-8bit.png +0 -0
  204. data/test/data/images/greyscale-trns-8bit.png +0 -0
  205. data/test/data/images/greyscale-with-gamma1.0.png +0 -0
  206. data/test/data/images/greyscale-with-gamma1.5.png +0 -0
  207. data/test/data/images/indexed-1bit.png +0 -0
  208. data/test/data/images/indexed-2bit.png +0 -0
  209. data/test/data/images/indexed-4bit.png +0 -0
  210. data/test/data/images/indexed-8bit.png +0 -0
  211. data/test/data/images/indexed-alpha-4bit.png +0 -0
  212. data/test/data/images/indexed-alpha-8bit.png +0 -0
  213. data/test/data/images/rgb.jpg +0 -0
  214. data/test/data/images/truecolour-8bit.png +0 -0
  215. data/test/data/images/truecolour-alpha-8bit.png +0 -0
  216. data/test/data/images/truecolour-gama-chrm-8bit.png +0 -0
  217. data/test/data/images/truecolour-srgb-8bit.png +0 -0
  218. data/test/data/minimal.pdf +44 -0
  219. data/test/data/standard-security-handler/README +9 -0
  220. data/test/data/standard-security-handler/bothpwd-aes-128bit-V4.pdf +44 -0
  221. data/test/data/standard-security-handler/bothpwd-aes-256bit-V5.pdf +0 -0
  222. data/test/data/standard-security-handler/bothpwd-arc4-128bit-V2.pdf +43 -0
  223. data/test/data/standard-security-handler/bothpwd-arc4-128bit-V4.pdf +43 -0
  224. data/test/data/standard-security-handler/bothpwd-arc4-40bit-V1.pdf +0 -0
  225. data/test/data/standard-security-handler/nopwd-aes-128bit-V4.pdf +43 -0
  226. data/test/data/standard-security-handler/nopwd-aes-256bit-V5.pdf +0 -0
  227. data/test/data/standard-security-handler/nopwd-arc4-128bit-V2.pdf +43 -0
  228. data/test/data/standard-security-handler/nopwd-arc4-128bit-V4.pdf +43 -0
  229. data/test/data/standard-security-handler/nopwd-arc4-40bit-V1.pdf +43 -0
  230. data/test/data/standard-security-handler/ownerpwd-aes-128bit-V4.pdf +0 -0
  231. data/test/data/standard-security-handler/ownerpwd-aes-256bit-V5.pdf +43 -0
  232. data/test/data/standard-security-handler/ownerpwd-arc4-128bit-V2.pdf +43 -0
  233. data/test/data/standard-security-handler/ownerpwd-arc4-128bit-V4.pdf +43 -0
  234. data/test/data/standard-security-handler/ownerpwd-arc4-40bit-V1.pdf +43 -0
  235. data/test/data/standard-security-handler/userpwd-aes-128bit-V4.pdf +43 -0
  236. data/test/data/standard-security-handler/userpwd-aes-256bit-V5.pdf +43 -0
  237. data/test/data/standard-security-handler/userpwd-arc4-128bit-V2.pdf +0 -0
  238. data/test/data/standard-security-handler/userpwd-arc4-128bit-V4.pdf +0 -0
  239. data/test/data/standard-security-handler/userpwd-arc4-40bit-V1.pdf +43 -0
  240. data/test/hexapdf/common_tokenizer_tests.rb +204 -0
  241. data/test/hexapdf/content/common.rb +31 -0
  242. data/test/hexapdf/content/graphic_object/test_arc.rb +93 -0
  243. data/test/hexapdf/content/graphic_object/test_endpoint_arc.rb +91 -0
  244. data/test/hexapdf/content/graphic_object/test_solid_arc.rb +86 -0
  245. data/test/hexapdf/content/test_canvas.rb +1113 -0
  246. data/test/hexapdf/content/test_color_space.rb +97 -0
  247. data/test/hexapdf/content/test_graphics_state.rb +138 -0
  248. data/test/hexapdf/content/test_operator.rb +619 -0
  249. data/test/hexapdf/content/test_parser.rb +66 -0
  250. data/test/hexapdf/content/test_processor.rb +156 -0
  251. data/test/hexapdf/content/test_transformation_matrix.rb +64 -0
  252. data/test/hexapdf/encryption/common.rb +87 -0
  253. data/test/hexapdf/encryption/test_aes.rb +121 -0
  254. data/test/hexapdf/encryption/test_arc4.rb +39 -0
  255. data/test/hexapdf/encryption/test_fast_aes.rb +17 -0
  256. data/test/hexapdf/encryption/test_fast_arc4.rb +12 -0
  257. data/test/hexapdf/encryption/test_identity.rb +21 -0
  258. data/test/hexapdf/encryption/test_ruby_aes.rb +23 -0
  259. data/test/hexapdf/encryption/test_ruby_arc4.rb +20 -0
  260. data/test/hexapdf/encryption/test_security_handler.rb +356 -0
  261. data/test/hexapdf/encryption/test_standard_security_handler.rb +274 -0
  262. data/test/hexapdf/filter/common.rb +53 -0
  263. data/test/hexapdf/filter/test_ascii85_decode.rb +60 -0
  264. data/test/hexapdf/filter/test_ascii_hex_decode.rb +33 -0
  265. data/test/hexapdf/filter/test_encryption.rb +24 -0
  266. data/test/hexapdf/filter/test_flate_decode.rb +35 -0
  267. data/test/hexapdf/filter/test_lzw_decode.rb +52 -0
  268. data/test/hexapdf/filter/test_predictor.rb +183 -0
  269. data/test/hexapdf/filter/test_run_length_decode.rb +32 -0
  270. data/test/hexapdf/font/cmap/test_parser.rb +67 -0
  271. data/test/hexapdf/font/cmap/test_writer.rb +58 -0
  272. data/test/hexapdf/font/encoding/test_base.rb +35 -0
  273. data/test/hexapdf/font/encoding/test_difference_encoding.rb +21 -0
  274. data/test/hexapdf/font/encoding/test_glyph_list.rb +59 -0
  275. data/test/hexapdf/font/encoding/test_zapf_dingbats_encoding.rb +16 -0
  276. data/test/hexapdf/font/test_encoding.rb +27 -0
  277. data/test/hexapdf/font/test_true_type_wrapper.rb +110 -0
  278. data/test/hexapdf/font/test_type1_wrapper.rb +66 -0
  279. data/test/hexapdf/font/true_type/common.rb +19 -0
  280. data/test/hexapdf/font/true_type/table/test_cmap.rb +59 -0
  281. data/test/hexapdf/font/true_type/table/test_cmap_subtable.rb +133 -0
  282. data/test/hexapdf/font/true_type/table/test_directory.rb +35 -0
  283. data/test/hexapdf/font/true_type/table/test_glyf.rb +58 -0
  284. data/test/hexapdf/font/true_type/table/test_head.rb +76 -0
  285. data/test/hexapdf/font/true_type/table/test_hhea.rb +40 -0
  286. data/test/hexapdf/font/true_type/table/test_hmtx.rb +38 -0
  287. data/test/hexapdf/font/true_type/table/test_loca.rb +43 -0
  288. data/test/hexapdf/font/true_type/table/test_maxp.rb +62 -0
  289. data/test/hexapdf/font/true_type/table/test_name.rb +95 -0
  290. data/test/hexapdf/font/true_type/table/test_os2.rb +65 -0
  291. data/test/hexapdf/font/true_type/table/test_post.rb +89 -0
  292. data/test/hexapdf/font/true_type/test_font.rb +120 -0
  293. data/test/hexapdf/font/true_type/test_table.rb +41 -0
  294. data/test/hexapdf/font/type1/test_afm_parser.rb +51 -0
  295. data/test/hexapdf/font/type1/test_font.rb +68 -0
  296. data/test/hexapdf/font/type1/test_pfb_parser.rb +37 -0
  297. data/test/hexapdf/font_loader/test_from_configuration.rb +28 -0
  298. data/test/hexapdf/font_loader/test_standard14.rb +22 -0
  299. data/test/hexapdf/image_loader/test_jpeg.rb +83 -0
  300. data/test/hexapdf/image_loader/test_pdf.rb +47 -0
  301. data/test/hexapdf/image_loader/test_png.rb +258 -0
  302. data/test/hexapdf/task/test_dereference.rb +46 -0
  303. data/test/hexapdf/task/test_optimize.rb +137 -0
  304. data/test/hexapdf/test_configuration.rb +82 -0
  305. data/test/hexapdf/test_data_dir.rb +32 -0
  306. data/test/hexapdf/test_dictionary.rb +284 -0
  307. data/test/hexapdf/test_dictionary_fields.rb +185 -0
  308. data/test/hexapdf/test_document.rb +574 -0
  309. data/test/hexapdf/test_document_utils.rb +144 -0
  310. data/test/hexapdf/test_filter.rb +96 -0
  311. data/test/hexapdf/test_font_utils.rb +47 -0
  312. data/test/hexapdf/test_importer.rb +78 -0
  313. data/test/hexapdf/test_object.rb +177 -0
  314. data/test/hexapdf/test_parser.rb +394 -0
  315. data/test/hexapdf/test_rectangle.rb +36 -0
  316. data/test/hexapdf/test_reference.rb +41 -0
  317. data/test/hexapdf/test_revision.rb +139 -0
  318. data/test/hexapdf/test_revisions.rb +93 -0
  319. data/test/hexapdf/test_serializer.rb +169 -0
  320. data/test/hexapdf/test_stream.rb +262 -0
  321. data/test/hexapdf/test_tokenizer.rb +30 -0
  322. data/test/hexapdf/test_writer.rb +120 -0
  323. data/test/hexapdf/test_xref_section.rb +35 -0
  324. data/test/hexapdf/type/test_catalog.rb +30 -0
  325. data/test/hexapdf/type/test_embedded_file.rb +16 -0
  326. data/test/hexapdf/type/test_file_specification.rb +148 -0
  327. data/test/hexapdf/type/test_font.rb +35 -0
  328. data/test/hexapdf/type/test_font_descriptor.rb +51 -0
  329. data/test/hexapdf/type/test_font_simple.rb +190 -0
  330. data/test/hexapdf/type/test_font_type1.rb +128 -0
  331. data/test/hexapdf/type/test_form.rb +60 -0
  332. data/test/hexapdf/type/test_info.rb +14 -0
  333. data/test/hexapdf/type/test_names.rb +9 -0
  334. data/test/hexapdf/type/test_object_stream.rb +84 -0
  335. data/test/hexapdf/type/test_page.rb +260 -0
  336. data/test/hexapdf/type/test_page_tree_node.rb +255 -0
  337. data/test/hexapdf/type/test_resources.rb +167 -0
  338. data/test/hexapdf/type/test_trailer.rb +109 -0
  339. data/test/hexapdf/type/test_xref_stream.rb +131 -0
  340. data/test/hexapdf/utils/test_bit_field.rb +47 -0
  341. data/test/hexapdf/utils/test_lru_cache.rb +22 -0
  342. data/test/hexapdf/utils/test_object_hash.rb +115 -0
  343. data/test/hexapdf/utils/test_pdf_doc_encoding.rb +18 -0
  344. data/test/hexapdf/utils/test_sorted_tree_node.rb +232 -0
  345. data/test/test_helper.rb +56 -0
  346. metadata +427 -0
@@ -0,0 +1,326 @@
1
+ # -*- encoding: utf-8 -*-
2
+ #
3
+ #--
4
+ # This file is part of HexaPDF.
5
+ #
6
+ # HexaPDF - A Versatile PDF Creation and Manipulation Library For Ruby
7
+ # Copyright (C) 2016 Thomas Leitner
8
+ #
9
+ # HexaPDF is free software: you can redistribute it and/or modify it
10
+ # under the terms of the GNU Affero General Public License version 3 as
11
+ # published by the Free Software Foundation with the addition of the
12
+ # following permission added to Section 15 as permitted in Section 7(a):
13
+ # FOR ANY PART OF THE COVERED WORK IN WHICH THE COPYRIGHT IS OWNED BY
14
+ # THOMAS LEITNER, THOMAS LEITNER DISCLAIMS THE WARRANTY OF NON
15
+ # INFRINGEMENT OF THIRD PARTY RIGHTS.
16
+ #
17
+ # HexaPDF is distributed in the hope that it will be useful, but WITHOUT
18
+ # ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
19
+ # FITNESS FOR A PARTICULAR PURPOSE. See the GNU Affero General Public
20
+ # License for more details.
21
+ #
22
+ # You should have received a copy of the GNU Affero General Public License
23
+ # along with HexaPDF. If not, see <http://www.gnu.org/licenses/>.
24
+ #
25
+ # The interactive user interfaces in modified source and object code
26
+ # versions of HexaPDF must display Appropriate Legal Notices, as required
27
+ # under Section 5 of the GNU Affero General Public License version 3.
28
+ #
29
+ # In accordance with Section 7(b) of the GNU Affero General Public
30
+ # License, a covered work must retain the producer line in every PDF that
31
+ # is created or manipulated using HexaPDF.
32
+ #++
33
+
34
+ require 'time'
35
+ require 'hexapdf/tokenizer'
36
+ require 'hexapdf/filter'
37
+ require 'hexapdf/utils/lru_cache'
38
+
39
+ module HexaPDF
40
+
41
+ # Knows how to serialize Ruby objects for a PDF file.
42
+ #
43
+ # For normal serialization purposes, the #serialize or #serialize_to_io methods should be used.
44
+ # However, if the type of the object to be serialized is known, a specialized serialization
45
+ # method like #serialize_float can be used.
46
+ #
47
+ # Additionally, an object for encrypting strings and streams while serializing can be set via the
48
+ # #encrypter= method. The assigned object has to respond to #encrypt_string(str, ind_obj) (where
49
+ # the string is part of the indirect object; returns the encrypted string) and
50
+ # #encrypt_stream(stream) (returns a fiber that represents the encrypted stream).
51
+ #
52
+ #
53
+ # == How This Class Works
54
+ #
55
+ # The main public interface consists of the #serialize and #serialize_to_io methods which accept
56
+ # an object and return its serialized form. During serialization of this object it is accessible
57
+ # by individual serialization methods via the @object instance variable (useful if the object is a
58
+ # composed object).
59
+ #
60
+ # Internally, the #__serialize method is used for invoking the correct serialization method
61
+ # based on the class of a given object. It is also used for serializing individual parts of a
62
+ # composed object.
63
+ #
64
+ # Therefore the serializer contains one serialization method for each class it needs to
65
+ # serialize. The naming scheme of these methods is based on the class name: The full class name
66
+ # is converted to lowercase, the namespace separator '::' is replaced with a single underscore
67
+ # and the string "serialize_" is then prepended.
68
+ #
69
+ # Examples:
70
+ #
71
+ # NilClass => serialize_nilclass
72
+ # TrueClass => serialize_trueclass
73
+ # HexaPDF::Object => serialize_hexapdf_object
74
+ #
75
+ # If no serialization method for a specific class is found, the ancestors classes are tried.
76
+ #
77
+ # See: PDF1.7 s7.3
78
+ class Serializer
79
+
80
+ # The encrypter to use for encrypting strings and streams. If +nil+, strings and streams are not
81
+ # encrypted.
82
+ #
83
+ # Default: +nil+
84
+ attr_accessor :encrypter
85
+
86
+ # Creates a new Serializer object.
87
+ def initialize
88
+ @dispatcher = Hash.new do |h, klass|
89
+ method = nil
90
+ klass.ancestors.each do |ancestor_klass|
91
+ method = "serialize_#{ancestor_klass.name.downcase.gsub(/::/, '_')}"
92
+ (h[klass] = method; break) if respond_to?(method, true)
93
+ end
94
+ method
95
+ end
96
+ @encrypter = false
97
+ @io = nil
98
+ @object = nil
99
+ end
100
+
101
+ # Returns the serialized form of the given object.
102
+ #
103
+ # For developers: While the object is serialized, methods can use the instance variable
104
+ # @object to obtain information about or use the object in case it is a composed object.
105
+ def serialize(obj)
106
+ @object = obj
107
+ __serialize(obj)
108
+ ensure
109
+ @object = nil
110
+ end
111
+
112
+ # Serializes the given object and writes it to the IO.
113
+ #
114
+ # Also see: #serialize
115
+ def serialize_to_io(obj, io)
116
+ @io = io
117
+ @io << serialize(obj).freeze
118
+ ensure
119
+ @io = nil
120
+ end
121
+
122
+ # Serializes the +nil+ value.
123
+ #
124
+ # See: PDF1.7 s7.3.9
125
+ def serialize_nilclass(_obj)
126
+ "null"
127
+ end
128
+
129
+ # Serializes the +true+ value.
130
+ #
131
+ # See: PDF1.7 s7.3.2
132
+ def serialize_trueclass(_obj)
133
+ "true"
134
+ end
135
+
136
+ # Serializes the +false+ value.
137
+ #
138
+ # See: PDF1.7 s7.3.2
139
+ def serialize_falseclass(_obj)
140
+ "false"
141
+ end
142
+
143
+ # Serializes a Numeric object (either Integer or Float).
144
+ #
145
+ # This method should be used for cases where it is known that the object is either an Integer
146
+ # or a Float.
147
+ #
148
+ # See: PDF1.7 s7.3.3
149
+ def serialize_numeric(obj)
150
+ obj.kind_of?(Integer) ? obj.to_s : serialize_float(obj)
151
+ end
152
+
153
+ # Serializes an Integer object.
154
+ #
155
+ # See: PDF1.7 s7.3.3
156
+ def serialize_integer(obj)
157
+ obj.to_s
158
+ end
159
+
160
+ # Serializes a Float object.
161
+ #
162
+ # See: PDF1.7 s7.3.3
163
+ def serialize_float(obj)
164
+ obj.abs < 0.0001 && obj != 0 ? sprintf("%.6f".freeze, obj) : obj.round(6).to_s
165
+ end
166
+
167
+ # The regexp matches all characters that need to be escaped and the substs hash contains the
168
+ # mapping from these characters to their escaped form.
169
+ #
170
+ # See PDF1.7 s7.3.5
171
+ NAME_SUBSTS = {} # :nodoc:
172
+ [0..32, 127..255, Tokenizer::DELIMITER.bytes, Tokenizer::WHITESPACE.bytes, [35]].each do |a|
173
+ a.each {|c| NAME_SUBSTS[c.chr] = "##{c.to_s(16).rjust(2, "0")}"}
174
+ end
175
+ NAME_REGEXP = /[^!-~&&[^##{Regexp.escape(Tokenizer::DELIMITER)}#{Regexp.escape(Tokenizer::WHITESPACE)}]]/ # :nodoc:
176
+ NAME_CACHE = Utils::LRUCache.new(1000) # :nodoc:
177
+
178
+ # Serializes a Symbol object (i.e. a PDF name object).
179
+ #
180
+ # See: PDF1.7 s7.3.5
181
+ def serialize_symbol(obj)
182
+ NAME_CACHE[obj] ||=
183
+ begin
184
+ str = obj.to_s.force_encoding(Encoding::BINARY)
185
+ str.gsub!(NAME_REGEXP) {|m| NAME_SUBSTS[m]}
186
+ "/#{str}"
187
+ end
188
+ end
189
+
190
+ BYTE_IS_DELIMITER = {40 => true, 47 => true, 60 => true, 91 => true, # :nodoc:
191
+ 41 => true, 62 => true, 93 => true}
192
+
193
+ # Serializes an Array object.
194
+ #
195
+ # See: PDF1.7 s7.3.6
196
+ def serialize_array(obj)
197
+ str = "["
198
+ index = 0
199
+ while index < obj.size
200
+ tmp = __serialize(obj[index])
201
+ str << " ".freeze unless BYTE_IS_DELIMITER[tmp.getbyte(0)] ||
202
+ BYTE_IS_DELIMITER[str.getbyte(-1)]
203
+ str << tmp
204
+ index += 1
205
+ end
206
+ str << "]".freeze
207
+ end
208
+
209
+ # Serializes a Hash object (i.e. a PDF dictionary object).
210
+ #
211
+ # See: PDF1.7 s7.3.7
212
+ def serialize_hash(obj)
213
+ str = "<<"
214
+ obj.each do |k, v|
215
+ next if v.nil? || (v.respond_to?(:null?) && v.null?)
216
+ str << __serialize(k)
217
+ tmp = __serialize(v)
218
+ str << " ".freeze unless BYTE_IS_DELIMITER[tmp.getbyte(0)] ||
219
+ BYTE_IS_DELIMITER[str.getbyte(-1)]
220
+ str << tmp
221
+ end
222
+ str << ">>".freeze
223
+ end
224
+
225
+ STRING_ESCAPE_MAP = {"(" => "\\(", ")" => "\\)", "\\" => "\\\\", "\r" => "\\r"} # :nodoc:
226
+
227
+ # Serializes a String object.
228
+ #
229
+ # See: PDF1.7 s7.3.4
230
+ def serialize_string(obj)
231
+ if @encrypter && @object.kind_of?(HexaPDF::Object) && @object.indirect?
232
+ obj = encrypter.encrypt_string(obj, @object)
233
+ elsif obj.encoding != Encoding::BINARY && obj =~ /[^ -~\t\r\n]/
234
+ obj = "\xFE\xFF".b << obj.encode(Encoding::UTF_16BE).force_encoding(Encoding::BINARY)
235
+ elsif obj.encoding != Encoding::BINARY
236
+ obj = obj.b
237
+ end
238
+ "(" << obj.gsub(/[\(\)\\\r]/n) {|m| STRING_ESCAPE_MAP[m]} << ")".freeze
239
+ end
240
+
241
+ # The ISO PDF specification differs in respect to the supported date format. When converting
242
+ # to a date string, a format suitable for both is output.
243
+ #
244
+ # See: PDF1.7 s7.9.4, ADB1.7 3.8.3
245
+ def serialize_time(obj)
246
+ zone = obj.strftime("%z'")
247
+ if zone == "+0000'"
248
+ zone = ''
249
+ else
250
+ zone[3, 0] = "'"
251
+ end
252
+ serialize_string(obj.strftime("D:%Y%m%d%H%M%S#{zone}"))
253
+ end
254
+
255
+ # See: #serialize_time
256
+ def serialize_date(obj)
257
+ serialize_time(obj.to_time)
258
+ end
259
+
260
+ # See: #serialize_time
261
+ def serialize_datetime(obj)
262
+ serialize_time(obj.to_time)
263
+ end
264
+
265
+ private
266
+
267
+ # Uses #serialize_hexapdf_reference if it is an indirect object, otherwise just serializes
268
+ # the objects value.
269
+ def serialize_hexapdf_object(obj)
270
+ if obj.indirect? && obj != @object
271
+ serialize_hexapdf_reference(obj)
272
+ else
273
+ __serialize(obj.value)
274
+ end
275
+ end
276
+
277
+ # See: PDF1.7 s7.3.10
278
+ def serialize_hexapdf_reference(obj)
279
+ "#{obj.oid} #{obj.gen} R".freeze
280
+ end
281
+
282
+ # Serializes the streams dictionary and its stream.
283
+ #
284
+ # See: PDF1.7 s7.3.8
285
+ def serialize_hexapdf_stream(obj)
286
+ if !obj.indirect?
287
+ raise HexaPDF::Error, "Can't serialize PDF stream without object identifier"
288
+ elsif obj != @object
289
+ return serialize_hexapdf_reference(obj)
290
+ end
291
+
292
+ fiber = if @encrypter
293
+ encrypter.encrypt_stream(obj)
294
+ else
295
+ obj.stream_encoder
296
+ end
297
+
298
+ if @io && fiber.respond_to?(:length) && fiber.length >= 0
299
+ obj.value[:Length] = fiber.length
300
+ @io << __serialize(obj.value)
301
+ @io << "stream\n".freeze
302
+ while fiber.alive? && (data = fiber.resume)
303
+ @io << data.freeze
304
+ end
305
+ @io << "\nendstream".freeze
306
+
307
+ nil
308
+ else
309
+ data = Filter.string_from_source(fiber)
310
+ obj.value[:Length] = data.size
311
+
312
+ str = __serialize(obj.value)
313
+ str << "stream\n".freeze
314
+ str << data
315
+ str << "\nendstream".freeze
316
+ end
317
+ end
318
+
319
+ # Invokes the correct serialization method for the object.
320
+ def __serialize(obj)
321
+ send(@dispatcher[obj.class], obj)
322
+ end
323
+
324
+ end
325
+
326
+ end
@@ -0,0 +1,279 @@
1
+ # -*- encoding: utf-8 -*-
2
+ #
3
+ #--
4
+ # This file is part of HexaPDF.
5
+ #
6
+ # HexaPDF - A Versatile PDF Creation and Manipulation Library For Ruby
7
+ # Copyright (C) 2016 Thomas Leitner
8
+ #
9
+ # HexaPDF is free software: you can redistribute it and/or modify it
10
+ # under the terms of the GNU Affero General Public License version 3 as
11
+ # published by the Free Software Foundation with the addition of the
12
+ # following permission added to Section 15 as permitted in Section 7(a):
13
+ # FOR ANY PART OF THE COVERED WORK IN WHICH THE COPYRIGHT IS OWNED BY
14
+ # THOMAS LEITNER, THOMAS LEITNER DISCLAIMS THE WARRANTY OF NON
15
+ # INFRINGEMENT OF THIRD PARTY RIGHTS.
16
+ #
17
+ # HexaPDF is distributed in the hope that it will be useful, but WITHOUT
18
+ # ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
19
+ # FITNESS FOR A PARTICULAR PURPOSE. See the GNU Affero General Public
20
+ # License for more details.
21
+ #
22
+ # You should have received a copy of the GNU Affero General Public License
23
+ # along with HexaPDF. If not, see <http://www.gnu.org/licenses/>.
24
+ #
25
+ # The interactive user interfaces in modified source and object code
26
+ # versions of HexaPDF must display Appropriate Legal Notices, as required
27
+ # under Section 5 of the GNU Affero General Public License version 3.
28
+ #
29
+ # In accordance with Section 7(b) of the GNU Affero General Public
30
+ # License, a covered work must retain the producer line in every PDF that
31
+ # is created or manipulated using HexaPDF.
32
+ #++
33
+
34
+ require 'hexapdf/error'
35
+ require 'hexapdf/dictionary'
36
+ require 'hexapdf/filter'
37
+
38
+ module HexaPDF
39
+
40
+ # Container for stream data that is more complex than a string.
41
+ #
42
+ # This helper class wraps all information necessary to read stream data by using a Fiber object
43
+ # (see HexaPDF::Filter). The underlying data either comes from an IO object, a file represented by
44
+ # its file name or a Fiber defined via a Proc object.
45
+ #
46
+ # Additionally, the #filter and #decode_parms can be set to indicate that the data returned from
47
+ # the Fiber needs to be post-processed. The +filter+ and +decode_parms+ are automatically
48
+ # normalized to arrays on assignment to ease further processing.
49
+ class StreamData
50
+
51
+ # The filter(s) that need to be applied for getting the decoded stream data.
52
+ attr_reader :filter
53
+
54
+ # The decoding parameters associated with the +filter+(s).
55
+ attr_reader :decode_parms
56
+
57
+ # :call-seq:
58
+ # StreamData.new(io) -> stream_data
59
+ # StreamData.new(str) -> stream_data
60
+ # StreamData.new(proc) -> stream_data
61
+ # StreamData.new { block } -> stream_data
62
+ #
63
+ # Creates a new StreamData object for the given +source+ and with the given options.
64
+ #
65
+ # The +source+ can be:
66
+ #
67
+ # * An IO stream which is read starting from a specific +offset+ for a specific +length+
68
+ #
69
+ # * A string which is interpreted as a file name and read starting from a specific +offset+
70
+ # * and for a specific +length+
71
+ #
72
+ # * A Proc object (that is converted to a Fiber when needed) in which case the +offset+ and
73
+ # value is ignored. The Proc object can also be passed by using a block.
74
+ def initialize(source = nil, offset: nil, length: nil, filter: nil, decode_parms: nil, &block)
75
+ if source.nil? && !block_given?
76
+ raise ArgumentError, "Either a source object or a block must be given"
77
+ end
78
+ @source = source || block
79
+ @offset = offset
80
+ @length = length
81
+ @filter = [filter].flatten.compact
82
+ @decode_parms = [decode_parms].flatten
83
+ freeze
84
+ end
85
+
86
+ # Returns a Fiber for getting at the data of the stream represented by this object.
87
+ def fiber(chunk_size = 0)
88
+ if @source.kind_of?(Proc)
89
+ FiberWithLength.new(@length, &@source)
90
+ elsif @source.kind_of?(String)
91
+ HexaPDF::Filter.source_from_file(@source, pos: @offset || 0, length: @length || -1,
92
+ chunk_size: chunk_size)
93
+ else
94
+ HexaPDF::Filter.source_from_io(@source, pos: @offset || 0, length: @length || -1,
95
+ chunk_size: chunk_size)
96
+ end
97
+ end
98
+
99
+ end
100
+
101
+ # Implements Stream objects of the PDF object system.
102
+ #
103
+ # == Stream Objects
104
+ #
105
+ # A stream may also be associated with a PDF object but only if the value is a PDF dictionary.
106
+ # This associated dictionary further describes the stream, like its length or how it is encoded.
107
+ #
108
+ # Such a stream object in PDF contains string data but of possibly unlimited length. Therefore
109
+ # it is used for large amounts of data like images, page descriptions or embedded files.
110
+ #
111
+ # The basic Object class cannot hold stream data, only this subclass contains the necessary
112
+ # methods to conveniently work with the stream data!
113
+ #
114
+ # See: PDF1.7 s7.3.8, Dictionary
115
+ class Stream < Dictionary
116
+
117
+ define_field :Length, type: Integer # not required, will be auto-filled when writing
118
+ define_field :Filter, type: [Symbol, Array]
119
+ define_field :DecodeParms, type: [Dictionary, Hash, Array]
120
+ define_field :F, type: :FileSpec, version: '1.2'
121
+ define_field :FFilter, type: [Symbol, Array], version: '1.2'
122
+ define_field :FDecodeParms, type: [Dictionary, Hash, Array], version: '1.2'
123
+ define_field :DL, type: Integer
124
+
125
+ # Stream objects must always be indirect.
126
+ def must_be_indirect?
127
+ true
128
+ end
129
+
130
+ # Assigns a new stream data object.
131
+ #
132
+ # The +stream+ argument can be a HexaPDF::StreamData object, a String object or +nil+.
133
+ #
134
+ # If +stream+ is +nil+, an empty binary string is used instead.
135
+ def stream=(stream)
136
+ data.stream = stream
137
+ after_data_change
138
+ end
139
+
140
+ # Returns the (possibly decoded) stream data as string.
141
+ #
142
+ # Note that modifications done to the returned string are not reflected in the Stream object
143
+ # itself. The modified string must explicitly be assigned via #stream= to take effect.
144
+ def stream
145
+ if data.stream.kind_of?(String)
146
+ data.stream.dup
147
+ else
148
+ HexaPDF::Filter.string_from_source(stream_decoder)
149
+ end
150
+ end
151
+
152
+ # Returns the raw stream object.
153
+ #
154
+ # The returned value can be of many different types (see #stream=). For working with the
155
+ # decoded stream contents use #stream.
156
+ def raw_stream
157
+ data.stream
158
+ end
159
+
160
+ # Returns the Fiber representing the unprocessed content of the stream.
161
+ def stream_source
162
+ if data.stream.kind_of?(String)
163
+ HexaPDF::Filter.source_from_string(data.stream)
164
+ else
165
+ data.stream.fiber(config['io.chunk_size'.freeze])
166
+ end
167
+ end
168
+
169
+ # Returns the decoder Fiber for the stream data.
170
+ #
171
+ # See the Filter module for more information on how to work with the fiber.
172
+ def stream_decoder
173
+ source = stream_source
174
+
175
+ if data.stream.kind_of?(StreamData)
176
+ data.stream.filter.zip(data.stream.decode_parms) do |filter, decode_parms|
177
+ source = filter_for_name(filter).decoder(source, decode_parms)
178
+ end
179
+ end
180
+
181
+ source
182
+ end
183
+
184
+ # Returns the encoder Fiber for the stream data.
185
+ #
186
+ # The two arguments can be used to add additional filters for *only* this returned encoder
187
+ # Fiber. They should normally *not* be used and are here for use by the encryption facilities.
188
+ #
189
+ # See the Filter module for more information on how to work with the fiber.
190
+ def stream_encoder(additional_filter = nil, additional_decode_parms = nil)
191
+ encoder_data = [additional_filter, document.unwrap(self[:Filter])].flatten.
192
+ zip([additional_decode_parms, document.unwrap(self[:DecodeParms])].flatten).
193
+ delete_if {|f, _| f.nil?}
194
+ source = stream_source
195
+
196
+ if data.stream.kind_of?(StreamData)
197
+ decoder_data = data.stream.filter.zip(data.stream.decode_parms)
198
+
199
+ while !decoder_data.empty? && !encoder_data.empty? && decoder_data.last == encoder_data.last
200
+ decoder_data.pop
201
+ encoder_data.pop
202
+ end
203
+
204
+ decoder_data.each do |filter, decode_parms|
205
+ source = filter_for_name(filter).decoder(source, decode_parms)
206
+ end
207
+ end
208
+
209
+ encoder_data.reverse!.each do |filter, decode_parms|
210
+ source = filter_for_name(filter).encoder(source, decode_parms)
211
+ end
212
+
213
+ source
214
+ end
215
+
216
+ # Sets the filters that should be used for encoding the stream.
217
+ #
218
+ # The arguments +filter+ as well as +decode_parms+ can either be a single items or arrays.
219
+ #
220
+ # The filters have to be specified in the *decoding order*! For example, if the filters would
221
+ # be [:A85, :Fl], the stream would first be encoded with the Flate and then with the ASCII85
222
+ # filter.
223
+ def set_filter(filter, decode_parms = nil)
224
+ if filter.nil? || (filter.kind_of?(Array) && filter.empty?)
225
+ delete(:Filter)
226
+ else
227
+ self[:Filter] = filter
228
+ end
229
+ if decode_parms.nil? || (decode_parms.kind_of?(Array) && decode_parms.empty?) ||
230
+ !key?(:Filter)
231
+ delete(:DecodeParms)
232
+ else
233
+ self[:DecodeParms] = decode_parms
234
+ end
235
+ end
236
+
237
+ private
238
+
239
+ # Makes sure that the stream data is either a String or a HexaPDF::StreamData object.
240
+ def after_data_change
241
+ super
242
+ data.stream ||= ''.b
243
+ unless data.stream.kind_of?(StreamData) || data.stream.kind_of?(String)
244
+ raise ArgumentError, "Object of class #{data.stream.class} cannot be used as stream value"
245
+ end
246
+ end
247
+
248
+ # Returns the filter object that corresponds to the given filter name.
249
+ #
250
+ # See: HexaPDF::Filter
251
+ def filter_for_name(filter_name)
252
+ GlobalConfiguration.constantize('filter.map', filter_name) do
253
+ raise HexaPDF::Error, "Unknown stream filter '#{filter_name}' encountered"
254
+ end
255
+ end
256
+
257
+ # :nodoc:
258
+ # A mapping from short name to long name for filters.
259
+ FILTER_MAP = {AHx: :ASCIIHexDecode, A85: :ASCII85Decode, LZW: :LZWDecode,
260
+ Fl: :FlateDecode, RL: :RunLengthDecode, CCF: :CCITTFaxDecode, DCT: :DCTDecode}
261
+
262
+ # Validates the /Filter entry so that it contains only long-name filter names.
263
+ def perform_validation
264
+ super
265
+ if value[:Filter].kind_of?(Symbol) && FILTER_MAP.key?(value[:Filter])
266
+ yield("A stream's /Filter entry may only use long-form filter names", true)
267
+ value[:Filter] = FILTER_MAP[value[:Filter]]
268
+ elsif value[:Filter].kind_of?(Array)
269
+ value[:Filter].map! do |filter|
270
+ next filter unless FILTER_MAP.key?(filter)
271
+ yield("A stream's /Filter entry may only use long-form filter names", true)
272
+ FILTER_MAP[filter]
273
+ end
274
+ end
275
+ end
276
+
277
+ end
278
+
279
+ end