hexapdf 0.1.0

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
Files changed (346) hide show
  1. checksums.yaml +7 -0
  2. data/CONTRIBUTERS +3 -0
  3. data/LICENSE +26 -0
  4. data/README.md +88 -0
  5. data/Rakefile +121 -0
  6. data/VERSION +1 -0
  7. data/agpl-3.0.txt +661 -0
  8. data/bin/hexapdf +6 -0
  9. data/data/hexapdf/afm/Courier-Bold.afm +342 -0
  10. data/data/hexapdf/afm/Courier-BoldOblique.afm +342 -0
  11. data/data/hexapdf/afm/Courier-Oblique.afm +342 -0
  12. data/data/hexapdf/afm/Courier.afm +342 -0
  13. data/data/hexapdf/afm/Helvetica-Bold.afm +2827 -0
  14. data/data/hexapdf/afm/Helvetica-BoldOblique.afm +2827 -0
  15. data/data/hexapdf/afm/Helvetica-Oblique.afm +3051 -0
  16. data/data/hexapdf/afm/Helvetica.afm +3051 -0
  17. data/data/hexapdf/afm/MustRead.html +1 -0
  18. data/data/hexapdf/afm/Symbol.afm +213 -0
  19. data/data/hexapdf/afm/Times-Bold.afm +2588 -0
  20. data/data/hexapdf/afm/Times-BoldItalic.afm +2384 -0
  21. data/data/hexapdf/afm/Times-Italic.afm +2667 -0
  22. data/data/hexapdf/afm/Times-Roman.afm +2419 -0
  23. data/data/hexapdf/afm/ZapfDingbats.afm +225 -0
  24. data/data/hexapdf/encoding/glyphlist.txt +4305 -0
  25. data/data/hexapdf/encoding/zapfdingbats.txt +225 -0
  26. data/examples/arc.rb +50 -0
  27. data/examples/graphics.rb +274 -0
  28. data/examples/hello_world.rb +16 -0
  29. data/examples/machupicchu.jpg +0 -0
  30. data/examples/merging.rb +24 -0
  31. data/examples/optimizing.rb +20 -0
  32. data/examples/show_char_bboxes.rb +55 -0
  33. data/examples/standard_pdf_fonts.rb +72 -0
  34. data/examples/truetype.rb +45 -0
  35. data/lib/hexapdf/cli/extract.rb +128 -0
  36. data/lib/hexapdf/cli/info.rb +121 -0
  37. data/lib/hexapdf/cli/inspect.rb +157 -0
  38. data/lib/hexapdf/cli/modify.rb +218 -0
  39. data/lib/hexapdf/cli.rb +121 -0
  40. data/lib/hexapdf/configuration.rb +392 -0
  41. data/lib/hexapdf/content/canvas.rb +1974 -0
  42. data/lib/hexapdf/content/color_space.rb +364 -0
  43. data/lib/hexapdf/content/graphic_object/arc.rb +267 -0
  44. data/lib/hexapdf/content/graphic_object/endpoint_arc.rb +208 -0
  45. data/lib/hexapdf/content/graphic_object/solid_arc.rb +173 -0
  46. data/lib/hexapdf/content/graphic_object.rb +81 -0
  47. data/lib/hexapdf/content/graphics_state.rb +579 -0
  48. data/lib/hexapdf/content/operator.rb +1072 -0
  49. data/lib/hexapdf/content/parser.rb +204 -0
  50. data/lib/hexapdf/content/processor.rb +451 -0
  51. data/lib/hexapdf/content/transformation_matrix.rb +172 -0
  52. data/lib/hexapdf/content.rb +47 -0
  53. data/lib/hexapdf/data_dir.rb +51 -0
  54. data/lib/hexapdf/dictionary.rb +303 -0
  55. data/lib/hexapdf/dictionary_fields.rb +382 -0
  56. data/lib/hexapdf/document.rb +589 -0
  57. data/lib/hexapdf/document_utils.rb +209 -0
  58. data/lib/hexapdf/encryption/aes.rb +206 -0
  59. data/lib/hexapdf/encryption/arc4.rb +93 -0
  60. data/lib/hexapdf/encryption/fast_aes.rb +79 -0
  61. data/lib/hexapdf/encryption/fast_arc4.rb +67 -0
  62. data/lib/hexapdf/encryption/identity.rb +63 -0
  63. data/lib/hexapdf/encryption/ruby_aes.rb +447 -0
  64. data/lib/hexapdf/encryption/ruby_arc4.rb +96 -0
  65. data/lib/hexapdf/encryption/security_handler.rb +494 -0
  66. data/lib/hexapdf/encryption/standard_security_handler.rb +616 -0
  67. data/lib/hexapdf/encryption.rb +94 -0
  68. data/lib/hexapdf/error.rb +73 -0
  69. data/lib/hexapdf/filter/ascii85_decode.rb +160 -0
  70. data/lib/hexapdf/filter/ascii_hex_decode.rb +87 -0
  71. data/lib/hexapdf/filter/dct_decode.rb +57 -0
  72. data/lib/hexapdf/filter/encryption.rb +59 -0
  73. data/lib/hexapdf/filter/flate_decode.rb +93 -0
  74. data/lib/hexapdf/filter/jpx_decode.rb +56 -0
  75. data/lib/hexapdf/filter/lzw_decode.rb +191 -0
  76. data/lib/hexapdf/filter/predictor.rb +266 -0
  77. data/lib/hexapdf/filter/run_length_decode.rb +108 -0
  78. data/lib/hexapdf/filter.rb +176 -0
  79. data/lib/hexapdf/font/cmap/parser.rb +146 -0
  80. data/lib/hexapdf/font/cmap/writer.rb +176 -0
  81. data/lib/hexapdf/font/cmap.rb +90 -0
  82. data/lib/hexapdf/font/encoding/base.rb +77 -0
  83. data/lib/hexapdf/font/encoding/difference_encoding.rb +64 -0
  84. data/lib/hexapdf/font/encoding/glyph_list.rb +150 -0
  85. data/lib/hexapdf/font/encoding/mac_expert_encoding.rb +221 -0
  86. data/lib/hexapdf/font/encoding/mac_roman_encoding.rb +265 -0
  87. data/lib/hexapdf/font/encoding/standard_encoding.rb +205 -0
  88. data/lib/hexapdf/font/encoding/symbol_encoding.rb +244 -0
  89. data/lib/hexapdf/font/encoding/win_ansi_encoding.rb +280 -0
  90. data/lib/hexapdf/font/encoding/zapf_dingbats_encoding.rb +250 -0
  91. data/lib/hexapdf/font/encoding.rb +68 -0
  92. data/lib/hexapdf/font/true_type/font.rb +179 -0
  93. data/lib/hexapdf/font/true_type/table/cmap.rb +103 -0
  94. data/lib/hexapdf/font/true_type/table/cmap_subtable.rb +384 -0
  95. data/lib/hexapdf/font/true_type/table/directory.rb +92 -0
  96. data/lib/hexapdf/font/true_type/table/glyf.rb +166 -0
  97. data/lib/hexapdf/font/true_type/table/head.rb +143 -0
  98. data/lib/hexapdf/font/true_type/table/hhea.rb +109 -0
  99. data/lib/hexapdf/font/true_type/table/hmtx.rb +79 -0
  100. data/lib/hexapdf/font/true_type/table/loca.rb +79 -0
  101. data/lib/hexapdf/font/true_type/table/maxp.rb +112 -0
  102. data/lib/hexapdf/font/true_type/table/name.rb +218 -0
  103. data/lib/hexapdf/font/true_type/table/os2.rb +200 -0
  104. data/lib/hexapdf/font/true_type/table/post.rb +230 -0
  105. data/lib/hexapdf/font/true_type/table.rb +155 -0
  106. data/lib/hexapdf/font/true_type.rb +48 -0
  107. data/lib/hexapdf/font/true_type_wrapper.rb +240 -0
  108. data/lib/hexapdf/font/type1/afm_parser.rb +230 -0
  109. data/lib/hexapdf/font/type1/character_metrics.rb +67 -0
  110. data/lib/hexapdf/font/type1/font.rb +123 -0
  111. data/lib/hexapdf/font/type1/font_metrics.rb +117 -0
  112. data/lib/hexapdf/font/type1/pfb_parser.rb +71 -0
  113. data/lib/hexapdf/font/type1.rb +52 -0
  114. data/lib/hexapdf/font/type1_wrapper.rb +193 -0
  115. data/lib/hexapdf/font_loader/from_configuration.rb +70 -0
  116. data/lib/hexapdf/font_loader/standard14.rb +98 -0
  117. data/lib/hexapdf/font_loader.rb +85 -0
  118. data/lib/hexapdf/font_utils.rb +89 -0
  119. data/lib/hexapdf/image_loader/jpeg.rb +166 -0
  120. data/lib/hexapdf/image_loader/pdf.rb +89 -0
  121. data/lib/hexapdf/image_loader/png.rb +410 -0
  122. data/lib/hexapdf/image_loader.rb +68 -0
  123. data/lib/hexapdf/importer.rb +139 -0
  124. data/lib/hexapdf/name_tree_node.rb +78 -0
  125. data/lib/hexapdf/number_tree_node.rb +67 -0
  126. data/lib/hexapdf/object.rb +363 -0
  127. data/lib/hexapdf/parser.rb +349 -0
  128. data/lib/hexapdf/rectangle.rb +99 -0
  129. data/lib/hexapdf/reference.rb +98 -0
  130. data/lib/hexapdf/revision.rb +206 -0
  131. data/lib/hexapdf/revisions.rb +194 -0
  132. data/lib/hexapdf/serializer.rb +326 -0
  133. data/lib/hexapdf/stream.rb +279 -0
  134. data/lib/hexapdf/task/dereference.rb +109 -0
  135. data/lib/hexapdf/task/optimize.rb +230 -0
  136. data/lib/hexapdf/task.rb +68 -0
  137. data/lib/hexapdf/tokenizer.rb +406 -0
  138. data/lib/hexapdf/type/catalog.rb +107 -0
  139. data/lib/hexapdf/type/embedded_file.rb +87 -0
  140. data/lib/hexapdf/type/file_specification.rb +232 -0
  141. data/lib/hexapdf/type/font.rb +81 -0
  142. data/lib/hexapdf/type/font_descriptor.rb +109 -0
  143. data/lib/hexapdf/type/font_simple.rb +190 -0
  144. data/lib/hexapdf/type/font_true_type.rb +47 -0
  145. data/lib/hexapdf/type/font_type1.rb +162 -0
  146. data/lib/hexapdf/type/form.rb +103 -0
  147. data/lib/hexapdf/type/graphics_state_parameter.rb +79 -0
  148. data/lib/hexapdf/type/image.rb +73 -0
  149. data/lib/hexapdf/type/info.rb +70 -0
  150. data/lib/hexapdf/type/names.rb +69 -0
  151. data/lib/hexapdf/type/object_stream.rb +224 -0
  152. data/lib/hexapdf/type/page.rb +355 -0
  153. data/lib/hexapdf/type/page_tree_node.rb +269 -0
  154. data/lib/hexapdf/type/resources.rb +212 -0
  155. data/lib/hexapdf/type/trailer.rb +128 -0
  156. data/lib/hexapdf/type/viewer_preferences.rb +73 -0
  157. data/lib/hexapdf/type/xref_stream.rb +204 -0
  158. data/lib/hexapdf/type.rb +67 -0
  159. data/lib/hexapdf/utils/bit_field.rb +87 -0
  160. data/lib/hexapdf/utils/bit_stream.rb +148 -0
  161. data/lib/hexapdf/utils/lru_cache.rb +65 -0
  162. data/lib/hexapdf/utils/math_helpers.rb +55 -0
  163. data/lib/hexapdf/utils/object_hash.rb +130 -0
  164. data/lib/hexapdf/utils/pdf_doc_encoding.rb +93 -0
  165. data/lib/hexapdf/utils/sorted_tree_node.rb +339 -0
  166. data/lib/hexapdf/version.rb +39 -0
  167. data/lib/hexapdf/writer.rb +199 -0
  168. data/lib/hexapdf/xref_section.rb +152 -0
  169. data/lib/hexapdf.rb +34 -0
  170. data/man/man1/hexapdf.1 +249 -0
  171. data/test/data/aes-test-vectors/CBCGFSbox-128-decrypt.data.gz +0 -0
  172. data/test/data/aes-test-vectors/CBCGFSbox-128-encrypt.data.gz +0 -0
  173. data/test/data/aes-test-vectors/CBCGFSbox-192-decrypt.data.gz +0 -0
  174. data/test/data/aes-test-vectors/CBCGFSbox-192-encrypt.data.gz +0 -0
  175. data/test/data/aes-test-vectors/CBCGFSbox-256-decrypt.data.gz +0 -0
  176. data/test/data/aes-test-vectors/CBCGFSbox-256-encrypt.data.gz +0 -0
  177. data/test/data/aes-test-vectors/CBCKeySbox-128-decrypt.data.gz +0 -0
  178. data/test/data/aes-test-vectors/CBCKeySbox-128-encrypt.data.gz +0 -0
  179. data/test/data/aes-test-vectors/CBCKeySbox-192-decrypt.data.gz +0 -0
  180. data/test/data/aes-test-vectors/CBCKeySbox-192-encrypt.data.gz +0 -0
  181. data/test/data/aes-test-vectors/CBCKeySbox-256-decrypt.data.gz +0 -0
  182. data/test/data/aes-test-vectors/CBCKeySbox-256-encrypt.data.gz +0 -0
  183. data/test/data/aes-test-vectors/CBCVarKey-128-decrypt.data.gz +0 -0
  184. data/test/data/aes-test-vectors/CBCVarKey-128-encrypt.data.gz +0 -0
  185. data/test/data/aes-test-vectors/CBCVarKey-192-decrypt.data.gz +0 -0
  186. data/test/data/aes-test-vectors/CBCVarKey-192-encrypt.data.gz +0 -0
  187. data/test/data/aes-test-vectors/CBCVarKey-256-decrypt.data.gz +0 -0
  188. data/test/data/aes-test-vectors/CBCVarKey-256-encrypt.data.gz +0 -0
  189. data/test/data/aes-test-vectors/CBCVarTxt-128-decrypt.data.gz +0 -0
  190. data/test/data/aes-test-vectors/CBCVarTxt-128-encrypt.data.gz +0 -0
  191. data/test/data/aes-test-vectors/CBCVarTxt-192-decrypt.data.gz +0 -0
  192. data/test/data/aes-test-vectors/CBCVarTxt-192-encrypt.data.gz +0 -0
  193. data/test/data/aes-test-vectors/CBCVarTxt-256-decrypt.data.gz +0 -0
  194. data/test/data/aes-test-vectors/CBCVarTxt-256-encrypt.data.gz +0 -0
  195. data/test/data/fonts/Ubuntu-Title.ttf +0 -0
  196. data/test/data/images/cmyk.jpg +0 -0
  197. data/test/data/images/fillbytes.jpg +0 -0
  198. data/test/data/images/gray.jpg +0 -0
  199. data/test/data/images/greyscale-1bit.png +0 -0
  200. data/test/data/images/greyscale-2bit.png +0 -0
  201. data/test/data/images/greyscale-4bit.png +0 -0
  202. data/test/data/images/greyscale-8bit.png +0 -0
  203. data/test/data/images/greyscale-alpha-8bit.png +0 -0
  204. data/test/data/images/greyscale-trns-8bit.png +0 -0
  205. data/test/data/images/greyscale-with-gamma1.0.png +0 -0
  206. data/test/data/images/greyscale-with-gamma1.5.png +0 -0
  207. data/test/data/images/indexed-1bit.png +0 -0
  208. data/test/data/images/indexed-2bit.png +0 -0
  209. data/test/data/images/indexed-4bit.png +0 -0
  210. data/test/data/images/indexed-8bit.png +0 -0
  211. data/test/data/images/indexed-alpha-4bit.png +0 -0
  212. data/test/data/images/indexed-alpha-8bit.png +0 -0
  213. data/test/data/images/rgb.jpg +0 -0
  214. data/test/data/images/truecolour-8bit.png +0 -0
  215. data/test/data/images/truecolour-alpha-8bit.png +0 -0
  216. data/test/data/images/truecolour-gama-chrm-8bit.png +0 -0
  217. data/test/data/images/truecolour-srgb-8bit.png +0 -0
  218. data/test/data/minimal.pdf +44 -0
  219. data/test/data/standard-security-handler/README +9 -0
  220. data/test/data/standard-security-handler/bothpwd-aes-128bit-V4.pdf +44 -0
  221. data/test/data/standard-security-handler/bothpwd-aes-256bit-V5.pdf +0 -0
  222. data/test/data/standard-security-handler/bothpwd-arc4-128bit-V2.pdf +43 -0
  223. data/test/data/standard-security-handler/bothpwd-arc4-128bit-V4.pdf +43 -0
  224. data/test/data/standard-security-handler/bothpwd-arc4-40bit-V1.pdf +0 -0
  225. data/test/data/standard-security-handler/nopwd-aes-128bit-V4.pdf +43 -0
  226. data/test/data/standard-security-handler/nopwd-aes-256bit-V5.pdf +0 -0
  227. data/test/data/standard-security-handler/nopwd-arc4-128bit-V2.pdf +43 -0
  228. data/test/data/standard-security-handler/nopwd-arc4-128bit-V4.pdf +43 -0
  229. data/test/data/standard-security-handler/nopwd-arc4-40bit-V1.pdf +43 -0
  230. data/test/data/standard-security-handler/ownerpwd-aes-128bit-V4.pdf +0 -0
  231. data/test/data/standard-security-handler/ownerpwd-aes-256bit-V5.pdf +43 -0
  232. data/test/data/standard-security-handler/ownerpwd-arc4-128bit-V2.pdf +43 -0
  233. data/test/data/standard-security-handler/ownerpwd-arc4-128bit-V4.pdf +43 -0
  234. data/test/data/standard-security-handler/ownerpwd-arc4-40bit-V1.pdf +43 -0
  235. data/test/data/standard-security-handler/userpwd-aes-128bit-V4.pdf +43 -0
  236. data/test/data/standard-security-handler/userpwd-aes-256bit-V5.pdf +43 -0
  237. data/test/data/standard-security-handler/userpwd-arc4-128bit-V2.pdf +0 -0
  238. data/test/data/standard-security-handler/userpwd-arc4-128bit-V4.pdf +0 -0
  239. data/test/data/standard-security-handler/userpwd-arc4-40bit-V1.pdf +43 -0
  240. data/test/hexapdf/common_tokenizer_tests.rb +204 -0
  241. data/test/hexapdf/content/common.rb +31 -0
  242. data/test/hexapdf/content/graphic_object/test_arc.rb +93 -0
  243. data/test/hexapdf/content/graphic_object/test_endpoint_arc.rb +91 -0
  244. data/test/hexapdf/content/graphic_object/test_solid_arc.rb +86 -0
  245. data/test/hexapdf/content/test_canvas.rb +1113 -0
  246. data/test/hexapdf/content/test_color_space.rb +97 -0
  247. data/test/hexapdf/content/test_graphics_state.rb +138 -0
  248. data/test/hexapdf/content/test_operator.rb +619 -0
  249. data/test/hexapdf/content/test_parser.rb +66 -0
  250. data/test/hexapdf/content/test_processor.rb +156 -0
  251. data/test/hexapdf/content/test_transformation_matrix.rb +64 -0
  252. data/test/hexapdf/encryption/common.rb +87 -0
  253. data/test/hexapdf/encryption/test_aes.rb +121 -0
  254. data/test/hexapdf/encryption/test_arc4.rb +39 -0
  255. data/test/hexapdf/encryption/test_fast_aes.rb +17 -0
  256. data/test/hexapdf/encryption/test_fast_arc4.rb +12 -0
  257. data/test/hexapdf/encryption/test_identity.rb +21 -0
  258. data/test/hexapdf/encryption/test_ruby_aes.rb +23 -0
  259. data/test/hexapdf/encryption/test_ruby_arc4.rb +20 -0
  260. data/test/hexapdf/encryption/test_security_handler.rb +356 -0
  261. data/test/hexapdf/encryption/test_standard_security_handler.rb +274 -0
  262. data/test/hexapdf/filter/common.rb +53 -0
  263. data/test/hexapdf/filter/test_ascii85_decode.rb +60 -0
  264. data/test/hexapdf/filter/test_ascii_hex_decode.rb +33 -0
  265. data/test/hexapdf/filter/test_encryption.rb +24 -0
  266. data/test/hexapdf/filter/test_flate_decode.rb +35 -0
  267. data/test/hexapdf/filter/test_lzw_decode.rb +52 -0
  268. data/test/hexapdf/filter/test_predictor.rb +183 -0
  269. data/test/hexapdf/filter/test_run_length_decode.rb +32 -0
  270. data/test/hexapdf/font/cmap/test_parser.rb +67 -0
  271. data/test/hexapdf/font/cmap/test_writer.rb +58 -0
  272. data/test/hexapdf/font/encoding/test_base.rb +35 -0
  273. data/test/hexapdf/font/encoding/test_difference_encoding.rb +21 -0
  274. data/test/hexapdf/font/encoding/test_glyph_list.rb +59 -0
  275. data/test/hexapdf/font/encoding/test_zapf_dingbats_encoding.rb +16 -0
  276. data/test/hexapdf/font/test_encoding.rb +27 -0
  277. data/test/hexapdf/font/test_true_type_wrapper.rb +110 -0
  278. data/test/hexapdf/font/test_type1_wrapper.rb +66 -0
  279. data/test/hexapdf/font/true_type/common.rb +19 -0
  280. data/test/hexapdf/font/true_type/table/test_cmap.rb +59 -0
  281. data/test/hexapdf/font/true_type/table/test_cmap_subtable.rb +133 -0
  282. data/test/hexapdf/font/true_type/table/test_directory.rb +35 -0
  283. data/test/hexapdf/font/true_type/table/test_glyf.rb +58 -0
  284. data/test/hexapdf/font/true_type/table/test_head.rb +76 -0
  285. data/test/hexapdf/font/true_type/table/test_hhea.rb +40 -0
  286. data/test/hexapdf/font/true_type/table/test_hmtx.rb +38 -0
  287. data/test/hexapdf/font/true_type/table/test_loca.rb +43 -0
  288. data/test/hexapdf/font/true_type/table/test_maxp.rb +62 -0
  289. data/test/hexapdf/font/true_type/table/test_name.rb +95 -0
  290. data/test/hexapdf/font/true_type/table/test_os2.rb +65 -0
  291. data/test/hexapdf/font/true_type/table/test_post.rb +89 -0
  292. data/test/hexapdf/font/true_type/test_font.rb +120 -0
  293. data/test/hexapdf/font/true_type/test_table.rb +41 -0
  294. data/test/hexapdf/font/type1/test_afm_parser.rb +51 -0
  295. data/test/hexapdf/font/type1/test_font.rb +68 -0
  296. data/test/hexapdf/font/type1/test_pfb_parser.rb +37 -0
  297. data/test/hexapdf/font_loader/test_from_configuration.rb +28 -0
  298. data/test/hexapdf/font_loader/test_standard14.rb +22 -0
  299. data/test/hexapdf/image_loader/test_jpeg.rb +83 -0
  300. data/test/hexapdf/image_loader/test_pdf.rb +47 -0
  301. data/test/hexapdf/image_loader/test_png.rb +258 -0
  302. data/test/hexapdf/task/test_dereference.rb +46 -0
  303. data/test/hexapdf/task/test_optimize.rb +137 -0
  304. data/test/hexapdf/test_configuration.rb +82 -0
  305. data/test/hexapdf/test_data_dir.rb +32 -0
  306. data/test/hexapdf/test_dictionary.rb +284 -0
  307. data/test/hexapdf/test_dictionary_fields.rb +185 -0
  308. data/test/hexapdf/test_document.rb +574 -0
  309. data/test/hexapdf/test_document_utils.rb +144 -0
  310. data/test/hexapdf/test_filter.rb +96 -0
  311. data/test/hexapdf/test_font_utils.rb +47 -0
  312. data/test/hexapdf/test_importer.rb +78 -0
  313. data/test/hexapdf/test_object.rb +177 -0
  314. data/test/hexapdf/test_parser.rb +394 -0
  315. data/test/hexapdf/test_rectangle.rb +36 -0
  316. data/test/hexapdf/test_reference.rb +41 -0
  317. data/test/hexapdf/test_revision.rb +139 -0
  318. data/test/hexapdf/test_revisions.rb +93 -0
  319. data/test/hexapdf/test_serializer.rb +169 -0
  320. data/test/hexapdf/test_stream.rb +262 -0
  321. data/test/hexapdf/test_tokenizer.rb +30 -0
  322. data/test/hexapdf/test_writer.rb +120 -0
  323. data/test/hexapdf/test_xref_section.rb +35 -0
  324. data/test/hexapdf/type/test_catalog.rb +30 -0
  325. data/test/hexapdf/type/test_embedded_file.rb +16 -0
  326. data/test/hexapdf/type/test_file_specification.rb +148 -0
  327. data/test/hexapdf/type/test_font.rb +35 -0
  328. data/test/hexapdf/type/test_font_descriptor.rb +51 -0
  329. data/test/hexapdf/type/test_font_simple.rb +190 -0
  330. data/test/hexapdf/type/test_font_type1.rb +128 -0
  331. data/test/hexapdf/type/test_form.rb +60 -0
  332. data/test/hexapdf/type/test_info.rb +14 -0
  333. data/test/hexapdf/type/test_names.rb +9 -0
  334. data/test/hexapdf/type/test_object_stream.rb +84 -0
  335. data/test/hexapdf/type/test_page.rb +260 -0
  336. data/test/hexapdf/type/test_page_tree_node.rb +255 -0
  337. data/test/hexapdf/type/test_resources.rb +167 -0
  338. data/test/hexapdf/type/test_trailer.rb +109 -0
  339. data/test/hexapdf/type/test_xref_stream.rb +131 -0
  340. data/test/hexapdf/utils/test_bit_field.rb +47 -0
  341. data/test/hexapdf/utils/test_lru_cache.rb +22 -0
  342. data/test/hexapdf/utils/test_object_hash.rb +115 -0
  343. data/test/hexapdf/utils/test_pdf_doc_encoding.rb +18 -0
  344. data/test/hexapdf/utils/test_sorted_tree_node.rb +232 -0
  345. data/test/test_helper.rb +56 -0
  346. metadata +427 -0
@@ -0,0 +1,392 @@
1
+ # -*- encoding: utf-8 -*-
2
+ #
3
+ #--
4
+ # This file is part of HexaPDF.
5
+ #
6
+ # HexaPDF - A Versatile PDF Creation and Manipulation Library For Ruby
7
+ # Copyright (C) 2016 Thomas Leitner
8
+ #
9
+ # HexaPDF is free software: you can redistribute it and/or modify it
10
+ # under the terms of the GNU Affero General Public License version 3 as
11
+ # published by the Free Software Foundation with the addition of the
12
+ # following permission added to Section 15 as permitted in Section 7(a):
13
+ # FOR ANY PART OF THE COVERED WORK IN WHICH THE COPYRIGHT IS OWNED BY
14
+ # THOMAS LEITNER, THOMAS LEITNER DISCLAIMS THE WARRANTY OF NON
15
+ # INFRINGEMENT OF THIRD PARTY RIGHTS.
16
+ #
17
+ # HexaPDF is distributed in the hope that it will be useful, but WITHOUT
18
+ # ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
19
+ # FITNESS FOR A PARTICULAR PURPOSE. See the GNU Affero General Public
20
+ # License for more details.
21
+ #
22
+ # You should have received a copy of the GNU Affero General Public License
23
+ # along with HexaPDF. If not, see <http://www.gnu.org/licenses/>.
24
+ #
25
+ # The interactive user interfaces in modified source and object code
26
+ # versions of HexaPDF must display Appropriate Legal Notices, as required
27
+ # under Section 5 of the GNU Affero General Public License version 3.
28
+ #
29
+ # In accordance with Section 7(b) of the GNU Affero General Public
30
+ # License, a covered work must retain the producer line in every PDF that
31
+ # is created or manipulated using HexaPDF.
32
+ #++
33
+
34
+ require 'hexapdf/error'
35
+
36
+ module HexaPDF
37
+
38
+ # Manages both the global and document specific configuration options for HexaPDF.
39
+ #
40
+ # == Overview
41
+ #
42
+ # HexaPDF allows detailed control over many aspects of PDF manipulation. If there is a need to
43
+ # use a certain default value somewhere, it is defined as configuration options so that it can
44
+ # easily be changed.
45
+ #
46
+ # Some options are defined as global options because they are needed on the class level - see
47
+ # HexaPDF::GlobalConfiguration. Other options can be configured for individual documents as they
48
+ # allow to fine-tune some behavior - see HexaPDF::DefaultDocumentConfiguration.
49
+ #
50
+ # A configuration option name is dot-separted to provide a hierarchy of option names. For
51
+ # example, io.chunk_size.
52
+ class Configuration
53
+
54
+ # Creates a new document specific Configuration object by merging the values into the default
55
+ # configuration object.
56
+ def self.with_defaults(values = {})
57
+ DefaultDocumentConfiguration.merge(values)
58
+ end
59
+
60
+
61
+ # Creates a new Configuration object using the provided hash argument.
62
+ def initialize(options = {})
63
+ @options = options
64
+ end
65
+
66
+ # Returns +true+ if the given option exists.
67
+ def key?(name)
68
+ options.key?(name)
69
+ end
70
+ alias :option? :key?
71
+
72
+ # Returns the value for the configuration option +name+.
73
+ def [](name)
74
+ options[name]
75
+ end
76
+
77
+ # Uses +value+ as the value for the configuration option +name+.
78
+ def []=(name, value)
79
+ options[name] = value
80
+ end
81
+
82
+ # Returns a new Configuration object containing the options from the given configuration
83
+ # object (or hash) and this configuration object.
84
+ #
85
+ # If a key already has a value in this object, its value is overwritten by the one from
86
+ # +config+. However, hash values are merged instead of being overwritten.
87
+ def merge(config)
88
+ config = (config.kind_of?(self.class) ? config.options : config)
89
+ self.class.new(options.merge(config) do |_key, old, new|
90
+ old.kind_of?(Hash) && new.kind_of?(Hash) ? old.merge(new) : new
91
+ end)
92
+ end
93
+
94
+ # :call-seq:
95
+ # config.constantize(name, key = nil) -> constant or nil
96
+ # config.constantize(name, key = nil) {|name| block} -> obj
97
+ #
98
+ # Returns the constant the option +name+ is referring to. If +key+ is provided and the value
99
+ # of the option +name+ responds to \#[], the constant to which +key+ refers is returned.
100
+ #
101
+ # If no constant can be found and no block is provided, +nil+ is returned. If a block is
102
+ # provided it is called with the option name and its result will be returned.
103
+ #
104
+ # config.constantize('encryption.aes') #=> HexaPDF::Encryption::FastAES
105
+ # config.constantize('filter.map', :Fl) #=> HexaPDF::Filter::FlateDecode
106
+ def constantize(name, key = :__unset)
107
+ data = self[name]
108
+ data = data[key] if key != :__unset && data.respond_to?(:[])
109
+ (data = ::Object.const_get(data) rescue nil) if data.kind_of?(String)
110
+ data = yield(name) if block_given? && data.nil?
111
+ data
112
+ end
113
+
114
+ protected
115
+
116
+ # Returns the hash with the configuration options.
117
+ attr_reader :options
118
+
119
+ end
120
+
121
+ # The default document specific configuration object.
122
+ #
123
+ # Modify this object if you want to globally change document specific options or if you want to
124
+ # introduce new document specific options.
125
+ #
126
+ # The following options are provided:
127
+ #
128
+ # document.auto_decrypt::
129
+ # A boolean determining whether the document should be decrypted automatically when parsed.
130
+ #
131
+ # If this is set to +false+ and the PDF document should later be decrypted, the method
132
+ # Encryption::SecurityHandler.set_up_decryption(document, decryption_opts) has to be called to
133
+ # set and retrieve the needed security handler. Note, however, that already loaded indirect
134
+ # objects have to be decrypted manually!
135
+ #
136
+ # In nearly all cases this option should not be changed from its default setting!
137
+ #
138
+ # font.map::
139
+ # Defines a mapping from font names and variants to font files.
140
+ #
141
+ # The value needs to be a hash of the form:
142
+ # {"font_name": {variant: file_name, variant2: file_name2, ...}, ...}
143
+ #
144
+ # Once a font is registered in this way, the font name together with a variant name can be used
145
+ # with the HexaPDF::FontUtils#load method to load the font.
146
+ #
147
+ # For best compatibility, the following variant names should be used:
148
+ #
149
+ # [none] For the normal variant of the font
150
+ # [bold] For the bold variant of the font
151
+ # [italic] For the italic or oblique variant of the font
152
+ # [bold_italic] For the bold and italic/oblique variant of the font
153
+ #
154
+ # font.on_missing_glyph::
155
+ # Callback hook when an UTF-8 character cannot be mapped to a glyph of a font.
156
+ #
157
+ # The value needs to be an object that responds to \#call(code_or_name, font) where
158
+ # +code_or_name+ is the Unicode value or the glyph name for the missing glyph and returns a
159
+ # substitute glyph name/ID to be used instead.
160
+ #
161
+ # The default implementation raises an error.
162
+ #
163
+ # font_loader::
164
+ # An array with font loader implementations. When a font should be loaded, the array is
165
+ # iterated in sequence and the first valid font returned by a font loader is used.
166
+ #
167
+ # If a value is a String, it should contain the name of a constant that is a font loader
168
+ # object.
169
+ #
170
+ # See the HexaPDF::FontLoader module for information on how to implement a font loader object.
171
+ #
172
+ # graphic_object.map::
173
+ # A mapping from graphic object names to graphic object factories.
174
+ #
175
+ # See HexaPDF::Content::GraphicObject for more information.
176
+ #
177
+ # graphic_object.arc.max_curves::
178
+ # The maximum number of curves used for approximating a complete ellipse using Bezier curves.
179
+ #
180
+ # The default value is 6, higher values result in better approximations but also take longer
181
+ # to compute. It should not be set to values lower than 4, otherwise the approximation of a
182
+ # complete ellipse is visibly false.
183
+ #
184
+ # image_loader.pdf.use_stringio::
185
+ # A boolean determining whether images specified via file names should be read into memory
186
+ # all at once using a StringIO object.
187
+ #
188
+ # Since loading a PDF as image entails having the IO object from the image PDF around until
189
+ # the PDF document where it is used is written, there is the choice whether memory should be
190
+ # used to load the image PDF all at once or whether a File object is used that needs to be
191
+ # manually closed.
192
+ #
193
+ # To avoid leaking file descriptors, using the StringIO is the default setting. If you set
194
+ # this option to +false+, it is strongly advised to use ObjectSpace.each_object(File) (or
195
+ # +IO+ instead of +File) to traverse the list of open file descriptors and close the ones
196
+ # that have been used for PDF images.
197
+ #
198
+ # io.chunk_size::
199
+ # The size of the chunks that are used when reading IO data.
200
+ #
201
+ # This can be used to limit the memory needed for reading or writing PDF files with huge
202
+ # stream objects.
203
+ #
204
+ # page.default_media_box::
205
+ # The media box that is used for new pages that don't define a media box. Default value is
206
+ # A4. See HexaPDF::Type::Page::PAPER_SIZE for a list of predefined paper sizes.
207
+ #
208
+ # The value can either be a rectangle defining the paper size or a Symbol referencing one of
209
+ # the predefined paper sizes.
210
+ #
211
+ # parser.on_correctable_error::
212
+ # Callback hook when the parser encounters an error that can be corrected.
213
+ #
214
+ # The value needs to be an object that responds to \#call(document, message, position) and
215
+ # returns +true+ if an error should be raised.
216
+ #
217
+ # sorted_tree.max_leaf_node_size::
218
+ # The maximum number of nodes that should be in a leaf node of a node tree.
219
+ DefaultDocumentConfiguration =
220
+ Configuration.new('document.auto_decrypt' => true,
221
+ 'font.map' => {},
222
+ 'font.on_missing_glyph' => proc do |n, f|
223
+ raise HexaPDF::Error, "No glyph for '#{n}' in font #{f.font_name} found"
224
+ end,
225
+ 'font_loader' => [
226
+ 'HexaPDF::FontLoader::Standard14',
227
+ 'HexaPDF::FontLoader::FromConfiguration',
228
+ ],
229
+ 'graphic_object.map' => {
230
+ arc: 'HexaPDF::Content::GraphicObject::Arc',
231
+ endpoint_arc: 'HexaPDF::Content::GraphicObject::EndpointArc',
232
+ solid_arc: 'HexaPDF::Content::GraphicObject::SolidArc',
233
+ },
234
+ 'graphic_object.arc.max_curves' => 6,
235
+ 'image_loader.pdf.use_stringio' => true,
236
+ 'io.chunk_size' => 2**16,
237
+ 'page.default_media_box' => :A4,
238
+ 'parser.on_correctable_error' => proc { false },
239
+ 'sorted_tree.max_leaf_node_size' => 64)
240
+
241
+ # The global configuration object, providing the following options:
242
+ #
243
+ # color_space.map::
244
+ # A mapping from a PDF name (a Symbol) to a color space class (see
245
+ # HexaPDF::Content::ColorSpace). If the value is a String, it should contain the name of a
246
+ # constant that contains a color space class.
247
+ #
248
+ # Classes for the most often used color space families are implemented and readily available.
249
+ #
250
+ # See PDF1.7 s8.6
251
+ #
252
+ # encryption.aes::
253
+ # The class that should be used for AES encryption. If the value is a String, it should
254
+ # contain the name of a constant to such a class.
255
+ #
256
+ # See HexaPDF::Encryption::AES for the general interface such a class must conform to and
257
+ # HexaPDF::Encryption::RubyAES as well as HexaPDF::Encryption::FastAES for implementations.
258
+ #
259
+ # encryption.arc4::
260
+ # The class that should be used for ARC4 encryption. If the value is a String, it should
261
+ # contain the name of a constant to such a class.
262
+ #
263
+ # See HexaPDF::Encryption::ARC4 for the general interface such a class must conform to and
264
+ # HexaPDF::Encryption::RubyARC4 as well as HexaPDF::Encryption::FastARC4 for implementations.
265
+ #
266
+ # encryption.filter_map::
267
+ # A mapping from a PDF name (a Symbol) to a security handler class (see
268
+ # Encryption::SecurityHandler). If the value is a String, it should contain the name of a
269
+ # constant to such a class.
270
+ #
271
+ # PDF defines a standard security handler that is implemented
272
+ # (HexaPDF::Encryption::StandardSecurityHandler) and assigned the :Standard name.
273
+ #
274
+ # encryption.sub_filter_map::
275
+ # A mapping from a PDF name (a Symbol) to a security handler class (see
276
+ # HexaPDF::Encryption::SecurityHandler). If the value is a String, it should contain the name
277
+ # of a constant to such a class.
278
+ #
279
+ # The sub filter map is used when the security handler defined by the encryption dictionary
280
+ # is not available, but a compatible implementation is.
281
+ #
282
+ # filter.flate_compression::
283
+ # Specifies the compression level that should be used with the FlateDecode filter. The level
284
+ # can range from 0 (no compression), 1 (best speed) to 9 (best compression, default).
285
+ #
286
+ # filter.map::
287
+ # A mapping from a PDF name (a Symbol) to a filter object (see Filter). If the value is a
288
+ # String, it should contain the name of a constant that contains a filter object.
289
+ #
290
+ # The most often used filters are implemented and readily available.
291
+ #
292
+ # See PDF1.7 s7.4.1, ADB sH.3 3.3
293
+ #
294
+ # image_loader::
295
+ # An array with image loader implementations. When an image should be loaded, the array is
296
+ # iterated in sequence to find a suitable image loader.
297
+ #
298
+ # If a value is a String, it should contain the name of a constant that is an image loader
299
+ # object.
300
+ #
301
+ # See the HexaPDF::ImageLoader module for information on how to implement an image loader
302
+ # object.
303
+ #
304
+ # object.type_map::
305
+ # A mapping from a PDF name (a Symbol) to PDF object classes which is based on the /Type
306
+ # field. If the value is a String, it should contain the name of a constant that contains a
307
+ # PDF object class.
308
+ #
309
+ # This mapping is used to provide automatic wrapping of objects in the HexaPDF::Document#wrap
310
+ # method.
311
+ #
312
+ # object.subtype_map::
313
+ # A mapping from a PDF name (a Symbol) to PDF object classes which is based on the /Subtype
314
+ # field. If the value is a String, it should contain the name of a constant that contains a
315
+ # PDF object class.
316
+ #
317
+ # This mapping is used to provide automatic wrapping of objects in the HexaPDF::Document#wrap
318
+ # method.
319
+ #
320
+ # task.map::
321
+ # A mapping from task names to callable task objects. See HexaPDF::Task for more information.
322
+ GlobalConfiguration =
323
+ Configuration.new('encryption.aes' => 'HexaPDF::Encryption::FastAES',
324
+ 'encryption.arc4' => 'HexaPDF::Encryption::FastARC4',
325
+ 'encryption.filter_map' => {
326
+ Standard: 'HexaPDF::Encryption::StandardSecurityHandler',
327
+ },
328
+ 'encryption.sub_filter_map' => {
329
+ },
330
+ 'filter.flate_compression' => 9,
331
+ 'filter.map' => {
332
+ ASCIIHexDecode: 'HexaPDF::Filter::ASCIIHexDecode',
333
+ AHx: 'HexaPDF::Filter::ASCIIHexDecode',
334
+ ASCII85Decode: 'HexaPDF::Filter::ASCII85Decode',
335
+ A85: 'HexaPDF::Filter::ASCII85Decode',
336
+ LZWDecode: 'HexaPDF::Filter::LZWDecode',
337
+ LZW: 'HexaPDF::Filter::LZWDecode',
338
+ FlateDecode: 'HexaPDF::Filter::FlateDecode',
339
+ Fl: 'HexaPDF::Filter::FlateDecode',
340
+ RunLengthDecode: 'HexaPDF::Filter::RunLengthDecode',
341
+ RL: 'HexaPDF::Filter::RunLengthDecode',
342
+ CCITTFaxDecode: nil,
343
+ CCF: nil,
344
+ JBIG2Decode: nil,
345
+ DCTDecode: 'HexaPDF::Filter::DCTDecode',
346
+ DCT: 'HexaPDF::Filter::DCTDecode',
347
+ JPXDecode: 'HexaPDF::Filter::JPXDecode',
348
+ Crypt: nil,
349
+ Encryption: 'HexaPDF::Filter::Encryption',
350
+ },
351
+ 'color_space.map' => {
352
+ DeviceRGB: 'HexaPDF::Content::ColorSpace::DeviceRGB',
353
+ DeviceCMYK: 'HexaPDF::Content::ColorSpace::DeviceCMYK',
354
+ DeviceGray: 'HexaPDF::Content::ColorSpace::DeviceGray',
355
+ },
356
+ 'image_loader' => [
357
+ 'HexaPDF::ImageLoader::JPEG',
358
+ 'HexaPDF::ImageLoader::PNG',
359
+ 'HexaPDF::ImageLoader::PDF',
360
+ ],
361
+ 'object.type_map' => {
362
+ XRef: 'HexaPDF::Type::XRefStream',
363
+ ObjStm: 'HexaPDF::Type::ObjectStream',
364
+ Catalog: 'HexaPDF::Type::Catalog',
365
+ Pages: 'HexaPDF::Type::PageTreeNode',
366
+ Page: 'HexaPDF::Type::Page',
367
+ Filespec: 'HexaPDF::Type::FileSpecification',
368
+ EmbeddedFile: 'HexaPDF::Type::EmbeddedFile',
369
+ ExtGState: 'HexaPDF::Type::GraphicsStateParameter',
370
+ Font: 'HexaPDF::Type::Font',
371
+ FontDescriptor: 'HexaPDF::Type::FontDescriptor',
372
+ XXEmbeddedFileParameters: 'HexaPDF::Type::EmbeddedFile::Parameters',
373
+ XXEmbeddedFileParametersMacInfo: 'HexaPDF::Type::EmbeddedFile::MacInfo',
374
+ XXFilespecEFDictionary: 'HexaPDF::Type::FileSpecification::EFDictionary',
375
+ XXInfo: 'HexaPDF::Type::Info',
376
+ XXNames: 'HexaPDF::Type::Names',
377
+ XXResources: 'HexaPDF::Type::Resources',
378
+ XXTrailer: 'HexaPDF::Type::Trailer',
379
+ XXViewerPreferences: 'HexaPDF::Type::ViewerPreferences',
380
+ },
381
+ 'object.subtype_map' => {
382
+ Image: 'HexaPDF::Type::Image',
383
+ Form: 'HexaPDF::Type::Form',
384
+ Type1: 'HexaPDF::Type::FontType1',
385
+ TrueType: 'HexaPDF::Type::FontTrueType',
386
+ },
387
+ 'task.map' => {
388
+ optimize: 'HexaPDF::Task::Optimize',
389
+ dereference: 'HexaPDF::Task::Dereference',
390
+ })
391
+
392
+ end