hexapdf 0.1.0

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
Files changed (346) hide show
  1. checksums.yaml +7 -0
  2. data/CONTRIBUTERS +3 -0
  3. data/LICENSE +26 -0
  4. data/README.md +88 -0
  5. data/Rakefile +121 -0
  6. data/VERSION +1 -0
  7. data/agpl-3.0.txt +661 -0
  8. data/bin/hexapdf +6 -0
  9. data/data/hexapdf/afm/Courier-Bold.afm +342 -0
  10. data/data/hexapdf/afm/Courier-BoldOblique.afm +342 -0
  11. data/data/hexapdf/afm/Courier-Oblique.afm +342 -0
  12. data/data/hexapdf/afm/Courier.afm +342 -0
  13. data/data/hexapdf/afm/Helvetica-Bold.afm +2827 -0
  14. data/data/hexapdf/afm/Helvetica-BoldOblique.afm +2827 -0
  15. data/data/hexapdf/afm/Helvetica-Oblique.afm +3051 -0
  16. data/data/hexapdf/afm/Helvetica.afm +3051 -0
  17. data/data/hexapdf/afm/MustRead.html +1 -0
  18. data/data/hexapdf/afm/Symbol.afm +213 -0
  19. data/data/hexapdf/afm/Times-Bold.afm +2588 -0
  20. data/data/hexapdf/afm/Times-BoldItalic.afm +2384 -0
  21. data/data/hexapdf/afm/Times-Italic.afm +2667 -0
  22. data/data/hexapdf/afm/Times-Roman.afm +2419 -0
  23. data/data/hexapdf/afm/ZapfDingbats.afm +225 -0
  24. data/data/hexapdf/encoding/glyphlist.txt +4305 -0
  25. data/data/hexapdf/encoding/zapfdingbats.txt +225 -0
  26. data/examples/arc.rb +50 -0
  27. data/examples/graphics.rb +274 -0
  28. data/examples/hello_world.rb +16 -0
  29. data/examples/machupicchu.jpg +0 -0
  30. data/examples/merging.rb +24 -0
  31. data/examples/optimizing.rb +20 -0
  32. data/examples/show_char_bboxes.rb +55 -0
  33. data/examples/standard_pdf_fonts.rb +72 -0
  34. data/examples/truetype.rb +45 -0
  35. data/lib/hexapdf/cli/extract.rb +128 -0
  36. data/lib/hexapdf/cli/info.rb +121 -0
  37. data/lib/hexapdf/cli/inspect.rb +157 -0
  38. data/lib/hexapdf/cli/modify.rb +218 -0
  39. data/lib/hexapdf/cli.rb +121 -0
  40. data/lib/hexapdf/configuration.rb +392 -0
  41. data/lib/hexapdf/content/canvas.rb +1974 -0
  42. data/lib/hexapdf/content/color_space.rb +364 -0
  43. data/lib/hexapdf/content/graphic_object/arc.rb +267 -0
  44. data/lib/hexapdf/content/graphic_object/endpoint_arc.rb +208 -0
  45. data/lib/hexapdf/content/graphic_object/solid_arc.rb +173 -0
  46. data/lib/hexapdf/content/graphic_object.rb +81 -0
  47. data/lib/hexapdf/content/graphics_state.rb +579 -0
  48. data/lib/hexapdf/content/operator.rb +1072 -0
  49. data/lib/hexapdf/content/parser.rb +204 -0
  50. data/lib/hexapdf/content/processor.rb +451 -0
  51. data/lib/hexapdf/content/transformation_matrix.rb +172 -0
  52. data/lib/hexapdf/content.rb +47 -0
  53. data/lib/hexapdf/data_dir.rb +51 -0
  54. data/lib/hexapdf/dictionary.rb +303 -0
  55. data/lib/hexapdf/dictionary_fields.rb +382 -0
  56. data/lib/hexapdf/document.rb +589 -0
  57. data/lib/hexapdf/document_utils.rb +209 -0
  58. data/lib/hexapdf/encryption/aes.rb +206 -0
  59. data/lib/hexapdf/encryption/arc4.rb +93 -0
  60. data/lib/hexapdf/encryption/fast_aes.rb +79 -0
  61. data/lib/hexapdf/encryption/fast_arc4.rb +67 -0
  62. data/lib/hexapdf/encryption/identity.rb +63 -0
  63. data/lib/hexapdf/encryption/ruby_aes.rb +447 -0
  64. data/lib/hexapdf/encryption/ruby_arc4.rb +96 -0
  65. data/lib/hexapdf/encryption/security_handler.rb +494 -0
  66. data/lib/hexapdf/encryption/standard_security_handler.rb +616 -0
  67. data/lib/hexapdf/encryption.rb +94 -0
  68. data/lib/hexapdf/error.rb +73 -0
  69. data/lib/hexapdf/filter/ascii85_decode.rb +160 -0
  70. data/lib/hexapdf/filter/ascii_hex_decode.rb +87 -0
  71. data/lib/hexapdf/filter/dct_decode.rb +57 -0
  72. data/lib/hexapdf/filter/encryption.rb +59 -0
  73. data/lib/hexapdf/filter/flate_decode.rb +93 -0
  74. data/lib/hexapdf/filter/jpx_decode.rb +56 -0
  75. data/lib/hexapdf/filter/lzw_decode.rb +191 -0
  76. data/lib/hexapdf/filter/predictor.rb +266 -0
  77. data/lib/hexapdf/filter/run_length_decode.rb +108 -0
  78. data/lib/hexapdf/filter.rb +176 -0
  79. data/lib/hexapdf/font/cmap/parser.rb +146 -0
  80. data/lib/hexapdf/font/cmap/writer.rb +176 -0
  81. data/lib/hexapdf/font/cmap.rb +90 -0
  82. data/lib/hexapdf/font/encoding/base.rb +77 -0
  83. data/lib/hexapdf/font/encoding/difference_encoding.rb +64 -0
  84. data/lib/hexapdf/font/encoding/glyph_list.rb +150 -0
  85. data/lib/hexapdf/font/encoding/mac_expert_encoding.rb +221 -0
  86. data/lib/hexapdf/font/encoding/mac_roman_encoding.rb +265 -0
  87. data/lib/hexapdf/font/encoding/standard_encoding.rb +205 -0
  88. data/lib/hexapdf/font/encoding/symbol_encoding.rb +244 -0
  89. data/lib/hexapdf/font/encoding/win_ansi_encoding.rb +280 -0
  90. data/lib/hexapdf/font/encoding/zapf_dingbats_encoding.rb +250 -0
  91. data/lib/hexapdf/font/encoding.rb +68 -0
  92. data/lib/hexapdf/font/true_type/font.rb +179 -0
  93. data/lib/hexapdf/font/true_type/table/cmap.rb +103 -0
  94. data/lib/hexapdf/font/true_type/table/cmap_subtable.rb +384 -0
  95. data/lib/hexapdf/font/true_type/table/directory.rb +92 -0
  96. data/lib/hexapdf/font/true_type/table/glyf.rb +166 -0
  97. data/lib/hexapdf/font/true_type/table/head.rb +143 -0
  98. data/lib/hexapdf/font/true_type/table/hhea.rb +109 -0
  99. data/lib/hexapdf/font/true_type/table/hmtx.rb +79 -0
  100. data/lib/hexapdf/font/true_type/table/loca.rb +79 -0
  101. data/lib/hexapdf/font/true_type/table/maxp.rb +112 -0
  102. data/lib/hexapdf/font/true_type/table/name.rb +218 -0
  103. data/lib/hexapdf/font/true_type/table/os2.rb +200 -0
  104. data/lib/hexapdf/font/true_type/table/post.rb +230 -0
  105. data/lib/hexapdf/font/true_type/table.rb +155 -0
  106. data/lib/hexapdf/font/true_type.rb +48 -0
  107. data/lib/hexapdf/font/true_type_wrapper.rb +240 -0
  108. data/lib/hexapdf/font/type1/afm_parser.rb +230 -0
  109. data/lib/hexapdf/font/type1/character_metrics.rb +67 -0
  110. data/lib/hexapdf/font/type1/font.rb +123 -0
  111. data/lib/hexapdf/font/type1/font_metrics.rb +117 -0
  112. data/lib/hexapdf/font/type1/pfb_parser.rb +71 -0
  113. data/lib/hexapdf/font/type1.rb +52 -0
  114. data/lib/hexapdf/font/type1_wrapper.rb +193 -0
  115. data/lib/hexapdf/font_loader/from_configuration.rb +70 -0
  116. data/lib/hexapdf/font_loader/standard14.rb +98 -0
  117. data/lib/hexapdf/font_loader.rb +85 -0
  118. data/lib/hexapdf/font_utils.rb +89 -0
  119. data/lib/hexapdf/image_loader/jpeg.rb +166 -0
  120. data/lib/hexapdf/image_loader/pdf.rb +89 -0
  121. data/lib/hexapdf/image_loader/png.rb +410 -0
  122. data/lib/hexapdf/image_loader.rb +68 -0
  123. data/lib/hexapdf/importer.rb +139 -0
  124. data/lib/hexapdf/name_tree_node.rb +78 -0
  125. data/lib/hexapdf/number_tree_node.rb +67 -0
  126. data/lib/hexapdf/object.rb +363 -0
  127. data/lib/hexapdf/parser.rb +349 -0
  128. data/lib/hexapdf/rectangle.rb +99 -0
  129. data/lib/hexapdf/reference.rb +98 -0
  130. data/lib/hexapdf/revision.rb +206 -0
  131. data/lib/hexapdf/revisions.rb +194 -0
  132. data/lib/hexapdf/serializer.rb +326 -0
  133. data/lib/hexapdf/stream.rb +279 -0
  134. data/lib/hexapdf/task/dereference.rb +109 -0
  135. data/lib/hexapdf/task/optimize.rb +230 -0
  136. data/lib/hexapdf/task.rb +68 -0
  137. data/lib/hexapdf/tokenizer.rb +406 -0
  138. data/lib/hexapdf/type/catalog.rb +107 -0
  139. data/lib/hexapdf/type/embedded_file.rb +87 -0
  140. data/lib/hexapdf/type/file_specification.rb +232 -0
  141. data/lib/hexapdf/type/font.rb +81 -0
  142. data/lib/hexapdf/type/font_descriptor.rb +109 -0
  143. data/lib/hexapdf/type/font_simple.rb +190 -0
  144. data/lib/hexapdf/type/font_true_type.rb +47 -0
  145. data/lib/hexapdf/type/font_type1.rb +162 -0
  146. data/lib/hexapdf/type/form.rb +103 -0
  147. data/lib/hexapdf/type/graphics_state_parameter.rb +79 -0
  148. data/lib/hexapdf/type/image.rb +73 -0
  149. data/lib/hexapdf/type/info.rb +70 -0
  150. data/lib/hexapdf/type/names.rb +69 -0
  151. data/lib/hexapdf/type/object_stream.rb +224 -0
  152. data/lib/hexapdf/type/page.rb +355 -0
  153. data/lib/hexapdf/type/page_tree_node.rb +269 -0
  154. data/lib/hexapdf/type/resources.rb +212 -0
  155. data/lib/hexapdf/type/trailer.rb +128 -0
  156. data/lib/hexapdf/type/viewer_preferences.rb +73 -0
  157. data/lib/hexapdf/type/xref_stream.rb +204 -0
  158. data/lib/hexapdf/type.rb +67 -0
  159. data/lib/hexapdf/utils/bit_field.rb +87 -0
  160. data/lib/hexapdf/utils/bit_stream.rb +148 -0
  161. data/lib/hexapdf/utils/lru_cache.rb +65 -0
  162. data/lib/hexapdf/utils/math_helpers.rb +55 -0
  163. data/lib/hexapdf/utils/object_hash.rb +130 -0
  164. data/lib/hexapdf/utils/pdf_doc_encoding.rb +93 -0
  165. data/lib/hexapdf/utils/sorted_tree_node.rb +339 -0
  166. data/lib/hexapdf/version.rb +39 -0
  167. data/lib/hexapdf/writer.rb +199 -0
  168. data/lib/hexapdf/xref_section.rb +152 -0
  169. data/lib/hexapdf.rb +34 -0
  170. data/man/man1/hexapdf.1 +249 -0
  171. data/test/data/aes-test-vectors/CBCGFSbox-128-decrypt.data.gz +0 -0
  172. data/test/data/aes-test-vectors/CBCGFSbox-128-encrypt.data.gz +0 -0
  173. data/test/data/aes-test-vectors/CBCGFSbox-192-decrypt.data.gz +0 -0
  174. data/test/data/aes-test-vectors/CBCGFSbox-192-encrypt.data.gz +0 -0
  175. data/test/data/aes-test-vectors/CBCGFSbox-256-decrypt.data.gz +0 -0
  176. data/test/data/aes-test-vectors/CBCGFSbox-256-encrypt.data.gz +0 -0
  177. data/test/data/aes-test-vectors/CBCKeySbox-128-decrypt.data.gz +0 -0
  178. data/test/data/aes-test-vectors/CBCKeySbox-128-encrypt.data.gz +0 -0
  179. data/test/data/aes-test-vectors/CBCKeySbox-192-decrypt.data.gz +0 -0
  180. data/test/data/aes-test-vectors/CBCKeySbox-192-encrypt.data.gz +0 -0
  181. data/test/data/aes-test-vectors/CBCKeySbox-256-decrypt.data.gz +0 -0
  182. data/test/data/aes-test-vectors/CBCKeySbox-256-encrypt.data.gz +0 -0
  183. data/test/data/aes-test-vectors/CBCVarKey-128-decrypt.data.gz +0 -0
  184. data/test/data/aes-test-vectors/CBCVarKey-128-encrypt.data.gz +0 -0
  185. data/test/data/aes-test-vectors/CBCVarKey-192-decrypt.data.gz +0 -0
  186. data/test/data/aes-test-vectors/CBCVarKey-192-encrypt.data.gz +0 -0
  187. data/test/data/aes-test-vectors/CBCVarKey-256-decrypt.data.gz +0 -0
  188. data/test/data/aes-test-vectors/CBCVarKey-256-encrypt.data.gz +0 -0
  189. data/test/data/aes-test-vectors/CBCVarTxt-128-decrypt.data.gz +0 -0
  190. data/test/data/aes-test-vectors/CBCVarTxt-128-encrypt.data.gz +0 -0
  191. data/test/data/aes-test-vectors/CBCVarTxt-192-decrypt.data.gz +0 -0
  192. data/test/data/aes-test-vectors/CBCVarTxt-192-encrypt.data.gz +0 -0
  193. data/test/data/aes-test-vectors/CBCVarTxt-256-decrypt.data.gz +0 -0
  194. data/test/data/aes-test-vectors/CBCVarTxt-256-encrypt.data.gz +0 -0
  195. data/test/data/fonts/Ubuntu-Title.ttf +0 -0
  196. data/test/data/images/cmyk.jpg +0 -0
  197. data/test/data/images/fillbytes.jpg +0 -0
  198. data/test/data/images/gray.jpg +0 -0
  199. data/test/data/images/greyscale-1bit.png +0 -0
  200. data/test/data/images/greyscale-2bit.png +0 -0
  201. data/test/data/images/greyscale-4bit.png +0 -0
  202. data/test/data/images/greyscale-8bit.png +0 -0
  203. data/test/data/images/greyscale-alpha-8bit.png +0 -0
  204. data/test/data/images/greyscale-trns-8bit.png +0 -0
  205. data/test/data/images/greyscale-with-gamma1.0.png +0 -0
  206. data/test/data/images/greyscale-with-gamma1.5.png +0 -0
  207. data/test/data/images/indexed-1bit.png +0 -0
  208. data/test/data/images/indexed-2bit.png +0 -0
  209. data/test/data/images/indexed-4bit.png +0 -0
  210. data/test/data/images/indexed-8bit.png +0 -0
  211. data/test/data/images/indexed-alpha-4bit.png +0 -0
  212. data/test/data/images/indexed-alpha-8bit.png +0 -0
  213. data/test/data/images/rgb.jpg +0 -0
  214. data/test/data/images/truecolour-8bit.png +0 -0
  215. data/test/data/images/truecolour-alpha-8bit.png +0 -0
  216. data/test/data/images/truecolour-gama-chrm-8bit.png +0 -0
  217. data/test/data/images/truecolour-srgb-8bit.png +0 -0
  218. data/test/data/minimal.pdf +44 -0
  219. data/test/data/standard-security-handler/README +9 -0
  220. data/test/data/standard-security-handler/bothpwd-aes-128bit-V4.pdf +44 -0
  221. data/test/data/standard-security-handler/bothpwd-aes-256bit-V5.pdf +0 -0
  222. data/test/data/standard-security-handler/bothpwd-arc4-128bit-V2.pdf +43 -0
  223. data/test/data/standard-security-handler/bothpwd-arc4-128bit-V4.pdf +43 -0
  224. data/test/data/standard-security-handler/bothpwd-arc4-40bit-V1.pdf +0 -0
  225. data/test/data/standard-security-handler/nopwd-aes-128bit-V4.pdf +43 -0
  226. data/test/data/standard-security-handler/nopwd-aes-256bit-V5.pdf +0 -0
  227. data/test/data/standard-security-handler/nopwd-arc4-128bit-V2.pdf +43 -0
  228. data/test/data/standard-security-handler/nopwd-arc4-128bit-V4.pdf +43 -0
  229. data/test/data/standard-security-handler/nopwd-arc4-40bit-V1.pdf +43 -0
  230. data/test/data/standard-security-handler/ownerpwd-aes-128bit-V4.pdf +0 -0
  231. data/test/data/standard-security-handler/ownerpwd-aes-256bit-V5.pdf +43 -0
  232. data/test/data/standard-security-handler/ownerpwd-arc4-128bit-V2.pdf +43 -0
  233. data/test/data/standard-security-handler/ownerpwd-arc4-128bit-V4.pdf +43 -0
  234. data/test/data/standard-security-handler/ownerpwd-arc4-40bit-V1.pdf +43 -0
  235. data/test/data/standard-security-handler/userpwd-aes-128bit-V4.pdf +43 -0
  236. data/test/data/standard-security-handler/userpwd-aes-256bit-V5.pdf +43 -0
  237. data/test/data/standard-security-handler/userpwd-arc4-128bit-V2.pdf +0 -0
  238. data/test/data/standard-security-handler/userpwd-arc4-128bit-V4.pdf +0 -0
  239. data/test/data/standard-security-handler/userpwd-arc4-40bit-V1.pdf +43 -0
  240. data/test/hexapdf/common_tokenizer_tests.rb +204 -0
  241. data/test/hexapdf/content/common.rb +31 -0
  242. data/test/hexapdf/content/graphic_object/test_arc.rb +93 -0
  243. data/test/hexapdf/content/graphic_object/test_endpoint_arc.rb +91 -0
  244. data/test/hexapdf/content/graphic_object/test_solid_arc.rb +86 -0
  245. data/test/hexapdf/content/test_canvas.rb +1113 -0
  246. data/test/hexapdf/content/test_color_space.rb +97 -0
  247. data/test/hexapdf/content/test_graphics_state.rb +138 -0
  248. data/test/hexapdf/content/test_operator.rb +619 -0
  249. data/test/hexapdf/content/test_parser.rb +66 -0
  250. data/test/hexapdf/content/test_processor.rb +156 -0
  251. data/test/hexapdf/content/test_transformation_matrix.rb +64 -0
  252. data/test/hexapdf/encryption/common.rb +87 -0
  253. data/test/hexapdf/encryption/test_aes.rb +121 -0
  254. data/test/hexapdf/encryption/test_arc4.rb +39 -0
  255. data/test/hexapdf/encryption/test_fast_aes.rb +17 -0
  256. data/test/hexapdf/encryption/test_fast_arc4.rb +12 -0
  257. data/test/hexapdf/encryption/test_identity.rb +21 -0
  258. data/test/hexapdf/encryption/test_ruby_aes.rb +23 -0
  259. data/test/hexapdf/encryption/test_ruby_arc4.rb +20 -0
  260. data/test/hexapdf/encryption/test_security_handler.rb +356 -0
  261. data/test/hexapdf/encryption/test_standard_security_handler.rb +274 -0
  262. data/test/hexapdf/filter/common.rb +53 -0
  263. data/test/hexapdf/filter/test_ascii85_decode.rb +60 -0
  264. data/test/hexapdf/filter/test_ascii_hex_decode.rb +33 -0
  265. data/test/hexapdf/filter/test_encryption.rb +24 -0
  266. data/test/hexapdf/filter/test_flate_decode.rb +35 -0
  267. data/test/hexapdf/filter/test_lzw_decode.rb +52 -0
  268. data/test/hexapdf/filter/test_predictor.rb +183 -0
  269. data/test/hexapdf/filter/test_run_length_decode.rb +32 -0
  270. data/test/hexapdf/font/cmap/test_parser.rb +67 -0
  271. data/test/hexapdf/font/cmap/test_writer.rb +58 -0
  272. data/test/hexapdf/font/encoding/test_base.rb +35 -0
  273. data/test/hexapdf/font/encoding/test_difference_encoding.rb +21 -0
  274. data/test/hexapdf/font/encoding/test_glyph_list.rb +59 -0
  275. data/test/hexapdf/font/encoding/test_zapf_dingbats_encoding.rb +16 -0
  276. data/test/hexapdf/font/test_encoding.rb +27 -0
  277. data/test/hexapdf/font/test_true_type_wrapper.rb +110 -0
  278. data/test/hexapdf/font/test_type1_wrapper.rb +66 -0
  279. data/test/hexapdf/font/true_type/common.rb +19 -0
  280. data/test/hexapdf/font/true_type/table/test_cmap.rb +59 -0
  281. data/test/hexapdf/font/true_type/table/test_cmap_subtable.rb +133 -0
  282. data/test/hexapdf/font/true_type/table/test_directory.rb +35 -0
  283. data/test/hexapdf/font/true_type/table/test_glyf.rb +58 -0
  284. data/test/hexapdf/font/true_type/table/test_head.rb +76 -0
  285. data/test/hexapdf/font/true_type/table/test_hhea.rb +40 -0
  286. data/test/hexapdf/font/true_type/table/test_hmtx.rb +38 -0
  287. data/test/hexapdf/font/true_type/table/test_loca.rb +43 -0
  288. data/test/hexapdf/font/true_type/table/test_maxp.rb +62 -0
  289. data/test/hexapdf/font/true_type/table/test_name.rb +95 -0
  290. data/test/hexapdf/font/true_type/table/test_os2.rb +65 -0
  291. data/test/hexapdf/font/true_type/table/test_post.rb +89 -0
  292. data/test/hexapdf/font/true_type/test_font.rb +120 -0
  293. data/test/hexapdf/font/true_type/test_table.rb +41 -0
  294. data/test/hexapdf/font/type1/test_afm_parser.rb +51 -0
  295. data/test/hexapdf/font/type1/test_font.rb +68 -0
  296. data/test/hexapdf/font/type1/test_pfb_parser.rb +37 -0
  297. data/test/hexapdf/font_loader/test_from_configuration.rb +28 -0
  298. data/test/hexapdf/font_loader/test_standard14.rb +22 -0
  299. data/test/hexapdf/image_loader/test_jpeg.rb +83 -0
  300. data/test/hexapdf/image_loader/test_pdf.rb +47 -0
  301. data/test/hexapdf/image_loader/test_png.rb +258 -0
  302. data/test/hexapdf/task/test_dereference.rb +46 -0
  303. data/test/hexapdf/task/test_optimize.rb +137 -0
  304. data/test/hexapdf/test_configuration.rb +82 -0
  305. data/test/hexapdf/test_data_dir.rb +32 -0
  306. data/test/hexapdf/test_dictionary.rb +284 -0
  307. data/test/hexapdf/test_dictionary_fields.rb +185 -0
  308. data/test/hexapdf/test_document.rb +574 -0
  309. data/test/hexapdf/test_document_utils.rb +144 -0
  310. data/test/hexapdf/test_filter.rb +96 -0
  311. data/test/hexapdf/test_font_utils.rb +47 -0
  312. data/test/hexapdf/test_importer.rb +78 -0
  313. data/test/hexapdf/test_object.rb +177 -0
  314. data/test/hexapdf/test_parser.rb +394 -0
  315. data/test/hexapdf/test_rectangle.rb +36 -0
  316. data/test/hexapdf/test_reference.rb +41 -0
  317. data/test/hexapdf/test_revision.rb +139 -0
  318. data/test/hexapdf/test_revisions.rb +93 -0
  319. data/test/hexapdf/test_serializer.rb +169 -0
  320. data/test/hexapdf/test_stream.rb +262 -0
  321. data/test/hexapdf/test_tokenizer.rb +30 -0
  322. data/test/hexapdf/test_writer.rb +120 -0
  323. data/test/hexapdf/test_xref_section.rb +35 -0
  324. data/test/hexapdf/type/test_catalog.rb +30 -0
  325. data/test/hexapdf/type/test_embedded_file.rb +16 -0
  326. data/test/hexapdf/type/test_file_specification.rb +148 -0
  327. data/test/hexapdf/type/test_font.rb +35 -0
  328. data/test/hexapdf/type/test_font_descriptor.rb +51 -0
  329. data/test/hexapdf/type/test_font_simple.rb +190 -0
  330. data/test/hexapdf/type/test_font_type1.rb +128 -0
  331. data/test/hexapdf/type/test_form.rb +60 -0
  332. data/test/hexapdf/type/test_info.rb +14 -0
  333. data/test/hexapdf/type/test_names.rb +9 -0
  334. data/test/hexapdf/type/test_object_stream.rb +84 -0
  335. data/test/hexapdf/type/test_page.rb +260 -0
  336. data/test/hexapdf/type/test_page_tree_node.rb +255 -0
  337. data/test/hexapdf/type/test_resources.rb +167 -0
  338. data/test/hexapdf/type/test_trailer.rb +109 -0
  339. data/test/hexapdf/type/test_xref_stream.rb +131 -0
  340. data/test/hexapdf/utils/test_bit_field.rb +47 -0
  341. data/test/hexapdf/utils/test_lru_cache.rb +22 -0
  342. data/test/hexapdf/utils/test_object_hash.rb +115 -0
  343. data/test/hexapdf/utils/test_pdf_doc_encoding.rb +18 -0
  344. data/test/hexapdf/utils/test_sorted_tree_node.rb +232 -0
  345. data/test/test_helper.rb +56 -0
  346. metadata +427 -0
@@ -0,0 +1,191 @@
1
+ # -*- encoding: utf-8 -*-
2
+ #
3
+ #--
4
+ # This file is part of HexaPDF.
5
+ #
6
+ # HexaPDF - A Versatile PDF Creation and Manipulation Library For Ruby
7
+ # Copyright (C) 2016 Thomas Leitner
8
+ #
9
+ # HexaPDF is free software: you can redistribute it and/or modify it
10
+ # under the terms of the GNU Affero General Public License version 3 as
11
+ # published by the Free Software Foundation with the addition of the
12
+ # following permission added to Section 15 as permitted in Section 7(a):
13
+ # FOR ANY PART OF THE COVERED WORK IN WHICH THE COPYRIGHT IS OWNED BY
14
+ # THOMAS LEITNER, THOMAS LEITNER DISCLAIMS THE WARRANTY OF NON
15
+ # INFRINGEMENT OF THIRD PARTY RIGHTS.
16
+ #
17
+ # HexaPDF is distributed in the hope that it will be useful, but WITHOUT
18
+ # ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
19
+ # FITNESS FOR A PARTICULAR PURPOSE. See the GNU Affero General Public
20
+ # License for more details.
21
+ #
22
+ # You should have received a copy of the GNU Affero General Public License
23
+ # along with HexaPDF. If not, see <http://www.gnu.org/licenses/>.
24
+ #
25
+ # The interactive user interfaces in modified source and object code
26
+ # versions of HexaPDF must display Appropriate Legal Notices, as required
27
+ # under Section 5 of the GNU Affero General Public License version 3.
28
+ #
29
+ # In accordance with Section 7(b) of the GNU Affero General Public
30
+ # License, a covered work must retain the producer line in every PDF that
31
+ # is created or manipulated using HexaPDF.
32
+ #++
33
+
34
+ require 'fiber'
35
+ require 'hexapdf/utils/bit_stream'
36
+ require 'hexapdf/filter/predictor'
37
+ require 'hexapdf/error'
38
+
39
+ module HexaPDF
40
+ module Filter
41
+
42
+ # Implements the LZW filter.
43
+ #
44
+ # Since LZW uses a tightly packed bit stream in which codes are of varying bit lengths and are
45
+ # not aligned to byte boundaries, this filter is not as fast as the other filters. If speed is
46
+ # a concern, the FlateDecode filter should be used instead.
47
+ #
48
+ # See: HexaPDF::Filter, PDF1.7 s7.4.4
49
+ module LZWDecode
50
+
51
+ CLEAR_TABLE = 256 # :nodoc:
52
+ EOD = 257 # :nodoc:
53
+
54
+ INITIAL_ENCODER_TABLE = {} #:nodoc:
55
+ 0.upto(255) {|i| INITIAL_ENCODER_TABLE[i.chr.freeze] = i}
56
+ INITIAL_ENCODER_TABLE[CLEAR_TABLE] = CLEAR_TABLE
57
+ INITIAL_ENCODER_TABLE[EOD] = EOD
58
+
59
+ INITIAL_DECODER_TABLE = {} #:nodoc:
60
+ 0.upto(255) {|i| INITIAL_DECODER_TABLE[i] = i.chr}
61
+ INITIAL_DECODER_TABLE[CLEAR_TABLE] = CLEAR_TABLE
62
+ INITIAL_DECODER_TABLE[EOD] = EOD
63
+
64
+ # See HexaPDF::Filter
65
+ def self.decoder(source, options = nil)
66
+ fib = Fiber.new do
67
+ # initialize decoder state
68
+ code_length = 9
69
+ table = INITIAL_DECODER_TABLE.dup
70
+
71
+ stream = HexaPDF::Utils::BitStreamReader.new
72
+ result = ''.b
73
+ finished = false
74
+ last_code = CLEAR_TABLE
75
+
76
+ while !finished && source.alive? && (data = source.resume)
77
+ stream.append_data(data)
78
+
79
+ while stream.read?(code_length)
80
+ code = stream.read(code_length)
81
+
82
+ # Decoder is one step behind => subtract 1!
83
+ # We check the table size before entering the next code into it => subtract 1, but
84
+ # there is one exception: After table entry 4095 is written, the clear table code
85
+ # also gets written with code length 12,
86
+ case table.size
87
+ when 510, 1022, 2046
88
+ code_length += 1
89
+ when 4095
90
+ if code != CLEAR_TABLE
91
+ raise FilterError, "Maximum of 12bit for codes in LZW stream exceeded"
92
+ end
93
+ end
94
+
95
+ if code == EOD
96
+ finished = true
97
+ break
98
+ elsif code == CLEAR_TABLE
99
+ # reset decoder state
100
+ code_length = 9
101
+ table = INITIAL_DECODER_TABLE.dup
102
+ elsif last_code == CLEAR_TABLE
103
+ unless table.key?(code)
104
+ raise FilterError, "Unknown code in LZW encoded stream found"
105
+ end
106
+ result << table[code]
107
+ else
108
+ unless table.key?(last_code)
109
+ raise FilterError, "Unknown code in LZW encoded stream found"
110
+ end
111
+ last_str = table[last_code]
112
+
113
+ str = if table.key?(code)
114
+ table[code]
115
+ else
116
+ last_str + last_str[0]
117
+ end
118
+ result << str
119
+ table[table.size] = last_str + str[0]
120
+ end
121
+
122
+ last_code = code
123
+ end
124
+
125
+ Fiber.yield(result)
126
+ result = ''.b
127
+ end
128
+ end
129
+
130
+ if options && options[:Predictor]
131
+ Predictor.decoder(fib, options)
132
+ else
133
+ fib
134
+ end
135
+ end
136
+
137
+ # See HexaPDF::Filter
138
+ def self.encoder(source, options = nil)
139
+ if options && options[:Predictor]
140
+ source = Predictor.encoder(source, options)
141
+ end
142
+
143
+ Fiber.new do
144
+ # initialize encoder state
145
+ code_length = 9
146
+ table = INITIAL_ENCODER_TABLE.dup
147
+
148
+ # initialize the bit stream with the clear-table marker
149
+ stream = HexaPDF::Utils::BitStreamWriter.new
150
+ result = stream.write(CLEAR_TABLE, 9)
151
+ str = ''.b
152
+
153
+ while source.alive? && (data = source.resume)
154
+ data.each_char do |char|
155
+ newstr = str + char
156
+ if table.key?(newstr)
157
+ str = newstr
158
+ else
159
+ result << stream.write(table[str], code_length)
160
+ table[newstr.freeze] = table.size
161
+ str = char
162
+ end
163
+
164
+ case table.size
165
+ when 512 then code_length = 10
166
+ when 1024 then code_length = 11
167
+ when 2048 then code_length = 12
168
+ when 4096
169
+ result << stream.write(CLEAR_TABLE, code_length)
170
+ # reset encoder state
171
+ code_length = 9
172
+ table = INITIAL_ENCODER_TABLE.dup
173
+ end
174
+ end
175
+
176
+ Fiber.yield(result)
177
+ result = ''.b
178
+ end
179
+
180
+ result = stream.write(table[str], code_length)
181
+ result << stream.write(EOD, code_length)
182
+ result << stream.finalize
183
+
184
+ result
185
+ end
186
+ end
187
+
188
+ end
189
+
190
+ end
191
+ end
@@ -0,0 +1,266 @@
1
+ # -*- encoding: utf-8 -*-
2
+ #
3
+ #--
4
+ # This file is part of HexaPDF.
5
+ #
6
+ # HexaPDF - A Versatile PDF Creation and Manipulation Library For Ruby
7
+ # Copyright (C) 2016 Thomas Leitner
8
+ #
9
+ # HexaPDF is free software: you can redistribute it and/or modify it
10
+ # under the terms of the GNU Affero General Public License version 3 as
11
+ # published by the Free Software Foundation with the addition of the
12
+ # following permission added to Section 15 as permitted in Section 7(a):
13
+ # FOR ANY PART OF THE COVERED WORK IN WHICH THE COPYRIGHT IS OWNED BY
14
+ # THOMAS LEITNER, THOMAS LEITNER DISCLAIMS THE WARRANTY OF NON
15
+ # INFRINGEMENT OF THIRD PARTY RIGHTS.
16
+ #
17
+ # HexaPDF is distributed in the hope that it will be useful, but WITHOUT
18
+ # ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
19
+ # FITNESS FOR A PARTICULAR PURPOSE. See the GNU Affero General Public
20
+ # License for more details.
21
+ #
22
+ # You should have received a copy of the GNU Affero General Public License
23
+ # along with HexaPDF. If not, see <http://www.gnu.org/licenses/>.
24
+ #
25
+ # The interactive user interfaces in modified source and object code
26
+ # versions of HexaPDF must display Appropriate Legal Notices, as required
27
+ # under Section 5 of the GNU Affero General Public License version 3.
28
+ #
29
+ # In accordance with Section 7(b) of the GNU Affero General Public
30
+ # License, a covered work must retain the producer line in every PDF that
31
+ # is created or manipulated using HexaPDF.
32
+ #++
33
+
34
+ require 'fiber'
35
+ require 'hexapdf/error'
36
+ require 'hexapdf/utils/bit_stream'
37
+
38
+ module HexaPDF
39
+ module Filter
40
+
41
+ # Implements the predictor for the LZWDecode and FlateDecode filters.
42
+ #
43
+ # Although a predictor isn't a full PDF filter, it is implemented as one in HexaPDF terms to
44
+ # allow easy chaining of the predictor.
45
+ #
46
+ # See: PDF1.7 s7.4.4.3, s7.4.4.4, https://partners.adobe.com/public/developer/en/tiff/TIFF6.pdf
47
+ # (p64f), http://www.w3.org/TR/PNG-Filters.html
48
+ #
49
+ #-- Implemenation notes:
50
+ #
51
+ # The TIFF encoding and decoding methods are the same, except for the innermost loop. The way
52
+ # it is implemented is probably not the best but it avoids duplicate code.
53
+ #
54
+ # The situation is similar with PNG encoding and decoding.
55
+ #++
56
+ module Predictor
57
+
58
+ PREDICTOR_PNG_NONE = 0 #:nodoc:
59
+ PREDICTOR_PNG_SUB = 1 #:nodoc:
60
+ PREDICTOR_PNG_UP = 2 #:nodoc:
61
+ PREDICTOR_PNG_AVERAGE = 3 #:nodoc:
62
+ PREDICTOR_PNG_PAETH = 4 #:nodoc:
63
+ PREDICTOR_PNG_OPTIMUM = 5 #:nodoc:
64
+
65
+ # See HexaPDF::Filter
66
+ def self.decoder(source, options)
67
+ execute(:decoder, source, options)
68
+ end
69
+
70
+ # See HexaPDF::Filter
71
+ def self.encoder(source, options)
72
+ execute(:encoder, source, options)
73
+ end
74
+
75
+ def self.execute(type, source, options) # :nodoc:
76
+ return source if !options[:Predictor] || options[:Predictor] == 1
77
+
78
+ colors = options[:Colors] || 1
79
+ bits_per_component = options[:BitsPerComponent] || 8
80
+ columns = options[:Columns] || 1
81
+
82
+ if options[:Predictor] == 2
83
+ tiff_execute(type, source, colors, bits_per_component, columns)
84
+ elsif options[:Predictor] >= 10
85
+ png_execute(type, source, options[:Predictor], colors, bits_per_component, columns)
86
+ else
87
+ raise HexaPDF::InvalidPDFObjectError, "Predictor key is invalid: #{options[:Predictor]}"
88
+ end
89
+ end
90
+
91
+ def self.tiff_execute(type, source, colors, bits_per_component, columns) # :nodoc:
92
+ Fiber.new do
93
+ bytes_per_row = (columns * bits_per_component * colors + 7) / 8
94
+ mask = (1 << bits_per_component) - 1
95
+
96
+ data = ''.b
97
+ writer = HexaPDF::Utils::BitStreamWriter.new
98
+ pos = 0
99
+
100
+ decode_row = lambda do |result, reader|
101
+ last_components = [0] * colors
102
+ (columns * colors).times do |i|
103
+ i %= colors
104
+ tmp = (reader.read(bits_per_component) + last_components[i]) & mask
105
+ result << writer.write(tmp, bits_per_component)
106
+ last_components[i] = tmp
107
+ end
108
+ result << writer.finalize
109
+ end
110
+
111
+ encode_row = lambda do |result, reader|
112
+ last_components = [0] * colors
113
+ (columns * colors).times do |i|
114
+ i %= colors
115
+ tmp = reader.read(bits_per_component)
116
+ result << writer.write((tmp - last_components[i]) & mask, bits_per_component)
117
+ last_components[i] = tmp
118
+ end
119
+ result << writer.finalize
120
+ end
121
+
122
+ row_action = (type == :decoder ? decode_row : encode_row)
123
+
124
+ while source.alive? && (new_data = source.resume)
125
+ data.slice!(0...pos)
126
+ data << new_data
127
+
128
+ result = ''.b
129
+ pos = 0
130
+
131
+ while pos + bytes_per_row <= data.length
132
+ reader = HexaPDF::Utils::BitStreamReader.new(data[pos, bytes_per_row])
133
+ row_action.call(result, reader)
134
+ pos += bytes_per_row
135
+ end
136
+
137
+ Fiber.yield(result) unless result.empty?
138
+ end
139
+
140
+ unless pos == data.length
141
+ raise FilterError, "Data is missing for TIFF predictor"
142
+ end
143
+ end
144
+ end
145
+
146
+ def self.png_execute(type, source, predictor, colors, bits_per_component, columns) # :nodoc:
147
+ Fiber.new do
148
+ bytes_per_pixel = (bits_per_component * colors + 7) / 8
149
+ bytes_per_row = (columns * bits_per_component * colors + 7) / 8
150
+ bytes_per_row += 1 if type == :decoder
151
+
152
+ # Only on encoding: Arbitrarily choose a predictor if we should choose the optimum
153
+ predictor = predictor == 15 ? PREDICTOR_PNG_PAETH : predictor - 10
154
+
155
+ data = ''.b
156
+ last_line = "\0".b * (bytes_per_row + 1)
157
+ pos = 0
158
+
159
+ decode_row = lambda do |result|
160
+ line = data[pos, bytes_per_row]
161
+
162
+ case line.getbyte(0)
163
+ when PREDICTOR_PNG_NONE
164
+ # nothing to do
165
+ when PREDICTOR_PNG_SUB
166
+ (bytes_per_pixel + 1).upto(bytes_per_row - 1) do |i|
167
+ line.setbyte(i, line.getbyte(i) + line.getbyte(i - bytes_per_pixel))
168
+ end
169
+ when PREDICTOR_PNG_UP
170
+ 1.upto(bytes_per_row - 1) do |i|
171
+ line.setbyte(i, line.getbyte(i) + last_line.getbyte(i))
172
+ end
173
+ when PREDICTOR_PNG_AVERAGE
174
+ 1.upto(bytes_per_row - 1) do |i|
175
+ a = i <= bytes_per_pixel ? 0 : line.getbyte(i - bytes_per_pixel)
176
+ line.setbyte(i, line.getbyte(i) + ((a + last_line.getbyte(i)) >> 1))
177
+ end
178
+ when PREDICTOR_PNG_PAETH
179
+ 1.upto(bytes_per_row - 1) do |i|
180
+ a = i <= bytes_per_pixel ? 0 : line.getbyte(i - bytes_per_pixel)
181
+ b = last_line.getbyte(i)
182
+ c = i <= bytes_per_pixel ? 0 : last_line.getbyte(i - bytes_per_pixel)
183
+
184
+ point = a + b - c
185
+ pa = (point - a).abs
186
+ pb = (point - b).abs
187
+ pc = (point - c).abs
188
+
189
+ point = ((pa <= pb && pa <= pc) ? a : (pb <= pc ? b : c))
190
+
191
+ line.setbyte(i, line.getbyte(i) + point)
192
+ end
193
+ end
194
+
195
+ result << line[1..-1]
196
+ last_line = line
197
+ end
198
+
199
+ encode_row = lambda do |result|
200
+ line = predictor.chr.force_encoding(Encoding::BINARY) << data[pos, bytes_per_row]
201
+ next_last_line = line.dup
202
+
203
+ case predictor
204
+ when PREDICTOR_PNG_NONE
205
+ # nothing to do
206
+ when PREDICTOR_PNG_SUB
207
+ bytes_per_row.downto(bytes_per_pixel + 1) do |i|
208
+ line.setbyte(i, line.getbyte(i) - line.getbyte(i - bytes_per_pixel))
209
+ end
210
+ when PREDICTOR_PNG_UP
211
+ bytes_per_row.downto(1) do |i|
212
+ line.setbyte(i, line.getbyte(i) - last_line.getbyte(i))
213
+ end
214
+ when PREDICTOR_PNG_AVERAGE
215
+ bytes_per_row.downto(1) do |i|
216
+ a = i <= bytes_per_pixel ? 0 : line.getbyte(i - bytes_per_pixel)
217
+ line.setbyte(i, line.getbyte(i) - ((a + last_line.getbyte(i)) >> 1))
218
+ end
219
+ when PREDICTOR_PNG_PAETH
220
+ bytes_per_row.downto(1) do |i|
221
+ a = i <= bytes_per_pixel ? 0 : line.getbyte(i - bytes_per_pixel)
222
+ b = last_line.getbyte(i)
223
+ c = i <= bytes_per_pixel ? 0 : last_line.getbyte(i - bytes_per_pixel)
224
+
225
+ point = a + b - c
226
+ pa = (point - a).abs
227
+ pb = (point - b).abs
228
+ pc = (point - c).abs
229
+
230
+ point = ((pa <= pb && pa <= pc) ? a : (pb <= pc ? b : c))
231
+
232
+ line.setbyte(i, line.getbyte(i) - point)
233
+ end
234
+ end
235
+
236
+ result << line
237
+ last_line = next_last_line
238
+ end
239
+
240
+ row_action = (type == :decoder ? decode_row : encode_row)
241
+
242
+ while source.alive? && (new_data = source.resume)
243
+ data.slice!(0...pos)
244
+ data << new_data
245
+
246
+ result = ''.b
247
+ pos = 0
248
+
249
+ while pos + bytes_per_row <= data.length
250
+ row_action.call(result)
251
+ pos += bytes_per_row
252
+ end
253
+
254
+ Fiber.yield(result) unless result.empty?
255
+ end
256
+
257
+ unless pos == data.length
258
+ raise FilterError, "Data is missing for PNG predictor"
259
+ end
260
+ end
261
+ end
262
+
263
+ end
264
+
265
+ end
266
+ end
@@ -0,0 +1,108 @@
1
+ # -*- encoding: utf-8 -*-
2
+ #
3
+ #--
4
+ # This file is part of HexaPDF.
5
+ #
6
+ # HexaPDF - A Versatile PDF Creation and Manipulation Library For Ruby
7
+ # Copyright (C) 2016 Thomas Leitner
8
+ #
9
+ # HexaPDF is free software: you can redistribute it and/or modify it
10
+ # under the terms of the GNU Affero General Public License version 3 as
11
+ # published by the Free Software Foundation with the addition of the
12
+ # following permission added to Section 15 as permitted in Section 7(a):
13
+ # FOR ANY PART OF THE COVERED WORK IN WHICH THE COPYRIGHT IS OWNED BY
14
+ # THOMAS LEITNER, THOMAS LEITNER DISCLAIMS THE WARRANTY OF NON
15
+ # INFRINGEMENT OF THIRD PARTY RIGHTS.
16
+ #
17
+ # HexaPDF is distributed in the hope that it will be useful, but WITHOUT
18
+ # ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
19
+ # FITNESS FOR A PARTICULAR PURPOSE. See the GNU Affero General Public
20
+ # License for more details.
21
+ #
22
+ # You should have received a copy of the GNU Affero General Public License
23
+ # along with HexaPDF. If not, see <http://www.gnu.org/licenses/>.
24
+ #
25
+ # The interactive user interfaces in modified source and object code
26
+ # versions of HexaPDF must display Appropriate Legal Notices, as required
27
+ # under Section 5 of the GNU Affero General Public License version 3.
28
+ #
29
+ # In accordance with Section 7(b) of the GNU Affero General Public
30
+ # License, a covered work must retain the producer line in every PDF that
31
+ # is created or manipulated using HexaPDF.
32
+ #++
33
+
34
+ require 'fiber'
35
+ require 'strscan'
36
+ require 'hexapdf/error'
37
+
38
+ module HexaPDF
39
+ module Filter
40
+
41
+ # Implements the run length filter.
42
+ #
43
+ # See: HexaPDF::Filter, PDF1.7 s7.4.5
44
+ module RunLengthDecode
45
+
46
+ EOD = 128.chr #:nodoc:
47
+
48
+ # See HexaPDF::Filter
49
+ def self.decoder(source, _ = nil)
50
+ Fiber.new do
51
+ i = 0
52
+ result = ''.b
53
+ data = source.resume
54
+ while data && i < data.length
55
+ length = data.getbyte(i)
56
+ if length < 128 && i + length + 1 < data.length # no byte run and enough bytes
57
+ result << data[i + 1, length + 1]
58
+ i += length + 2
59
+ elsif length > 128 && i + 1 < data.length # byte run and enough bytes
60
+ result << data[i + 1] * (257 - length)
61
+ i += 2
62
+ elsif length != 128 # not enough bytes in data
63
+ Fiber.yield(result)
64
+ if source.alive? && (new_data = source.resume)
65
+ data = data[i..-1] << new_data
66
+ else
67
+ raise FilterError, "Missing data for run length encoded stream"
68
+ end
69
+ i = 0
70
+ result = ''.b
71
+ else # EOD reached
72
+ break
73
+ end
74
+
75
+ if i == data.length && source.alive? && (data = source.resume)
76
+ Fiber.yield(result)
77
+ i = 0
78
+ result = ''.b
79
+ end
80
+ end
81
+ result unless result.empty?
82
+ end
83
+ end
84
+
85
+ # See HexaPDF::Filter
86
+ def self.encoder(source, _ = nil)
87
+ Fiber.new do
88
+ while source.alive? && (data = source.resume)
89
+ result = ''.b
90
+ strscan = StringScanner.new(data)
91
+ until strscan.eos?
92
+ if strscan.scan(/(.)\1{1,127}/m) # a run of <= 128 same characters
93
+ result << (257 - strscan.matched_size).chr << strscan[1]
94
+ else # a run of characters until two same characters or length > 128
95
+ match = strscan.scan(/.{1,128}?(?=(.)\1|\z)|.{128}/m)
96
+ result << (match.length - 1).chr << match
97
+ end
98
+ end
99
+ Fiber.yield(result)
100
+ end
101
+ EOD
102
+ end
103
+ end
104
+
105
+ end
106
+
107
+ end
108
+ end