hexapdf 0.1.0
This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
- checksums.yaml +7 -0
- data/CONTRIBUTERS +3 -0
- data/LICENSE +26 -0
- data/README.md +88 -0
- data/Rakefile +121 -0
- data/VERSION +1 -0
- data/agpl-3.0.txt +661 -0
- data/bin/hexapdf +6 -0
- data/data/hexapdf/afm/Courier-Bold.afm +342 -0
- data/data/hexapdf/afm/Courier-BoldOblique.afm +342 -0
- data/data/hexapdf/afm/Courier-Oblique.afm +342 -0
- data/data/hexapdf/afm/Courier.afm +342 -0
- data/data/hexapdf/afm/Helvetica-Bold.afm +2827 -0
- data/data/hexapdf/afm/Helvetica-BoldOblique.afm +2827 -0
- data/data/hexapdf/afm/Helvetica-Oblique.afm +3051 -0
- data/data/hexapdf/afm/Helvetica.afm +3051 -0
- data/data/hexapdf/afm/MustRead.html +1 -0
- data/data/hexapdf/afm/Symbol.afm +213 -0
- data/data/hexapdf/afm/Times-Bold.afm +2588 -0
- data/data/hexapdf/afm/Times-BoldItalic.afm +2384 -0
- data/data/hexapdf/afm/Times-Italic.afm +2667 -0
- data/data/hexapdf/afm/Times-Roman.afm +2419 -0
- data/data/hexapdf/afm/ZapfDingbats.afm +225 -0
- data/data/hexapdf/encoding/glyphlist.txt +4305 -0
- data/data/hexapdf/encoding/zapfdingbats.txt +225 -0
- data/examples/arc.rb +50 -0
- data/examples/graphics.rb +274 -0
- data/examples/hello_world.rb +16 -0
- data/examples/machupicchu.jpg +0 -0
- data/examples/merging.rb +24 -0
- data/examples/optimizing.rb +20 -0
- data/examples/show_char_bboxes.rb +55 -0
- data/examples/standard_pdf_fonts.rb +72 -0
- data/examples/truetype.rb +45 -0
- data/lib/hexapdf/cli/extract.rb +128 -0
- data/lib/hexapdf/cli/info.rb +121 -0
- data/lib/hexapdf/cli/inspect.rb +157 -0
- data/lib/hexapdf/cli/modify.rb +218 -0
- data/lib/hexapdf/cli.rb +121 -0
- data/lib/hexapdf/configuration.rb +392 -0
- data/lib/hexapdf/content/canvas.rb +1974 -0
- data/lib/hexapdf/content/color_space.rb +364 -0
- data/lib/hexapdf/content/graphic_object/arc.rb +267 -0
- data/lib/hexapdf/content/graphic_object/endpoint_arc.rb +208 -0
- data/lib/hexapdf/content/graphic_object/solid_arc.rb +173 -0
- data/lib/hexapdf/content/graphic_object.rb +81 -0
- data/lib/hexapdf/content/graphics_state.rb +579 -0
- data/lib/hexapdf/content/operator.rb +1072 -0
- data/lib/hexapdf/content/parser.rb +204 -0
- data/lib/hexapdf/content/processor.rb +451 -0
- data/lib/hexapdf/content/transformation_matrix.rb +172 -0
- data/lib/hexapdf/content.rb +47 -0
- data/lib/hexapdf/data_dir.rb +51 -0
- data/lib/hexapdf/dictionary.rb +303 -0
- data/lib/hexapdf/dictionary_fields.rb +382 -0
- data/lib/hexapdf/document.rb +589 -0
- data/lib/hexapdf/document_utils.rb +209 -0
- data/lib/hexapdf/encryption/aes.rb +206 -0
- data/lib/hexapdf/encryption/arc4.rb +93 -0
- data/lib/hexapdf/encryption/fast_aes.rb +79 -0
- data/lib/hexapdf/encryption/fast_arc4.rb +67 -0
- data/lib/hexapdf/encryption/identity.rb +63 -0
- data/lib/hexapdf/encryption/ruby_aes.rb +447 -0
- data/lib/hexapdf/encryption/ruby_arc4.rb +96 -0
- data/lib/hexapdf/encryption/security_handler.rb +494 -0
- data/lib/hexapdf/encryption/standard_security_handler.rb +616 -0
- data/lib/hexapdf/encryption.rb +94 -0
- data/lib/hexapdf/error.rb +73 -0
- data/lib/hexapdf/filter/ascii85_decode.rb +160 -0
- data/lib/hexapdf/filter/ascii_hex_decode.rb +87 -0
- data/lib/hexapdf/filter/dct_decode.rb +57 -0
- data/lib/hexapdf/filter/encryption.rb +59 -0
- data/lib/hexapdf/filter/flate_decode.rb +93 -0
- data/lib/hexapdf/filter/jpx_decode.rb +56 -0
- data/lib/hexapdf/filter/lzw_decode.rb +191 -0
- data/lib/hexapdf/filter/predictor.rb +266 -0
- data/lib/hexapdf/filter/run_length_decode.rb +108 -0
- data/lib/hexapdf/filter.rb +176 -0
- data/lib/hexapdf/font/cmap/parser.rb +146 -0
- data/lib/hexapdf/font/cmap/writer.rb +176 -0
- data/lib/hexapdf/font/cmap.rb +90 -0
- data/lib/hexapdf/font/encoding/base.rb +77 -0
- data/lib/hexapdf/font/encoding/difference_encoding.rb +64 -0
- data/lib/hexapdf/font/encoding/glyph_list.rb +150 -0
- data/lib/hexapdf/font/encoding/mac_expert_encoding.rb +221 -0
- data/lib/hexapdf/font/encoding/mac_roman_encoding.rb +265 -0
- data/lib/hexapdf/font/encoding/standard_encoding.rb +205 -0
- data/lib/hexapdf/font/encoding/symbol_encoding.rb +244 -0
- data/lib/hexapdf/font/encoding/win_ansi_encoding.rb +280 -0
- data/lib/hexapdf/font/encoding/zapf_dingbats_encoding.rb +250 -0
- data/lib/hexapdf/font/encoding.rb +68 -0
- data/lib/hexapdf/font/true_type/font.rb +179 -0
- data/lib/hexapdf/font/true_type/table/cmap.rb +103 -0
- data/lib/hexapdf/font/true_type/table/cmap_subtable.rb +384 -0
- data/lib/hexapdf/font/true_type/table/directory.rb +92 -0
- data/lib/hexapdf/font/true_type/table/glyf.rb +166 -0
- data/lib/hexapdf/font/true_type/table/head.rb +143 -0
- data/lib/hexapdf/font/true_type/table/hhea.rb +109 -0
- data/lib/hexapdf/font/true_type/table/hmtx.rb +79 -0
- data/lib/hexapdf/font/true_type/table/loca.rb +79 -0
- data/lib/hexapdf/font/true_type/table/maxp.rb +112 -0
- data/lib/hexapdf/font/true_type/table/name.rb +218 -0
- data/lib/hexapdf/font/true_type/table/os2.rb +200 -0
- data/lib/hexapdf/font/true_type/table/post.rb +230 -0
- data/lib/hexapdf/font/true_type/table.rb +155 -0
- data/lib/hexapdf/font/true_type.rb +48 -0
- data/lib/hexapdf/font/true_type_wrapper.rb +240 -0
- data/lib/hexapdf/font/type1/afm_parser.rb +230 -0
- data/lib/hexapdf/font/type1/character_metrics.rb +67 -0
- data/lib/hexapdf/font/type1/font.rb +123 -0
- data/lib/hexapdf/font/type1/font_metrics.rb +117 -0
- data/lib/hexapdf/font/type1/pfb_parser.rb +71 -0
- data/lib/hexapdf/font/type1.rb +52 -0
- data/lib/hexapdf/font/type1_wrapper.rb +193 -0
- data/lib/hexapdf/font_loader/from_configuration.rb +70 -0
- data/lib/hexapdf/font_loader/standard14.rb +98 -0
- data/lib/hexapdf/font_loader.rb +85 -0
- data/lib/hexapdf/font_utils.rb +89 -0
- data/lib/hexapdf/image_loader/jpeg.rb +166 -0
- data/lib/hexapdf/image_loader/pdf.rb +89 -0
- data/lib/hexapdf/image_loader/png.rb +410 -0
- data/lib/hexapdf/image_loader.rb +68 -0
- data/lib/hexapdf/importer.rb +139 -0
- data/lib/hexapdf/name_tree_node.rb +78 -0
- data/lib/hexapdf/number_tree_node.rb +67 -0
- data/lib/hexapdf/object.rb +363 -0
- data/lib/hexapdf/parser.rb +349 -0
- data/lib/hexapdf/rectangle.rb +99 -0
- data/lib/hexapdf/reference.rb +98 -0
- data/lib/hexapdf/revision.rb +206 -0
- data/lib/hexapdf/revisions.rb +194 -0
- data/lib/hexapdf/serializer.rb +326 -0
- data/lib/hexapdf/stream.rb +279 -0
- data/lib/hexapdf/task/dereference.rb +109 -0
- data/lib/hexapdf/task/optimize.rb +230 -0
- data/lib/hexapdf/task.rb +68 -0
- data/lib/hexapdf/tokenizer.rb +406 -0
- data/lib/hexapdf/type/catalog.rb +107 -0
- data/lib/hexapdf/type/embedded_file.rb +87 -0
- data/lib/hexapdf/type/file_specification.rb +232 -0
- data/lib/hexapdf/type/font.rb +81 -0
- data/lib/hexapdf/type/font_descriptor.rb +109 -0
- data/lib/hexapdf/type/font_simple.rb +190 -0
- data/lib/hexapdf/type/font_true_type.rb +47 -0
- data/lib/hexapdf/type/font_type1.rb +162 -0
- data/lib/hexapdf/type/form.rb +103 -0
- data/lib/hexapdf/type/graphics_state_parameter.rb +79 -0
- data/lib/hexapdf/type/image.rb +73 -0
- data/lib/hexapdf/type/info.rb +70 -0
- data/lib/hexapdf/type/names.rb +69 -0
- data/lib/hexapdf/type/object_stream.rb +224 -0
- data/lib/hexapdf/type/page.rb +355 -0
- data/lib/hexapdf/type/page_tree_node.rb +269 -0
- data/lib/hexapdf/type/resources.rb +212 -0
- data/lib/hexapdf/type/trailer.rb +128 -0
- data/lib/hexapdf/type/viewer_preferences.rb +73 -0
- data/lib/hexapdf/type/xref_stream.rb +204 -0
- data/lib/hexapdf/type.rb +67 -0
- data/lib/hexapdf/utils/bit_field.rb +87 -0
- data/lib/hexapdf/utils/bit_stream.rb +148 -0
- data/lib/hexapdf/utils/lru_cache.rb +65 -0
- data/lib/hexapdf/utils/math_helpers.rb +55 -0
- data/lib/hexapdf/utils/object_hash.rb +130 -0
- data/lib/hexapdf/utils/pdf_doc_encoding.rb +93 -0
- data/lib/hexapdf/utils/sorted_tree_node.rb +339 -0
- data/lib/hexapdf/version.rb +39 -0
- data/lib/hexapdf/writer.rb +199 -0
- data/lib/hexapdf/xref_section.rb +152 -0
- data/lib/hexapdf.rb +34 -0
- data/man/man1/hexapdf.1 +249 -0
- data/test/data/aes-test-vectors/CBCGFSbox-128-decrypt.data.gz +0 -0
- data/test/data/aes-test-vectors/CBCGFSbox-128-encrypt.data.gz +0 -0
- data/test/data/aes-test-vectors/CBCGFSbox-192-decrypt.data.gz +0 -0
- data/test/data/aes-test-vectors/CBCGFSbox-192-encrypt.data.gz +0 -0
- data/test/data/aes-test-vectors/CBCGFSbox-256-decrypt.data.gz +0 -0
- data/test/data/aes-test-vectors/CBCGFSbox-256-encrypt.data.gz +0 -0
- data/test/data/aes-test-vectors/CBCKeySbox-128-decrypt.data.gz +0 -0
- data/test/data/aes-test-vectors/CBCKeySbox-128-encrypt.data.gz +0 -0
- data/test/data/aes-test-vectors/CBCKeySbox-192-decrypt.data.gz +0 -0
- data/test/data/aes-test-vectors/CBCKeySbox-192-encrypt.data.gz +0 -0
- data/test/data/aes-test-vectors/CBCKeySbox-256-decrypt.data.gz +0 -0
- data/test/data/aes-test-vectors/CBCKeySbox-256-encrypt.data.gz +0 -0
- data/test/data/aes-test-vectors/CBCVarKey-128-decrypt.data.gz +0 -0
- data/test/data/aes-test-vectors/CBCVarKey-128-encrypt.data.gz +0 -0
- data/test/data/aes-test-vectors/CBCVarKey-192-decrypt.data.gz +0 -0
- data/test/data/aes-test-vectors/CBCVarKey-192-encrypt.data.gz +0 -0
- data/test/data/aes-test-vectors/CBCVarKey-256-decrypt.data.gz +0 -0
- data/test/data/aes-test-vectors/CBCVarKey-256-encrypt.data.gz +0 -0
- data/test/data/aes-test-vectors/CBCVarTxt-128-decrypt.data.gz +0 -0
- data/test/data/aes-test-vectors/CBCVarTxt-128-encrypt.data.gz +0 -0
- data/test/data/aes-test-vectors/CBCVarTxt-192-decrypt.data.gz +0 -0
- data/test/data/aes-test-vectors/CBCVarTxt-192-encrypt.data.gz +0 -0
- data/test/data/aes-test-vectors/CBCVarTxt-256-decrypt.data.gz +0 -0
- data/test/data/aes-test-vectors/CBCVarTxt-256-encrypt.data.gz +0 -0
- data/test/data/fonts/Ubuntu-Title.ttf +0 -0
- data/test/data/images/cmyk.jpg +0 -0
- data/test/data/images/fillbytes.jpg +0 -0
- data/test/data/images/gray.jpg +0 -0
- data/test/data/images/greyscale-1bit.png +0 -0
- data/test/data/images/greyscale-2bit.png +0 -0
- data/test/data/images/greyscale-4bit.png +0 -0
- data/test/data/images/greyscale-8bit.png +0 -0
- data/test/data/images/greyscale-alpha-8bit.png +0 -0
- data/test/data/images/greyscale-trns-8bit.png +0 -0
- data/test/data/images/greyscale-with-gamma1.0.png +0 -0
- data/test/data/images/greyscale-with-gamma1.5.png +0 -0
- data/test/data/images/indexed-1bit.png +0 -0
- data/test/data/images/indexed-2bit.png +0 -0
- data/test/data/images/indexed-4bit.png +0 -0
- data/test/data/images/indexed-8bit.png +0 -0
- data/test/data/images/indexed-alpha-4bit.png +0 -0
- data/test/data/images/indexed-alpha-8bit.png +0 -0
- data/test/data/images/rgb.jpg +0 -0
- data/test/data/images/truecolour-8bit.png +0 -0
- data/test/data/images/truecolour-alpha-8bit.png +0 -0
- data/test/data/images/truecolour-gama-chrm-8bit.png +0 -0
- data/test/data/images/truecolour-srgb-8bit.png +0 -0
- data/test/data/minimal.pdf +44 -0
- data/test/data/standard-security-handler/README +9 -0
- data/test/data/standard-security-handler/bothpwd-aes-128bit-V4.pdf +44 -0
- data/test/data/standard-security-handler/bothpwd-aes-256bit-V5.pdf +0 -0
- data/test/data/standard-security-handler/bothpwd-arc4-128bit-V2.pdf +43 -0
- data/test/data/standard-security-handler/bothpwd-arc4-128bit-V4.pdf +43 -0
- data/test/data/standard-security-handler/bothpwd-arc4-40bit-V1.pdf +0 -0
- data/test/data/standard-security-handler/nopwd-aes-128bit-V4.pdf +43 -0
- data/test/data/standard-security-handler/nopwd-aes-256bit-V5.pdf +0 -0
- data/test/data/standard-security-handler/nopwd-arc4-128bit-V2.pdf +43 -0
- data/test/data/standard-security-handler/nopwd-arc4-128bit-V4.pdf +43 -0
- data/test/data/standard-security-handler/nopwd-arc4-40bit-V1.pdf +43 -0
- data/test/data/standard-security-handler/ownerpwd-aes-128bit-V4.pdf +0 -0
- data/test/data/standard-security-handler/ownerpwd-aes-256bit-V5.pdf +43 -0
- data/test/data/standard-security-handler/ownerpwd-arc4-128bit-V2.pdf +43 -0
- data/test/data/standard-security-handler/ownerpwd-arc4-128bit-V4.pdf +43 -0
- data/test/data/standard-security-handler/ownerpwd-arc4-40bit-V1.pdf +43 -0
- data/test/data/standard-security-handler/userpwd-aes-128bit-V4.pdf +43 -0
- data/test/data/standard-security-handler/userpwd-aes-256bit-V5.pdf +43 -0
- data/test/data/standard-security-handler/userpwd-arc4-128bit-V2.pdf +0 -0
- data/test/data/standard-security-handler/userpwd-arc4-128bit-V4.pdf +0 -0
- data/test/data/standard-security-handler/userpwd-arc4-40bit-V1.pdf +43 -0
- data/test/hexapdf/common_tokenizer_tests.rb +204 -0
- data/test/hexapdf/content/common.rb +31 -0
- data/test/hexapdf/content/graphic_object/test_arc.rb +93 -0
- data/test/hexapdf/content/graphic_object/test_endpoint_arc.rb +91 -0
- data/test/hexapdf/content/graphic_object/test_solid_arc.rb +86 -0
- data/test/hexapdf/content/test_canvas.rb +1113 -0
- data/test/hexapdf/content/test_color_space.rb +97 -0
- data/test/hexapdf/content/test_graphics_state.rb +138 -0
- data/test/hexapdf/content/test_operator.rb +619 -0
- data/test/hexapdf/content/test_parser.rb +66 -0
- data/test/hexapdf/content/test_processor.rb +156 -0
- data/test/hexapdf/content/test_transformation_matrix.rb +64 -0
- data/test/hexapdf/encryption/common.rb +87 -0
- data/test/hexapdf/encryption/test_aes.rb +121 -0
- data/test/hexapdf/encryption/test_arc4.rb +39 -0
- data/test/hexapdf/encryption/test_fast_aes.rb +17 -0
- data/test/hexapdf/encryption/test_fast_arc4.rb +12 -0
- data/test/hexapdf/encryption/test_identity.rb +21 -0
- data/test/hexapdf/encryption/test_ruby_aes.rb +23 -0
- data/test/hexapdf/encryption/test_ruby_arc4.rb +20 -0
- data/test/hexapdf/encryption/test_security_handler.rb +356 -0
- data/test/hexapdf/encryption/test_standard_security_handler.rb +274 -0
- data/test/hexapdf/filter/common.rb +53 -0
- data/test/hexapdf/filter/test_ascii85_decode.rb +60 -0
- data/test/hexapdf/filter/test_ascii_hex_decode.rb +33 -0
- data/test/hexapdf/filter/test_encryption.rb +24 -0
- data/test/hexapdf/filter/test_flate_decode.rb +35 -0
- data/test/hexapdf/filter/test_lzw_decode.rb +52 -0
- data/test/hexapdf/filter/test_predictor.rb +183 -0
- data/test/hexapdf/filter/test_run_length_decode.rb +32 -0
- data/test/hexapdf/font/cmap/test_parser.rb +67 -0
- data/test/hexapdf/font/cmap/test_writer.rb +58 -0
- data/test/hexapdf/font/encoding/test_base.rb +35 -0
- data/test/hexapdf/font/encoding/test_difference_encoding.rb +21 -0
- data/test/hexapdf/font/encoding/test_glyph_list.rb +59 -0
- data/test/hexapdf/font/encoding/test_zapf_dingbats_encoding.rb +16 -0
- data/test/hexapdf/font/test_encoding.rb +27 -0
- data/test/hexapdf/font/test_true_type_wrapper.rb +110 -0
- data/test/hexapdf/font/test_type1_wrapper.rb +66 -0
- data/test/hexapdf/font/true_type/common.rb +19 -0
- data/test/hexapdf/font/true_type/table/test_cmap.rb +59 -0
- data/test/hexapdf/font/true_type/table/test_cmap_subtable.rb +133 -0
- data/test/hexapdf/font/true_type/table/test_directory.rb +35 -0
- data/test/hexapdf/font/true_type/table/test_glyf.rb +58 -0
- data/test/hexapdf/font/true_type/table/test_head.rb +76 -0
- data/test/hexapdf/font/true_type/table/test_hhea.rb +40 -0
- data/test/hexapdf/font/true_type/table/test_hmtx.rb +38 -0
- data/test/hexapdf/font/true_type/table/test_loca.rb +43 -0
- data/test/hexapdf/font/true_type/table/test_maxp.rb +62 -0
- data/test/hexapdf/font/true_type/table/test_name.rb +95 -0
- data/test/hexapdf/font/true_type/table/test_os2.rb +65 -0
- data/test/hexapdf/font/true_type/table/test_post.rb +89 -0
- data/test/hexapdf/font/true_type/test_font.rb +120 -0
- data/test/hexapdf/font/true_type/test_table.rb +41 -0
- data/test/hexapdf/font/type1/test_afm_parser.rb +51 -0
- data/test/hexapdf/font/type1/test_font.rb +68 -0
- data/test/hexapdf/font/type1/test_pfb_parser.rb +37 -0
- data/test/hexapdf/font_loader/test_from_configuration.rb +28 -0
- data/test/hexapdf/font_loader/test_standard14.rb +22 -0
- data/test/hexapdf/image_loader/test_jpeg.rb +83 -0
- data/test/hexapdf/image_loader/test_pdf.rb +47 -0
- data/test/hexapdf/image_loader/test_png.rb +258 -0
- data/test/hexapdf/task/test_dereference.rb +46 -0
- data/test/hexapdf/task/test_optimize.rb +137 -0
- data/test/hexapdf/test_configuration.rb +82 -0
- data/test/hexapdf/test_data_dir.rb +32 -0
- data/test/hexapdf/test_dictionary.rb +284 -0
- data/test/hexapdf/test_dictionary_fields.rb +185 -0
- data/test/hexapdf/test_document.rb +574 -0
- data/test/hexapdf/test_document_utils.rb +144 -0
- data/test/hexapdf/test_filter.rb +96 -0
- data/test/hexapdf/test_font_utils.rb +47 -0
- data/test/hexapdf/test_importer.rb +78 -0
- data/test/hexapdf/test_object.rb +177 -0
- data/test/hexapdf/test_parser.rb +394 -0
- data/test/hexapdf/test_rectangle.rb +36 -0
- data/test/hexapdf/test_reference.rb +41 -0
- data/test/hexapdf/test_revision.rb +139 -0
- data/test/hexapdf/test_revisions.rb +93 -0
- data/test/hexapdf/test_serializer.rb +169 -0
- data/test/hexapdf/test_stream.rb +262 -0
- data/test/hexapdf/test_tokenizer.rb +30 -0
- data/test/hexapdf/test_writer.rb +120 -0
- data/test/hexapdf/test_xref_section.rb +35 -0
- data/test/hexapdf/type/test_catalog.rb +30 -0
- data/test/hexapdf/type/test_embedded_file.rb +16 -0
- data/test/hexapdf/type/test_file_specification.rb +148 -0
- data/test/hexapdf/type/test_font.rb +35 -0
- data/test/hexapdf/type/test_font_descriptor.rb +51 -0
- data/test/hexapdf/type/test_font_simple.rb +190 -0
- data/test/hexapdf/type/test_font_type1.rb +128 -0
- data/test/hexapdf/type/test_form.rb +60 -0
- data/test/hexapdf/type/test_info.rb +14 -0
- data/test/hexapdf/type/test_names.rb +9 -0
- data/test/hexapdf/type/test_object_stream.rb +84 -0
- data/test/hexapdf/type/test_page.rb +260 -0
- data/test/hexapdf/type/test_page_tree_node.rb +255 -0
- data/test/hexapdf/type/test_resources.rb +167 -0
- data/test/hexapdf/type/test_trailer.rb +109 -0
- data/test/hexapdf/type/test_xref_stream.rb +131 -0
- data/test/hexapdf/utils/test_bit_field.rb +47 -0
- data/test/hexapdf/utils/test_lru_cache.rb +22 -0
- data/test/hexapdf/utils/test_object_hash.rb +115 -0
- data/test/hexapdf/utils/test_pdf_doc_encoding.rb +18 -0
- data/test/hexapdf/utils/test_sorted_tree_node.rb +232 -0
- data/test/test_helper.rb +56 -0
- metadata +427 -0
@@ -0,0 +1,382 @@
|
|
1
|
+
# -*- encoding: utf-8 -*-
|
2
|
+
#
|
3
|
+
#--
|
4
|
+
# This file is part of HexaPDF.
|
5
|
+
#
|
6
|
+
# HexaPDF - A Versatile PDF Creation and Manipulation Library For Ruby
|
7
|
+
# Copyright (C) 2016 Thomas Leitner
|
8
|
+
#
|
9
|
+
# HexaPDF is free software: you can redistribute it and/or modify it
|
10
|
+
# under the terms of the GNU Affero General Public License version 3 as
|
11
|
+
# published by the Free Software Foundation with the addition of the
|
12
|
+
# following permission added to Section 15 as permitted in Section 7(a):
|
13
|
+
# FOR ANY PART OF THE COVERED WORK IN WHICH THE COPYRIGHT IS OWNED BY
|
14
|
+
# THOMAS LEITNER, THOMAS LEITNER DISCLAIMS THE WARRANTY OF NON
|
15
|
+
# INFRINGEMENT OF THIRD PARTY RIGHTS.
|
16
|
+
#
|
17
|
+
# HexaPDF is distributed in the hope that it will be useful, but WITHOUT
|
18
|
+
# ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
|
19
|
+
# FITNESS FOR A PARTICULAR PURPOSE. See the GNU Affero General Public
|
20
|
+
# License for more details.
|
21
|
+
#
|
22
|
+
# You should have received a copy of the GNU Affero General Public License
|
23
|
+
# along with HexaPDF. If not, see <http://www.gnu.org/licenses/>.
|
24
|
+
#
|
25
|
+
# The interactive user interfaces in modified source and object code
|
26
|
+
# versions of HexaPDF must display Appropriate Legal Notices, as required
|
27
|
+
# under Section 5 of the GNU Affero General Public License version 3.
|
28
|
+
#
|
29
|
+
# In accordance with Section 7(b) of the GNU Affero General Public
|
30
|
+
# License, a covered work must retain the producer line in every PDF that
|
31
|
+
# is created or manipulated using HexaPDF.
|
32
|
+
#++
|
33
|
+
|
34
|
+
require 'time'
|
35
|
+
require 'date'
|
36
|
+
require 'hexapdf/object'
|
37
|
+
require 'hexapdf/rectangle'
|
38
|
+
require 'hexapdf/configuration'
|
39
|
+
require 'hexapdf/utils/pdf_doc_encoding'
|
40
|
+
|
41
|
+
module HexaPDF
|
42
|
+
|
43
|
+
# A mixin used by Dictionary that implements the infrastructure and classes for defining fields.
|
44
|
+
#
|
45
|
+
# The class responsible for holding the field information is the Field class. Additionally, each
|
46
|
+
# field object is automatically assigned a stateless converter object that knows if data read
|
47
|
+
# from a PDF file potentially needs to be converted into a standard format before use.
|
48
|
+
#
|
49
|
+
# The methods that need to be implemented by such stateless converter objects are:
|
50
|
+
#
|
51
|
+
# usable_for?(type)::
|
52
|
+
# Should return +true+ if the converter is usable for the given type.
|
53
|
+
#
|
54
|
+
# additional_types::
|
55
|
+
# Should return +nil+, a single type class or an array of type classes which will additionally
|
56
|
+
# be allowed for the field.
|
57
|
+
#
|
58
|
+
# convert?(data, type)::
|
59
|
+
# Should return +true+ if the given +data+ object can be converted. The +type+ argument is the
|
60
|
+
# result of the Field#type method call.
|
61
|
+
#
|
62
|
+
# convert(data, type, document)::
|
63
|
+
# Should return the +converted+ data. The +type+ argument is the result of the Field#type method
|
64
|
+
# call and +document+ is the HexaPDF::Document for which the data should be converted.
|
65
|
+
module DictionaryFields
|
66
|
+
|
67
|
+
# This constant should *always* be used for boolean fields.
|
68
|
+
Boolean = [TrueClass, FalseClass]
|
69
|
+
|
70
|
+
# PDFByteString is used for defining fields with strings in binary encoding.
|
71
|
+
PDFByteString = Class.new { private_class_method :new }
|
72
|
+
|
73
|
+
# PDFDate is used for defining fields which store a date object as a string.
|
74
|
+
PDFDate = Class.new { private_class_method :new }
|
75
|
+
|
76
|
+
# A dictionary field contains information about one field of a structured PDF object and this
|
77
|
+
# information comes directly from the PDF specification.
|
78
|
+
#
|
79
|
+
# By incorporating this field information into HexaPDF it is possible to do many things
|
80
|
+
# automatically, like checking for the correct minimum PDF version to use or converting a date
|
81
|
+
# from its string representation to a Time object.
|
82
|
+
class Field
|
83
|
+
|
84
|
+
# Returns the list of available converter objects.
|
85
|
+
#
|
86
|
+
# See ::converter_for for information on how this list is used.
|
87
|
+
def self.converters
|
88
|
+
@converters ||= []
|
89
|
+
end
|
90
|
+
|
91
|
+
# Returns the converter for the given +type+ specification.
|
92
|
+
#
|
93
|
+
# The converter list is checked for a suitable converter from the front to the back. So if
|
94
|
+
# two converters could potentially be used for the same type, the one that appears earlier
|
95
|
+
# is used.
|
96
|
+
def self.converter_for(type)
|
97
|
+
@converters.find {|converter| converter.usable_for?(type)}
|
98
|
+
end
|
99
|
+
|
100
|
+
|
101
|
+
# Returns +true+ if the value for this field needs to be an indirect object, +false+ if it
|
102
|
+
# needs to be a direct object or +nil+ if it can be either.
|
103
|
+
attr_reader :indirect
|
104
|
+
|
105
|
+
# Returns the PDF version that is required for this field.
|
106
|
+
attr_reader :version
|
107
|
+
|
108
|
+
# Create a new Field object. See Dictionary::define_field for information on the arguments.
|
109
|
+
#
|
110
|
+
# Depending on the +type+ entry an appropriate field converter object is chosen from the
|
111
|
+
# available converters.
|
112
|
+
def initialize(type, required = false, default = nil, indirect = nil, version = nil)
|
113
|
+
@type = [type].flatten
|
114
|
+
@type_mapped = false
|
115
|
+
@required, @default, @indirect, @version = required, default, indirect, version
|
116
|
+
@converter = self.class.converter_for(type)
|
117
|
+
end
|
118
|
+
|
119
|
+
# Returns the array with valid types for this field.
|
120
|
+
def type
|
121
|
+
return @type if @type_mapped
|
122
|
+
@type_mapped = true
|
123
|
+
@type.concat(Array(@converter.additional_types))
|
124
|
+
@type.map! do |type|
|
125
|
+
if type.kind_of?(Symbol)
|
126
|
+
HexaPDF::GlobalConfiguration.constantize('object.type_map'.freeze, type)
|
127
|
+
else
|
128
|
+
type
|
129
|
+
end
|
130
|
+
end
|
131
|
+
@type.uniq!
|
132
|
+
@type
|
133
|
+
end
|
134
|
+
|
135
|
+
# Returns +true+ if this field is required.
|
136
|
+
def required?
|
137
|
+
@required
|
138
|
+
end
|
139
|
+
|
140
|
+
# Returns +true+ if a default value is available.
|
141
|
+
def default?
|
142
|
+
!@default.nil?
|
143
|
+
end
|
144
|
+
|
145
|
+
# Returns a duplicated default value, automatically taking unduplicatable classes into
|
146
|
+
# account.
|
147
|
+
def default
|
148
|
+
duplicatable_default? ? @default.dup : @default
|
149
|
+
end
|
150
|
+
|
151
|
+
# Returns +true+ if the default value can safely be duplicated with #dup.
|
152
|
+
def duplicatable_default?
|
153
|
+
@cached_dupdefault ||= HexaPDF::Object::NOT_DUPLICATABLE_CLASSES.none? do |klass|
|
154
|
+
@default.kind_of?(klass)
|
155
|
+
end
|
156
|
+
end
|
157
|
+
private :duplicatable_default?
|
158
|
+
|
159
|
+
# Returns +true+ if the given object is valid for this field.
|
160
|
+
def valid_object?(obj)
|
161
|
+
type.any? {|t| obj.kind_of?(t)} ||
|
162
|
+
(obj.kind_of?(HexaPDF::Object) && type.any? {|t| obj.value.kind_of?(t)})
|
163
|
+
end
|
164
|
+
|
165
|
+
# If a converter was defined, it is used. Otherwise +false+ is returned.
|
166
|
+
#
|
167
|
+
# See: #convert
|
168
|
+
def convert?(data)
|
169
|
+
@converter.convert?(data, type)
|
170
|
+
end
|
171
|
+
|
172
|
+
# If a converter was defined, it is used for converting the data. Otherwise this is a Noop -
|
173
|
+
# it just returns the data.
|
174
|
+
#
|
175
|
+
# See: #convert?
|
176
|
+
def convert(data, document)
|
177
|
+
@converter.convert(data, type, document)
|
178
|
+
end
|
179
|
+
|
180
|
+
end
|
181
|
+
|
182
|
+
# Does nothing.
|
183
|
+
module IdentityConverter
|
184
|
+
|
185
|
+
def self.usable_for?(_type) #:nodoc:
|
186
|
+
true
|
187
|
+
end
|
188
|
+
|
189
|
+
def self.additional_types #:nodoc:
|
190
|
+
end
|
191
|
+
|
192
|
+
def self.convert?(_data, _type) #:nodoc:
|
193
|
+
false
|
194
|
+
end
|
195
|
+
|
196
|
+
def self.convert(data, _type, _document) #:nodoc:
|
197
|
+
data
|
198
|
+
end
|
199
|
+
|
200
|
+
end
|
201
|
+
|
202
|
+
# Converter module for fields of type Dictionary and its subclasses. The first class in the
|
203
|
+
# type array of the field is used for the conversion.
|
204
|
+
module DictionaryConverter
|
205
|
+
|
206
|
+
# This converter is used when either a Symbol is provided as +type+ (for lazy loading) or
|
207
|
+
# when the type is a class derived from the Dictionary class.
|
208
|
+
def self.usable_for?(type)
|
209
|
+
type.kind_of?(Symbol) ||
|
210
|
+
(type.respond_to?(:ancestors) && type.ancestors.include?(HexaPDF::Dictionary))
|
211
|
+
end
|
212
|
+
|
213
|
+
# Dictionary fields can also contain simple hashes.
|
214
|
+
def self.additional_types
|
215
|
+
Hash
|
216
|
+
end
|
217
|
+
|
218
|
+
# Returns +true+ if the given data value can be converted to the Dictionary subclass
|
219
|
+
# specified by type (see Field#type).
|
220
|
+
def self.convert?(data, type)
|
221
|
+
!data.kind_of?(type.first) && (data.kind_of?(Hash) ||
|
222
|
+
data.kind_of?(HexaPDF::Dictionary))
|
223
|
+
end
|
224
|
+
|
225
|
+
# Wraps the given data value in the PDF specific type class.
|
226
|
+
def self.convert(data, type, document)
|
227
|
+
document.wrap(data, type: type.first)
|
228
|
+
end
|
229
|
+
|
230
|
+
end
|
231
|
+
|
232
|
+
# Converter module for string fields to automatically convert a string into UTF-8 encoding.
|
233
|
+
module StringConverter
|
234
|
+
|
235
|
+
# This converter is usable if the +type+ is the String class.
|
236
|
+
def self.usable_for?(type)
|
237
|
+
type == String
|
238
|
+
end
|
239
|
+
|
240
|
+
# :nodoc:
|
241
|
+
def self.additional_types
|
242
|
+
end
|
243
|
+
|
244
|
+
# Returns +true+ if the given data should be converted to a UTF-8 encoded string.
|
245
|
+
def self.convert?(data, _type)
|
246
|
+
data.kind_of?(String) && data.encoding == Encoding::BINARY
|
247
|
+
end
|
248
|
+
|
249
|
+
# Converts the string into UTF-8 encoding, assuming it is currently a binary string.
|
250
|
+
def self.convert(str, _type, _document)
|
251
|
+
if str.getbyte(0) == 254 && str.getbyte(1) == 255
|
252
|
+
str[2..-1].force_encoding(Encoding::UTF_16BE).encode(Encoding::UTF_8)
|
253
|
+
else
|
254
|
+
Utils::PDFDocEncoding.convert_to_utf8(str)
|
255
|
+
end
|
256
|
+
end
|
257
|
+
|
258
|
+
end
|
259
|
+
|
260
|
+
# Converter module for binary string fields to automatically convert a string into binary
|
261
|
+
# encoding.
|
262
|
+
module PDFByteStringConverter
|
263
|
+
|
264
|
+
# This converter is usable if the +type+ is PDFByteString.
|
265
|
+
def self.usable_for?(type)
|
266
|
+
type == PDFByteString
|
267
|
+
end
|
268
|
+
|
269
|
+
# :nodoc:
|
270
|
+
def self.additional_types
|
271
|
+
String
|
272
|
+
end
|
273
|
+
|
274
|
+
# Returns +true+ if the given data should be converted to a UTF-8 encoded string.
|
275
|
+
def self.convert?(data, _type)
|
276
|
+
data.kind_of?(String) && data.encoding != Encoding::BINARY
|
277
|
+
end
|
278
|
+
|
279
|
+
# Converts the string into UTF-8 encoding, assuming it is currently a binary string.
|
280
|
+
def self.convert(str, _type, _document)
|
281
|
+
str.force_encoding(Encoding::BINARY)
|
282
|
+
end
|
283
|
+
|
284
|
+
end
|
285
|
+
|
286
|
+
# Converter module for handling PDF date fields since they are stored as strings.
|
287
|
+
#
|
288
|
+
# The ISO PDF specification differs from Adobe's specification in respect to the supported
|
289
|
+
# date format. When converting from a date string to a Time object, this is taken into
|
290
|
+
# account.
|
291
|
+
#
|
292
|
+
# See: PDF1.7 s7.9.4, ADB1.7 3.8.3
|
293
|
+
module DateConverter
|
294
|
+
|
295
|
+
# This converter is usable if the +type+ is PDFDate.
|
296
|
+
def self.usable_for?(type)
|
297
|
+
type == PDFDate
|
298
|
+
end
|
299
|
+
|
300
|
+
# A date field may contain a string in PDF format, or a Time, Date or DateTime object.
|
301
|
+
def self.additional_types
|
302
|
+
[String, Time, Date, DateTime]
|
303
|
+
end
|
304
|
+
|
305
|
+
# :nodoc:
|
306
|
+
DATE_RE = /\AD:(\d{4})(\d\d)?(\d\d)?(\d\d)?(\d\d)?(\d\d)?([Z+-])?(?:(\d\d)(?:'|'(\d\d)'?|\z)?)?\z/n
|
307
|
+
|
308
|
+
# Returns +true+ if the given data should be converted to a Time object.
|
309
|
+
def self.convert?(data, _type)
|
310
|
+
data.kind_of?(String) && data =~ DATE_RE
|
311
|
+
end
|
312
|
+
|
313
|
+
# Converts the string into a Time object.
|
314
|
+
def self.convert(str, _type, _document)
|
315
|
+
m = DATE_RE.match(str)
|
316
|
+
utc_offset = (m[7].nil? || m[7] == 'Z' ? 0 : "#{m[7]}#{m[8]}:#{m[9] || '00'}")
|
317
|
+
Time.new(m[1].to_i, (m[2] ? m[2].to_i : 1), (m[3] ? m[3].to_i : 1),
|
318
|
+
m[4].to_i, m[5].to_i, m[6].to_i, utc_offset)
|
319
|
+
end
|
320
|
+
|
321
|
+
end
|
322
|
+
|
323
|
+
|
324
|
+
# Converter module for file specification fields. A file specification in string format is
|
325
|
+
# converted to the corresponding file specification dictionary.
|
326
|
+
module FileSpecificationConverter
|
327
|
+
|
328
|
+
# This converter is only used for the :FileSpec type.
|
329
|
+
def self.usable_for?(type)
|
330
|
+
type == :Filespec
|
331
|
+
end
|
332
|
+
|
333
|
+
# FileSpecs can also be simple hashes or strings.
|
334
|
+
def self.additional_types
|
335
|
+
[Hash, String]
|
336
|
+
end
|
337
|
+
|
338
|
+
# Returns +true+ if the given data is a string file specification.
|
339
|
+
def self.convert?(data, _type)
|
340
|
+
data.kind_of?(String)
|
341
|
+
end
|
342
|
+
|
343
|
+
# Converts the string file specification into a full file specification.
|
344
|
+
def self.convert(data, type, document)
|
345
|
+
document.wrap({F: data}, type: type.first)
|
346
|
+
end
|
347
|
+
|
348
|
+
end
|
349
|
+
|
350
|
+
|
351
|
+
# Converter module for fields of type Rectangle.
|
352
|
+
module RectangleConverter
|
353
|
+
|
354
|
+
# This converter is usable if the +type+ is Rectangle.
|
355
|
+
def self.usable_for?(type)
|
356
|
+
type == Rectangle
|
357
|
+
end
|
358
|
+
|
359
|
+
# Rectangle fields can also contain simple arrays.
|
360
|
+
def self.additional_types
|
361
|
+
Array
|
362
|
+
end
|
363
|
+
|
364
|
+
# Returns +true+ if the given data value is an Array.
|
365
|
+
def self.convert?(data, _type)
|
366
|
+
data.kind_of?(Array)
|
367
|
+
end
|
368
|
+
|
369
|
+
# Wraps the given data value in the Rectangle class.
|
370
|
+
def self.convert(data, _type, document)
|
371
|
+
document.wrap(data, type: Rectangle)
|
372
|
+
end
|
373
|
+
|
374
|
+
end
|
375
|
+
|
376
|
+
Field.converters.replace([FileSpecificationConverter, DictionaryConverter, StringConverter,
|
377
|
+
PDFByteStringConverter, DateConverter, RectangleConverter,
|
378
|
+
IdentityConverter])
|
379
|
+
|
380
|
+
end
|
381
|
+
|
382
|
+
end
|