RubyGems - hexapdf - Versions diffs - 0.32.1 → 0.33.0 - Mend

hexapdf 0.32.1 → 0.33.0

Files changed (205) hide show

checksums.yaml +4 -4
data/CHANGELOG.md +76 -1
data/README.md +9 -0
data/examples/002-graphics.rb +15 -17
data/examples/003-arcs.rb +9 -9
data/examples/009-text_layouter_alignment.rb +1 -1
data/examples/010-text_layouter_inline_boxes.rb +2 -2
data/examples/011-text_layouter_line_wrapping.rb +1 -1
data/examples/012-text_layouter_styling.rb +7 -7
data/examples/013-text_layouter_shapes.rb +1 -1
data/examples/014-text_in_polygon.rb +1 -1
data/examples/015-boxes.rb +8 -7
data/examples/016-frame_automatic_box_placement.rb +2 -2
data/examples/017-frame_text_flow.rb +2 -1
data/examples/018-composer.rb +1 -1
data/examples/020-column_box.rb +2 -1
data/examples/025-table_box.rb +46 -0
data/lib/hexapdf/cli/command.rb +5 -2
data/lib/hexapdf/cli/form.rb +5 -5
data/lib/hexapdf/cli/inspect.rb +3 -3
data/lib/hexapdf/cli.rb +4 -0
data/lib/hexapdf/composer.rb +104 -52
data/lib/hexapdf/configuration.rb +44 -39
data/lib/hexapdf/content/canvas.rb +393 -267
data/lib/hexapdf/content/color_space.rb +72 -25
data/lib/hexapdf/content/graphic_object/arc.rb +57 -24
data/lib/hexapdf/content/graphic_object/endpoint_arc.rb +66 -23
data/lib/hexapdf/content/graphic_object/geom2d.rb +47 -6
data/lib/hexapdf/content/graphic_object/solid_arc.rb +58 -36
data/lib/hexapdf/content/graphic_object.rb +6 -7
data/lib/hexapdf/content/graphics_state.rb +54 -45
data/lib/hexapdf/content/operator.rb +52 -54
data/lib/hexapdf/content/parser.rb +2 -2
data/lib/hexapdf/content/processor.rb +15 -15
data/lib/hexapdf/content/transformation_matrix.rb +1 -1
data/lib/hexapdf/content.rb +5 -0
data/lib/hexapdf/dictionary.rb +6 -5
data/lib/hexapdf/dictionary_fields.rb +42 -14
data/lib/hexapdf/digital_signature/cms_handler.rb +2 -2
data/lib/hexapdf/digital_signature/handler.rb +1 -1
data/lib/hexapdf/digital_signature/pkcs1_handler.rb +2 -3
data/lib/hexapdf/digital_signature/signature.rb +6 -6
data/lib/hexapdf/digital_signature/signatures.rb +13 -12
data/lib/hexapdf/digital_signature/signing/default_handler.rb +14 -5
data/lib/hexapdf/digital_signature/signing/signed_data_creator.rb +2 -4
data/lib/hexapdf/digital_signature/signing/timestamp_handler.rb +4 -4
data/lib/hexapdf/digital_signature/signing.rb +4 -0
data/lib/hexapdf/digital_signature/verification_result.rb +2 -2
data/lib/hexapdf/digital_signature.rb +7 -2
data/lib/hexapdf/document/destinations.rb +12 -11
data/lib/hexapdf/document/files.rb +1 -1
data/lib/hexapdf/document/fonts.rb +1 -1
data/lib/hexapdf/document/layout.rb +167 -39
data/lib/hexapdf/document/pages.rb +3 -2
data/lib/hexapdf/document.rb +89 -55
data/lib/hexapdf/encryption/aes.rb +5 -5
data/lib/hexapdf/encryption/arc4.rb +1 -1
data/lib/hexapdf/encryption/fast_aes.rb +2 -2
data/lib/hexapdf/encryption/fast_arc4.rb +1 -1
data/lib/hexapdf/encryption/identity.rb +1 -1
data/lib/hexapdf/encryption/ruby_aes.rb +1 -1
data/lib/hexapdf/encryption/ruby_arc4.rb +1 -1
data/lib/hexapdf/encryption/security_handler.rb +31 -24
data/lib/hexapdf/encryption/standard_security_handler.rb +45 -36
data/lib/hexapdf/encryption.rb +7 -2
data/lib/hexapdf/error.rb +18 -0
data/lib/hexapdf/filter/ascii85_decode.rb +1 -1
data/lib/hexapdf/filter/ascii_hex_decode.rb +1 -1
data/lib/hexapdf/filter/flate_decode.rb +1 -1
data/lib/hexapdf/filter/lzw_decode.rb +1 -1
data/lib/hexapdf/filter/pass_through.rb +1 -1
data/lib/hexapdf/filter/predictor.rb +1 -1
data/lib/hexapdf/filter/run_length_decode.rb +1 -1
data/lib/hexapdf/filter.rb +55 -6
data/lib/hexapdf/font/cmap/parser.rb +2 -2
data/lib/hexapdf/font/cmap.rb +1 -1
data/lib/hexapdf/font/encoding/difference_encoding.rb +1 -1
data/lib/hexapdf/font/encoding/mac_expert_encoding.rb +1 -1
data/lib/hexapdf/font/encoding/mac_roman_encoding.rb +2 -2
data/lib/hexapdf/font/encoding/standard_encoding.rb +1 -1
data/lib/hexapdf/font/encoding/symbol_encoding.rb +1 -1
data/lib/hexapdf/font/encoding/win_ansi_encoding.rb +3 -3
data/lib/hexapdf/font/encoding/zapf_dingbats_encoding.rb +1 -1
data/lib/hexapdf/font/invalid_glyph.rb +3 -0
data/lib/hexapdf/font/true_type_wrapper.rb +17 -4
data/lib/hexapdf/font/type1_wrapper.rb +19 -4
data/lib/hexapdf/font_loader/from_configuration.rb +5 -2
data/lib/hexapdf/font_loader/from_file.rb +5 -5
data/lib/hexapdf/font_loader/standard14.rb +3 -3
data/lib/hexapdf/font_loader.rb +3 -0
data/lib/hexapdf/image_loader/jpeg.rb +2 -2
data/lib/hexapdf/image_loader/pdf.rb +1 -1
data/lib/hexapdf/image_loader/png.rb +2 -2
data/lib/hexapdf/image_loader.rb +1 -1
data/lib/hexapdf/importer.rb +13 -0
data/lib/hexapdf/layout/box.rb +9 -2
data/lib/hexapdf/layout/box_fitter.rb +2 -2
data/lib/hexapdf/layout/column_box.rb +18 -4
data/lib/hexapdf/layout/frame.rb +30 -12
data/lib/hexapdf/layout/image_box.rb +5 -0
data/lib/hexapdf/layout/inline_box.rb +1 -0
data/lib/hexapdf/layout/list_box.rb +17 -1
data/lib/hexapdf/layout/page_style.rb +4 -4
data/lib/hexapdf/layout/style.rb +18 -3
data/lib/hexapdf/layout/table_box.rb +682 -0
data/lib/hexapdf/layout/text_box.rb +5 -3
data/lib/hexapdf/layout/text_fragment.rb +1 -1
data/lib/hexapdf/layout/text_layouter.rb +12 -4
data/lib/hexapdf/layout.rb +1 -0
data/lib/hexapdf/name_tree_node.rb +1 -1
data/lib/hexapdf/number_tree_node.rb +1 -1
data/lib/hexapdf/object.rb +18 -7
data/lib/hexapdf/parser.rb +8 -8
data/lib/hexapdf/pdf_array.rb +1 -1
data/lib/hexapdf/rectangle.rb +1 -1
data/lib/hexapdf/reference.rb +1 -1
data/lib/hexapdf/revision.rb +1 -1
data/lib/hexapdf/revisions.rb +3 -3
data/lib/hexapdf/serializer.rb +15 -15
data/lib/hexapdf/stream.rb +4 -2
data/lib/hexapdf/tokenizer.rb +14 -14
data/lib/hexapdf/type/acro_form/appearance_generator.rb +22 -22
data/lib/hexapdf/type/acro_form/button_field.rb +1 -1
data/lib/hexapdf/type/acro_form/choice_field.rb +1 -1
data/lib/hexapdf/type/acro_form/field.rb +2 -2
data/lib/hexapdf/type/acro_form/form.rb +1 -1
data/lib/hexapdf/type/acro_form/signature_field.rb +4 -4
data/lib/hexapdf/type/acro_form/text_field.rb +1 -1
data/lib/hexapdf/type/acro_form/variable_text_field.rb +1 -1
data/lib/hexapdf/type/acro_form.rb +1 -1
data/lib/hexapdf/type/action.rb +1 -1
data/lib/hexapdf/type/actions/go_to.rb +1 -1
data/lib/hexapdf/type/actions/go_to_r.rb +1 -1
data/lib/hexapdf/type/actions/launch.rb +1 -1
data/lib/hexapdf/type/actions/uri.rb +1 -1
data/lib/hexapdf/type/actions.rb +1 -1
data/lib/hexapdf/type/annotation.rb +3 -3
data/lib/hexapdf/type/annotations/link.rb +1 -1
data/lib/hexapdf/type/annotations/markup_annotation.rb +1 -1
data/lib/hexapdf/type/annotations/text.rb +1 -1
data/lib/hexapdf/type/annotations/widget.rb +2 -2
data/lib/hexapdf/type/annotations.rb +1 -1
data/lib/hexapdf/type/catalog.rb +1 -1
data/lib/hexapdf/type/cid_font.rb +3 -3
data/lib/hexapdf/type/embedded_file.rb +1 -1
data/lib/hexapdf/type/file_specification.rb +2 -2
data/lib/hexapdf/type/font_descriptor.rb +1 -1
data/lib/hexapdf/type/font_simple.rb +2 -2
data/lib/hexapdf/type/font_type0.rb +3 -3
data/lib/hexapdf/type/font_type3.rb +1 -1
data/lib/hexapdf/type/form.rb +1 -1
data/lib/hexapdf/type/graphics_state_parameter.rb +1 -1
data/lib/hexapdf/type/icon_fit.rb +1 -1
data/lib/hexapdf/type/image.rb +1 -1
data/lib/hexapdf/type/info.rb +1 -1
data/lib/hexapdf/type/mark_information.rb +1 -1
data/lib/hexapdf/type/names.rb +2 -2
data/lib/hexapdf/type/object_stream.rb +7 -3
data/lib/hexapdf/type/outline.rb +1 -1
data/lib/hexapdf/type/outline_item.rb +1 -1
data/lib/hexapdf/type/page.rb +19 -10
data/lib/hexapdf/type/page_label.rb +1 -1
data/lib/hexapdf/type/page_tree_node.rb +1 -1
data/lib/hexapdf/type/resources.rb +1 -1
data/lib/hexapdf/type/trailer.rb +2 -2
data/lib/hexapdf/type/viewer_preferences.rb +1 -1
data/lib/hexapdf/type/xref_stream.rb +2 -2
data/lib/hexapdf/utils/pdf_doc_encoding.rb +1 -1
data/lib/hexapdf/version.rb +1 -1
data/lib/hexapdf/writer.rb +4 -4
data/lib/hexapdf/xref_section.rb +2 -2
data/test/hexapdf/content/graphic_object/test_endpoint_arc.rb +11 -1
data/test/hexapdf/content/graphic_object/test_geom2d.rb +7 -0
data/test/hexapdf/content/test_canvas.rb +0 -1
data/test/hexapdf/digital_signature/test_signatures.rb +22 -0
data/test/hexapdf/document/test_files.rb +2 -2
data/test/hexapdf/document/test_layout.rb +98 -0
data/test/hexapdf/encryption/test_security_handler.rb +12 -11
data/test/hexapdf/encryption/test_standard_security_handler.rb +35 -23
data/test/hexapdf/font/test_true_type_wrapper.rb +18 -1
data/test/hexapdf/font/test_type1_wrapper.rb +15 -1
data/test/hexapdf/layout/test_box.rb +1 -1
data/test/hexapdf/layout/test_column_box.rb +65 -21
data/test/hexapdf/layout/test_frame.rb +14 -14
data/test/hexapdf/layout/test_image_box.rb +4 -0
data/test/hexapdf/layout/test_inline_box.rb +5 -0
data/test/hexapdf/layout/test_list_box.rb +40 -6
data/test/hexapdf/layout/test_page_style.rb +3 -2
data/test/hexapdf/layout/test_style.rb +50 -0
data/test/hexapdf/layout/test_table_box.rb +722 -0
data/test/hexapdf/layout/test_text_box.rb +18 -0
data/test/hexapdf/layout/test_text_layouter.rb +4 -0
data/test/hexapdf/test_dictionary_fields.rb +4 -1
data/test/hexapdf/test_document.rb +1 -0
data/test/hexapdf/test_filter.rb +8 -0
data/test/hexapdf/test_importer.rb +9 -0
data/test/hexapdf/test_object.rb +16 -5
data/test/hexapdf/test_parser.rb +1 -1
data/test/hexapdf/test_stream.rb +7 -0
data/test/hexapdf/test_writer.rb +3 -3
data/test/hexapdf/type/acro_form/test_appearance_generator.rb +13 -5
data/test/hexapdf/type/acro_form/test_form.rb +4 -3
data/test/hexapdf/type/test_object_stream.rb +9 -3
data/test/hexapdf/type/test_page.rb +18 -4
metadata +17 -8

data/lib/hexapdf/layout/text_box.rb CHANGED Viewed

@@ -74,13 +74,14 @@ module HexaPDF
         @width = @height = 0
         @result = if style.position == :flow
-                    @tl.fit(@items, frame.width_specification, frame.shape.bbox.height)
+                    @tl.fit(@items, frame.width_specification, frame.shape.bbox.height,
+                            apply_first_text_indent: !split_box?)
                   else
                     @width = reserved_width
                     @height = reserved_height
                     width = (@initial_width > 0 ? @initial_width : available_width) - @width
                     height = (@initial_height > 0 ? @initial_height : available_height) - @height
-                    @tl.fit(@items, width, height)
+                    @tl.fit(@items, width, height, apply_first_text_indent: !split_box?)
                   end
         @width += if @initial_width > 0 || style.align == :center || style.align == :right
                     width
@@ -103,7 +104,8 @@ module HexaPDF
       def split(available_width, available_height, frame)
         fit(available_width, available_height, frame) unless @result
-        if style.position != :flow && (@width > available_width || @height > available_height)
+        if style.position != :flow && (float_compare(@width, available_width) > 0 ||
+                                       float_compare(@height, available_height) > 0)
           [nil, self]
         elsif @result.remaining_items.empty?
           [self]

data/lib/hexapdf/layout/text_fragment.rb CHANGED Viewed

@@ -259,7 +259,7 @@ module HexaPDF
       # The width of the text fragment.
       #
       # It is the sum of the widths of its items and is calculated by using the algorithm presented
-      # in PDF1.7 s9.4.4. By using kerning values as the first and/or last items, the text contained
+      # in PDF2.0 s9.4.4. By using kerning values as the first and/or last items, the text contained
       # in the fragment may spill over the left and/or right boundary.
       def width
         @width ||= @items.sum {|item| style.scaled_item_width(item) }

data/lib/hexapdf/layout/text_layouter.rb CHANGED Viewed

@@ -51,7 +51,8 @@ module HexaPDF
     # * Existing line breaking characters inside of TextFragment objects are respected when fitting
     #   text. If this is not wanted, they have to be removed beforehand.
     #
-    # * The first line may be indented by setting Style#text_indent which may also be negative.
+    # * The first line of each paragraph may be indented by setting Style#text_indent which may also
+    #   be negative.
     #
     # * Text can be fitted into arbitrarily shaped areas, even containing holes.
     #
@@ -658,7 +659,7 @@ module HexaPDF
       end
       # :call-seq:
-      #   text_layouter.fit(items, width, height) -> result
+      #   text_layouter.fit(items, width, height, apply_first_text_indent: true) -> result
       #
       # Fits the items into the given area and returns a Result object with all the information.
       #
@@ -693,7 +694,14 @@ module HexaPDF
       # The text segmentation algorithm specified via #style is applied to the items in case they
       # are not already in segmented form. This also means that Result#remaining_items always
       # contains segmented items.
-      def fit(items, width, height)
+      #
+      # Optional arguments:
+      #
+      # +apply_first_text_indent+::
+      #     Specifies whether style.text_indent should be applied to the first line. This should be
+      #     set to +false+ if the items start with a continuation of a paragraph instead of starting
+      #     a new paragraph (e.g. after a page break).
+      def fit(items, width, height, apply_first_text_indent: true)
         unless items.empty? || items[0].respond_to?(:type)
           items = style.text_segmentation_algorithm.call(items)
         end
@@ -704,7 +712,7 @@ module HexaPDF
         rest = items
         # processing state variables
-        indent = style.text_indent
+        indent = apply_first_text_indent ? style.text_indent : 0
         line_fragments = []
         line_height = 0
         previous_line = nil

data/lib/hexapdf/layout.rb CHANGED Viewed

@@ -57,6 +57,7 @@ module HexaPDF
     autoload(:ColumnBox, 'hexapdf/layout/column_box')
     autoload(:ListBox, 'hexapdf/layout/list_box')
     autoload(:PageStyle, 'hexapdf/layout/page_style')
+    autoload(:TableBox, 'hexapdf/layout/table_box')
   end

data/lib/hexapdf/name_tree_node.rb CHANGED Viewed

@@ -55,7 +55,7 @@ module HexaPDF
   # HexaPDF::Utils::SortedTreeNode) to add or retrieve entries. They ensure that the name tree stays
   # valid.
   #
-  # See: PDF1.7 s7.9.6
+  # See: PDF2.0 s7.9.6
   class NameTreeNode < Dictionary
     include Utils::SortedTreeNode

data/lib/hexapdf/number_tree_node.rb CHANGED Viewed

@@ -44,7 +44,7 @@ module HexaPDF
   # Number trees are similar to name trees but use integers as keys instead of strings. See
   # HexaPDF::NameTreeNode for a more detailed explanation.
   #
-  # See: PDF1.7 s7.9.7, HexaPDF::NameTreeNode
+  # See: PDF2.0 s7.9.7, HexaPDF::NameTreeNode
   class NumberTreeNode < Dictionary
     include Utils::SortedTreeNode

data/lib/hexapdf/object.rb CHANGED Viewed

@@ -117,7 +117,7 @@ module HexaPDF
   #
   # See: HexaPDF::Dictionary, HexaPDF::Stream, HexaPDF::Reference, HexaPDF::Document
   #
-  # See: PDF1.7 s7.3.10, s7.3.8
+  # See: PDF2.0 s7.3.10, s7.3.8
   class Object
     include Comparable
@@ -143,18 +143,27 @@ module HexaPDF
     # Makes sure that the object itself as well as all nested values are direct objects.
     #
+    # The +document+ argument needs to contain the Document instance to which +object+ belongs so
+    # that references can be correctly resolved.
+    #
     # If an indirect object is found, it is turned into a direct object and the indirect object is
     # deleted from the document.
-    def self.make_direct(object)
+    def self.make_direct(object, document)
       if object.kind_of?(HexaPDF::Object) && object.indirect?
+        raise HexaPDF::Error, "Can't make a stream object a direct object" if object.data.stream
         object_to_delete = object
         object = object.value
         object_to_delete.document.delete(object_to_delete)
       end
-      if object.kind_of?(Hash)
-        object.transform_values! {|val| make_direct(val) }
-      elsif object.kind_of?(Array)
-        object.map! {|val| make_direct(val) }
+      case object
+      when HexaPDF::Object
+        object.data.value = make_direct(object.data.value, document)
+      when Hash
+        object.transform_values! {|val| make_direct(val, document) }
+      when Array
+        object.map! {|val| make_direct(val, document) }
+      when Reference
+        object = make_direct(document.object(object), document)
       end
       object
     end
@@ -255,7 +264,7 @@ module HexaPDF
     # type.
     #
     # However, the Type and Subtype fields can easily be used for this. Subclasses for PDF objects
-    # that don't have such fields may use a unique name that has to begin with XX (see PDF1.7 sE.2)
+    # that don't have such fields may use a unique name that has to begin with XX (see PDF2.0 sE.2)
     # and therefore doesn't clash with names defined by the PDF specification.
     #
     # For basic objects this always returns +:Unknown+.
@@ -297,6 +306,8 @@ module HexaPDF
     end
     # Makes a deep copy of the source PDF object and resets the object identifier.
+    #
+    # Note that indirect references are *not* copied! If that is also needed, use Importer::copy.
     def deep_copy
       obj = dup
       obj.instance_variable_set(:@data, @data.dup)

data/lib/hexapdf/parser.rb CHANGED Viewed

@@ -41,11 +41,11 @@ require 'hexapdf/xref_section'
 module HexaPDF
-  # Parses an IO stream according to PDF1.7 to get at the contained objects.
+  # Parses an IO stream according to PDF2.0 to get at the contained objects.
   #
   # This class also contains higher-level methods for getting indirect objects and revisions.
   #
-  # See: PDF1.7 s7
+  # See: PDF2.0 s7
   class Parser
     # The IO stream which is parsed.
@@ -125,7 +125,7 @@ module HexaPDF
     #
     # Returns an array containing [object, oid, gen, stream].
     #
-    # See: PDF1.7 s7.3.10, s7.3.8
+    # See: PDF2.0 s7.3.10, s7.3.8
     def parse_indirect_object(offset = nil)
       @tokenizer.pos = offset + @header_offset if offset
       oid = @tokenizer.next_token
@@ -267,7 +267,7 @@ module HexaPDF
     #
     # This method can only parse cross-reference sections, not cross-reference streams!
     #
-    # See: PDF1.7 s7.5.4, s7.5.5; ADB1.7 sH.3-3.4.3
+    # See: PDF2.0 s7.5.4, s7.5.5; ADB1.7 sH.3-3.4.3
     def parse_xref_section_and_trailer(offset)
       @tokenizer.pos = offset + @header_offset
       token = @tokenizer.next_token
@@ -346,7 +346,7 @@ module HexaPDF
     #
     # If strict parsing is disabled, the whole file is searched for the offset.
     #
-    # See: PDF1.7 s7.5.5, ADB1.7 sH.3-3.4.4
+    # See: PDF2.0 s7.5.5, ADB1.7 sH.3-3.4.4
     def startxref_offset
       return @startxref_offset if defined?(@startxref_offset)
@@ -397,7 +397,7 @@ module HexaPDF
     # Returns the PDF version number that is stored in the file header.
     #
-    # See: PDF1.7 s7.5.2
+    # See: PDF2.0 s7.5.2
     def file_header_version
       unless @header_version
         raise_malformed("PDF file header is missing or corrupt", pos: 0)
@@ -413,7 +413,7 @@ module HexaPDF
     # restriction so that the header may appear in the first 1024 bytes. We follow the Adobe
     # convention.
     #
-    # See: PDF1.7 s7.5.2, ADB1.7 sH.3-3.4.1
+    # See: PDF2.0 s7.5.2, ADB1.7 sH.3-3.4.1
     def retrieve_pdf_header_offset_and_version
       @io.seek(0)
       @header_offset = (@io.read(1024) || '').index(/%PDF-(\d\.\d)/) || 0
@@ -458,7 +458,7 @@ module HexaPDF
               linearized = obj.kind_of?(Hash) && obj.key?(:Linearized)
               @tokenizer.pos = pos
             end
-            @tokenizer.scan_until(/(?:\n|\r\n?)endobj\b/)
+            @tokenizer.scan_until(/\bendobj\b/)
           end
         elsif token.kind_of?(Tokenizer::Token) && token == 'trailer'
           obj = @tokenizer.next_object rescue nil

data/lib/hexapdf/pdf_array.rb CHANGED Viewed

@@ -44,7 +44,7 @@ module HexaPDF
   # #[] method. Therefore not all Array methods are implemented - use the #value directly if other
   # methods are needed.
   #
-  # See: PDF1.7 s7.3.6
+  # See: PDF2.0 s7.3.6
   class PDFArray < HexaPDF::Object
     include Enumerable

data/lib/hexapdf/rectangle.rb CHANGED Viewed

@@ -51,7 +51,7 @@ module HexaPDF
   # where +left+ is the bottom left x-coordinate, +bottom+ is the bottom left y-coordinate, +right+
   # is the top right x-coordinate and +top+ is the top right y-coordinate.
   #
-  # See: PDF1.7 s7.9.5
+  # See: PDF2.0 s7.9.5
   class Rectangle < HexaPDF::PDFArray
     # Returns the x-coordinate of the bottom-left corner.

data/lib/hexapdf/reference.rb CHANGED Viewed

@@ -50,7 +50,7 @@ module HexaPDF
   # keys. Furthermore the implementation is compatible to the one of Object, i.e. the hash of a
   # Reference object is the same as the hash of an indirect Object.
   #
-  # See: PDF1.7 s7.3.10, Object
+  # See: PDF2.0 s7.3.10, Object
   class Reference
     include Comparable

data/lib/hexapdf/revision.rb CHANGED Viewed

@@ -48,7 +48,7 @@ module HexaPDF
   # If a revision doesn't have an associated cross-reference section, it wasn't created from a PDF
   # file.
   #
-  # See: PDF1.7 s7.5.6, Revisions
+  # See: PDF2.0 s7.5.6, Revisions
   class Revision
     include Enumerable

data/lib/hexapdf/revisions.rb CHANGED Viewed

@@ -55,7 +55,7 @@ module HexaPDF
   # this should only be done if one is familiar with the inner workings of HexaPDF. Otherwise it is
   # best to use the convenience methods of this class to create, access or delete indirect objects.
   #
-  # See: PDF1.7 s7.5.6, HexaPDF::Revision
+  # See: PDF2.0 s7.5.6, HexaPDF::Revision
   class Revisions
     class << self
@@ -76,7 +76,7 @@ module HexaPDF
           seen_xref_offsets = {}
           while offset && !seen_xref_offsets.key?(offset)
-            # PDF1.7 s7.5.5 states that :Prev needs to be indirect, Adobe's reference 3.4.4 says it
+            # PDF2.0 s7.5.5 states that :Prev needs to be indirect, Adobe's reference 3.4.4 says it
             # should be direct. Adobe's POV is followed here. Same with :XRefStm.
             xref_section, trailer = parser.load_revision(offset)
             seen_xref_offsets[offset] = true
@@ -167,7 +167,7 @@ module HexaPDF
     # For references to unknown objects, +nil+ is returned but free objects are represented by a
     # PDF Null object, not by +nil+!
     #
-    # See: PDF1.7 s7.3.9
+    # See: PDF2.0 s7.3.9
     def object(ref)
       i = @revisions.size - 1
       while i >= 0

data/lib/hexapdf/serializer.rb CHANGED Viewed

@@ -79,7 +79,7 @@ module HexaPDF
   #
   # If no serialization method for a specific class is found, the ancestors classes are tried.
   #
-  # See: PDF1.7 s7.3
+  # See: PDF2.0 s7.3
   class Serializer
     # The encrypter to use for encrypting strings and streams. If +nil+, strings and streams are not
@@ -163,21 +163,21 @@ module HexaPDF
     # Serializes the +nil+ value.
     #
-    # See: PDF1.7 s7.3.9
+    # See: PDF2.0 s7.3.9
     def serialize_nilclass(_obj)
       "null"
     end
     # Serializes the +true+ value.
     #
-    # See: PDF1.7 s7.3.2
+    # See: PDF2.0 s7.3.2
     def serialize_trueclass(_obj)
       "true"
     end
     # Serializes the +false+ value.
     #
-    # See: PDF1.7 s7.3.2
+    # See: PDF2.0 s7.3.2
     def serialize_falseclass(_obj)
       "false"
     end
@@ -187,21 +187,21 @@ module HexaPDF
     # This method should be used for cases where it is known that the object is either an Integer
     # or a Float.
     #
-    # See: PDF1.7 s7.3.3
+    # See: PDF2.0 s7.3.3
     def serialize_numeric(obj)
       obj.kind_of?(Integer) ? obj.to_s : serialize_float(obj)
     end
     # Serializes an Integer object.
     #
-    # See: PDF1.7 s7.3.3
+    # See: PDF2.0 s7.3.3
     def serialize_integer(obj)
       obj.to_s
     end
     # Serializes a Float object.
     #
-    # See: PDF1.7 s7.3.3
+    # See: PDF2.0 s7.3.3
     def serialize_float(obj)
       if -0.0001 < obj && obj < 0.0001 && obj != 0
         sprintf("%.6f", obj)
@@ -215,7 +215,7 @@ module HexaPDF
     # The regexp matches all characters that need to be escaped and the substs hash contains the
     # mapping from these characters to their escaped form.
     #
-    # See PDF1.7 s7.3.5
+    # See PDF2.0 s7.3.5
     NAME_SUBSTS = {} # :nodoc:
     [0..32, 127..255, Tokenizer::DELIMITER.bytes, Tokenizer::WHITESPACE.bytes, [35]].each do |a|
       a.each {|c| NAME_SUBSTS[c.chr] = "##{c.to_s(16).rjust(2, '0')}" }
@@ -225,7 +225,7 @@ module HexaPDF
     # Serializes a Symbol object (i.e. a PDF name object).
     #
-    # See: PDF1.7 s7.3.5
+    # See: PDF2.0 s7.3.5
     def serialize_symbol(obj)
       NAME_CACHE[obj] ||=
         begin
@@ -240,7 +240,7 @@ module HexaPDF
     # Serializes an Array object.
     #
-    # See: PDF1.7 s7.3.6
+    # See: PDF2.0 s7.3.6
     def serialize_array(obj)
       str = +"["
       index = 0
@@ -256,7 +256,7 @@ module HexaPDF
     # Serializes a Hash object (i.e. a PDF dictionary object).
     #
-    # See: PDF1.7 s7.3.7
+    # See: PDF2.0 s7.3.7
     def serialize_hash(obj)
       str = +"<<"
       obj.each do |k, v|
@@ -274,7 +274,7 @@ module HexaPDF
     # Serializes a String object.
     #
-    # See: PDF1.7 s7.3.4
+    # See: PDF2.0 s7.3.4
     def serialize_string(obj)
       obj = if @encrypter && @object.kind_of?(HexaPDF::Object) && @object.indirect?
               encrypter.encrypt_string(obj, @object)
@@ -294,7 +294,7 @@ module HexaPDF
     # The ISO PDF specification differs in respect to the supported date format. When converting
     # to a date string, a format suitable for both is output.
     #
-    # See: PDF1.7 s7.9.4, ADB1.7 3.8.3
+    # See: PDF2.0 s7.9.4, ADB1.7 3.8.3
     def serialize_time(obj)
       zone = obj.strftime("%z'")
       if zone == "+0000'"
@@ -330,14 +330,14 @@ module HexaPDF
       end
     end
-    # See: PDF1.7 s7.3.10
+    # See: PDF2.0 s7.3.10
     def serialize_hexapdf_reference(obj)
       "#{obj.oid} #{obj.gen} R"
     end
     # Serializes the streams dictionary and its stream.
     #
-    # See: PDF1.7 s7.3.8
+    # See: PDF2.0 s7.3.8
     def serialize_hexapdf_stream(obj)
       if !obj.indirect?
         raise HexaPDF::Error, "Can't serialize PDF stream without object identifier"

data/lib/hexapdf/stream.rb CHANGED Viewed

@@ -88,7 +88,9 @@ module HexaPDF
     # Returns a Fiber for getting at the data of the stream represented by this object.
     def fiber(chunk_size = 0)
-      if @source.kind_of?(Proc)
+      if @source.kind_of?(FiberDoubleForString)
+        @source.dup
+      elsif @source.kind_of?(Proc)
         FiberWithLength.new(@length, &@source)
       elsif @source.kind_of?(String)
         HexaPDF::Filter.source_from_file(@source, pos: @offset || 0, length: @length || -1,
@@ -134,7 +136,7 @@ module HexaPDF
   #
   # Note that support for external streams (/F, /FFilter, /FDecodeParms) is not yet implemented!
   #
-  # See: PDF1.7 s7.3.8, Dictionary
+  # See: PDF2.0 s7.3.8, Dictionary
   class Stream < Dictionary
     define_field :Length,       type: Integer # not required, will be auto-filled when writing

data/lib/hexapdf/tokenizer.rb CHANGED Viewed

@@ -42,7 +42,7 @@ module HexaPDF
   # Tokenizes the content of an IO object following the PDF rules.
   #
-  # See: PDF1.7 s7.2
+  # See: PDF2.0 s7.2
   class Tokenizer
     # Represents a keyword in a PDF file.
@@ -61,12 +61,12 @@ module HexaPDF
     # Characters defined as whitespace.
     #
-    # See: PDF1.7 s7.2.2
+    # See: PDF2.0 s7.2.2
     WHITESPACE = " \n\r\0\t\f"
     # Characters defined as delimiters.
     #
-    # See: PDF1.7 s7.2.2
+    # See: PDF2.0 s7.2.2
     DELIMITER = "()<>{}/[]%"
     WHITESPACE_MULTI_RE = /[#{WHITESPACE}]+/ # :nodoc:
@@ -171,7 +171,7 @@ module HexaPDF
     # If the +allow_end_array_token+ argument is +true+, the ']' token is permitted to facilitate
     # the use of this method during array parsing.
     #
-    # See: PDF1.7 s7.3
+    # See: PDF2.0 s7.3
     def next_object(allow_end_array_token: false, allow_keyword: false)
       token = next_token
@@ -231,7 +231,7 @@ module HexaPDF
     # If a problem is detected, yields to caller where the argument +recoverable+ is truthy if the
     # problem is recoverable.
     #
-    # See: PDF1.7 7.5.4
+    # See: PDF2.0 7.5.4
     def next_xref_entry #:yield: recoverable
       prepare_string_scanner(20)
       if !@ss.skip(/(\d{10}) (\d{5}) ([nf])(?: \r| \n|\r\n|(\r\r|\r|\n))/) || @ss[4]
@@ -242,7 +242,7 @@ module HexaPDF
     # Skips all whitespace at the current position.
     #
-    # See: PDF1.7 s7.2.2
+    # See: PDF2.0 s7.2.2
     def skip_whitespace
       prepare_string_scanner
       prepare_string_scanner while @ss.skip(WHITESPACE_MULTI_RE)
@@ -268,7 +268,7 @@ module HexaPDF
     # Parses the keyword at the current position.
     #
-    # See: PDF1.7 s7.2
+    # See: PDF2.0 s7.2
     def parse_keyword
       str = scan_until(WHITESPACE_OR_DELIMITER_RE) || @ss.scan(/.*/)
       TOKEN_CACHE[str]
@@ -278,12 +278,12 @@ module HexaPDF
     # Parses the number (integer or real) at the current position.
     #
-    # See: PDF1.7 s7.3.3
+    # See: PDF2.0 s7.3.3
     def parse_number
       val = scan_until(WHITESPACE_OR_DELIMITER_RE) || @ss.scan(/.*/)
       if val.match?(/\A[+-]?\d++(?!\.)\z/)
         tmp = val.to_i
-        # Handle object references, see PDF1.7 s7.3.10
+        # Handle object references, see PDF2.0 s7.3.10
         prepare_string_scanner(10)
         if @ss.scan(REFERENCE_RE)
           tmp = if tmp > 0
@@ -315,7 +315,7 @@ module HexaPDF
     # Parses the literal string at the current position.
     #
-    # See: PDF1.7 s7.3.4.2
+    # See: PDF2.0 s7.3.4.2
     def parse_literal_string
       @ss.pos += 1
       str = "".b
@@ -358,7 +358,7 @@ module HexaPDF
     # Parses the hex string at the current position.
     #
-    # See: PDF1.7 s7.3.4.3
+    # See: PDF2.0 s7.3.4.3
     def parse_hex_string
       @ss.pos += 1
       data = scan_until(/(?=>)/)
@@ -373,7 +373,7 @@ module HexaPDF
     # Parses the name at the current position.
     #
-    # See: PDF1.7 s7.3.5
+    # See: PDF2.0 s7.3.5
     def parse_name
       @ss.pos += 1
       str = scan_until(WHITESPACE_OR_DELIMITER_RE) || @ss.scan(/.*/)
@@ -389,7 +389,7 @@ module HexaPDF
     #
     # It is assumed that the initial '[' has already been scanned.
     #
-    # See: PDF1.7 s7.3.6
+    # See: PDF2.0 s7.3.6
     def parse_array
       result = []
       while true
@@ -408,7 +408,7 @@ module HexaPDF
     #
     # It is assumed that the initial '<<' has already been scanned.
     #
-    # See: PDF1.7 s7.3.7
+    # See: PDF2.0 s7.3.7
     def parse_dictionary
       result = {}
       while true

data/lib/hexapdf/type/acro_form/appearance_generator.rb CHANGED Viewed

@@ -61,7 +61,7 @@ module HexaPDF
       # By subclassing and overriding the necessary methods it is possible to define custom
       # appearances.
       #
-      # See: PDF1.7 s12.5.5, s12.7
+      # See: PDF2.0 s12.5.5, s12.7
       class AppearanceGenerator
         # Creates a new instance for the given +widget+.
@@ -200,7 +200,7 @@ module HexaPDF
         def create_text_appearances
           default_resources = @document.acro_form.default_resources
           font, font_size, font_color = retrieve_font_information(default_resources)
-          style = HexaPDF::Layout::Style.new(font: font, fill_color: font_color)
+          style = HexaPDF::Layout::Style.new(font: font, font_size: font_size, fill_color: font_color)
           border_style = @widget.border_style
           padding = [1, border_style.width].max
@@ -226,8 +226,6 @@ module HexaPDF
           canvas = form.canvas
           apply_background_and_border(border_style, canvas)
-          style.font_size = calculate_font_size(font, font_size, height, border_style)
-          style.clear_cache
           canvas.marked_content_sequence(:Tx) do
             if @field.field_value || @field.concrete_field_type == :list_box
@@ -362,6 +360,7 @@ module HexaPDF
         def draw_single_line_text(canvas, width, height, style, padding)
           value, text_color = apply_javascript_formatting(@field.field_value)
           style.fill_color = text_color if text_color
+          calculate_and_apply_font_size(value, style, width, height, padding)
           fragment = HexaPDF::Layout::TextFragment.create(value, style)
           if @field.concrete_field_type == :comb_text_field
@@ -431,6 +430,11 @@ module HexaPDF
         # Draws the visible option items of the list box in the widget's rectangle.
         def draw_list_box(canvas, width, height, style, padding)
+          if style.font_size == 0
+            style.font_size = 12 # Seems to be Adobe's default
+            style.clear_cache
+          end
           option_items = @field.option_items
           top_index = @field.list_box_top_index
           items = [Layout::TextFragment.create(option_items[top_index..-1].join("\n"), style)]
@@ -475,24 +479,20 @@ module HexaPDF
           [font, font_size, font_color]
         end
-        # Calculates the font size for text fields based on the font and font size of the default
-        # appearance string, the annotation rectangle's height and the border style.
-        def calculate_font_size(font, font_size, height, border_style)
-          if font_size == 0
-            case @field.concrete_field_type
-            when :multiline_text_field
-              0 # Handled by multiline drawing code
-            when :list_box
-              12 # Seems to be Adobe's default
-            else
-              unit_font_size = (font.wrapped_font.bounding_box[3] - font.wrapped_font.bounding_box[1]) *
-                font.scaling_factor / 1000.0
-              # The constant factor was found empirically by checking what Adobe Reader etc. do
-              (height - 2 * border_style.width) / unit_font_size * 0.83
-            end
-          else
-            font_size
-          end
+        # Calculates the font size for single line text fields using auto-sizing, based on the font
+        # and font size of the default appearance string, the annotation rectangle's height and
+        # width and the given padding. The font size is then applied to the provided style object.
+        def calculate_and_apply_font_size(value, style, width, height, padding)
+          return if style.font_size != 0
+          font = style.font
+          unit_font_size = (font.wrapped_font.bounding_box[3] - font.wrapped_font.bounding_box[1]) *
+            font.scaling_factor / 1000.0
+          # The constant factor was found empirically by checking what Adobe Reader etc. do
+          style.font_size = (height - 2 * padding) / unit_font_size * 0.85
+          fragment = HexaPDF::Layout::TextFragment.create(value, style)
+          style.font_size = [style.font_size, style.font_size * (width - 4 * padding) / fragment.width].min
+          style.clear_cache
         end
         # Handles Javascript formatting routines for single-line text fields.

data/lib/hexapdf/type/acro_form/button_field.rb CHANGED Viewed

@@ -81,7 +81,7 @@ module HexaPDF
       # :radios_in_unison:: A group of radio buttons with the same value for the on state will turn
       #                     on or off in unison.
       #
-      # See: PDF1.7 s12.7.4.2
+      # See: PDF2.0 s12.7.4.2
       class ButtonField < Field
         define_type :XXAcroFormField