RubyGems - pdf-reader - Versions diffs - 1.1.1 → 1.2.0 - Mend

pdf-reader 1.1.1 → 1.2.0

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (24) hide show

data/CHANGELOG +8 -0
data/bin/pdf_text +0 -2
data/examples/extract_images.rb +11 -6
data/lib/pdf/reader.rb +11 -5
data/lib/pdf/reader/buffer.rb +48 -42
data/lib/pdf/reader/cmap.rb +26 -11
data/lib/pdf/reader/filter.rb +11 -234
data/lib/pdf/reader/filter/ascii85.rb +25 -0
data/lib/pdf/reader/filter/ascii_hex.rb +26 -0
data/lib/pdf/reader/filter/depredict.rb +138 -0
data/lib/pdf/reader/filter/flate.rb +38 -0
data/lib/pdf/reader/filter/lzw.rb +18 -0
data/lib/pdf/reader/filter/null.rb +15 -0
data/lib/pdf/reader/filter/run_length.rb +46 -0
data/lib/pdf/reader/font.rb +1 -1
data/lib/pdf/reader/form_xobject.rb +25 -4
data/lib/pdf/reader/glyph_hash.rb +3 -2
data/lib/pdf/reader/object_cache.rb +39 -16
data/lib/pdf/reader/object_hash.rb +1 -1
data/lib/pdf/reader/page.rb +7 -1
data/lib/pdf/reader/page_state.rb +2 -1
data/lib/pdf/reader/stream.rb +1 -1
data/lib/pdf/reader/xref.rb +23 -4
metadata +99 -46

data/CHANGELOG CHANGED

@@ -1,3 +1,11 @@
+v1.2.0 (28th AUgust 2012)
+- Feature: correctly extract text using surrogate pairs and ligatures
+  (thanks Nathaniel Madura)
+- Speed optimisation: cache tokenised Form XObjects to avoid re-parsing them
+- Feature: support opening documents with some junk bytes prepended to file
+  (thanks Paul Gallagher)
+  - Acrobat does this, so it seemed reasonable to add support
 v1.1.1 (9th May 2012)
 - bugfix release to improve parsing of some PDFs

data/bin/pdf_text CHANGED

@@ -1,8 +1,6 @@
 #!/usr/bin/env ruby
 require 'rubygems'
-$LOAD_PATH.unshift(File.dirname(__FILE__) + "/../lib")
 require 'pdf/reader'
 if ARGV.empty?

data/examples/extract_images.rb CHANGED

@@ -86,14 +86,15 @@ module ExtractImages
       tiff = header.dup
       tiff << short_tag.call( 256, 1, w ) # image width
       tiff << short_tag.call( 257, 1, h ) # image height
-      tiff << long_tag.call( 258, 4, (header.size + (tag_count*12))) # bits per pixel
+      tiff << long_tag.call( 258, 4, (header.size + (tag_count*12) + 4)) # bits per pixel
       tiff << short_tag.call( 259, 1, 1 ) # compression
       tiff << short_tag.call( 262, 1, 5 ) # colorspace - separation
-      tiff << long_tag.call( 273, 1, (10 + (tag_count*12) + 16) ) # data offset
+      tiff << long_tag.call( 273, 1, (10 + (tag_count*12) + 20) ) # data offset
       tiff << short_tag.call( 277, 1, 4 ) # samples per pixel
       tiff << long_tag.call( 279, 1, stream.unfiltered_data.size) # data byte size
       tiff << short_tag.call( 284, 1, 1 ) # planer config
       tiff << long_tag.call( 332, 1, 1)   # inkset - CMYK
+      tiff << [0].pack("I") # next IFD pointer
       tiff << [bpc, bpc, bpc, bpc].pack("IIII")
       tiff << stream.unfiltered_data
       File.open(filename, "wb") { |file| file.write tiff }
@@ -119,10 +120,12 @@ module ExtractImages
       tiff << short_tag.call( 258, 1, 8 ) # bits per pixel
       tiff << short_tag.call( 259, 1, 1 ) # compression
       tiff << short_tag.call( 262, 1, 1 ) # colorspace - grayscale
-      tiff << long_tag.call( 273, 1, (10 + (tag_count*12)) ) # data offset
+      tiff << long_tag.call( 273, 1, (10 + (tag_count*12) + 4) ) # data offset
       tiff << short_tag.call( 277, 1, 1 ) # samples per pixel
       tiff << long_tag.call( 279, 1, stream.unfiltered_data.size) # data byte size
       tiff << short_tag.call( 284, 1, 1 ) # planer config
+      tiff << [0].pack("I") # next IFD pointer
+      p stream.unfiltered_data.size
       tiff << stream.unfiltered_data
       File.open(filename, "wb") { |file| file.write tiff }
     end
@@ -144,12 +147,13 @@ module ExtractImages
       tiff = header.dup
       tiff << short_tag.call( 256, 1, w ) # image width
       tiff << short_tag.call( 257, 1, h ) # image height
-      tiff << long_tag.call( 258, 3, (header.size + (tag_count*12))) # bits per pixel
+      tiff << long_tag.call( 258, 3, (header.size + (tag_count*12) + 4)) # bits per pixel
       tiff << short_tag.call( 259, 1, 1 ) # compression
       tiff << short_tag.call( 262, 1, 2 ) # colorspace - RGB
-      tiff << long_tag.call( 273, 1, (header.size + (tag_count*12) + 12) ) # data offset
+      tiff << long_tag.call( 273, 1, (header.size + (tag_count*12) + 16) ) # data offset
       tiff << short_tag.call( 277, 1, 3 ) # samples per pixel
       tiff << long_tag.call( 279, 1, stream.unfiltered_data.size) # data byte size
+      tiff << [0].pack("I") # next IFD pointer
       tiff << [bpc, bpc, bpc].pack("III")
       tiff << stream.unfiltered_data
       File.open(filename, "wb") { |file| file.write tiff }
@@ -209,8 +213,9 @@ module ExtractImages
       + short_tag.call( 256, cols ) \
       + short_tag.call( 257, h ) \
       + short_tag.call( 259, 4 ) \
-      + long_tag.call( 273, (10 + (5*12)) ) \
+      + long_tag.call( 273, (10 + (5*12) + 4) ) \
       + long_tag.call( 279, len) \
+      + [0].pack("I") \
       + stream.data
       File.open(filename, "wb") { |file| file.write tiff }
     end

data/lib/pdf/reader.rb CHANGED

@@ -25,9 +25,6 @@
 ################################################################################
 require 'stringio'
-require 'zlib'
-require 'ascii85'
 module PDF
   ################################################################################
@@ -113,6 +110,8 @@ module PDF
     #
     def initialize(input = nil, opts = {})
       if input # support the deprecated Reader API
+        @cache   = PDF::Reader::ObjectCache.new
+        opts.merge!(:cache => @cache)
         @objects = PDF::Reader::ObjectHash.new(input, opts)
       end
     end
@@ -222,7 +221,7 @@ module PDF
     #
     def pages
       (1..self.page_count).map { |num|
-        PDF::Reader::Page.new(@objects, num)
+        PDF::Reader::Page.new(@objects, num, :cache => @cache)
       }
     end
@@ -241,7 +240,7 @@ module PDF
     def page(num)
       num = num.to_i
       raise ArgumentError, "valid pages are 1 .. #{self.page_count}" if num < 1 || num > self.page_count
-      PDF::Reader::Page.new(@objects, num)
+      PDF::Reader::Page.new(@objects, num, :cache => @cache)
     end
@@ -338,6 +337,13 @@ require 'pdf/reader/cmap'
 require 'pdf/reader/encoding'
 require 'pdf/reader/error'
 require 'pdf/reader/filter'
+require 'pdf/reader/filter/ascii85'
+require 'pdf/reader/filter/ascii_hex'
+require 'pdf/reader/filter/depredict'
+require 'pdf/reader/filter/flate'
+require 'pdf/reader/filter/lzw'
+require 'pdf/reader/filter/null'
+require 'pdf/reader/filter/run_length'
 require 'pdf/reader/font'
 require 'pdf/reader/form_xobject'
 require 'pdf/reader/glyph_hash'

data/lib/pdf/reader/buffer.rb CHANGED

@@ -36,7 +36,7 @@ class PDF::Reader
   # the raw tokens into objects we can work with (strings, ints, arrays, etc)
   #
   class Buffer
-    TOKEN_WHITESPACE=["\x00", "\x09", "\x0A", "\x0C", "\x0D", "\x20"]
+    TOKEN_WHITESPACE=[0x00, 0x09, 0x0A, 0x0C, 0x0D, 0x20]
     attr_reader :pos
@@ -232,18 +232,17 @@ class PDF::Reader
       finished = false
       while !finished
-        chr = @io.read(1)
-        codepoint = chr.to_s.unpack("C*").first
-        if chr.nil?
+        byte = @io.getbyte
+        if byte.nil?
           finished = true # unbalanced params
-        elsif (48..57).include?(codepoint) || (65..90).include?(codepoint) || (97..122).include?(codepoint)
-          str << chr
-        elsif codepoint <= 32
+        elsif (48..57).include?(byte) || (65..90).include?(byte) || (97..122).include?(byte)
+          str << byte.chr
+        elsif byte <= 32
           # ignore it
         else
           @tokens << str if str.size > 0
-          @tokens << ">" if chr != ">"
-          @tokens << chr
+          @tokens << ">" if byte != 0x3E # '>'
+          @tokens << byte.chr
           finished = true
         end
       end
@@ -263,19 +262,19 @@ class PDF::Reader
       count = 1
       while count > 0
-        chr = @io.read(1)
-        if chr.nil?
+        byte = @io.getbyte
+        if byte.nil?
           count = 0 # unbalanced params
-        elsif chr == "\x5c"
-          str << chr << @io.read(1).to_s
-        elsif chr == "("
+        elsif byte == 0x5C
+          str << byte.chr << @io.getbyte.chr
+        elsif byte == 0x28 # "("
           str << "("
           count += 1
-        elsif chr == ")"
+        elsif byte == 0x29 # ")"
           count -= 1
           str << ")" unless count == 0
         else
-          str << chr unless count == 0
+          str << byte.chr unless count == 0
         end
       end
@@ -291,61 +290,68 @@ class PDF::Reader
     def prepare_regular_token
       tok = ""
-      while chr = @io.read(1)
-        case chr
-        when "\x25"
+      while byte = @io.getbyte
+        case byte
+        when 0x25
           # comment, ignore everything until the next EOL char
           done = false
           while !done
-            chr = @io.read(1)
-            done = true if chr.nil? || chr == "\x0A" || chr == "\x0D"
+            byte = @io.getbyte
+            done = true if byte.nil? || byte == 0x0A || byte == 0x0D
           end
         when *TOKEN_WHITESPACE
           # white space, token finished
           @tokens << tok if tok.size > 0
           #If the token was empty, chomp the rest of the whitespace too
-          while TOKEN_WHITESPACE.include?(peek_char) && tok.size == 0
-            @io.read(1)
+          while TOKEN_WHITESPACE.include?(peek_byte) && tok.size == 0
+            @io.getbyte
           end
           tok = ""
           break
-        when "\x3C"
+        when 0x3C
           # opening delimiter '<', start of new token
           @tokens << tok if tok.size > 0
-          chr << @io.read(1) if peek_char == "\x3C" # check if token is actually '<<'
-          @tokens << chr
+          if peek_byte == 0x3C # check if token is actually '<<'
+            @io.getbyte
+            @tokens << "<<"
+          else
+            @tokens << "<"
+          end
           tok = ""
           break
-        when "\x3E"
+        when 0x3E
           # closing delimiter '>', start of new token
           @tokens << tok if tok.size > 0
-          chr << @io.read(1) if peek_char == "\x3E" # check if token is actually '>>'
-          @tokens << chr
+          if peek_byte == 0x3E # check if token is actually '>>'
+            @io.getbyte
+            @tokens << ">>"
+          else
+            @tokens << byte.chr
+          end
           tok = ""
           break
-        when "\x28", "\x5B", "\x7B"
+        when 0x28, 0x5B, 0x7B
           # opening delimiter, start of new token
           @tokens << tok if tok.size > 0
-          @tokens << chr
+          @tokens << byte.chr
           tok = ""
           break
-        when "\x29", "\x5D", "\x7D"
+        when 0x29, 0x5D, 0x7D
           # closing delimiter
           @tokens << tok if tok.size > 0
-          @tokens << chr
+          @tokens << byte.chr
           tok = ""
           break
-        when "\x2F"
+        when 0x2F
           # PDF name, start of new token
           @tokens << tok if tok.size > 0
-          @tokens << chr
-          next_char = peek_char
-          @tokens << "" if chr == "/" && [nil, " ", "\n"].include?(next_char)
+          @tokens << byte.chr
+          @tokens << "" if byte == 0x2F && [nil, 0x20, 0x0A].include?(peek_byte)
           tok = ""
           break
         else
-          tok << chr
+          tok << byte.chr
         end
       end
@@ -355,10 +361,10 @@ class PDF::Reader
     # peek at the next character in the io stream, leaving the stream position
     # untouched
     #
-    def peek_char
-      chr = @io.read(1)
-      @io.seek(-1, IO::SEEK_CUR) unless chr.nil?
-      chr
+    def peek_byte
+      byte = @io.getbyte
+      @io.seek(-1, IO::SEEK_CUR) if byte
+      byte
     end
     # for a handful of tokens we want to tell the parser how to convert them

data/lib/pdf/reader/cmap.rb CHANGED

@@ -60,6 +60,10 @@ class PDF::Reader
       @map.size
     end
+    # Convert a glyph code into one or more Codepoints.
+    #
+    # Returns an array of Fixnums.
+    #
     def decode(c)
       # TODO: implement the conversion
       return c unless c.class == Fixnum
@@ -74,12 +78,23 @@ class PDF::Reader
     end
     def str_to_int(str)
-      return nil if str.nil? || str.size == 0 || str.size >= 3
-      if str.size == 1
-        str.unpack("C*")[0]
+      return nil if str.nil? || str.size == 0
+      unpacked_string = if str.size == 1 # UTF-8
+        str.unpack("C*")
+      else # UTF-16
+         str.unpack("n*")
+      end
+      if unpacked_string.length == 1
+        unpacked_string
+      elsif unpacked_string.length == 2 && (unpacked_string[0] > 0xD800 && unpacked_string[0] < 0xDBFF)
+        # this is a Unicode UTF-16 "Surrogate Pair" see Unicode Spec. Chapter 3.7
+        # lets convert to a UTF-32. (the high bit is between 0xD800-0xDBFF, the
+        # low bit is between 0xDC00-0xDFFF) for example: U+1D44E (U+D835 U+DC4E)
+        [(unpacked_string[0] - 0xD800) * 0x400 + (unpacked_string[1] - 0xDC00) + 0x10000]
       else
-        str.unpack("n*")[0]
+        # it is a bad idea to just return the first 16 bits, as this doesn't allow
+        # for ligatures for example fi (U+0066 U+0069)
+        unpacked_string
       end
     end
@@ -88,7 +103,7 @@ class PDF::Reader
       find    = str_to_int(parser.parse_token)
       replace = str_to_int(parser.parse_token)
       while find && replace
-        @map[find] = replace
+        @map[find[0]] = replace
         find       = str_to_int(parser.parse_token)
         replace    = str_to_int(parser.parse_token)
       end
@@ -114,21 +129,21 @@ class PDF::Reader
     end
     def bfrange_type_one(start_code, end_code, dst)
-      start_code = str_to_int(start_code)
-      end_code   = str_to_int(end_code)
+      start_code = str_to_int(start_code)[0]
+      end_code   = str_to_int(end_code)[0]
       dst        = str_to_int(dst)
       # add all values in the range to our mapping
       (start_code..end_code).each_with_index do |val, idx|
-        @map[val] = dst + idx
+        @map[val] = dst.length == 1 ? [dst[0] + idx] : [dst[0], dst[1] + 1]
         # ensure a single range does not exceed 255 chars
         raise PDF::Reader::MalformedPDFError, "a CMap bfrange cann't exceed 255 chars" if idx > 255
       end
     end
     def bfrange_type_two(start_code, end_code, dst)
-      start_code = str_to_int(start_code)
-      end_code   = str_to_int(end_code)
+      start_code = str_to_int(start_code)[0]
+      end_code   = str_to_int(end_code)[0]
       from_range = (start_code..end_code)
       # add all values in the range to our mapping

data/lib/pdf/reader/filter.rb CHANGED

@@ -22,7 +22,6 @@
 # WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN THE SOFTWARE.
 #
 ################################################################################
-require 'zlib'
 class PDF::Reader
   ################################################################################
@@ -30,7 +29,7 @@ class PDF::Reader
   # support for features like compression and encryption. This class is for decoding that
   # content.
   #
-  class Filter # :nodoc:
+  module Filter # :nodoc:
     ################################################################################
     # creates a new filter for decoding content.
@@ -38,242 +37,20 @@ class PDF::Reader
     # Filters that are only used to encode image data are accepted, but the data is
     # returned untouched. At this stage PDF::Reader has no need to decode images.
     #
-    def initialize (name, options = nil)
-      @options = options
+    def self.with(name, options = {})
       case name.to_sym
-      when :ASCII85Decode   then @filter = :ascii85
-      when :ASCIIHexDecode  then @filter = :asciihex
-      when :CCITTFaxDecode  then @filter = nil
-      when :DCTDecode       then @filter = nil
-      when :FlateDecode     then @filter = :flate
-      when :JBIG2Decode     then @filter = nil
-      when :JPXDecode       then @filter = nil
-      when :LZWDecode       then @filter = :lzw
-      when :RunLengthDecode then @filter = :runlength
+      when :ASCII85Decode   then PDF::Reader::Filter::Ascii85.new(options)
+      when :ASCIIHexDecode  then PDF::Reader::Filter::AsciiHex.new(options)
+      when :CCITTFaxDecode  then PDF::Reader::Filter::Null.new(options)
+      when :DCTDecode       then PDF::Reader::Filter::Null.new(options)
+      when :FlateDecode     then PDF::Reader::Filter::Flate.new(options)
+      when :JBIG2Decode     then PDF::Reader::Filter::Null.new(options)
+      when :JPXDecode       then PDF::Reader::Filter::Null.new(options)
+      when :LZWDecode       then PDF::Reader::Filter::Lzw.new(options)
+      when :RunLengthDecode then PDF::Reader::Filter::RunLength.new(options)
       else
         raise UnsupportedFeatureError, "Unknown filter: #{name}"
       end
     end
-    ################################################################################
-    # attempts to decode the specified data with the current filter
-    #
-    # Filters that are only used to encode image data are accepted, but the data is
-    # returned untouched. At this stage PDF::Reader has no need to decode images.
-    #
-    def filter (data)
-      # leave the data untouched if we don't support the required filter
-      return data if @filter.nil?
-      # decode the data
-      self.send(@filter, data)
-    end
-    ################################################################################
-    # Decode the specified data using the Ascii85 algorithm. Relies on the AScii85
-    # rubygem.
-    #
-    def ascii85(data)
-      data = "<~#{data}" unless data.to_s[0,2] == "<~"
-      Ascii85::decode(data)
-    rescue Exception => e
-      # Oops, there was a problem decoding the stream
-      raise MalformedPDFError, "Error occured while decoding an ASCII85 stream (#{e.class.to_s}: #{e.to_s})"
-    end
-    ################################################################################
-    # Decode the specified data using the AsciiHex algorithm.
-    #
-    def asciihex(data)
-      data.chop! if data[-1,1] == ">"
-      data = data[1,data.size] if data[0,1] == "<"
-      data.gsub!(/[^A-Fa-f0-9]/,"")
-      data << "0" if data.size % 2 == 1
-      data.scan(/.{2}/).map { |s| s.hex.chr }.join("")
-    rescue Exception => e
-      # Oops, there was a problem decoding the stream
-      raise MalformedPDFError, "Error occured while decoding an ASCIIHex stream (#{e.class.to_s}: #{e.to_s})"
-    end
-    ################################################################################
-    # Decode the specified data with the Zlib compression algorithm
-    def flate (data)
-      deflated = nil
-      begin
-        deflated = Zlib::Inflate.new.inflate(data)
-      rescue Zlib::DataError => e
-        # by default, Ruby's Zlib assumes the data it's inflating
-        # is RFC1951 deflated data, wrapped in a RFC1951 zlib container.
-        # If that fails, then use an undocumented 'feature' to attempt to inflate
-        # the data as a raw RFC1951 stream.
-        #
-        # See
-        # - http://blade.nagaokaut.ac.jp/cgi-bin/scat.rb/ruby/ruby-talk/243545
-        # - http://www.gzip.org/zlib/zlib_faq.html#faq38
-        deflated = Zlib::Inflate.new(-Zlib::MAX_WBITS).inflate(data)
-      end
-      depredict(deflated, @options)
-    rescue Exception => e
-      # Oops, there was a problem inflating the stream
-      raise MalformedPDFError, "Error occured while inflating a compressed stream (#{e.class.to_s}: #{e.to_s})"
-    end
-    ################################################################################
-    # Decode the specified data with the LZW compression algorithm
-    def lzw(data)
-      data = PDF::Reader::LZW.decode(data)
-      depredict(data, @options)
-    end
-    ################################################################################
-    # Decode the specified data with the RunLengthDecode compression algorithm
-    def runlength(data)
-      pos = 0
-      out = ""
-      while pos < data.length
-        if data.respond_to?(:getbyte)
-          length = data.getbyte(pos)
-        else
-          length = data[pos]
-        end
-        pos += 1
-        case
-        when length == 128
-          break
-        when length < 128
-          # When the length is < 128, we copy the following length+1 bytes
-          # literally.
-          out << data[pos, length + 1]
-          pos += length
-        else
-          # When the length is > 128, we copy the next byte (257 - length)
-          # times; i.e., "\xFA\x00" ([250, 0]) will expand to
-          # "\x00\x00\x00\x00\x00\x00\x00".
-          out << data[pos, 1] * (257 - length)
-        end
-        pos += 1
-      end
-      out
-    end
-    ################################################################################
-    def depredict(data, opts = {})
-      predictor = (opts || {})[:Predictor].to_i
-      case predictor
-      when 0, 1 then
-        data
-      when 2    then
-        tiff_depredict(data, opts)
-      when 10, 11, 12, 13, 14, 15 then
-        png_depredict(data, opts)
-      else
-        raise  MalformedPDFError, "Unrecognised predictor value (#{predictor})"
-      end
-    end
-    ################################################################################
-    def tiff_depredict(data, opts = {})
-      data        = data.unpack("C*")
-      unfiltered  = []
-      bpc         = opts[:BitsPerComponent] || 8
-      pixel_bits  = bpc * opts[:Colors]
-      pixel_bytes = pixel_bits / 8
-      line_len    = (pixel_bytes * opts[:Columns])
-      pos         = 0
-      if bpc != 8
-        raise UnsupportedFeatureError, "TIFF predictor onlys supports 8 Bits Per Component"
-      end
-      until pos > data.size
-        row_data = data[pos, line_len]
-        row_data.each_with_index do |byte, index|
-          left = index < pixel_bytes ? 0 : row_data[index - pixel_bytes]
-          row_data[index] = (byte + left) % 256
-        end
-        unfiltered += row_data
-        pos += line_len
-      end
-      unfiltered.pack("C*")
-    end
-    ################################################################################
-    def png_depredict(data, opts = {})
-      return data if opts.nil? || opts[:Predictor].to_i < 10
-      data = data.unpack("C*")
-      pixel_bytes     = opts[:Colors] || 1
-      scanline_length = (pixel_bytes * opts[:Columns]) + 1
-      row = 0
-      pixels = []
-      paeth, pa, pb, pc = nil
-      until data.empty? do
-        row_data = data.slice! 0, scanline_length
-        filter = row_data.shift
-        case filter
-        when 0 # None
-        when 1 # Sub
-          row_data.each_with_index do |byte, index|
-            left = index < pixel_bytes ? 0 : row_data[index - pixel_bytes]
-            row_data[index] = (byte + left) % 256
-            #p [byte, left, row_data[index]]
-          end
-        when 2 # Up
-          row_data.each_with_index do |byte, index|
-            col = index / pixel_bytes
-            upper = row == 0 ? 0 : pixels[row-1][col][index % pixel_bytes]
-            row_data[index] = (upper + byte) % 256
-          end
-        when 3  # Average
-          row_data.each_with_index do |byte, index|
-            col = index / pixel_bytes
-            upper = row == 0 ? 0 : pixels[row-1][col][index % pixel_bytes]
-            left = index < pixel_bytes ? 0 : row_data[index - pixel_bytes]
-            row_data[index] = (byte + ((left + upper)/2).floor) % 256
-          end
-        when 4 # Paeth
-          left = upper = upper_left = nil
-          row_data.each_with_index do |byte, index|
-            col = index / pixel_bytes
-            left = index < pixel_bytes ? 0 : row_data[index - pixel_bytes]
-            if row.zero?
-              upper = upper_left = 0
-            else
-              upper = pixels[row-1][col][index % pixel_bytes]
-              upper_left = col.zero? ? 0 :
-                pixels[row-1][col-1][index % pixel_bytes]
-            end
-            p = left + upper - upper_left
-            pa = (p - left).abs
-            pb = (p - upper).abs
-            pc = (p - upper_left).abs
-            paeth = if pa <= pb && pa <= pc
-                      left
-                    elsif pb <= pc
-                      upper
-                    else
-                      upper_left
-                    end
-            row_data[index] = (byte + paeth) % 256
-          end
-        else
-          raise ArgumentError, "Invalid filter algorithm #{filter}"
-        end
-        s = []
-        row_data.each_slice pixel_bytes do |slice|
-          s << slice
-        end
-        pixels << s
-        row += 1
-      end
-      pixels.map { |bytes| bytes.flatten.pack("C*") }.join("")
-    end
   end
 end
-################################################################################