RubyGems - origami - Versions diffs - 1.2.7 → 2.0.0 - Mend

origami 1.2.7 → 2.0.0

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (162) hide show

checksums.yaml +4 -4
data/CHANGELOG.md +66 -0
data/README.md +112 -0
data/bin/config/pdfcop.conf.yml +232 -233
data/bin/gui/about.rb +27 -37
data/bin/gui/config.rb +108 -117
data/bin/gui/file.rb +416 -365
data/bin/gui/gtkhex.rb +1138 -1153
data/bin/gui/hexview.rb +55 -57
data/bin/gui/imgview.rb +48 -51
data/bin/gui/menu.rb +388 -386
data/bin/gui/properties.rb +114 -130
data/bin/gui/signing.rb +571 -617
data/bin/gui/textview.rb +77 -95
data/bin/gui/treeview.rb +382 -387
data/bin/gui/walker.rb +227 -232
data/bin/gui/xrefs.rb +56 -60
data/bin/pdf2pdfa +53 -57
data/bin/pdf2ruby +212 -228
data/bin/pdfcop +338 -348
data/bin/pdfdecompress +58 -65
data/bin/pdfdecrypt +56 -60
data/bin/pdfencrypt +75 -80
data/bin/pdfexplode +185 -182
data/bin/pdfextract +201 -218
data/bin/pdfmetadata +83 -82
data/bin/pdfsh +4 -5
data/bin/pdfwalker +1 -2
data/bin/shell/.irbrc +45 -82
data/bin/shell/console.rb +105 -130
data/bin/shell/hexdump.rb +40 -64
data/examples/README.md +34 -0
data/examples/attachments/attachment.rb +38 -0
data/examples/attachments/nested_document.rb +51 -0
data/examples/encryption/encryption.rb +28 -0
data/{samples/actions/triggerevents/trigger.rb → examples/events/events.rb} +13 -16
data/examples/flash/flash.rb +37 -0
data/{samples → examples}/flash/helloworld.swf +0 -0
data/examples/forms/javascript.rb +54 -0
data/examples/forms/xfa.rb +115 -0
data/examples/javascript/hello_world.rb +22 -0
data/examples/javascript/js_emulation.rb +54 -0
data/examples/loop/goto.rb +32 -0
data/examples/loop/named.rb +33 -0
data/examples/signature/signature.rb +65 -0
data/examples/uri/javascript.rb +56 -0
data/examples/uri/open-uri.rb +21 -0
data/examples/uri/submitform.rb +47 -0
data/lib/origami.rb +29 -42
data/lib/origami/3d.rb +350 -225
data/lib/origami/acroform.rb +262 -288
data/lib/origami/actions.rb +268 -288
data/lib/origami/annotations.rb +697 -722
data/lib/origami/array.rb +258 -184
data/lib/origami/boolean.rb +74 -84
data/lib/origami/catalog.rb +397 -434
data/lib/origami/collections.rb +144 -0
data/lib/origami/destinations.rb +233 -194
data/lib/origami/dictionary.rb +253 -232
data/lib/origami/encryption.rb +1274 -1243
data/lib/origami/export.rb +232 -268
data/lib/origami/extensions/fdf.rb +307 -220
data/lib/origami/extensions/ppklite.rb +368 -435
data/lib/origami/filespec.rb +197 -0
data/lib/origami/filters.rb +301 -295
data/lib/origami/filters/ascii.rb +177 -180
data/lib/origami/filters/ccitt.rb +528 -535
data/lib/origami/filters/crypt.rb +26 -35
data/lib/origami/filters/dct.rb +46 -52
data/lib/origami/filters/flate.rb +95 -94
data/lib/origami/filters/jbig2.rb +49 -55
data/lib/origami/filters/jpx.rb +38 -44
data/lib/origami/filters/lzw.rb +189 -183
data/lib/origami/filters/predictors.rb +221 -235
data/lib/origami/filters/runlength.rb +103 -104
data/lib/origami/font.rb +173 -186
data/lib/origami/functions.rb +67 -81
data/lib/origami/graphics.rb +25 -21
data/lib/origami/graphics/colors.rb +178 -187
data/lib/origami/graphics/instruction.rb +79 -85
data/lib/origami/graphics/path.rb +142 -148
data/lib/origami/graphics/patterns.rb +160 -167
data/lib/origami/graphics/render.rb +43 -50
data/lib/origami/graphics/state.rb +138 -153
data/lib/origami/graphics/text.rb +188 -205
data/lib/origami/graphics/xobject.rb +819 -815
data/lib/origami/header.rb +63 -78
data/lib/origami/javascript.rb +596 -597
data/lib/origami/linearization.rb +285 -290
data/lib/origami/metadata.rb +139 -148
data/lib/origami/name.rb +112 -148
data/lib/origami/null.rb +53 -62
data/lib/origami/numeric.rb +162 -175
data/lib/origami/obfuscation.rb +186 -174
data/lib/origami/object.rb +593 -573
data/lib/origami/outline.rb +42 -47
data/lib/origami/outputintents.rb +73 -82
data/lib/origami/page.rb +703 -592
data/lib/origami/parser.rb +238 -290
data/lib/origami/parsers/fdf.rb +41 -33
data/lib/origami/parsers/pdf.rb +75 -95
data/lib/origami/parsers/pdf/lazy.rb +137 -0
data/lib/origami/parsers/pdf/linear.rb +64 -66
data/lib/origami/parsers/ppklite.rb +34 -70
data/lib/origami/pdf.rb +1030 -1005
data/lib/origami/reference.rb +102 -102
data/lib/origami/signature.rb +591 -609
data/lib/origami/stream.rb +668 -551
data/lib/origami/string.rb +397 -373
data/lib/origami/template/patterns.rb +56 -0
data/lib/origami/template/widgets.rb +151 -0
data/lib/origami/trailer.rb +144 -158
data/lib/origami/tree.rb +62 -0
data/lib/origami/version.rb +23 -0
data/lib/origami/webcapture.rb +88 -79
data/lib/origami/xfa.rb +2863 -2882
data/lib/origami/xreftable.rb +472 -384
data/test/dataset/calc.pdf +85 -0
data/test/dataset/crypto.pdf +82 -0
data/test/dataset/empty.pdf +49 -0
data/test/test_actions.rb +27 -0
data/test/test_annotations.rb +90 -0
data/test/test_pages.rb +31 -0
data/test/test_pdf.rb +16 -0
data/test/test_pdf_attachment.rb +34 -0
data/test/test_pdf_create.rb +24 -0
data/test/test_pdf_encrypt.rb +95 -0
data/test/test_pdf_parse.rb +96 -0
data/test/test_pdf_sign.rb +58 -0
data/test/test_streams.rb +182 -0
data/test/test_xrefs.rb +67 -0
metadata +88 -58
data/README +0 -67
data/bin/pdf2graph +0 -121
data/bin/pdfcocoon +0 -104
data/lib/origami/file.rb +0 -233
data/samples/README.txt +0 -45
data/samples/actions/launch/calc.rb +0 -87
data/samples/actions/launch/winparams.rb +0 -22
data/samples/actions/loop/loopgoto.rb +0 -24
data/samples/actions/loop/loopnamed.rb +0 -21
data/samples/actions/named/named.rb +0 -31
data/samples/actions/samba/smbrelay.rb +0 -26
data/samples/actions/webbug/submitform.js +0 -26
data/samples/actions/webbug/webbug-browser.rb +0 -68
data/samples/actions/webbug/webbug-js.rb +0 -67
data/samples/actions/webbug/webbug-reader.rb +0 -90
data/samples/attachments/attach.rb +0 -40
data/samples/attachments/attached.txt +0 -1
data/samples/crypto/crypto.rb +0 -28
data/samples/digsig/signed.rb +0 -46
data/samples/exploits/cve-2008-2992-utilprintf.rb +0 -87
data/samples/exploits/cve-2009-0927-geticon.rb +0 -65
data/samples/exploits/exploit_customdictopen.rb +0 -55
data/samples/exploits/getannots.rb +0 -69
data/samples/flash/flash.rb +0 -31
data/samples/javascript/attached.txt +0 -1
data/samples/javascript/js.rb +0 -52
data/templates/patterns.rb +0 -66
data/templates/widgets.rb +0 -173
data/templates/xdp.rb +0 -92
data/test/ts_pdf.rb +0 -50

data/bin/pdfexplode CHANGED

@@ -1,34 +1,33 @@
-#!/usr/bin/env ruby
+#!/usr/bin/env ruby
 =begin
-= Author:
-  Guillaume Delugré <guillaume/at/security-labs.org>
+= Info
+    Explodes a PDF into separate documents.
-= Info:
-  Explodes a PDF into separate documents.
-= License:
-	Origami is free software: you can redistribute it and/or modify
-  it under the terms of the GNU Lesser General Public License as published by
-  the Free Software Foundation, either version 3 of the License, or
-  (at your option) any later version.
+= License
+    Copyright (C) 2016  Guillaume Delugré.
-  Origami is distributed in the hope that it will be useful,
-  but WITHOUT ANY WARRANTY; without even the implied warranty of
-  MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
-  GNU Lesser General Public License for more details.
+    Origami is free software: you can redistribute it and/or modify
+    it under the terms of the GNU Lesser General Public License as published by
+    the Free Software Foundation, either version 3 of the License, or
+    (at your option) any later version.
-  You should have received a copy of the GNU Lesser General Public License
-  along with Origami.  If not, see <http://www.gnu.org/licenses/>.
+    Origami is distributed in the hope that it will be useful,
+    but WITHOUT ANY WARRANTY; without even the implied warranty of
+    MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
+    GNU Lesser General Public License for more details.
+    You should have received a copy of the GNU Lesser General Public License
+    along with Origami.  If not, see <http://www.gnu.org/licenses/>.
 =end
 begin
-  require 'origami'
+    require 'origami'
 rescue LoadError
-  ORIGAMIDIR = "#{File.dirname(__FILE__)}/../lib"
-  $: << ORIGAMIDIR
-  require 'origami'
+    $: << File.join(__dir__, '../lib')
+    require 'origami'
 end
 include Origami
@@ -36,185 +35,189 @@ require 'optparse'
 require 'rexml/document'
 class OptParser
-  BANNER = <<USAGE
+    BANNER = <<USAGE
 Usage: #{$0} <PDF-file> [-r <range>] [-t pages|rsrc] [-d <output-directory>]
 Explodes a document into separate documents.
-Bug reports or feature requests at: http://origami-pdf.googlecode.com/
+Bug reports or feature requests at: http://github.com/gdelugre/origami
 Options:
 USAGE
-  def self.parser(options)
-    OptionParser.new do |opts|
-      opts.banner = BANNER
-      opts.on("-d", "--output-dir DIR", "Output directory.") do |d|
-        options[:output_dir] = d
-      end
-      opts.on("-r", "--range PAGES", "Page range (e.g: 2-, 1-3, 5). Default to '-'.") do |r|
-        range =
-          if r.index('-').nil?
-            page = r.to_i
-            Range.new(page-1, page-1)
-          else
-            from, to = r.split('-').map{|bound| bound.to_i}
-            from ||= 1
-            to ||= 0
-            Range.new(from-1, to-1)
-          end
-        options[:page_range] = range
-      end
-      opts.on("-t", "--type TYPE", "Split by type. Can be 'pages' or 'rsrc'. Default to 'pages'.") do |t|
-        options[:split_by] = t
-      end
-      opts.on_tail("-h", "--help", "Show this message.") do
-        puts opts
-        exit
-      end
+    def self.parser(options)
+        OptionParser.new do |opts|
+            opts.banner = BANNER
+            opts.on("-d", "--output-dir DIR", "Output directory.") do |d|
+                options[:output_dir] = d
+            end
+            opts.on("-r", "--range PAGES", "Page range (e.g: 2-, 1-3, 5). Default to '-'.") do |r|
+                range =
+                    if r.index('-').nil?
+                        page = r.to_i
+                        Range.new(page-1, page-1)
+                    else
+                        from, to = r.split('-').map{|bound| bound.to_i}
+                        from ||= 1
+                        to ||= 0
+                        Range.new(from-1, to-1)
+                    end
+                options[:page_range] = range
+            end
+            opts.on("-t", "--type TYPE", "Split by type. Can be 'pages' or 'rsrc'. Default to 'pages'.") do |t|
+                options[:split_by] = t
+            end
+            opts.on_tail("-h", "--help", "Show this message.") do
+                puts opts
+                exit
+            end
+        end
     end
-  end
-  def self.parse(args)
-    options =
-    {
-      :page_range => (0..-1),
-      :split_by => 'pages'
-    }
+    def self.parse(args)
+        options =
+        {
+            page_range: (0..-1),
+            split_by: 'pages'
+        }
-    self.parser(options).parse!(args)
+        self.parser(options).parse!(args)
-    options
-  end
+        options
+    end
 end
 begin
-  @options = OptParser.parse(ARGV)
-  if ARGV.empty?
-    STDERR.puts "Error: No filename was specified. #{$0} --help for details."
-    exit 1
-  else
-    target = ARGV.shift
-  end
-  if @options[:output_dir].nil?
-    @options[:output_dir] = "#{File.join(File.dirname(target), File.basename(target,'.pdf'))}.explode"
-  end
-  Origami::OPTIONS[:ignore_bad_references] = true
-  OUTPUT_DIR = @options[:output_dir]
-  Dir::mkdir(OUTPUT_DIR) unless File.directory?(OUTPUT_DIR)
-  def split_by_rsrc(n, page, type)
-    all_rsrc = page.resources
-    type_rsrc = page.ls_resources(type)
-    other_rsrc = all_rsrc.keys - type_rsrc.keys
-    unless type_rsrc.empty?
-      # Keep only specified resource type.
-      output_file = File.join(OUTPUT_DIR, "page_#{n}_keeponly_#{type}.pdf")
-      PDF.write(output_file) do |pdf|
-        reduced = page.copy
-        # New resource dictionary with only matching resources.
-        reduced.Resources = Resources.new(type => type_rsrc)
-        # Remove mention of other resources.
-        reduced.Contents.data = reduced.Contents.data.lines.to_a.
-          delete_if {|line| other_rsrc.any?{|rsrc| line =~ /#{rsrc}/}}.join
-        STDERR.puts "Creating #{output_file}..."
-        pdf.append_page(reduced)
-      end
-      # Remove all specified resource type.
-      output_file = File.join(OUTPUT_DIR, "page_#{n}_excluded_#{type}.pdf")
-      PDF.write(output_file) do |pdf|
-        reduced = page.copy
-        # New resource dictionary with no resource of specified type.
-        reduced.Resources = reduced.Resources.copy
-        reduced.Resources.delete(type)
-        # Remove mention this resource type.
-        reduced.Contents.data = reduced.Contents.data.lines.to_a.
-          delete_if {|line| type_rsrc.keys.any?{|rsrc| line =~ /#{rsrc}/}}.join
-        STDERR.puts "Creating #{output_file}..."
-        pdf.append_page(reduced)
-      end
-      # Now treating each resource object separately.
-      type_rsrc.each_pair do |name, rsrc|
-        anyother_rsrc = all_rsrc.keys - [ name ]
-        # Keey only specified resource object.
-        output_file = File.join(OUTPUT_DIR, "page_#{n}_keeponly_#{type}_#{name}.pdf")
-        PDF.write(output_file) do |pdf|
-          reduced = page.copy
-          # New resource dictionary with only specified resource object.
-          reduced.Resources = Resources.new(type => {name => rsrc})
-          # Remove mention of all other resources.
-          reduced.Contents.data = reduced.Contents.data.lines.to_a.
-            delete_if {|line| anyother_rsrc.any?{|rsrc| line =~ /#{rsrc}/}}.join
-          STDERR.puts "Creating #{output_file}..."
-          pdf.append_page(reduced)
-        end
-        # Remove only specified resource object.
-        output_file = File.join(OUTPUT_DIR, "page_#{n}_excluded_#{type}_#{name}.pdf")
-        PDF.write(output_file) do |pdf|
-          reduced = page.copy
-          # New resource dictionary with only specified resource object.
-          reduced.Resources = reduced.Resources.copy
-          reduced.Resources[type] = reduced.Resources.send(type).copy
-          reduced.Resources[type].delete(name)
-          # Remove mention of this resource only.
-          reduced.Contents.data = reduced.Contents.data.lines.to_a.
-            delete_if {|line| line =~ /#{name}/}.join
-          STDERR.puts "Creating #{output_file}..."
-          pdf.append_page(reduced)
+    @options = OptParser.parse(ARGV)
+    if ARGV.empty?
+        abort "Error: No filename was specified. #{$0} --help for details."
+    else
+        target = ARGV.shift
+    end
+    if @options[:output_dir].nil?
+        @options[:output_dir] = "#{File.join(File.dirname(target), File.basename(target,'.pdf'))}.explode"
+    end
+    Origami::OPTIONS[:ignore_bad_references] = true
+    OUTPUT_DIR = @options[:output_dir]
+    Dir::mkdir(OUTPUT_DIR) unless File.directory?(OUTPUT_DIR)
+    def split_by_rsrc(n, page, type)
+        all_rsrc = page.resources
+        type_rsrc = page.resources(type)
+        other_rsrc = all_rsrc.keys - type_rsrc.keys
+        unless type_rsrc.empty?
+            # Keep only specified resource type.
+            output_file = File.join(OUTPUT_DIR, "page_#{n}_keeponly_#{type}.pdf")
+            PDF.write(output_file) do |pdf|
+                reduced = page.copy
+                # New resource dictionary with only matching resources.
+                reduced.Resources = Resources.new(type => type_rsrc)
+                # Remove mention of other resources.
+                reduced.each_content_stream do |stream|
+                    stream.data = stream.data.lines.
+                        delete_if {|line| other_rsrc.any?{|rsrc| line =~ /#{rsrc}/}}.join
+                end
+                STDERR.puts "Creating #{output_file}..."
+                pdf.append_page(reduced)
+            end
+            # Remove all specified resource type.
+            output_file = File.join(OUTPUT_DIR, "page_#{n}_excluded_#{type}.pdf")
+            PDF.write(output_file) do |pdf|
+                reduced = page.copy
+                # New resource dictionary with no resource of specified type.
+                reduced.Resources = reduced.Resources.copy
+                reduced.Resources.delete(type)
+                # Remove mention this resource type.
+                reduced.each_content_stream do |stream|
+                    stream.data = stream.data.lines.
+                        delete_if {|line| type_rsrc.keys.any?{|rsrc| line =~ /#{rsrc}/}}.join
+                end
+                STDERR.puts "Creating #{output_file}..."
+                pdf.append_page(reduced)
+            end
+            # Now treating each resource object separately.
+            type_rsrc.each_pair do |name, rsrc|
+                anyother_rsrc = all_rsrc.keys - [ name ]
+                # Keey only specified resource object.
+                output_file = File.join(OUTPUT_DIR, "page_#{n}_keeponly_#{type}_#{name}.pdf")
+                PDF.write(output_file) do |pdf|
+                    reduced = page.copy
+                    # New resource dictionary with only specified resource object.
+                    reduced.Resources = Resources.new(type => {name => rsrc})
+                    # Remove mention of all other resources.
+                    reduced.each_content_stream do |stream|
+                        stream.data = stream.data.lines.
+                            delete_if {|line| anyother_rsrc.any?{|rsrc| line =~ /#{rsrc}/}}.join
+                    end
+                    STDERR.puts "Creating #{output_file}..."
+                    pdf.append_page(reduced)
+                end
+                # Remove only specified resource object.
+                output_file = File.join(OUTPUT_DIR, "page_#{n}_excluded_#{type}_#{name}.pdf")
+                PDF.write(output_file) do |pdf|
+                    reduced = page.copy
+                    # New resource dictionary with only specified resource object.
+                    reduced.Resources = reduced.Resources.copy
+                    reduced.Resources[type] = reduced.Resources.send(type).copy
+                    reduced.Resources[type].delete(name)
+                    # Remove mention of this resource only.
+                    reduced.each_content_stream do |stream|
+                        stream.data = stream.data.lines.
+                            delete_if {|line| line =~ /#{name}/}.join
+                    end
+                    STDERR.puts "Creating #{output_file}..."
+                    pdf.append_page(reduced)
+                end
+            end
         end
-      end
     end
-  end
-  params =
-  {
-    :verbosity => Parser::VERBOSE_QUIET,
-  }
-  pdf = PDF.read(target, params)
-  i = @options[:page_range].first + 1
-  pdf.pages[@options[:page_range]].each do |page|
-    case @options[:split_by]
-      when 'pages'
-        output_file = File.join(OUTPUT_DIR, "page_#{i}.pdf")
-        PDF.write(output_file) do |pdf|
-          STDERR.puts "Creating #{output_file}..."
-          pdf.append_page(page)
+    params =
+    {
+        verbosity: Parser::VERBOSE_QUIET,
+    }
+    pdf = PDF.read(target, params)
+    i = @options[:page_range].first + 1
+    pdf.pages[@options[:page_range]].each do |page|
+        case @options[:split_by]
+        when 'pages'
+            output_file = File.join(OUTPUT_DIR, "page_#{i}.pdf")
+            PDF.write(output_file) do |pdf|
+              STDERR.puts "Creating #{output_file}..."
+              pdf.append_page(page)
+            end
+        when 'rsrc'
+            [ Resources::EXTGSTATE,
+              Resources::COLORSPACE,
+              Resources::PATTERN,
+              Resources::SHADING,
+              Resources::XOBJECT,
+              Resources::FONT,
+              Resources::PROPERTIES
+            ].each { |type| split_by_rsrc(i, page, type) }
+        else
+            raise ArgumentError, "Unknown split option: #{@options[:split_by]}"
         end
-      when 'rsrc'
-        [ Resources::EXTGSTATE,
-          Resources::COLORSPACE,
-          Resources::PATTERN,
-          Resources::SHADING,
-          Resources::XOBJECT,
-          Resources::FONT,
-          Resources::PROPERTIES
-        ].each { |type| split_by_rsrc(i, page, type) }
-      else
-        raise ArgumentError, "Unknown split option: #{@options[:split_by]}"
+        i += 1
     end
-    i += 1
-  end
-rescue SystemExit
-rescue Exception => e
-  STDERR.puts "#{e.class}: #{e.message} #{e.backtrace}"
-  exit 1
+rescue
+    abort "#{$!.class}: #{$!.message} #{$!.backtrace.join($/)}"
 end

data/bin/pdfextract CHANGED

@@ -1,38 +1,36 @@
-#!/usr/bin/env ruby
+#!/usr/bin/env ruby
 =begin
-= Author:
-  Guillaume Delugré <guillaume/at/security-labs.org>
+= Info
+    Extracts valuable data from a PDF document. Can extract:
+     - decoded streams
+     - JavaScript
+     - file attachments
-= Info:
-  Extracts valuable data from a PDF document. Can extract:
-    - decoded streams
-    - JavaScript
-    - file attachments
+= License
+    Copyright (C) 2016  Guillaume Delugré.
-= License:
-	Origami is free software: you can redistribute it and/or modify
-  it under the terms of the GNU Lesser General Public License as published by
-  the Free Software Foundation, either version 3 of the License, or
-  (at your option) any later version.
+    Origami is free software: you can redistribute it and/or modify
+    it under the terms of the GNU Lesser General Public License as published by
+    the Free Software Foundation, either version 3 of the License, or
+    (at your option) any later version.
-  Origami is distributed in the hope that it will be useful,
-  but WITHOUT ANY WARRANTY; without even the implied warranty of
-  MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
-  GNU Lesser General Public License for more details.
+    Origami is distributed in the hope that it will be useful,
+    but WITHOUT ANY WARRANTY; without even the implied warranty of
+    MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
+    GNU Lesser General Public License for more details.
-  You should have received a copy of the GNU Lesser General Public License
-  along with Origami.  If not, see <http://www.gnu.org/licenses/>.
+    You should have received a copy of the GNU Lesser General Public License
+    along with Origami.  If not, see <http://www.gnu.org/licenses/>.
 =end
 begin
-  require 'origami'
+    require 'origami'
 rescue LoadError
-  ORIGAMIDIR = "#{File.dirname(__FILE__)}/../lib"
-  $: << ORIGAMIDIR
-  require 'origami'
+    $: << File.join(__dir__, '../lib')
+    require 'origami'
 end
 include Origami
@@ -40,246 +38,231 @@ require 'optparse'
 require 'rexml/document'
 class OptParser
-  BANNER = <<USAGE
+    BANNER = <<USAGE
 Usage: #{$0} <PDF-file> [-afjms] [-d <output-directory>]
 Extracts various data out of a document (streams, scripts, images, fonts, metadata, attachments).
-Bug reports or feature requests at: http://origami-pdf.googlecode.com/
+Bug reports or feature requests at: http://github.com/gdelugre/origami
 Options:
 USAGE
-  def self.parser(options)
-    OptionParser.new do |opts|
-      opts.banner = BANNER
+    def self.parser(options)
+        OptionParser.new do |opts|
+            opts.banner = BANNER
-      opts.on("-d", "--output-dir DIR", "Output directory") do |d|
-        options[:output_dir] = d
-      end
+            opts.on("-d", "--output-dir DIR", "Output directory") do |d|
+                options[:output_dir] = d
+            end
-      opts.on("-s", "--streams", "Extracts all decoded streams") do
-        options[:streams] = true
-      end
+            opts.on("-s", "--streams", "Extracts all decoded streams") do
+                options[:streams] = true
+            end
-      opts.on("-a", "--attachments", "Extracts file attachments") do
-        options[:attachments] = true
-      end
+            opts.on("-a", "--attachments", "Extracts file attachments") do
+                options[:attachments] = true
+            end
-      opts.on("-f", "--fonts", "Extracts embedded font files") do
-        options[:fonts] = true
-      end
+            opts.on("-f", "--fonts", "Extracts embedded font files") do
+                options[:fonts] = true
+            end
-      opts.on("-j", "--js", "Extracts JavaScript scripts") do
-        options[:javascript] = true
-      end
+            opts.on("-j", "--js", "Extracts JavaScript scripts") do
+                options[:javascript] = true
+            end
-      opts.on("-m", "--metadata", "Extracts metadata streams") do
-        options[:metadata] = true
-      end
+            opts.on("-m", "--metadata", "Extracts metadata streams") do
+                options[:metadata] = true
+            end
-      opts.on("-i", "--images", "Extracts embedded images") do
-        options[:images] = true
-      end
+            opts.on("-i", "--images", "Extracts embedded images") do
+                options[:images] = true
+            end
-      opts.on_tail("-h", "--help", "Show this message") do
-        puts opts
-        exit
-      end
+            opts.on_tail("-h", "--help", "Show this message") do
+                puts opts
+                exit
+            end
+        end
     end
-  end
-  def self.parse(args)
-    options =
-    {
-    }
+    def self.parse(args)
+        options = {}
-    self.parser(options).parse!(args)
+        self.parser(options).parse!(args)
-    options
-  end
+        options
+    end
 end
 begin
-  @options = OptParser.parse(ARGV)
-  if ARGV.empty?
-    STDERR.puts "Error: No filename was specified. #{$0} --help for details."
-    exit 1
-  else
-    target = ARGV.shift
-  end
-  unless [:streams,:javascript,:attachments,:fonts,:metadata,:images].any? {|opt| @options[opt]}
-    @options[:streams] =
-    @options[:javascript] =
-    @options[:fonts] =
-    @options[:attachments] =
-    @options[:images] = true
-  end
-  if @options[:output_dir].nil?
-    @options[:output_dir] = "#{File.basename(target, '.pdf')}.dump"
-  end
-  # Force data extraction, even for invalid FlateDecode streams.
-  Origami::OPTIONS[:ignore_zlib_errors] = true
-  OUTPUT_DIR = @options[:output_dir]
-  Dir::mkdir(OUTPUT_DIR) unless File.directory?(OUTPUT_DIR)
-  params =
-  {
-    :verbosity => Parser::VERBOSE_QUIET,
-  }
-  pdf = PDF.read(target, params)
-  if @options[:streams]
-    nstreams = 0
-    Dir::mkdir("#{OUTPUT_DIR}/streams") unless File.directory?("#{OUTPUT_DIR}/streams")
-    pdf.root_objects.find_all{|obj| obj.is_a?(Stream)}.each do |stream|
-      stream_file = "#{OUTPUT_DIR}/streams/stream_#{stream.reference.refno}.dmp"
-      File.open(stream_file, "wb") do |fd|
-        fd.write(stream.data)
-      end
-      nstreams += 1
+    @options = OptParser.parse(ARGV)
+    if ARGV.empty?
+        abort "Error: No filename was specified. #{$0} --help for details."
+    else
+        target = ARGV.shift
     end
-    puts "Extracted #{nstreams} PDF streams to '#{OUTPUT_DIR}/streams'."
-  end
+    unless %i[streams javascript attachments fonts metadata images].any? {|opt| @options[opt]}
+        @options[:streams] =
+        @options[:javascript] =
+        @options[:fonts] =
+        @options[:attachments] =
+        @options[:images] = true
+    end
-  if @options[:javascript]
-    nscripts = 0
-    Dir::mkdir("#{OUTPUT_DIR}/scripts") unless File.directory?("#{OUTPUT_DIR}/scripts")
+    if @options[:output_dir].nil?
+        @options[:output_dir] = "#{File.basename(target, '.pdf')}.dump"
+    end
-    pdf.ls(/^JS$/).each do |script|
-      script_file = "#{OUTPUT_DIR}/scripts/script_#{script.hash}.js"
-      File.open(script_file, "wb") do |fd|
-        fd.write(
-          case script
-            when Stream then
-              script.data
-            else
-              script.value
-          end
-        )
-      end
-      nscripts += 1
+    # Force data extraction, even for invalid FlateDecode streams.
+    Origami::OPTIONS[:ignore_zlib_errors] = true
+    Origami::OPTIONS[:ignore_png_errors] = true
+    OUTPUT_DIR = @options[:output_dir]
+    Dir::mkdir(OUTPUT_DIR) unless File.directory?(OUTPUT_DIR)
+    params =
+    {
+        verbosity: Parser::VERBOSE_QUIET,
+    }
+    pdf = PDF.read(target, params)
+    if @options[:streams]
+        nstreams = 0
+        stream_dir = File.join(OUTPUT_DIR, "streams")
+        Dir::mkdir(stream_dir) unless File.directory?(stream_dir)
+        pdf.root_objects.find_all{|obj| obj.is_a?(Stream)}.each do |stream|
+            stream_file = File.join(stream_dir, "stream_#{stream.reference.refno}.dmp")
+            File.binwrite(stream_file, stream.data)
+            nstreams += 1
+        end
+        puts "Extracted #{nstreams} PDF streams to '#{stream_dir}'."
     end
-    # Also checking for presence of JavaScript in XML forms.
-    if pdf.has_form? and pdf.Catalog.AcroForm.has_key?(:XFA)
-      xfa = pdf.Catalog.AcroForm[:XFA].solve
-      case xfa
-        when Array then
-          xml = ""
-          i = 0
-          xfa.each do |packet|
-            if i % 2 == 1
-              xml << packet.solve.data
+    if @options[:javascript]
+        nscripts = 0
+        js_dir = File.join(OUTPUT_DIR, "scripts")
+        Dir::mkdir(js_dir) unless File.directory?(js_dir)
+        pdf.ls(/^JS$/).each do |script|
+            script_file = File.join(js_dir, "script_#{script.hash}.js")
+            script_data =
+                case script
+                when Stream then script.data
+                else script.value
+                end
+            File.binwrite(script_file, script_data)
+            nscripts += 1
+        end
+        # Also checking for presence of JavaScript in XML forms.
+        if pdf.form? and pdf.Catalog.AcroForm.has_key?(:XFA)
+            xfa = pdf.Catalog.AcroForm[:XFA].solve
+            case xfa
+            when Array then
+                xml = ""
+                i = 0
+                xfa.each do |packet|
+                    if i % 2 == 1
+                        xml << packet.solve.data
+                    end
+                    i = i + 1
+                end
+            when Stream then
+                xml = xfa.data
+            else
+                reject("Malformed XFA dictionary")
             end
-            i = i + 1
-          end
-        when Stream then
-          xml = xfa.data
-        else
-          reject("Malformed XFA dictionary")
-      end
-      xfadoc = REXML::Document.new(xml)
-      REXML::XPath.match(xfadoc, "//script").each do |script|
-        script_file = "#{OUTPUT_DIR}/script_#{script.hash}.js"
-        File.open(script_file, "wb") do |fd|
-          fd.write(script.text)
+            xfadoc = REXML::Document.new(xml)
+            REXML::XPath.match(xfadoc, "//script").each do |script|
+                script_file = File.join(js_dir, "script_#{script.hash}.js")
+                File.binwrite(script_file, script.text)
+                nscripts += 1
+            end
         end
-        nscripts += 1
-      end
+        puts "Extracted #{nscripts} scripts to '#{js_dir}'."
     end
-    puts "Extracted #{nscripts} scripts to '#{OUTPUT_DIR}/scripts'."
-  end
-  if @options[:attachments]
-    nattach = 0
-    Dir::mkdir("#{OUTPUT_DIR}/attachments") unless File.directory?("#{OUTPUT_DIR}/attachments")
-    pdf.ls_names(Names::Root::EMBEDDEDFILES).each do |name, attachment|
-      attached_file = "#{OUTPUT_DIR}/attachments/attached_#{File.basename(name)}"
-      spec = attachment.solve
-      if spec and spec.EF and f = spec.EF.F and f.is_a?(Stream)
-        File.open(attached_file, "wb") do |fd|
-          fd.write(f.data)
+    if @options[:attachments]
+        nattach = 0
+        attachments_dir = File.join(OUTPUT_DIR, "attachments")
+        Dir::mkdir(attachments_dir) unless File.directory?(attachments_dir)
+        pdf.each_attachment do |name, attachment|
+            attached_file = File.join(attachments_dir, "attached_#{File.basename(name)}")
+            spec = attachment.solve
+            if spec and spec.EF and f = spec.EF.F and f.is_a?(Stream)
+                File.binwrite(attached_file, f.data)
+                nattach += 1
+            end
         end
-        nattach += 1
-      end
+        puts "Extracted #{nattach} attachments to '#{attachments_dir}'."
     end
-    puts "Extracted #{nattach} attachments to '#{OUTPUT_DIR}/attachments'."
-  end
-  if @options[:fonts]
-    nfonts = 0
-    Dir::mkdir("#{OUTPUT_DIR}/fonts") unless File.directory?("#{OUTPUT_DIR}/fonts")
-    pdf.root_objects.find_all{|obj| obj.is_a?(Stream)}.each do |stream|
-      font = stream.xrefs.find{|obj| obj.is_a?(FontDescriptor)}
-      if font
-        font_file = "#{OUTPUT_DIR}/fonts/font_#{File.basename(font.FontName.value.to_s)}"
-        File.open(font_file, "wb") do |fd|
-          fd.write(stream.data)
+    if @options[:fonts]
+        nfonts = 0
+        fonts_dir = File.join(OUTPUT_DIR, "fonts")
+        Dir::mkdir(fonts_dir) unless File.directory?(fonts_dir)
+        pdf.root_objects.find_all{|obj| obj.is_a?(Stream)}.each do |stream|
+            font = stream.xrefs.find{|obj| obj.is_a?(FontDescriptor)}
+            if font
+                font_file = File.join(fonts_dir, File.basename(font.FontName.value.to_s))
+                File.binwrite(font_file, stream.data)
+                nfonts += 1
+            end
         end
-        nfonts += 1
-      end
+        puts "Extracted #{nfonts} fonts to '#{fonts_dir}'."
     end
-    puts "Extracted #{nfonts} fonts to '#{OUTPUT_DIR}/fonts'."
-  end
+    if @options[:metadata]
+        nmeta = 0
+        metadata_dir = File.join(OUTPUT_DIR, "metadata")
+        Dir::mkdir(metadata_dir) unless File.directory?(metadata_dir)
-  if @options[:metadata]
-    nmeta = 0
-    Dir::mkdir("#{OUTPUT_DIR}/metadata") unless File.directory?("#{OUTPUT_DIR}/metadata")
+        pdf.root_objects.find_all{|obj| obj.is_a?(MetadataStream)}.each do |stream|
+            metadata_file = File.join(metadata_dir, "metadata_#{stream.reference.refno}.xml")
+            File.binwrite(metadata_file, stream.data)
+            nmeta += 1
+        end
-    pdf.root_objects.find_all{|obj| obj.is_a?(MetadataStream)}.each do |stream|
-      metadata_file = "#{OUTPUT_DIR}/metadata/metadata_#{stream.reference.refno}.xml"
-      File.open(metadata_file, "wb") do |fd|
-        fd.write(stream.data)
-      end
-      nmeta += 1
+        puts "Extracted #{nmeta} metadata streams to '#{metadata_dir}'."
     end
-    puts "Extracted #{nmeta} metadata streams to '#{OUTPUT_DIR}/metadata'."
-  end
+    if @options[:images]
+        nimages = 0
+        image_dir = File.join(OUTPUT_DIR, "images")
+        Dir::mkdir(image_dir) unless File.directory?(image_dir)
-  if @options[:images]
-    nimages = 0
-    Dir::mkdir("#{OUTPUT_DIR}/images") unless File.directory?("#{OUTPUT_DIR}/images")
-    pdf.root_objects.find_all{|obj| obj.is_a?(Graphics::ImageXObject)}.each do |stream|
-      begin
-        ext, image_data = stream.to_image_file
-        image_file = "#{OUTPUT_DIR}/images/image_#{stream.reference.refno}.#{ext}"
+        pdf.root_objects.find_all{|obj| obj.is_a?(Graphics::ImageXObject)}.each do |stream|
+            begin
+                ext, image_data = stream.to_image_file
+                image_file = File.join(image_dir, "image_#{stream.reference.refno}.#{ext}")
-        if ext != 'png' and stream.ColorSpace == Graphics::Color::Space::DEVICE_CMYK
-          STDERR.puts "Warning: file '#{image_file}' is intended to be viewed in CMYK color space."
-        end
+                if ext != 'png' and stream.ColorSpace == Graphics::Color::Space::DEVICE_CMYK
+                    STDERR.puts "Warning: file '#{image_file}' is intended to be viewed in CMYK color space."
+                end
-        File.open(image_file, "wb") do |fd|
-          fd.write(image_data)
+                File.binwrite(image_file, image_data)
+                nimages += 1
+            rescue
+                STDERR.puts "Unable to decode image (stream #{stream.reference.refno}). #{$!.message}"
+            end
         end
-        nimages += 1
-      rescue Exception => e
-        STDERR.puts "Unable to decode image (stream #{stream.reference.refno}). #{e.message}"
-      end
+        puts "Extracted #{nimages} images to '#{image_dir}'."
     end
-    puts "Extracted #{nimages} images to '#{OUTPUT_DIR}/images'."
-  end
-rescue SystemExit
-rescue Exception => e
-  STDERR.puts "#{e.class}: #{e.message}"
-  exit 1
-end
+rescue
+    abort "#{$!.class}: #{$!.message}"
+end