origami 1.2.7 → 2.0.0
Sign up to get free protection for your applications and to get access to all the features.
- checksums.yaml +4 -4
- data/CHANGELOG.md +66 -0
- data/README.md +112 -0
- data/bin/config/pdfcop.conf.yml +232 -233
- data/bin/gui/about.rb +27 -37
- data/bin/gui/config.rb +108 -117
- data/bin/gui/file.rb +416 -365
- data/bin/gui/gtkhex.rb +1138 -1153
- data/bin/gui/hexview.rb +55 -57
- data/bin/gui/imgview.rb +48 -51
- data/bin/gui/menu.rb +388 -386
- data/bin/gui/properties.rb +114 -130
- data/bin/gui/signing.rb +571 -617
- data/bin/gui/textview.rb +77 -95
- data/bin/gui/treeview.rb +382 -387
- data/bin/gui/walker.rb +227 -232
- data/bin/gui/xrefs.rb +56 -60
- data/bin/pdf2pdfa +53 -57
- data/bin/pdf2ruby +212 -228
- data/bin/pdfcop +338 -348
- data/bin/pdfdecompress +58 -65
- data/bin/pdfdecrypt +56 -60
- data/bin/pdfencrypt +75 -80
- data/bin/pdfexplode +185 -182
- data/bin/pdfextract +201 -218
- data/bin/pdfmetadata +83 -82
- data/bin/pdfsh +4 -5
- data/bin/pdfwalker +1 -2
- data/bin/shell/.irbrc +45 -82
- data/bin/shell/console.rb +105 -130
- data/bin/shell/hexdump.rb +40 -64
- data/examples/README.md +34 -0
- data/examples/attachments/attachment.rb +38 -0
- data/examples/attachments/nested_document.rb +51 -0
- data/examples/encryption/encryption.rb +28 -0
- data/{samples/actions/triggerevents/trigger.rb → examples/events/events.rb} +13 -16
- data/examples/flash/flash.rb +37 -0
- data/{samples → examples}/flash/helloworld.swf +0 -0
- data/examples/forms/javascript.rb +54 -0
- data/examples/forms/xfa.rb +115 -0
- data/examples/javascript/hello_world.rb +22 -0
- data/examples/javascript/js_emulation.rb +54 -0
- data/examples/loop/goto.rb +32 -0
- data/examples/loop/named.rb +33 -0
- data/examples/signature/signature.rb +65 -0
- data/examples/uri/javascript.rb +56 -0
- data/examples/uri/open-uri.rb +21 -0
- data/examples/uri/submitform.rb +47 -0
- data/lib/origami.rb +29 -42
- data/lib/origami/3d.rb +350 -225
- data/lib/origami/acroform.rb +262 -288
- data/lib/origami/actions.rb +268 -288
- data/lib/origami/annotations.rb +697 -722
- data/lib/origami/array.rb +258 -184
- data/lib/origami/boolean.rb +74 -84
- data/lib/origami/catalog.rb +397 -434
- data/lib/origami/collections.rb +144 -0
- data/lib/origami/destinations.rb +233 -194
- data/lib/origami/dictionary.rb +253 -232
- data/lib/origami/encryption.rb +1274 -1243
- data/lib/origami/export.rb +232 -268
- data/lib/origami/extensions/fdf.rb +307 -220
- data/lib/origami/extensions/ppklite.rb +368 -435
- data/lib/origami/filespec.rb +197 -0
- data/lib/origami/filters.rb +301 -295
- data/lib/origami/filters/ascii.rb +177 -180
- data/lib/origami/filters/ccitt.rb +528 -535
- data/lib/origami/filters/crypt.rb +26 -35
- data/lib/origami/filters/dct.rb +46 -52
- data/lib/origami/filters/flate.rb +95 -94
- data/lib/origami/filters/jbig2.rb +49 -55
- data/lib/origami/filters/jpx.rb +38 -44
- data/lib/origami/filters/lzw.rb +189 -183
- data/lib/origami/filters/predictors.rb +221 -235
- data/lib/origami/filters/runlength.rb +103 -104
- data/lib/origami/font.rb +173 -186
- data/lib/origami/functions.rb +67 -81
- data/lib/origami/graphics.rb +25 -21
- data/lib/origami/graphics/colors.rb +178 -187
- data/lib/origami/graphics/instruction.rb +79 -85
- data/lib/origami/graphics/path.rb +142 -148
- data/lib/origami/graphics/patterns.rb +160 -167
- data/lib/origami/graphics/render.rb +43 -50
- data/lib/origami/graphics/state.rb +138 -153
- data/lib/origami/graphics/text.rb +188 -205
- data/lib/origami/graphics/xobject.rb +819 -815
- data/lib/origami/header.rb +63 -78
- data/lib/origami/javascript.rb +596 -597
- data/lib/origami/linearization.rb +285 -290
- data/lib/origami/metadata.rb +139 -148
- data/lib/origami/name.rb +112 -148
- data/lib/origami/null.rb +53 -62
- data/lib/origami/numeric.rb +162 -175
- data/lib/origami/obfuscation.rb +186 -174
- data/lib/origami/object.rb +593 -573
- data/lib/origami/outline.rb +42 -47
- data/lib/origami/outputintents.rb +73 -82
- data/lib/origami/page.rb +703 -592
- data/lib/origami/parser.rb +238 -290
- data/lib/origami/parsers/fdf.rb +41 -33
- data/lib/origami/parsers/pdf.rb +75 -95
- data/lib/origami/parsers/pdf/lazy.rb +137 -0
- data/lib/origami/parsers/pdf/linear.rb +64 -66
- data/lib/origami/parsers/ppklite.rb +34 -70
- data/lib/origami/pdf.rb +1030 -1005
- data/lib/origami/reference.rb +102 -102
- data/lib/origami/signature.rb +591 -609
- data/lib/origami/stream.rb +668 -551
- data/lib/origami/string.rb +397 -373
- data/lib/origami/template/patterns.rb +56 -0
- data/lib/origami/template/widgets.rb +151 -0
- data/lib/origami/trailer.rb +144 -158
- data/lib/origami/tree.rb +62 -0
- data/lib/origami/version.rb +23 -0
- data/lib/origami/webcapture.rb +88 -79
- data/lib/origami/xfa.rb +2863 -2882
- data/lib/origami/xreftable.rb +472 -384
- data/test/dataset/calc.pdf +85 -0
- data/test/dataset/crypto.pdf +82 -0
- data/test/dataset/empty.pdf +49 -0
- data/test/test_actions.rb +27 -0
- data/test/test_annotations.rb +90 -0
- data/test/test_pages.rb +31 -0
- data/test/test_pdf.rb +16 -0
- data/test/test_pdf_attachment.rb +34 -0
- data/test/test_pdf_create.rb +24 -0
- data/test/test_pdf_encrypt.rb +95 -0
- data/test/test_pdf_parse.rb +96 -0
- data/test/test_pdf_sign.rb +58 -0
- data/test/test_streams.rb +182 -0
- data/test/test_xrefs.rb +67 -0
- metadata +88 -58
- data/README +0 -67
- data/bin/pdf2graph +0 -121
- data/bin/pdfcocoon +0 -104
- data/lib/origami/file.rb +0 -233
- data/samples/README.txt +0 -45
- data/samples/actions/launch/calc.rb +0 -87
- data/samples/actions/launch/winparams.rb +0 -22
- data/samples/actions/loop/loopgoto.rb +0 -24
- data/samples/actions/loop/loopnamed.rb +0 -21
- data/samples/actions/named/named.rb +0 -31
- data/samples/actions/samba/smbrelay.rb +0 -26
- data/samples/actions/webbug/submitform.js +0 -26
- data/samples/actions/webbug/webbug-browser.rb +0 -68
- data/samples/actions/webbug/webbug-js.rb +0 -67
- data/samples/actions/webbug/webbug-reader.rb +0 -90
- data/samples/attachments/attach.rb +0 -40
- data/samples/attachments/attached.txt +0 -1
- data/samples/crypto/crypto.rb +0 -28
- data/samples/digsig/signed.rb +0 -46
- data/samples/exploits/cve-2008-2992-utilprintf.rb +0 -87
- data/samples/exploits/cve-2009-0927-geticon.rb +0 -65
- data/samples/exploits/exploit_customdictopen.rb +0 -55
- data/samples/exploits/getannots.rb +0 -69
- data/samples/flash/flash.rb +0 -31
- data/samples/javascript/attached.txt +0 -1
- data/samples/javascript/js.rb +0 -52
- data/templates/patterns.rb +0 -66
- data/templates/widgets.rb +0 -173
- data/templates/xdp.rb +0 -92
- data/test/ts_pdf.rb +0 -50
data/lib/origami/parsers/fdf.rb
CHANGED
@@ -1,21 +1,20 @@
|
|
1
1
|
=begin
|
2
2
|
|
3
|
-
|
4
|
-
|
3
|
+
This file is part of Origami, PDF manipulation framework for Ruby
|
4
|
+
Copyright (C) 2016 Guillaume Delugré.
|
5
5
|
|
6
|
-
|
7
|
-
|
8
|
-
|
9
|
-
|
10
|
-
(at your option) any later version.
|
6
|
+
Origami is free software: you can redistribute it and/or modify
|
7
|
+
it under the terms of the GNU Lesser General Public License as published by
|
8
|
+
the Free Software Foundation, either version 3 of the License, or
|
9
|
+
(at your option) any later version.
|
11
10
|
|
12
|
-
|
13
|
-
|
14
|
-
|
15
|
-
|
11
|
+
Origami is distributed in the hope that it will be useful,
|
12
|
+
but WITHOUT ANY WARRANTY; without even the implied warranty of
|
13
|
+
MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
|
14
|
+
GNU Lesser General Public License for more details.
|
16
15
|
|
17
|
-
|
18
|
-
|
16
|
+
You should have received a copy of the GNU Lesser General Public License
|
17
|
+
along with Origami. If not, see <http://www.gnu.org/licenses/>.
|
19
18
|
|
20
19
|
=end
|
21
20
|
|
@@ -23,26 +22,35 @@ require 'origami/parser'
|
|
23
22
|
|
24
23
|
module Origami
|
25
24
|
|
26
|
-
|
27
|
-
|
28
|
-
|
29
|
-
|
30
|
-
|
31
|
-
|
32
|
-
|
33
|
-
|
34
|
-
|
35
|
-
|
36
|
-
|
37
|
-
|
38
|
-
|
39
|
-
|
40
|
-
|
41
|
-
|
25
|
+
class FDF
|
26
|
+
class Parser < Origami::Parser
|
27
|
+
def parse(stream) #:nodoc:
|
28
|
+
super(stream)
|
29
|
+
|
30
|
+
fdf = FDF.new
|
31
|
+
fdf.header = FDF::Header.parse(@data)
|
32
|
+
@options[:callback].call(fdf.header)
|
33
|
+
|
34
|
+
loop do
|
35
|
+
break if (object = parse_object).nil?
|
36
|
+
fdf.insert(object)
|
37
|
+
end
|
38
|
+
|
39
|
+
fdf.revisions.first.xreftable = parse_xreftable
|
40
|
+
fdf.revisions.first.trailer = parse_trailer
|
41
|
+
|
42
|
+
if Origami::OPTIONS[:enable_type_propagation]
|
43
|
+
trailer = fdf.revisions.first.trailer
|
42
44
|
|
43
|
-
|
44
|
-
|
45
|
+
if trailer[:Root].is_a?(Reference)
|
46
|
+
fdf.cast_object(trailer[:Root], FDF::Catalog, self)
|
47
|
+
end
|
48
|
+
|
49
|
+
propagate_types(fdf)
|
50
|
+
end
|
51
|
+
|
52
|
+
fdf
|
53
|
+
end
|
54
|
+
end
|
45
55
|
end
|
46
|
-
end
|
47
56
|
end
|
48
|
-
|
data/lib/origami/parsers/pdf.rb
CHANGED
@@ -1,115 +1,95 @@
|
|
1
1
|
=begin
|
2
2
|
|
3
|
-
|
4
|
-
|
5
|
-
|
6
|
-
|
7
|
-
|
8
|
-
|
9
|
-
|
10
|
-
|
11
|
-
|
12
|
-
|
13
|
-
|
14
|
-
|
15
|
-
|
16
|
-
|
17
|
-
|
18
|
-
MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
|
19
|
-
GNU Lesser General Public License for more details.
|
20
|
-
|
21
|
-
You should have received a copy of the GNU Lesser General Public License
|
22
|
-
along with Origami. If not, see <http://www.gnu.org/licenses/>.
|
3
|
+
This file is part of Origami, PDF manipulation framework for Ruby
|
4
|
+
Copyright (C) 2016 Guillaume Delugré.
|
5
|
+
|
6
|
+
Origami is free software: you can redistribute it and/or modify
|
7
|
+
it under the terms of the GNU Lesser General Public License as published by
|
8
|
+
the Free Software Foundation, either version 3 of the License, or
|
9
|
+
(at your option) any later version.
|
10
|
+
|
11
|
+
Origami is distributed in the hope that it will be useful,
|
12
|
+
but WITHOUT ANY WARRANTY; without even the implied warranty of
|
13
|
+
MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
|
14
|
+
GNU Lesser General Public License for more details.
|
15
|
+
|
16
|
+
You should have received a copy of the GNU Lesser General Public License
|
17
|
+
along with Origami. If not, see <http://www.gnu.org/licenses/>.
|
23
18
|
|
24
19
|
=end
|
25
20
|
|
26
21
|
require 'origami/parser'
|
27
22
|
|
28
23
|
module Origami
|
29
|
-
|
30
|
-
class PDF
|
31
|
-
class Parser < Origami::Parser
|
32
|
-
def initialize(params = {})
|
33
|
-
options =
|
34
|
-
{
|
35
|
-
:password => '', # Default password being tried when opening a protected document.
|
36
|
-
:prompt_password => Proc.new {
|
37
|
-
print "Password: "
|
38
|
-
gets.chomp
|
39
|
-
}, # Callback procedure to prompt password when document is encrypted.
|
40
|
-
:force => false # Force PDF header detection
|
41
|
-
}.update(params)
|
42
|
-
|
43
|
-
super(options)
|
44
|
-
end
|
45
|
-
|
46
|
-
private
|
47
|
-
|
48
|
-
def parse_initialize #:nodoc:
|
49
|
-
if @options[:force] == true
|
50
|
-
@data.skip_until(/%PDF-/).nil?
|
51
|
-
@data.pos = @data.pos - 5
|
52
|
-
end
|
53
24
|
|
54
|
-
|
55
|
-
|
56
|
-
|
57
|
-
|
58
|
-
|
59
|
-
|
60
|
-
|
61
|
-
|
62
|
-
|
63
|
-
|
64
|
-
|
65
|
-
|
66
|
-
|
25
|
+
class PDF
|
26
|
+
class Parser < Origami::Parser
|
27
|
+
def initialize(params = {})
|
28
|
+
options =
|
29
|
+
{
|
30
|
+
password: '', # Default password being tried when opening a protected document.
|
31
|
+
prompt_password: lambda do # Callback procedure to prompt password when document is encrypted.
|
32
|
+
require 'io/console'
|
33
|
+
STDERR.print "Password: "
|
34
|
+
STDIN.noecho(&:gets).chomp
|
35
|
+
end,
|
36
|
+
force: false # Force PDF header detection
|
37
|
+
}.update(params)
|
38
|
+
|
39
|
+
super(options)
|
40
|
+
end
|
67
41
|
|
68
|
-
|
69
|
-
end
|
42
|
+
private
|
70
43
|
|
71
|
-
|
72
|
-
|
44
|
+
def parse_initialize #:nodoc:
|
45
|
+
if @options[:force] == true
|
46
|
+
@data.skip_until(/%PDF-/).nil?
|
47
|
+
@data.pos = @data.pos - 5
|
48
|
+
end
|
73
49
|
|
74
|
-
|
75
|
-
info "...Propagating types..."
|
76
|
-
@deferred_casts.each_pair do |ref, type|
|
77
|
-
type = [ type ] unless type.is_a?(::Array)
|
78
|
-
type.each do |hint|
|
79
|
-
pdf.cast_object(ref, hint)
|
80
|
-
end
|
81
|
-
end
|
82
|
-
end
|
50
|
+
pdf = PDF.new(self)
|
83
51
|
|
84
|
-
|
85
|
-
|
86
|
-
|
87
|
-
|
88
|
-
|
89
|
-
|
90
|
-
|
91
|
-
|
92
|
-
|
93
|
-
|
94
|
-
if passwd.empty?
|
95
|
-
passwd = @options[:prompt_password].call
|
96
|
-
retry unless passwd.empty?
|
52
|
+
info "...Reading header..."
|
53
|
+
begin
|
54
|
+
pdf.header = PDF::Header.parse(@data)
|
55
|
+
@options[:callback].call(pdf.header)
|
56
|
+
rescue InvalidHeaderError
|
57
|
+
raise unless @options[:ignore_errors]
|
58
|
+
warn "PDF header is invalid, ignoring..."
|
59
|
+
end
|
60
|
+
|
61
|
+
pdf
|
97
62
|
end
|
98
63
|
|
99
|
-
|
100
|
-
|
101
|
-
end
|
64
|
+
def parse_finalize(pdf) #:nodoc:
|
65
|
+
warn "This file has been linearized." if pdf.linearized?
|
102
66
|
|
103
|
-
|
104
|
-
warn "This document has been signed!"
|
105
|
-
end
|
67
|
+
propagate_types(pdf) if Origami::OPTIONS[:enable_type_propagation]
|
106
68
|
|
107
|
-
|
108
|
-
|
109
|
-
|
110
|
-
|
69
|
+
#
|
70
|
+
# Decrypt encrypted file contents
|
71
|
+
#
|
72
|
+
if pdf.encrypted?
|
73
|
+
warn "This document contains encrypted data!"
|
111
74
|
|
112
|
-
|
75
|
+
passwd = @options[:password]
|
76
|
+
begin
|
77
|
+
pdf.decrypt(passwd)
|
78
|
+
rescue EncryptionInvalidPasswordError
|
79
|
+
if passwd.empty?
|
80
|
+
passwd = @options[:prompt_password].call
|
81
|
+
retry unless passwd.empty?
|
82
|
+
end
|
113
83
|
|
114
|
-
|
84
|
+
raise
|
85
|
+
end
|
86
|
+
end
|
115
87
|
|
88
|
+
warn "This document has been signed!" if pdf.signed?
|
89
|
+
|
90
|
+
pdf
|
91
|
+
end
|
92
|
+
end
|
93
|
+
end
|
94
|
+
|
95
|
+
end
|
@@ -0,0 +1,137 @@
|
|
1
|
+
=begin
|
2
|
+
|
3
|
+
This file is part of Origami, PDF manipulation framework for Ruby
|
4
|
+
Copyright (C) 2016 Guillaume Delugré.
|
5
|
+
|
6
|
+
Origami is free software: you can redistribute it and/or modify
|
7
|
+
it under the terms of the GNU Lesser General Public License as published by
|
8
|
+
the Free Software Foundation, either version 3 of the License, or
|
9
|
+
(at your option) any later version.
|
10
|
+
|
11
|
+
Origami is distributed in the hope that it will be useful,
|
12
|
+
but WITHOUT ANY WARRANTY; without even the implied warranty of
|
13
|
+
MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
|
14
|
+
GNU Lesser General Public License for more details.
|
15
|
+
|
16
|
+
You should have received a copy of the GNU Lesser General Public License
|
17
|
+
along with Origami. If not, see <http://www.gnu.org/licenses/>.
|
18
|
+
|
19
|
+
=end
|
20
|
+
|
21
|
+
|
22
|
+
require 'origami/parsers/pdf'
|
23
|
+
|
24
|
+
module Origami
|
25
|
+
|
26
|
+
class PDF
|
27
|
+
|
28
|
+
#
|
29
|
+
# Create a new PDF lazy Parser.
|
30
|
+
#
|
31
|
+
class LazyParser < Parser
|
32
|
+
def parse(stream)
|
33
|
+
super
|
34
|
+
|
35
|
+
pdf = parse_initialize
|
36
|
+
revisions = []
|
37
|
+
|
38
|
+
# Set the scanner position at the end.
|
39
|
+
@data.terminate
|
40
|
+
|
41
|
+
# Locate the startxref token.
|
42
|
+
until @data.match?(/#{Trailer::XREF_TOKEN}/)
|
43
|
+
raise ParsingError, "No xref token found" if @data.pos == 0
|
44
|
+
@data.pos -= 1
|
45
|
+
end
|
46
|
+
|
47
|
+
# Extract the offset of the last xref section.
|
48
|
+
trailer = Trailer.parse(@data, self)
|
49
|
+
raise ParsingError, "Cannot locate xref section" if trailer.startxref.zero?
|
50
|
+
|
51
|
+
xref_offset = trailer.startxref
|
52
|
+
while xref_offset and xref_offset != 0
|
53
|
+
|
54
|
+
# Create a new revision based on the xref section offset.
|
55
|
+
revision = parse_revision(pdf, xref_offset)
|
56
|
+
|
57
|
+
# Locate the previous xref section.
|
58
|
+
if revision.xrefstm
|
59
|
+
xref_offset = revision.xrefstm[:Prev].to_i
|
60
|
+
else
|
61
|
+
xref_offset = revision.trailer[:Prev].to_i
|
62
|
+
end
|
63
|
+
|
64
|
+
# Prepend the revision.
|
65
|
+
revisions.unshift(revision)
|
66
|
+
end
|
67
|
+
|
68
|
+
pdf.revisions.clear
|
69
|
+
revisions.each do |rev|
|
70
|
+
pdf.revisions.push(rev)
|
71
|
+
pdf.insert(rev.xrefstm) if rev.has_xrefstm?
|
72
|
+
end
|
73
|
+
|
74
|
+
parse_finalize(pdf)
|
75
|
+
|
76
|
+
pdf
|
77
|
+
end
|
78
|
+
|
79
|
+
private
|
80
|
+
|
81
|
+
def parse_revision(pdf, offset)
|
82
|
+
raise ParsingError, "Invalid xref offset" if offset < 0 or offset >= @data.string.size
|
83
|
+
|
84
|
+
@data.pos = offset
|
85
|
+
|
86
|
+
# Create a new revision.
|
87
|
+
revision = PDF::Revision.new(pdf)
|
88
|
+
|
89
|
+
# Regular xref section.
|
90
|
+
if @data.match?(/#{XRef::Section::TOKEN}/)
|
91
|
+
xreftable = parse_xreftable
|
92
|
+
raise ParsingError, "Cannot parse xref section" if xreftable.nil?
|
93
|
+
|
94
|
+
revision.xreftable = xreftable
|
95
|
+
revision.trailer = parse_trailer
|
96
|
+
|
97
|
+
# Handle hybrid cross-references.
|
98
|
+
if revision.trailer[:XRefStm].is_a?(Integer)
|
99
|
+
begin
|
100
|
+
offset = revision.trailer[:XRefStm].to_i
|
101
|
+
xrefstm = parse_object(offset)
|
102
|
+
|
103
|
+
if xrefstm.is_a?(XRefStream)
|
104
|
+
revision.xrefstm = xrefstm
|
105
|
+
else
|
106
|
+
warn "Invalid xref stream at offset #{offset}"
|
107
|
+
end
|
108
|
+
|
109
|
+
rescue
|
110
|
+
warn "Cannot parse xref stream at offset #{offset}"
|
111
|
+
end
|
112
|
+
end
|
113
|
+
|
114
|
+
# The xrefs are stored in a stream.
|
115
|
+
else
|
116
|
+
xrefstm = parse_object
|
117
|
+
raise ParsingError, "Invalid xref stream" unless xrefstm.is_a?(XRefStream)
|
118
|
+
|
119
|
+
revision.xrefstm = xrefstm
|
120
|
+
|
121
|
+
# Search for the trailer.
|
122
|
+
if @data.skip_until Regexp.union(Trailer::XREF_TOKEN, *Trailer::TOKENS)
|
123
|
+
@data.pos -= @data.matched_size
|
124
|
+
|
125
|
+
revision.trailer = parse_trailer
|
126
|
+
else
|
127
|
+
warn "No trailer found."
|
128
|
+
revision.trailer = Trailer.new
|
129
|
+
end
|
130
|
+
end
|
131
|
+
|
132
|
+
revision
|
133
|
+
end
|
134
|
+
end
|
135
|
+
end
|
136
|
+
|
137
|
+
end
|
@@ -1,85 +1,83 @@
|
|
1
1
|
=begin
|
2
2
|
|
3
|
-
|
4
|
-
|
3
|
+
This file is part of Origami, PDF manipulation framework for Ruby
|
4
|
+
Copyright (C) 2016 Guillaume Delugré.
|
5
5
|
|
6
|
-
|
7
|
-
|
8
|
-
|
9
|
-
|
10
|
-
(at your option) any later version.
|
6
|
+
Origami is free software: you can redistribute it and/or modify
|
7
|
+
it under the terms of the GNU Lesser General Public License as published by
|
8
|
+
the Free Software Foundation, either version 3 of the License, or
|
9
|
+
(at your option) any later version.
|
11
10
|
|
12
|
-
|
13
|
-
|
14
|
-
|
15
|
-
|
11
|
+
Origami is distributed in the hope that it will be useful,
|
12
|
+
but WITHOUT ANY WARRANTY; without even the implied warranty of
|
13
|
+
MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
|
14
|
+
GNU Lesser General Public License for more details.
|
16
15
|
|
17
|
-
|
18
|
-
|
16
|
+
You should have received a copy of the GNU Lesser General Public License
|
17
|
+
along with Origami. If not, see <http://www.gnu.org/licenses/>.
|
19
18
|
|
20
19
|
=end
|
21
20
|
|
22
21
|
|
23
|
-
require 'origami/
|
24
|
-
require 'origami/pdf'
|
22
|
+
require 'origami/parsers/pdf'
|
25
23
|
|
26
24
|
module Origami
|
27
25
|
|
28
|
-
|
29
|
-
|
30
|
-
#
|
31
|
-
# Create a new PDF linear Parser.
|
32
|
-
#
|
33
|
-
class LinearParser < Parser
|
34
|
-
def parse(stream)
|
35
|
-
super
|
36
|
-
|
37
|
-
pdf = parse_initialize
|
26
|
+
class PDF
|
38
27
|
|
39
28
|
#
|
40
|
-
#
|
29
|
+
# Create a new PDF linear Parser.
|
41
30
|
#
|
42
|
-
|
43
|
-
|
44
|
-
|
45
|
-
|
46
|
-
|
47
|
-
|
48
|
-
|
49
|
-
|
50
|
-
|
51
|
-
|
52
|
-
|
31
|
+
class LinearParser < Parser
|
32
|
+
def parse(stream)
|
33
|
+
super
|
34
|
+
|
35
|
+
pdf = parse_initialize
|
36
|
+
|
37
|
+
#
|
38
|
+
# Parse each revision
|
39
|
+
#
|
40
|
+
revision = 0
|
41
|
+
until @data.eos? do
|
42
|
+
begin
|
43
|
+
pdf.add_new_revision unless revision.zero?
|
44
|
+
revision = revision + 1
|
45
|
+
|
46
|
+
info "...Parsing revision #{pdf.revisions.size}..."
|
47
|
+
loop do
|
48
|
+
break if (object = parse_object).nil?
|
49
|
+
pdf.insert(object)
|
50
|
+
end
|
51
|
+
|
52
|
+
pdf.revisions.last.xreftable = parse_xreftable
|
53
|
+
|
54
|
+
trailer = parse_trailer
|
55
|
+
pdf.revisions.last.trailer = trailer
|
56
|
+
|
57
|
+
if trailer.startxref != 0
|
58
|
+
xrefstm = pdf.get_object_by_offset(trailer.startxref)
|
59
|
+
elsif trailer[:XRefStm].is_a?(Integer)
|
60
|
+
xrefstm = pdf.get_object_by_offset(trailer[:XRefStm])
|
61
|
+
end
|
62
|
+
|
63
|
+
if xrefstm.is_a?(XRefStream)
|
64
|
+
warn "Found a XRefStream for this revision at #{xrefstm.reference}"
|
65
|
+
pdf.revisions.last.xrefstm = xrefstm
|
66
|
+
end
|
67
|
+
|
68
|
+
rescue
|
69
|
+
error "Cannot read : " + (@data.peek(10) + "...").inspect
|
70
|
+
error "Stopped on exception : " + $!.message
|
71
|
+
|
72
|
+
break
|
73
|
+
end
|
74
|
+
end
|
75
|
+
|
76
|
+
pdf.loaded!
|
77
|
+
|
78
|
+
parse_finalize(pdf)
|
53
79
|
end
|
54
|
-
|
55
|
-
pdf.revisions.last.xreftable = parse_xreftable
|
56
|
-
|
57
|
-
trailer = parse_trailer
|
58
|
-
pdf.revisions.last.trailer = trailer
|
59
|
-
|
60
|
-
xrefstm = pdf.get_object_by_offset(trailer.startxref) ||
|
61
|
-
(pdf.get_object_by_offset(trailer.XRefStm) if trailer.has_field? :XRefStm)
|
62
|
-
|
63
|
-
if not xrefstm.nil?
|
64
|
-
warn "Found a XRefStream for this revision at #{xrefstm.reference}"
|
65
|
-
pdf.revisions.last.xrefstm = xrefstm
|
66
|
-
end
|
67
|
-
|
68
|
-
rescue SystemExit
|
69
|
-
raise
|
70
|
-
rescue Exception => e
|
71
|
-
error "Cannot read : " + (@data.peek(10) + "...").inspect
|
72
|
-
error "Stopped on exception : " + e.message
|
73
|
-
|
74
|
-
break
|
75
|
-
end
|
76
|
-
|
77
80
|
end
|
78
|
-
|
79
|
-
parse_finalize(pdf)
|
80
|
-
end
|
81
|
-
|
82
81
|
end
|
83
|
-
end
|
84
|
-
end
|
85
82
|
|
83
|
+
end
|