pdf2html 0.0.1 → 0.1.0

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
checksums.yaml CHANGED
@@ -1,7 +1,7 @@
1
1
  ---
2
2
  SHA1:
3
- metadata.gz: b3da61b55d55cd4bddf89a429c739e2c9f35bd00
4
- data.tar.gz: 7044515d0e576a34f16727e0b67a0fdfe00350e6
3
+ metadata.gz: db52b2d9c2b7944e249ba2716826127b653b16f8
4
+ data.tar.gz: 8fc774e786a47ad21d2d63728787c5bf6a2d6075
5
5
  SHA512:
6
- metadata.gz: f844cc86497e49100d913f50275cddf73cfb3269adbeb470e8f901957db432c41e05fc8a17b3690c08885f46193e2ff2fa65b3aca9ff582bc84a7db38024aaa1
7
- data.tar.gz: b792d10792e0b5b1638f11bc40df31af0c2963f27714ec1025de230b98c5a56c67ebc415ef3eb43f6d0444652e1b3e09324f8df9c056785ca6415f8df18717d1
6
+ metadata.gz: 478baa34fb940efeed097d2a6f9285f1ea0a4eb9fc8aa002938a291258936be40e402f62f07cab2e0a893b19b598ba2d036e296b6c519384ca1ea36e30eb3cfd
7
+ data.tar.gz: 01d5d052a8980aed7475e56825b5a608e6dbc29fee1d14d618f2f23bb2d4c6f22a02e953039507bb5746d1eb5e771777c7f1e57b2cfcfc1c69338d63a2b05bd4
data/README.md CHANGED
@@ -1,6 +1,6 @@
1
1
  # Pdf2html
2
2
 
3
- Ruby interface to [pdf2htmlex](https://github.com/coolwanglu/pdf2htmlEX). Will utilize posix_spawn if available.
3
+ Ruby wrapper for the awesome [pdf2htmlex](https://github.com/coolwanglu/pdf2htmlEX). Will utilize `posix_spawn` if available.
4
4
 
5
5
  ## Installation
6
6
 
@@ -11,17 +11,16 @@ On OS X this is easy using Homebrew:
11
11
 
12
12
  Install the gem:
13
13
 
14
- gem install pdf2html
14
+ $ gem install pdf2html
15
15
 
16
16
  ## Usage
17
17
 
18
- Pdf2Html.convert({
19
- pdf: "/home/dev/meow.pdf",
20
- dest_dir: "/home/dev/precious_html",
21
- zoom: 1.5
22
- })
18
+ ```ruby
19
+ Pdf2Html.convert '/home/dev/meow.pdf', dest_dir: '/home/dev/public/', zoom: 1.5
23
20
 
24
- ### All params to date:
21
+ Pdf2Html.convert '/home/dev/meow.pdf', { dest_dir: '/home/dev/public/', zoom: 1.5 }, "your_awesome_optional_html_filename.html"
22
+ ```
23
+ ### All options to date:
25
24
 
26
25
  data_dir: "--data-dir",
27
26
  first_page: "--first-page",
@@ -64,5 +63,4 @@ Install the gem:
64
63
  debug: "--debug"
65
64
 
66
65
  ## Work harder
67
-
68
-
66
+ Aleksandr Schigol
@@ -2,7 +2,7 @@ require 'pdf2html/version'
2
2
  require 'pdf2html/caller'
3
3
 
4
4
  module Pdf2Html
5
- def self.convert(options = {})
6
- Caller.new(options).run
5
+ def self.convert(input_file, options = {}, output_file = "")
6
+ Caller.new(input_file, options, output_file).run
7
7
  end
8
8
  end
@@ -2,18 +2,37 @@ require 'cocaine'
2
2
  require 'pdf2html/option_provider'
3
3
 
4
4
  module Pdf2Html
5
- PDF2HTMLEX = 'pdf2htmlex'
6
-
7
5
  class Caller
8
6
  attr_reader :line, :cmd_options
7
+ attr_writer :cmd
9
8
 
10
- def initialize(options)
11
- @cmd_options = OptionProvider.new(options)
12
- @line = ::Cocaine::CommandLine.new(PDF2HTMLEX, @cmd_options.to_s)
9
+ def initialize(input_file, options = {}, output_file = "")
10
+ args = { pdf: input_file, html: output_file }
11
+ @cmd_options = OptionProvider.new(args, options)
12
+ @line = ::Cocaine::CommandLine.new(cmd, @cmd_options.to_s)
13
13
  end
14
14
 
15
15
  def run
16
16
  @line.run(@cmd_options.to_h)
17
17
  end
18
+
19
+ def cmd
20
+ @cmd ||= which('pdf2htmlex') || which('pdf2htmlEX')
21
+ end
22
+
23
+ private
24
+
25
+ def which(cmd)
26
+ exts = ENV['PATHEXT'] ? ENV['PATHEXT'].split(';') : ['']
27
+
28
+ ENV['PATH'].split(File::PATH_SEPARATOR).each do |path|
29
+ exts.each do |ext|
30
+ exe = File.join(path, "#{cmd}#{ext}")
31
+ return exe if File.executable? exe
32
+ end
33
+ end
34
+
35
+ return nil
36
+ end
18
37
  end
19
38
  end
@@ -1,9 +1,10 @@
1
1
  module Pdf2Html
2
+ PDF2HTMLEX_ARGS = [":pdf", ":html"]
3
+
2
4
  PDF2HTMLEX_OPTIONS = {
3
5
  zoom: "--zoom",
4
6
  data_dir: "--data-dir",
5
7
  dest_dir: "--dest-dir",
6
- pdf: "",
7
8
  first_page: "--first-page",
8
9
  last_page: "--last-page",
9
10
  fit_width: "--fit-width",
@@ -45,26 +46,23 @@ module Pdf2Html
45
46
  }
46
47
 
47
48
  class OptionProvider
48
- attr_reader :keys#, :switches
49
+ attr_reader :keys
49
50
 
50
- def initialize(options = {})
51
+ def initialize(args, options = {})
51
52
  @keys = PDF2HTMLEX_OPTIONS.keys & options.keys
52
53
  @options = normalize_options(options)
54
+ @args = args
53
55
  end
54
56
 
55
57
  def to_s
56
58
  return "" if @keys.empty?
57
59
 
58
- @options_string ||= ""
59
- @options.each do |key, val|
60
- @options_string = @options_string + "#{PDF2HTMLEX_OPTIONS[key]} #{key.to_sym.inspect.to_s} "
61
- end
62
-
63
- @options_string
60
+ (array_from_options(@options, PDF2HTMLEX_OPTIONS) +
61
+ PDF2HTMLEX_ARGS).join(" ")
64
62
  end
65
63
 
66
64
  def to_h
67
- @options
65
+ @options.merge(@args)
68
66
  end
69
67
 
70
68
  private
@@ -77,5 +75,11 @@ module Pdf2Html
77
75
  hash
78
76
  end
79
77
  end
78
+
79
+ def array_from_options(hash, opts = hash)
80
+ hash.flat_map do |key, val|
81
+ [opts[key].to_s, key.to_sym.inspect.to_s]
82
+ end
83
+ end
80
84
  end
81
85
  end
@@ -1,3 +1,3 @@
1
1
  module Pdf2Html
2
- VERSION = '0.0.1'
2
+ VERSION = '0.1.0'
3
3
  end
@@ -2,8 +2,9 @@ require_relative '../../test/helper'
2
2
 
3
3
  describe Pdf2Html::OptionProvider do
4
4
  before do
5
- @options = { zoom: 1.5, dest_dir: "/dir", pdf: "some.pdf", nonsense: "nonsense" }
6
- @option_provider = Pdf2Html::OptionProvider.new(@options)
5
+ @options = { zoom: 1.5, dest_dir: "/dir", nonsense: "nonsense" }
6
+ @args = { pdf: "some.pdf", html: 'some.html' }
7
+ @option_provider = Pdf2Html::OptionProvider.new(@args, @options)
7
8
  end
8
9
 
9
10
  it "must include only valid options" do
@@ -17,4 +18,8 @@ describe Pdf2Html::OptionProvider do
17
18
  it "must output options string for cocaine" do
18
19
  @option_provider.to_s.class.must_equal String
19
20
  end
21
+
22
+ # describe ".to_h" do
23
+ # it ""
24
+ # end
20
25
  end
metadata CHANGED
@@ -1,14 +1,14 @@
1
1
  --- !ruby/object:Gem::Specification
2
2
  name: pdf2html
3
3
  version: !ruby/object:Gem::Version
4
- version: 0.0.1
4
+ version: 0.1.0
5
5
  platform: ruby
6
6
  authors:
7
7
  - Aleksandr Schigol
8
8
  autorequire:
9
9
  bindir: bin
10
10
  cert_chain: []
11
- date: 2013-11-19 00:00:00.000000000 Z
11
+ date: 2013-12-12 00:00:00.000000000 Z
12
12
  dependencies:
13
13
  - !ruby/object:Gem::Dependency
14
14
  name: cocaine