docsplit 0.4.0 → 0.4.1

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
Files changed (3) hide show
  1. data/docsplit.gemspec +1 -1
  2. data/lib/docsplit.rb +4 -2
  3. metadata +3 -3
@@ -1,6 +1,6 @@
1
1
  Gem::Specification.new do |s|
2
2
  s.name = 'docsplit'
3
- s.version = '0.4.0' # Keep version in sync with docsplit.rb
3
+ s.version = '0.4.1' # Keep version in sync with docsplit.rb
4
4
  s.date = '2010-8-23'
5
5
 
6
6
  s.homepage = "http://documentcloud.github.com/docsplit/"
@@ -1,7 +1,7 @@
1
1
  # The Docsplit module delegates to the Java PDF extractors.
2
2
  module Docsplit
3
3
 
4
- VERSION = '0.4.0' # Keep in sync with gemspec.
4
+ VERSION = '0.4.1' # Keep in sync with gemspec.
5
5
 
6
6
  ROOT = File.expand_path(File.dirname(__FILE__) + '/..')
7
7
 
@@ -11,6 +11,8 @@ module Docsplit
11
11
 
12
12
  HEADLESS = "-Djava.awt.headless=true"
13
13
 
14
+ OFFICE = RUBY_PLATFORM.match(/darwin/i) ? '' : '-Doffice.home=/usr/lib/openoffice'
15
+
14
16
  METADATA_KEYS = [:author, :date, :creator, :keywords, :producer, :subject, :title, :length]
15
17
 
16
18
  DEPENDENCIES = {:java => false, :gm => false, :pdftotext => false, :pdftk => false, :tesseract => false}
@@ -76,7 +78,7 @@ module Docsplit
76
78
  # Runs a Java command, with quieted logging, and the classpath set properly.
77
79
  def self.run(command, pdfs, opts, return_output=false)
78
80
  pdfs = [pdfs].flatten.map{|pdf| "\"#{pdf}\""}.join(' ')
79
- cmd = "java #{HEADLESS} #{LOGGING} -cp #{CLASSPATH} #{command} #{pdfs} 2>&1"
81
+ cmd = "java #{HEADLESS} #{LOGGING} #{OFFICE} -cp #{CLASSPATH} #{command} #{pdfs} 2>&1"
80
82
  result = `#{cmd}`.chomp
81
83
  raise ExtractionFailed, result if $? != 0
82
84
  return return_output ? (result.empty? ? nil : result) : true
metadata CHANGED
@@ -1,13 +1,13 @@
1
1
  --- !ruby/object:Gem::Specification
2
2
  name: docsplit
3
3
  version: !ruby/object:Gem::Version
4
- hash: 15
4
+ hash: 13
5
5
  prerelease: false
6
6
  segments:
7
7
  - 0
8
8
  - 4
9
- - 0
10
- version: 0.4.0
9
+ - 1
10
+ version: 0.4.1
11
11
  platform: ruby
12
12
  authors:
13
13
  - Jeremy Ashkenas