libis-format 1.2.9 → 2.0.0
This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
- checksums.yaml +4 -4
- data/.coveralls.yml +2 -0
- data/.gitignore +20 -0
- data/.travis.yml +70 -0
- data/Gemfile +0 -8
- data/README.md +2 -2
- data/Rakefile +8 -0
- data/base/Dockerfile +35 -0
- data/base/Dockerfile.alpine +20 -0
- data/base/Dockerfile.rvm +56 -0
- data/base/rework_path +20 -0
- data/data/PDFA_def.ps +3 -3
- data/data/eciRGB_v2.icc +0 -0
- data/data/types.yml +3 -16
- data/docker_cfg.yml +1 -0
- data/lib/libis/format/cli/convert.rb +4 -4
- data/lib/libis/format/cli/prompt_helper.rb +24 -32
- data/lib/libis/format/config.rb +4 -3
- data/lib/libis/format/converter/audio_converter.rb +31 -56
- data/lib/libis/format/converter/base.rb +21 -8
- data/lib/libis/format/converter/chain.rb +6 -18
- data/lib/libis/format/converter/fop_pdf_converter.rb +2 -0
- data/lib/libis/format/converter/image_assembler.rb +82 -0
- data/lib/libis/format/converter/image_converter.rb +21 -141
- data/lib/libis/format/converter/image_splitter.rb +80 -0
- data/lib/libis/format/converter/image_watermarker.rb +261 -0
- data/lib/libis/format/converter/jp2_converter.rb +4 -4
- data/lib/libis/format/converter/office_converter.rb +5 -3
- data/lib/libis/format/converter/pdf_assembler.rb +66 -0
- data/lib/libis/format/converter/pdf_converter.rb +31 -98
- data/lib/libis/format/converter/pdf_optimizer.rb +70 -0
- data/lib/libis/format/converter/pdf_splitter.rb +65 -0
- data/lib/libis/format/converter/pdf_watermarker.rb +110 -0
- data/lib/libis/format/converter/spreadsheet_converter.rb +5 -3
- data/lib/libis/format/converter/video_converter.rb +3 -6
- data/lib/libis/format/converter/xslt_converter.rb +14 -15
- data/lib/libis/format/identifier.rb +4 -4
- data/lib/libis/format/info.rb +27 -0
- data/lib/libis/format/library.rb +147 -0
- data/lib/libis/format/tool/extension_identification.rb +26 -24
- data/lib/libis/format/tool/{ff_mpeg.rb → ffmpeg.rb} +1 -10
- data/lib/libis/format/tool/fido.rb +27 -22
- data/lib/libis/format/tool/file_tool.rb +24 -11
- data/lib/libis/format/tool/fop_pdf.rb +14 -25
- data/lib/libis/format/tool/identification_tool.rb +40 -38
- data/lib/libis/format/tool/office_to_pdf.rb +18 -30
- data/lib/libis/format/tool/pdf_copy.rb +1 -11
- data/lib/libis/format/tool/pdf_merge.rb +1 -11
- data/lib/libis/format/tool/pdf_optimizer.rb +2 -11
- data/lib/libis/format/tool/pdf_split.rb +16 -25
- data/lib/libis/format/tool/pdf_to_pdfa.rb +32 -50
- data/lib/libis/format/tool/pdfa_validator.rb +30 -25
- data/lib/libis/format/tool/spreadsheet_to_ods.rb +2 -10
- data/lib/libis/format/tool.rb +1 -2
- data/lib/libis/format/version.rb +1 -3
- data/lib/libis/format/yaml_loader.rb +71 -0
- data/lib/libis/format.rb +5 -2
- data/libis-format.gemspec +18 -24
- metadata +78 -120
- data/data/AdobeRGB1998.icc +0 -0
- data/lib/libis/format/converter/email_converter.rb +0 -38
- data/lib/libis/format/tool/msg_to_pdf.rb +0 -270
- data/lib/libis/format/type_database.rb +0 -133
- data/lib/libis/format/type_database_impl.rb +0 -120
- data/tools/pdf2pdfa +0 -395
- /data/bin/{droid_tool → droid} +0 -0
- /data/bin/{fido_tool → fido} +0 -0
| @@ -0,0 +1,70 @@ | |
| 1 | 
            +
            # encoding: utf-8
         | 
| 2 | 
            +
             | 
| 3 | 
            +
            require_relative 'base'
         | 
| 4 | 
            +
             | 
| 5 | 
            +
            require 'libis/tools/extend/hash'
         | 
| 6 | 
            +
            require 'libis/format/tool/pdf_copy'
         | 
| 7 | 
            +
            require 'libis/format/tool/pdf_to_pdfa'
         | 
| 8 | 
            +
            require 'libis/format/tool/pdf_optimizer'
         | 
| 9 | 
            +
             | 
| 10 | 
            +
            module Libis
         | 
| 11 | 
            +
              module Format
         | 
| 12 | 
            +
                module Converter
         | 
| 13 | 
            +
             | 
| 14 | 
            +
                  class PdfOptimizer < Libis::Format::Converter::Base
         | 
| 15 | 
            +
             | 
| 16 | 
            +
                    def self.input_types
         | 
| 17 | 
            +
                      [:PDF]
         | 
| 18 | 
            +
                    end
         | 
| 19 | 
            +
             | 
| 20 | 
            +
                    def self.output_types(format = nil)
         | 
| 21 | 
            +
                      return [] unless input_types.include?(format) if format
         | 
| 22 | 
            +
                      [:PDF]
         | 
| 23 | 
            +
                    end
         | 
| 24 | 
            +
             | 
| 25 | 
            +
                    def pdf_optimize(_)
         | 
| 26 | 
            +
                      #force usage of this converter
         | 
| 27 | 
            +
                    end
         | 
| 28 | 
            +
             | 
| 29 | 
            +
                    # Optimize the PDF
         | 
| 30 | 
            +
                    #
         | 
| 31 | 
            +
                    # This reduces the graphics quality to a level in order to limit file size. This option relies on the
         | 
| 32 | 
            +
                    # presence of ghostscript and takes one argument: the quality level. It should be one of:
         | 
| 33 | 
            +
                    #
         | 
| 34 | 
            +
                    # - 0 : lowest quality (Acrobat Distiller 'Screen Optimized' equivalent)
         | 
| 35 | 
            +
                    # - 1 : medium quality (Acrobat Distiller 'eBook' equivalent)
         | 
| 36 | 
            +
                    # - 2 : good quality
         | 
| 37 | 
            +
                    # - 3 : high quality (Acrobat Distiller 'Print Optimized' equivalent)
         | 
| 38 | 
            +
                    # - 4 : highest quality (Acrobat Distiller 'Prepress Optimized' equivalent)
         | 
| 39 | 
            +
                    #
         | 
| 40 | 
            +
                    # Note that the optimization is intended to be used with PDF's containing high-resolution images.
         | 
| 41 | 
            +
                    #
         | 
| 42 | 
            +
                    # @param [Integer] setting quality setting. [0-4]
         | 
| 43 | 
            +
                    def quality(setting = 1)
         | 
| 44 | 
            +
                      @quality = %w(screen ebook default printer prepress)[setting] if (0..4) === setting
         | 
| 45 | 
            +
                    end
         | 
| 46 | 
            +
             | 
| 47 | 
            +
                    def convert(source, target, format, opts = {})
         | 
| 48 | 
            +
                      super
         | 
| 49 | 
            +
             | 
| 50 | 
            +
                       optimize_pdf(source, target, @quality || 'ebook')
         | 
| 51 | 
            +
             | 
| 52 | 
            +
                    end
         | 
| 53 | 
            +
             | 
| 54 | 
            +
                    def optimize_pdf(source, target, quality)
         | 
| 55 | 
            +
             | 
| 56 | 
            +
                      using_temp(target) do |tmpname|
         | 
| 57 | 
            +
                        result = Libis::Format::Tool::PdfOptimizer.run(source, tmpname, quality)
         | 
| 58 | 
            +
                        unless result[:status] == 0
         | 
| 59 | 
            +
                          error("Pdf optimization encountered errors:\n%s", (result[:err] + result[:out]).join("\n"))
         | 
| 60 | 
            +
                          next nil
         | 
| 61 | 
            +
                        end
         | 
| 62 | 
            +
                        tmpname
         | 
| 63 | 
            +
                      end
         | 
| 64 | 
            +
                    end
         | 
| 65 | 
            +
             | 
| 66 | 
            +
                  end
         | 
| 67 | 
            +
             | 
| 68 | 
            +
                end
         | 
| 69 | 
            +
              end
         | 
| 70 | 
            +
            end
         | 
| @@ -0,0 +1,65 @@ | |
| 1 | 
            +
            # encoding: utf-8
         | 
| 2 | 
            +
             | 
| 3 | 
            +
            require_relative 'base'
         | 
| 4 | 
            +
             | 
| 5 | 
            +
            require 'libis/format/tool/pdf_split'
         | 
| 6 | 
            +
             | 
| 7 | 
            +
            module Libis
         | 
| 8 | 
            +
              module Format
         | 
| 9 | 
            +
                module Converter
         | 
| 10 | 
            +
             | 
| 11 | 
            +
                  # noinspection DuplicatedCode
         | 
| 12 | 
            +
                  class PdfSplitter < Libis::Format::Converter::Base
         | 
| 13 | 
            +
             | 
| 14 | 
            +
                    def self.input_types
         | 
| 15 | 
            +
                      [:PDF]
         | 
| 16 | 
            +
                    end
         | 
| 17 | 
            +
             | 
| 18 | 
            +
                    def self.output_types(format = nil)
         | 
| 19 | 
            +
                      return [] unless input_types.include?(format) if format
         | 
| 20 | 
            +
                      [:PDF]
         | 
| 21 | 
            +
                    end
         | 
| 22 | 
            +
             | 
| 23 | 
            +
                    def pdf_split(_)
         | 
| 24 | 
            +
                      #force usage of this converter
         | 
| 25 | 
            +
                    end
         | 
| 26 | 
            +
             | 
| 27 | 
            +
                    def self.category
         | 
| 28 | 
            +
                      :splitter
         | 
| 29 | 
            +
                    end
         | 
| 30 | 
            +
             | 
| 31 | 
            +
                    # Split at given page. If omitted or nil, the source PDF will be split at every page
         | 
| 32 | 
            +
                    def page(v)
         | 
| 33 | 
            +
                      @page = v unless v.blank
         | 
| 34 | 
            +
                    end
         | 
| 35 | 
            +
             | 
| 36 | 
            +
                    def convert(source, target, format, opts = {})
         | 
| 37 | 
            +
                      super
         | 
| 38 | 
            +
             | 
| 39 | 
            +
                      result = split(source, target)
         | 
| 40 | 
            +
                      return nil unless result
         | 
| 41 | 
            +
             | 
| 42 | 
            +
                      result
         | 
| 43 | 
            +
                    end
         | 
| 44 | 
            +
             | 
| 45 | 
            +
                    private
         | 
| 46 | 
            +
             | 
| 47 | 
            +
                    def split(source, target)
         | 
| 48 | 
            +
             | 
| 49 | 
            +
                      options = @page ? ['--page', @page] : ['--every_page']
         | 
| 50 | 
            +
                      using_temp(target) do |tmpname|
         | 
| 51 | 
            +
                        result = Libis::Format::Tool::PdfSplit.run(source, tmpname, *options)
         | 
| 52 | 
            +
                        unless result[:err].empty?
         | 
| 53 | 
            +
                          error("Pdf split encountered errors:\n%s", result[:err].join(join("\n")))
         | 
| 54 | 
            +
                          next nil
         | 
| 55 | 
            +
                        end
         | 
| 56 | 
            +
                        tmpname
         | 
| 57 | 
            +
                      end
         | 
| 58 | 
            +
             | 
| 59 | 
            +
                    end
         | 
| 60 | 
            +
             | 
| 61 | 
            +
                  end
         | 
| 62 | 
            +
             | 
| 63 | 
            +
                end
         | 
| 64 | 
            +
              end
         | 
| 65 | 
            +
            end
         | 
| @@ -0,0 +1,110 @@ | |
| 1 | 
            +
            # encoding: utf-8
         | 
| 2 | 
            +
             | 
| 3 | 
            +
            require_relative 'base'
         | 
| 4 | 
            +
             | 
| 5 | 
            +
            require 'libis/tools/extend/hash'
         | 
| 6 | 
            +
            require 'libis/format/tool/pdf_copy'
         | 
| 7 | 
            +
            require 'libis/format/tool/pdf_to_pdfa'
         | 
| 8 | 
            +
            require 'libis/format/tool/pdf_optimizer'
         | 
| 9 | 
            +
             | 
| 10 | 
            +
            module Libis
         | 
| 11 | 
            +
              module Format
         | 
| 12 | 
            +
                module Converter
         | 
| 13 | 
            +
             | 
| 14 | 
            +
                  class PdfWatermarker < Libis::Format::Converter::Base
         | 
| 15 | 
            +
             | 
| 16 | 
            +
                    def self.input_types
         | 
| 17 | 
            +
                      [:PDF]
         | 
| 18 | 
            +
                    end
         | 
| 19 | 
            +
             | 
| 20 | 
            +
                    def self.output_types(format = nil)
         | 
| 21 | 
            +
                      return [] unless input_types.include?(format) if format
         | 
| 22 | 
            +
                      [:PDF]
         | 
| 23 | 
            +
                    end
         | 
| 24 | 
            +
             | 
| 25 | 
            +
                    def pdf_watermark(_)
         | 
| 26 | 
            +
                      #force usage of this converter
         | 
| 27 | 
            +
                    end
         | 
| 28 | 
            +
             | 
| 29 | 
            +
                    def initialize
         | 
| 30 | 
            +
                      super
         | 
| 31 | 
            +
                      @options[:text] = '© LIBIS'
         | 
| 32 | 
            +
                      @options[:opacity] = '0.3'
         | 
| 33 | 
            +
                    end
         | 
| 34 | 
            +
             | 
| 35 | 
            +
                    def file(v)
         | 
| 36 | 
            +
                      @options[:file] = v.blank? ? nil : v
         | 
| 37 | 
            +
                    end
         | 
| 38 | 
            +
             | 
| 39 | 
            +
                    def text(v)
         | 
| 40 | 
            +
                      @options[:text] = v
         | 
| 41 | 
            +
                    end
         | 
| 42 | 
            +
             | 
| 43 | 
            +
                    def rotation(v)
         | 
| 44 | 
            +
                      @options[:rotation] = v unless v.blank?
         | 
| 45 | 
            +
                    end
         | 
| 46 | 
            +
             | 
| 47 | 
            +
                    def size(v)
         | 
| 48 | 
            +
                      @options[:size] = v unless v.blank?
         | 
| 49 | 
            +
                    end
         | 
| 50 | 
            +
             | 
| 51 | 
            +
                    def opacity(v)
         | 
| 52 | 
            +
                      @options[:opacity] = v unless v.blank?
         | 
| 53 | 
            +
                    end
         | 
| 54 | 
            +
             | 
| 55 | 
            +
                    def gap_size(v)
         | 
| 56 | 
            +
                      @options[:gap_size] = v
         | 
| 57 | 
            +
                    end
         | 
| 58 | 
            +
             | 
| 59 | 
            +
                    def gap_ratio(v)
         | 
| 60 | 
            +
                      @options[:gap_ratio] = v
         | 
| 61 | 
            +
                    end
         | 
| 62 | 
            +
             | 
| 63 | 
            +
                    def convert(source, target, format, opts = {})
         | 
| 64 | 
            +
                      super
         | 
| 65 | 
            +
             | 
| 66 | 
            +
                      result = convert_pdf(source, target)
         | 
| 67 | 
            +
                      return nil unless result
         | 
| 68 | 
            +
             | 
| 69 | 
            +
                      result
         | 
| 70 | 
            +
             | 
| 71 | 
            +
                    end
         | 
| 72 | 
            +
             | 
| 73 | 
            +
                    OPTIONS_TABLE = {
         | 
| 74 | 
            +
                        file: 'wm_image',
         | 
| 75 | 
            +
                        text: 'wm_text',
         | 
| 76 | 
            +
                        rotation: 'wm_text_rotation',
         | 
| 77 | 
            +
                        size: 'wm_font_size',
         | 
| 78 | 
            +
                        opacity: 'wm_opacity',
         | 
| 79 | 
            +
                        gap_size: 'wm_gap_size',
         | 
| 80 | 
            +
                        gap_ratio: 'wm_gap_ratio'
         | 
| 81 | 
            +
                    }
         | 
| 82 | 
            +
                    # noinspection DuplicatedCode
         | 
| 83 | 
            +
                    def convert_pdf(source, target)
         | 
| 84 | 
            +
             | 
| 85 | 
            +
                      using_temp(target) do |tmpname|
         | 
| 86 | 
            +
                        result = Libis::Format::Tool::PdfCopy.run(
         | 
| 87 | 
            +
                            source, tmpname,
         | 
| 88 | 
            +
                            @options.map {|k, v|
         | 
| 89 | 
            +
                              if v.nil?
         | 
| 90 | 
            +
                                nil
         | 
| 91 | 
            +
                              else
         | 
| 92 | 
            +
                                v = v.split('\n') unless v.blank? if k == :text
         | 
| 93 | 
            +
                                k = OPTIONS_TABLE[k] || k
         | 
| 94 | 
            +
                                ["--#{k}", (v.is_a?(Array) ? v : v.to_s)]
         | 
| 95 | 
            +
                              end}.compact.flatten
         | 
| 96 | 
            +
                        )
         | 
| 97 | 
            +
                        unless result[:err].empty?
         | 
| 98 | 
            +
                          error("Pdf conversion encountered errors:\n%s", result[:err].join(join("\n")))
         | 
| 99 | 
            +
                          next nil
         | 
| 100 | 
            +
                        end
         | 
| 101 | 
            +
                        tmpname
         | 
| 102 | 
            +
                      end
         | 
| 103 | 
            +
             | 
| 104 | 
            +
                    end
         | 
| 105 | 
            +
             | 
| 106 | 
            +
                  end
         | 
| 107 | 
            +
             | 
| 108 | 
            +
                end
         | 
| 109 | 
            +
              end
         | 
| 110 | 
            +
            end
         | 
| @@ -3,7 +3,7 @@ | |
| 3 3 | 
             
            require_relative 'base'
         | 
| 4 4 |  | 
| 5 5 | 
             
            require 'libis/format/tool/spreadsheet_to_ods'
         | 
| 6 | 
            -
            require 'libis/format/ | 
| 6 | 
            +
            require 'libis/format/library'
         | 
| 7 7 |  | 
| 8 8 | 
             
            module Libis
         | 
| 9 9 | 
             
              module Format
         | 
| @@ -20,7 +20,7 @@ module Libis | |
| 20 20 | 
             
                    end
         | 
| 21 21 |  | 
| 22 22 | 
             
                    def self.output_types(format = nil)
         | 
| 23 | 
            -
                      return [] unless input_types.include?(format)
         | 
| 23 | 
            +
                      return [] unless input_types.include?(format) if format
         | 
| 24 24 | 
             
                      [:OO_CALC]
         | 
| 25 25 | 
             
                    end
         | 
| 26 26 |  | 
| @@ -31,7 +31,9 @@ module Libis | |
| 31 31 | 
             
                    def convert(source, target, format, opts = {})
         | 
| 32 32 | 
             
                      super
         | 
| 33 33 |  | 
| 34 | 
            -
                      Format::Tool::SpreadsheetToOds.run(source, target)
         | 
| 34 | 
            +
                      return nil unless Format::Tool::SpreadsheetToOds.run(source, target)
         | 
| 35 | 
            +
             | 
| 36 | 
            +
                      target
         | 
| 35 37 |  | 
| 36 38 | 
             
                    end
         | 
| 37 39 |  | 
| @@ -1,5 +1,5 @@ | |
| 1 1 | 
             
            require_relative 'base'
         | 
| 2 | 
            -
            require 'libis/format/tool/ | 
| 2 | 
            +
            require 'libis/format/tool/ffmpeg'
         | 
| 3 3 |  | 
| 4 4 | 
             
            require 'fileutils'
         | 
| 5 5 |  | 
| @@ -14,7 +14,7 @@ module Libis | |
| 14 14 | 
             
                    end
         | 
| 15 15 |  | 
| 16 16 | 
             
                    def self.output_types(format = nil)
         | 
| 17 | 
            -
                      return [] unless input_types.include?(format)
         | 
| 17 | 
            +
                      return [] unless input_types.include?(format) if format
         | 
| 18 18 | 
             
                      [:GIF, :WEBM, :MP4, :MPG, :MKV, :MJP2, :QTFF, :AVI, :OGGV, :WMV, :DV, :FLV, :SWF]
         | 
| 19 19 | 
             
                    end
         | 
| 20 20 |  | 
| @@ -179,10 +179,7 @@ module Libis | |
| 179 179 |  | 
| 180 180 | 
             
                      end
         | 
| 181 181 |  | 
| 182 | 
            -
                       | 
| 183 | 
            -
                        files: [target],
         | 
| 184 | 
            -
                        converter: self.class.name
         | 
| 185 | 
            -
                      }
         | 
| 182 | 
            +
                      target
         | 
| 186 183 |  | 
| 187 184 | 
             
                    end
         | 
| 188 185 |  | 
| @@ -1,17 +1,17 @@ | |
| 1 | 
            -
            require_relative  | 
| 1 | 
            +
            require_relative 'base'
         | 
| 2 2 |  | 
| 3 3 | 
             
            module Libis
         | 
| 4 4 | 
             
              module Format
         | 
| 5 5 | 
             
                module Converter
         | 
| 6 | 
            +
             | 
| 6 7 | 
             
                  class XsltConverter < Libis::Format::Converter::Base
         | 
| 8 | 
            +
             | 
| 7 9 | 
             
                    def self.input_types
         | 
| 8 10 | 
             
                      [:XML]
         | 
| 9 11 | 
             
                    end
         | 
| 10 12 |  | 
| 11 13 | 
             
                    def self.output_types(format = nil)
         | 
| 12 | 
            -
                      if format
         | 
| 13 | 
            -
                        return [] unless input_types.include?(format)
         | 
| 14 | 
            -
                      end
         | 
| 14 | 
            +
                      return [] unless input_types.include?(format) if format
         | 
| 15 15 | 
             
                      [:XML, :HTML, :TXT]
         | 
| 16 16 | 
             
                    end
         | 
| 17 17 |  | 
| @@ -28,20 +28,20 @@ module Libis | |
| 28 28 | 
             
                      end
         | 
| 29 29 |  | 
| 30 30 | 
             
                      unless @options[:xsl_file]
         | 
| 31 | 
            -
                        error  | 
| 31 | 
            +
                        error 'No xsl_file supplied'
         | 
| 32 32 | 
             
                        return nil
         | 
| 33 33 | 
             
                      end
         | 
| 34 34 |  | 
| 35 35 | 
             
                      FileUtils.mkpath(File.dirname(target))
         | 
| 36 36 |  | 
| 37 37 | 
             
                      if RUBY_PLATFORM == "java"
         | 
| 38 | 
            -
                        require  | 
| 38 | 
            +
                        require 'saxon-xslt'
         | 
| 39 39 | 
             
                        xsl = Saxon.XSLT(File.open(@options[:xsl_file]))
         | 
| 40 40 | 
             
                        xml = Saxon.XML(File.open(source))
         | 
| 41 41 | 
             
                        result = xsl.transform(xml)
         | 
| 42 | 
            -
                        File. | 
| 42 | 
            +
                        File.open(target, 'w') {|f| f.write(result.to_s)}
         | 
| 43 43 | 
             
                      else
         | 
| 44 | 
            -
                        require  | 
| 44 | 
            +
                        require 'nokogiri'
         | 
| 45 45 |  | 
| 46 46 | 
             
                        doc = nil
         | 
| 47 47 | 
             
                        begin
         | 
| @@ -65,7 +65,7 @@ module Libis | |
| 65 65 | 
             
                        xsl = nil
         | 
| 66 66 |  | 
| 67 67 | 
             
                        begin
         | 
| 68 | 
            -
                          fp = File.open(file,  | 
| 68 | 
            +
                          fp = File.open(file, 'r')
         | 
| 69 69 | 
             
                          xsl = Nokogiri::XSLT(fp) do |config|
         | 
| 70 70 | 
             
                            config.options = Nokogiri::XML::ParseOptions::STRICT | Nokogiri::XML::ParseOptions::NOBLANKS
         | 
| 71 71 | 
             
                          end
         | 
| @@ -80,7 +80,7 @@ module Libis | |
| 80 80 |  | 
| 81 81 | 
             
                        begin
         | 
| 82 82 | 
             
                          target_xml = xsl.transform(doc)
         | 
| 83 | 
            -
                          fp = File.open(target,  | 
| 83 | 
            +
                          fp = File.open(target, 'w')
         | 
| 84 84 | 
             
                          fp.write(target_xml)
         | 
| 85 85 | 
             
                        rescue Exception => e
         | 
| 86 86 | 
             
                          error "Error transforming '#{source}' with '#{file}': #{e.message} @ #{e.backtrace[0]}"
         | 
| @@ -89,14 +89,13 @@ module Libis | |
| 89 89 | 
             
                          fp.close unless fp.nil? or fp.closed?
         | 
| 90 90 | 
             
                        end
         | 
| 91 91 |  | 
| 92 | 
            -
                         | 
| 93 | 
            -
                          command: {status: 0},
         | 
| 94 | 
            -
                          files: [target]
         | 
| 95 | 
            -
                        }
         | 
| 96 | 
            -
             | 
| 92 | 
            +
                        target
         | 
| 97 93 | 
             
                      end
         | 
| 94 | 
            +
             | 
| 98 95 | 
             
                    end
         | 
| 96 | 
            +
             | 
| 99 97 | 
             
                  end
         | 
| 98 | 
            +
             | 
| 100 99 | 
             
                end
         | 
| 101 100 | 
             
              end
         | 
| 102 101 | 
             
            end
         | 
| @@ -9,7 +9,7 @@ require 'libis/tools/extend/string' | |
| 9 9 | 
             
            require 'libis/tools/extend/empty'
         | 
| 10 10 | 
             
            require 'nori/core_ext/object'
         | 
| 11 11 |  | 
| 12 | 
            -
            require 'libis/format/ | 
| 12 | 
            +
            require 'libis/format/library'
         | 
| 13 13 |  | 
| 14 14 | 
             
            require_relative 'config'
         | 
| 15 15 | 
             
            require_relative 'tool/fido'
         | 
| @@ -97,7 +97,7 @@ module Libis | |
| 97 97 | 
             
                  end
         | 
| 98 98 |  | 
| 99 99 | 
             
                  def get_fido_identification(file, result, options)
         | 
| 100 | 
            -
                    output = ::Libis::Format::Tool::Fido.run(file, options[:recursive],  | 
| 100 | 
            +
                    output = ::Libis::Format::Tool::Fido.run(file, options[:recursive], options[:fido_options])
         | 
| 101 101 | 
             
                    process_tool_output(output, result, options[:base_dir])
         | 
| 102 102 | 
             
                    output
         | 
| 103 103 | 
             
                  end
         | 
| @@ -132,7 +132,7 @@ module Libis | |
| 132 132 | 
             
                        if doc.validates_against?(xsd_file)
         | 
| 133 133 | 
             
                          log_msg result, :debug, "XML file validated against XML Schema: #{xsd_file}"
         | 
| 134 134 | 
             
                          info = {mimetype: mime, tool_raw: file_result[:tool], tool: :xsd_validation, match_type: 'xsd_validation', format_version: '', }
         | 
| 135 | 
            -
                          file_result.merge! Libis::Format:: | 
| 135 | 
            +
                          file_result.merge! Libis::Format::Library.enrich(info, puid: :puid, mimetype: :mimetype, name: :format_name)
         | 
| 136 136 | 
             
                        end
         | 
| 137 137 | 
             
                      rescue => e
         | 
| 138 138 | 
             
                        # Do nothing - probably Nokogiri chrashed during validation. Could have many causes
         | 
| @@ -208,7 +208,7 @@ module Libis | |
| 208 208 | 
             
                  end
         | 
| 209 209 |  | 
| 210 210 | 
             
                  def get_mimetype(puid)
         | 
| 211 | 
            -
                    ::Libis::Format:: | 
| 211 | 
            +
                    ::Libis::Format::Library.get_field_by(:puid, puid, :mimetypes)
         | 
| 212 212 | 
             
                  end
         | 
| 213 213 |  | 
| 214 214 | 
             
                  def get_best_result(results)
         | 
| @@ -0,0 +1,27 @@ | |
| 1 | 
            +
            module Libis
         | 
| 2 | 
            +
              module Format
         | 
| 3 | 
            +
                class Info
         | 
| 4 | 
            +
                  attr_reader :name, :category, :description, :puids, :mimetypes, :extensions
         | 
| 5 | 
            +
             | 
| 6 | 
            +
                  def initialize(name:, category:, description: '', puids: [], mimetypes: [], extensions: [])
         | 
| 7 | 
            +
                    @name = name
         | 
| 8 | 
            +
                    @category = category
         | 
| 9 | 
            +
                    @description = description
         | 
| 10 | 
            +
                    @puids = puids
         | 
| 11 | 
            +
                    @mimetypes = mimetypes
         | 
| 12 | 
            +
                    @extensions = extensions
         | 
| 13 | 
            +
                  end
         | 
| 14 | 
            +
             | 
| 15 | 
            +
                  def to_hash
         | 
| 16 | 
            +
                    {
         | 
| 17 | 
            +
                        name: name,
         | 
| 18 | 
            +
                        description: description.dup,
         | 
| 19 | 
            +
                        category: category,
         | 
| 20 | 
            +
                        puids: puids.dup,
         | 
| 21 | 
            +
                        mimetypes: mimetypes.dup,
         | 
| 22 | 
            +
                        extensions: extensions.dup
         | 
| 23 | 
            +
                    }
         | 
| 24 | 
            +
                  end
         | 
| 25 | 
            +
                end
         | 
| 26 | 
            +
              end
         | 
| 27 | 
            +
            end
         | 
| @@ -0,0 +1,147 @@ | |
| 1 | 
            +
            # froze_string_litteral: true
         | 
| 2 | 
            +
            # coding: utf-8
         | 
| 3 | 
            +
            require 'singleton'
         | 
| 4 | 
            +
             | 
| 5 | 
            +
            module Libis
         | 
| 6 | 
            +
              module Format
         | 
| 7 | 
            +
             | 
| 8 | 
            +
                class Library
         | 
| 9 | 
            +
                  include Singleton
         | 
| 10 | 
            +
             | 
| 11 | 
            +
                  class << self
         | 
| 12 | 
            +
                    def implementation=(impl)
         | 
| 13 | 
            +
                      instance.implementation = impl
         | 
| 14 | 
            +
                    end
         | 
| 15 | 
            +
             | 
| 16 | 
            +
                    def get_info(format)
         | 
| 17 | 
            +
                      instance.get_info(format)
         | 
| 18 | 
            +
                    end
         | 
| 19 | 
            +
             | 
| 20 | 
            +
                    def get_info_by(key, value)
         | 
| 21 | 
            +
                      instance.get_info_by(key, value)
         | 
| 22 | 
            +
                    end
         | 
| 23 | 
            +
             | 
| 24 | 
            +
                    def get_infos_by(key, value)
         | 
| 25 | 
            +
                      instance.get_infos_by(key, value)
         | 
| 26 | 
            +
                    end
         | 
| 27 | 
            +
             | 
| 28 | 
            +
                    def get_field(format, field)
         | 
| 29 | 
            +
                      instance.get_field(format, field)
         | 
| 30 | 
            +
                    end
         | 
| 31 | 
            +
             | 
| 32 | 
            +
                    def get_field_by(key, value, field)
         | 
| 33 | 
            +
                      instance.get_field_by(key, value, field)
         | 
| 34 | 
            +
                    end
         | 
| 35 | 
            +
             | 
| 36 | 
            +
                    def get_fields_by(key, value, field)
         | 
| 37 | 
            +
                      instance.get_fields_by(key, value, field)
         | 
| 38 | 
            +
                    end
         | 
| 39 | 
            +
             | 
| 40 | 
            +
                    def known?(key, value)
         | 
| 41 | 
            +
                      instance.known?(key, value)
         | 
| 42 | 
            +
                    end
         | 
| 43 | 
            +
             | 
| 44 | 
            +
                    def enrich(info, map_keys = {})
         | 
| 45 | 
            +
                      instance.enrich(info, map_keys)
         | 
| 46 | 
            +
                    end
         | 
| 47 | 
            +
             | 
| 48 | 
            +
                    def normalize(info, map_keys = {})
         | 
| 49 | 
            +
                      instance.normalize(info, map_keys)
         | 
| 50 | 
            +
                    end
         | 
| 51 | 
            +
                  end
         | 
| 52 | 
            +
             | 
| 53 | 
            +
                  def implementation=(impl)
         | 
| 54 | 
            +
                    @implementation = impl
         | 
| 55 | 
            +
                  end
         | 
| 56 | 
            +
             | 
| 57 | 
            +
                  def get_field(format, field)
         | 
| 58 | 
            +
                    get_field_by(:name, format, field)
         | 
| 59 | 
            +
                  end
         | 
| 60 | 
            +
             | 
| 61 | 
            +
                  def get_field_by(key, value, field)
         | 
| 62 | 
            +
                    info = get_info_by(key, value)
         | 
| 63 | 
            +
                    return nil unless info
         | 
| 64 | 
            +
                    case field
         | 
| 65 | 
            +
                    when :mimetype
         | 
| 66 | 
            +
                      info[:mimetypes]&.first
         | 
| 67 | 
            +
                    when :puid
         | 
| 68 | 
            +
                      info[:puids]&.first
         | 
| 69 | 
            +
                    when :extension
         | 
| 70 | 
            +
                      info[:extensions]&.first
         | 
| 71 | 
            +
                    else
         | 
| 72 | 
            +
                      info[field]
         | 
| 73 | 
            +
                    end
         | 
| 74 | 
            +
                  end
         | 
| 75 | 
            +
             | 
| 76 | 
            +
                  def get_fields_by(key, value, field)
         | 
| 77 | 
            +
                    get_infos_by(key, value)&.map { |info| info[field] }.compact
         | 
| 78 | 
            +
                  end
         | 
| 79 | 
            +
             | 
| 80 | 
            +
                  def get_info(format)
         | 
| 81 | 
            +
                    get_info_by(:name, format)
         | 
| 82 | 
            +
                  end
         | 
| 83 | 
            +
             | 
| 84 | 
            +
                  def get_info_by(key, value)
         | 
| 85 | 
            +
                    get_infos_by(key, value)&.first
         | 
| 86 | 
            +
                  end
         | 
| 87 | 
            +
             | 
| 88 | 
            +
                  def get_infos_by(key, value)
         | 
| 89 | 
            +
                    result = @implementation.query(key, value)
         | 
| 90 | 
            +
                    result.map(&:to_hash)
         | 
| 91 | 
            +
                  end
         | 
| 92 | 
            +
             | 
| 93 | 
            +
                  def known?(key, value)
         | 
| 94 | 
            +
                    !get_info_by(key, value).nil?
         | 
| 95 | 
            +
                  end
         | 
| 96 | 
            +
             | 
| 97 | 
            +
                  def enrich(info, map_keys = {})
         | 
| 98 | 
            +
                    info = normalize(info, map_keys)
         | 
| 99 | 
            +
                    mapper = Hash.new { |hash, key| hash[key] = key }.merge(map_keys)
         | 
| 100 | 
            +
                    unless (format = info[mapper[:name]]).nil?
         | 
| 101 | 
            +
                      lib_info = get_info(format)
         | 
| 102 | 
            +
                      mapper.keys.each do |key|
         | 
| 103 | 
            +
                        case key
         | 
| 104 | 
            +
                        when :mimetype
         | 
| 105 | 
            +
                          info[mapper[key]] = lib_info[:mimetypes].first if lib_info[:mimetypes].first
         | 
| 106 | 
            +
                        when :puid
         | 
| 107 | 
            +
                          info[mapper[key]] = lib_info[:puids].first if lib_info[:puids].first
         | 
| 108 | 
            +
                        when :extension
         | 
| 109 | 
            +
                          info[mapper[key]] = lib_info[:extensions].first if lib_info[:extensions].first
         | 
| 110 | 
            +
                        else
         | 
| 111 | 
            +
                          info[mapper[key]] = lib_info[key] if lib_info[key]
         | 
| 112 | 
            +
                        end
         | 
| 113 | 
            +
                      end
         | 
| 114 | 
            +
                    end
         | 
| 115 | 
            +
                    info
         | 
| 116 | 
            +
                  end
         | 
| 117 | 
            +
             | 
| 118 | 
            +
                  # Derive name from the available info
         | 
| 119 | 
            +
                  def normalize(info, map_keys = {})
         | 
| 120 | 
            +
                    return {} unless info.is_a? Hash
         | 
| 121 | 
            +
                    mapper = Hash.new { |hash, key| hash[key] = key }.merge(map_keys)
         | 
| 122 | 
            +
                    # fill format from looking up by puid
         | 
| 123 | 
            +
                    unless (puid = info[mapper[:puid]]).blank?
         | 
| 124 | 
            +
                      info[mapper[:name]] ||= get_field_by(:puid, puid, :name)
         | 
| 125 | 
            +
                    end
         | 
| 126 | 
            +
                    # fill format from looking up by mimetype
         | 
| 127 | 
            +
                    unless (mime = info[mapper[:mimetype]]).blank?
         | 
| 128 | 
            +
                      info[mapper[:name]] ||= get_field_by(:mimetype, mime, :name)
         | 
| 129 | 
            +
                    end
         | 
| 130 | 
            +
                    # finally complete the information from looking up by format name
         | 
| 131 | 
            +
                    unless (format = info[mapper[:name]]).nil?
         | 
| 132 | 
            +
                      info[mapper[:mimetype]] = get_field(format, :mimetype)
         | 
| 133 | 
            +
                      info[mapper[:category]] = get_field(format, :category)
         | 
| 134 | 
            +
                    end
         | 
| 135 | 
            +
                    info
         | 
| 136 | 
            +
                  end
         | 
| 137 | 
            +
             | 
| 138 | 
            +
                  private
         | 
| 139 | 
            +
             | 
| 140 | 
            +
                  def initialize
         | 
| 141 | 
            +
                    @implementation = eval(Libis::Format::Config[:format_library_implementation])
         | 
| 142 | 
            +
                  end
         | 
| 143 | 
            +
             | 
| 144 | 
            +
                end
         | 
| 145 | 
            +
             | 
| 146 | 
            +
              end
         | 
| 147 | 
            +
            end
         | 
| @@ -1,56 +1,58 @@ | |
| 1 | 
            -
            # frozen_string_literal: true
         | 
| 2 | 
            -
             | 
| 3 1 | 
             
            require_relative 'identification_tool'
         | 
| 4 2 |  | 
| 5 3 | 
             
            module Libis
         | 
| 6 4 | 
             
              module Format
         | 
| 7 5 | 
             
                module Tool
         | 
| 6 | 
            +
             | 
| 8 7 | 
             
                  class ExtensionIdentification < Libis::Format::Tool::IdentificationTool
         | 
| 9 | 
            -
             | 
| 8 | 
            +
             | 
| 9 | 
            +
                    def run_list(filelist, _options = {})
         | 
| 10 | 
            +
             | 
| 10 11 | 
             
                      output = runner(nil, filelist)
         | 
| 11 12 |  | 
| 12 13 | 
             
                      process_output(output)
         | 
| 14 | 
            +
             | 
| 13 15 | 
             
                    end
         | 
| 14 16 |  | 
| 15 | 
            -
                    def run_dir(dir, recursive = true,  | 
| 17 | 
            +
                    def run_dir(dir, recursive = true, _options = {})
         | 
| 18 | 
            +
             | 
| 16 19 | 
             
                      filelist = find_files(dir, recursive)
         | 
| 17 20 |  | 
| 18 21 | 
             
                      output = runner(nil, filelist)
         | 
| 19 22 |  | 
| 20 23 | 
             
                      process_output(output)
         | 
| 24 | 
            +
             | 
| 21 25 | 
             
                    end
         | 
| 22 26 |  | 
| 23 | 
            -
                    def run(file,  | 
| 27 | 
            +
                    def run(file, _options)
         | 
| 28 | 
            +
             | 
| 24 29 | 
             
                      output = runner(file)
         | 
| 25 30 |  | 
| 26 31 | 
             
                      process_output(output)
         | 
| 32 | 
            +
             | 
| 27 33 | 
             
                    end
         | 
| 28 34 |  | 
| 29 35 | 
             
                    protected
         | 
| 30 36 |  | 
| 31 37 | 
             
                    def runner(*args)
         | 
| 38 | 
            +
             | 
| 32 39 | 
             
                      args.map do |file|
         | 
| 33 | 
            -
                        info = ::Libis::Format:: | 
| 34 | 
            -
                         | 
| 35 | 
            -
             | 
| 36 | 
            -
             | 
| 37 | 
            -
             | 
| 38 | 
            -
             | 
| 39 | 
            -
             | 
| 40 | 
            -
             | 
| 41 | 
            -
             | 
| 42 | 
            -
             | 
| 43 | 
            -
                          puid: begin
         | 
| 44 | 
            -
                            info[:PUID].first
         | 
| 45 | 
            -
                          rescue StandardError
         | 
| 46 | 
            -
                            nil
         | 
| 47 | 
            -
                          end,
         | 
| 48 | 
            -
                          matchtype: 'extension',
         | 
| 49 | 
            -
                          tool: :type_database
         | 
| 50 | 
            -
                        }
         | 
| 40 | 
            +
                        info = ::Libis::Format::Library.get_info_by(:extension, File.extname(file))
         | 
| 41 | 
            +
                        if info
         | 
| 42 | 
            +
                          {
         | 
| 43 | 
            +
                              filepath: file,
         | 
| 44 | 
            +
                              mimetype: (info[:mimetypes].first rescue nil),
         | 
| 45 | 
            +
                              puid: (info[:puids].first rescue nil),
         | 
| 46 | 
            +
                              matchtype: 'extension',
         | 
| 47 | 
            +
                              tool: :format_library
         | 
| 48 | 
            +
                          }
         | 
| 49 | 
            +
                        end
         | 
| 51 50 | 
             
                      end.cleanup
         | 
| 51 | 
            +
             | 
| 52 52 | 
             
                    end
         | 
| 53 | 
            +
             | 
| 53 54 | 
             
                  end
         | 
| 55 | 
            +
             | 
| 54 56 | 
             
                end
         | 
| 55 57 | 
             
              end
         | 
| 56 | 
            -
            end
         | 
| 58 | 
            +
            end
         | 
| @@ -13,11 +13,6 @@ module Libis | |
| 13 13 | 
             
                    include Singleton
         | 
| 14 14 | 
             
                    include ::Libis::Tools::Logger
         | 
| 15 15 |  | 
| 16 | 
            -
                    def self.installed?
         | 
| 17 | 
            -
                      result = Libis::Tools::Command.run(Libis::Format::Config[:ffmpeg_cmd], "-h")
         | 
| 18 | 
            -
                      result[:status] == 0
         | 
| 19 | 
            -
                    end
         | 
| 20 | 
            -
             | 
| 21 16 | 
             
                    def self.run(source, target, options = {})
         | 
| 22 17 | 
             
                      self.instance.run source, target, options
         | 
| 23 18 | 
             
                    end
         | 
| @@ -43,11 +38,7 @@ module Libis | |
| 43 38 |  | 
| 44 39 | 
             
                      warn "FFMpeg warnings: #{(result[:err] + result[:out]).join("\n")}" unless result[:err].empty?
         | 
| 45 40 |  | 
| 46 | 
            -
                       | 
| 47 | 
            -
                        command: result,
         | 
| 48 | 
            -
                        files: [ target ]
         | 
| 49 | 
            -
                      }
         | 
| 50 | 
            -
             | 
| 41 | 
            +
                      result[:out]
         | 
| 51 42 | 
             
                    end
         | 
| 52 43 |  | 
| 53 44 | 
             
                  end
         |