RubyGems - burner - Versions diffs - 1.3.0 → 1.4.0.pre.alpha - Mend

burner 1.3.0 → 1.4.0.pre.alpha

Files changed (14) hide show

checksums.yaml +4 -4
data/CHANGELOG.md +10 -0
data/README.md +6 -1
data/burner.gemspec +1 -0
data/lib/burner.rb +1 -0
data/lib/burner/jobs.rb +3 -0
data/lib/burner/library.rb +3 -0
data/lib/burner/library/compress/row_reader.rb +102 -0
data/lib/burner/library/io/row_reader.rb +119 -0
data/lib/burner/library/serialize/csv.rb +15 -2
data/lib/burner/modeling.rb +1 -0
data/lib/burner/modeling/byte_order_mark.rb +27 -0
data/lib/burner/version.rb +1 -1
metadata +21 -4

checksums.yaml CHANGED

@@ -1,7 +1,7 @@
 ---
 SHA256:
-  metadata.gz: be4b0f77b37a352fc98dc859e4593750670442f8b9353ef86836749e0b9dee8c
-  data.tar.gz: b5cd388f6886fd3956a33db754fbad454e8d94a68d9920cbdb0f82f40bec9a04
+  metadata.gz: e4694264d232ea9b8c353973096b144283967676421524aa7aa2b9582f73469f
+  data.tar.gz: 1730498b8d7b18a1fee81a51b16817cb17e69f78bcd3091be7152b3139955806
 SHA512:
-  metadata.gz: 942fc77175829d47a2b070d5dbdc7f7bb024e6f3be58254cd3b42ab5e70a64f688dd2d3fcd48aa7b193d349a1b497cdde0a7b2dfd95fd25078b56d59f52d94ad
-  data.tar.gz: dd6e6e5ce6de426c2fbf0e4950adbd3c908f7ed49e2314d242e43538bf90768de5216db34fe940050c02231b2dac6115ded03a29ae415a2c5d591aeb771d49ab
+  metadata.gz: 1c473531a5422691fb36e14f5fbf7d7421fd19abe889d08e84e14265c146616f5761acbc3458c8cdd656ac784755dc96ec68370637234f260dbac16b0b8486b6
+  data.tar.gz: 88bce907acfcbb8fcec5c39d4be5ba8876fb630583ed55b268d96c3eca65c66412d15439f5abe4af8c29505099b54796dd4e9cdcb898a707d5e32a3e4dc0d838

data/CHANGELOG.md CHANGED

@@ -1,3 +1,13 @@
+# 1.4.0 (TBD)
+Additions:
+* byte_order_mark option for b/serialize/csv job
+Added Jobs:
+* b/compress/row_reader
+* b/io/row_reader
 # 1.3.0 (December 11th, 2020)
 Additions:

data/README.md CHANGED

@@ -228,6 +228,10 @@ This library only ships with very basic, rudimentary jobs that are meant to just
 * **b/collection/validate** [invalid_register, join_char, message_key, register, separator, validations]: Take an array of objects, run it through each declared validator, and split the objects into two registers.  The valid objects will be split into the current register while the invalid ones will go into the invalid_register as declared.  Optional arguments, join_char and message_key, help determine the compiled error messages.  The separator option can be utilized to use dot-notation for validating keys.  See each validation's options by viewing their classes within the `lib/modeling/validations` directory.
 * **b/collection/values** [include_keys, register]: Take an array of objects and call `#values` on each object. If include_keys is true (it is false by default), then call `#keys` on the first object and inject that as a "header" object.
+#### Compression
+* **b/compress/row_reader** [data_key, ignore_blank_path, ignore_blank_data, path_key, register, separator]: Iterates over an array of objects, extracts a path and data in each object, and creates a zip file.
 #### De-serialization
 * **b/deserialize/csv** [register]: Take a CSV string and de-serialize into object(s).  Currently it will return an array of arrays, with each nested array representing one row.
@@ -240,11 +244,12 @@ By default all jobs will use the `Burner::Disks::Local` disk for its persistence
 * **b/io/exist** [disk, path, short_circuit]: Check to see if a file exists. The path parameter can be interpolated using `Payload#params`.  If short_circuit was set to true (defaults to false) and the file does not exist then the pipeline will be short-circuited.
 * **b/io/read** [binary, disk, path, register]: Read in a local file.  The path parameter can be interpolated using `Payload#params`.  If the contents are binary, pass in `binary: true` to open it up in binary+read mode.
+* **b/io/row_reader** [data_key, disk, ignore_blank_path, ignore_file_not_found, path_key, register, separator]: Iterates over an array of objects, extracts a filepath from a key in each object, and attempts to load the file's content for each record.  The file's content will be stored at the specified data_key. By default missing paths or files will be treated as hard errors.  If you wish to ignore these then pass in true for ignore_blank_path and/or ignore_file_not_found.
 * **b/io/write** [binary, disk, path, register]: Write to a local file.  The path parameter can be interpolated using `Payload#params`.  If the contents are binary, pass in `binary: true` to open it up in binary+write mode.
 #### Serialization
-* **b/serialize/csv** [register]: Take an array of arrays and create a CSV.
+* **b/serialize/csv** [byte_order_mark, register]: Take an array of arrays and create a CSV.  You can optionally pre-pend a byte order mark, see Burner::Modeling::ByteOrderMark for acceptable options.
 * **b/serialize/json** [register]: Convert value to JSON.
 * **b/serialize/yaml** [register]: Convert value to YAML.

data/burner.gemspec CHANGED

@@ -33,6 +33,7 @@ Gem::Specification.new do |s|
   s.add_dependency('hash_math', '~>1.2')
   s.add_dependency('objectable', '~>1.0')
   s.add_dependency('realize', '~>1.3')
+  s.add_dependency('rubyzip', '~>1.2')
   s.add_dependency('stringento', '~>2.1')
   s.add_development_dependency('guard-rspec', '~>4.7')

data/lib/burner.rb CHANGED

@@ -22,6 +22,7 @@ require 'singleton'
 require 'stringento'
 require 'time'
 require 'yaml'
+require 'zip'
 # Common/Shared
 require_relative 'burner/disks'

data/lib/burner/jobs.rb CHANGED

@@ -35,12 +35,15 @@ module Burner
     register 'b/collection/values',            Library::Collection::Values
     register 'b/collection/validate',          Library::Collection::Validate
+    register 'b/compress/row_reader',          Library::Compress::RowReader
     register 'b/deserialize/csv',              Library::Deserialize::Csv
     register 'b/deserialize/json',             Library::Deserialize::Json
     register 'b/deserialize/yaml',             Library::Deserialize::Yaml
     register 'b/io/exist',                     Library::IO::Exist
     register 'b/io/read',                      Library::IO::Read
+    register 'b/io/row_reader',                Library::IO::RowReader
     register 'b/io/write',                     Library::IO::Write
     register 'b/serialize/csv',                Library::Serialize::Csv

data/lib/burner/library.rb CHANGED

@@ -26,12 +26,15 @@ require_relative 'library/collection/unpivot'
 require_relative 'library/collection/validate'
 require_relative 'library/collection/values'
+require_relative 'library/compress/row_reader'
 require_relative 'library/deserialize/csv'
 require_relative 'library/deserialize/json'
 require_relative 'library/deserialize/yaml'
 require_relative 'library/io/exist'
 require_relative 'library/io/read'
+require_relative 'library/io/row_reader'
 require_relative 'library/io/write'
 require_relative 'library/serialize/csv'

data/lib/burner/library/compress/row_reader.rb ADDED

@@ -0,0 +1,102 @@
+# frozen_string_literal: true
+#
+# Copyright (c) 2020-present, Blue Marble Payroll, LLC
+#
+# This source code is licensed under the MIT license found in the
+# LICENSE file in the root directory of this source tree.
+#
+module Burner
+  module Library
+    module Compress
+      # Iterates over an array of objects, extracts a path and data in each object, and
+      # creates a zip file.  By default, if a path is blank then an ArgumentError will be raised.
+      # If this is undesirable then you can set ignore_blank_path to true and the record will be
+      # skipped.  You also have the option to supress blank files being added by configuring
+      # ignore_blank_data as true.
+      #
+      # Expected Payload[register] input: array of objects.
+      # Payload[register] output: compressed binary zip file contents.
+      class RowReader < JobWithRegister
+        Content = Struct.new(:path, :data)
+        private_constant :Content
+        DEFAULT_DATA_KEY = 'data'
+        DEFAULT_PATH_KEY = 'path'
+        attr_reader :data_key,
+                    :ignore_blank_data,
+                    :ignore_blank_path,
+                    :path_key,
+                    :resolver
+        def initialize(
+          name:,
+          data_key: DEFAULT_DATA_KEY,
+          ignore_blank_data: false,
+          ignore_blank_path: false,
+          path_key: DEFAULT_PATH_KEY,
+          register: DEFAULT_REGISTER,
+          separator: ''
+        )
+          super(name: name, register: register)
+          @data_key          = data_key.to_s
+          @ignore_blank_data = ignore_blank_data || false
+          @ignore_blank_path = ignore_blank_path || false
+          @path_key          = path_key.to_s
+          @resolver          = Objectable.resolver(separator: separator)
+          freeze
+        end
+        def perform(output, payload)
+          payload[register] = Zip::OutputStream.write_buffer do |zip|
+            array(payload[register]).each.with_index(1) do |record, index|
+              content = extract_path_and_data(record, index, output)
+              next unless content
+              zip.put_next_entry(content.path)
+              zip.write(content.data)
+            end
+          end.string
+        end
+        private
+        def extract_path_and_data(record, index, output)
+          path = strip_leading_separator(resolver.get(record, path_key))
+          data = resolver.get(record, data_key)
+          return if assert_and_skip_missing_path?(path, index, output)
+          return if skip_missing_data?(data, index, output)
+          Content.new(path, data)
+        end
+        def strip_leading_separator(path)
+          path.to_s.start_with?(File::SEPARATOR) ? path.to_s[1..-1] : path.to_s
+        end
+        def assert_and_skip_missing_path?(path, index, output)
+          if ignore_blank_path && path.to_s.empty?
+            output.detail("Skipping record #{index} because of blank path")
+            true
+          elsif path.to_s.empty?
+            raise ArgumentError, "Record #{index} is missing a path at key: #{path_key}"
+          end
+        end
+        def skip_missing_data?(data, index, output)
+          return false unless ignore_blank_data && data.to_s.empty?
+          output.detail("Skipping record #{index} because of blank data")
+          true
+        end
+      end
+    end
+  end
+end

data/lib/burner/library/io/row_reader.rb ADDED

@@ -0,0 +1,119 @@
+# frozen_string_literal: true
+#
+# Copyright (c) 2020-present, Blue Marble Payroll, LLC
+#
+# This source code is licensed under the MIT license found in the
+# LICENSE file in the root directory of this source tree.
+#
+require_relative 'open_file_base'
+module Burner
+  module Library
+    module IO
+      # Iterates over an array of objects, extracts a filepath from a key in each object,
+      # and attempts to load the file's content for each record.  The file's content will be
+      # stored at the specified data_key. By default missing paths or files will be
+      # treated as hard errors.  If you wish to ignore these then pass in true for
+      # ignore_blank_path and/or ignore_file_not_found.
+      #
+      # Expected Payload[register] input: array of objects.
+      # Payload[register] output: array of objects.
+      class RowReader < JobWithRegister
+        class FileNotFoundError < StandardError; end
+        DEFAULT_DATA_KEY = 'data'
+        DEFAULT_PATH_KEY = 'path'
+        attr_reader :binary,
+                    :data_key,
+                    :disk,
+                    :ignore_blank_path,
+                    :ignore_file_not_found,
+                    :path_key,
+                    :resolver
+        def initialize(
+          name:,
+          binary: false,
+          data_key: DEFAULT_DATA_KEY,
+          disk: {},
+          ignore_blank_path: false,
+          ignore_file_not_found: false,
+          path_key: DEFAULT_PATH_KEY,
+          register: DEFAULT_REGISTER,
+          separator: ''
+        )
+          super(name: name, register: register)
+          @binary                = binary || false
+          @data_key              = data_key.to_s
+          @disk                  = Disks.make(disk)
+          @ignore_blank_path     = ignore_blank_path || false
+          @ignore_file_not_found = ignore_file_not_found || false
+          @path_key              = path_key.to_s
+          @resolver              = Objectable.resolver(separator: separator)
+          freeze
+        end
+        def perform(output, payload)
+          records = array(payload[register])
+          output.detail("Reading path_key: #{path_key} for #{payload[register].length} records(s)")
+          output.detail("Storing read data in: #{path_key}")
+          payload[register] = records.map.with_index(1) do |object, index|
+            load_data(object, index, output)
+          end
+        end
+        private
+        def assert_and_skip_missing_path?(path, index, output)
+          missing_path            = path.to_s.empty?
+          blank_path_raises_error = !ignore_blank_path
+          if missing_path && blank_path_raises_error
+            output.detail("Record #{index} is missing a path, raising error")
+            raise ArgumentError, "Record #{index} is missing a path"
+          elsif missing_path
+            output.detail("Record #{index} is missing a path")
+            true
+          end
+        end
+        def assert_and_skip_file_not_found?(path, index, output)
+          does_not_exist              = !disk.exist?(path)
+          file_not_found_raises_error = !ignore_file_not_found
+          if file_not_found_raises_error && does_not_exist
+            output.detail("Record #{index} path: '#{path}' does not exist, raising error")
+            raise FileNotFoundError, "#{path} does not exist"
+          elsif does_not_exist
+            output.detail("Record #{index} path: '#{path}' does not exist, skipping")
+            true
+          end
+        end
+        def load_data(object, index, output)
+          path = resolver.get(object, path_key)
+          return object if assert_and_skip_missing_path?(path, index, output)
+          return object if assert_and_skip_file_not_found?(path, index, output)
+          data = disk.read(path, binary: binary)
+          resolver.set(object, data_key, data)
+          object
+        end
+      end
+    end
+  end
+end

data/lib/burner/library/serialize/csv.rb CHANGED

@@ -10,17 +10,30 @@
 module Burner
   module Library
     module Serialize
-      # Take an array of arrays and create a CSV.
+      # Take an array of arrays and create a CSV.  You can optionally pre-pend a byte order mark,
+      # see Burner::Modeling::ByteOrderMark for acceptable options.
       #
       # Expected Payload[register] input: array of arrays.
       # Payload[register] output: a serialized CSV string.
       class Csv < JobWithRegister
+        attr_reader :byte_order_mark
+        def initialize(name:, byte_order_mark: nil, register: DEFAULT_REGISTER)
+          super(name: name, register: register)
+          @byte_order_mark = Modeling::ByteOrderMark.resolve(byte_order_mark)
+          freeze
+        end
         def perform(_output, payload)
-          payload[register] = CSV.generate(options) do |csv|
+          serialized_rows = CSV.generate(options) do |csv|
             array(payload[register]).each do |row|
               csv << row
             end
           end
+          payload[register] = "#{byte_order_mark}#{serialized_rows}"
         end
         private

data/lib/burner/modeling.rb CHANGED

@@ -9,6 +9,7 @@
 require_relative 'modeling/attribute'
 require_relative 'modeling/attribute_renderer'
+require_relative 'modeling/byte_order_mark'
 require_relative 'modeling/key_index_mapping'
 require_relative 'modeling/key_mapping'
 require_relative 'modeling/validations'

data/lib/burner/modeling/byte_order_mark.rb ADDED

@@ -0,0 +1,27 @@
+# frozen_string_literal: true
+#
+# Copyright (c) 2020-present, Blue Marble Payroll, LLC
+#
+# This source code is licensed under the MIT license found in the
+# LICENSE file in the root directory of this source tree.
+#
+module Burner
+  module Modeling
+    # Define all acceptable byte order mark values.
+    module ByteOrderMark
+      UTF_8    = "\xEF\xBB\xBF"
+      UTF_16BE = "\xFE\xFF"
+      UTF_16LE = "\xFF\xFE"
+      UTF_32BE = "\x00\x00\xFE\xFF"
+      UTF_32LE = "\xFE\xFF\x00\x00"
+      class << self
+        def resolve(value)
+          value ? const_get(value.to_s.upcase.to_sym) : nil
+        end
+      end
+    end
+  end
+end

data/lib/burner/version.rb CHANGED

@@ -8,5 +8,5 @@
 #
 module Burner
-  VERSION = '1.3.0'
+  VERSION = '1.4.0-alpha'
 end

metadata CHANGED

@@ -1,14 +1,14 @@
 --- !ruby/object:Gem::Specification
 name: burner
 version: !ruby/object:Gem::Version
-  version: 1.3.0
+  version: 1.4.0.pre.alpha
 platform: ruby
 authors:
 - Matthew Ruggio
 autorequire:
 bindir: exe
 cert_chain: []
-date: 2020-12-12 00:00:00.000000000 Z
+date: 2020-12-17 00:00:00.000000000 Z
 dependencies:
 - !ruby/object:Gem::Dependency
   name: acts_as_hashable
@@ -80,6 +80,20 @@ dependencies:
     - - "~>"
       - !ruby/object:Gem::Version
         version: '1.3'
+- !ruby/object:Gem::Dependency
+  name: rubyzip
+  requirement: !ruby/object:Gem::Requirement
+    requirements:
+    - - "~>"
+      - !ruby/object:Gem::Version
+        version: '1.2'
+  type: :runtime
+  prerelease: false
+  version_requirements: !ruby/object:Gem::Requirement
+    requirements:
+    - - "~>"
+      - !ruby/object:Gem::Version
+        version: '1.2'
 - !ruby/object:Gem::Dependency
   name: stringento
   requirement: !ruby/object:Gem::Requirement
@@ -238,6 +252,7 @@ files:
 - lib/burner/library/collection/unpivot.rb
 - lib/burner/library/collection/validate.rb
 - lib/burner/library/collection/values.rb
+- lib/burner/library/compress/row_reader.rb
 - lib/burner/library/deserialize/csv.rb
 - lib/burner/library/deserialize/json.rb
 - lib/burner/library/deserialize/yaml.rb
@@ -245,6 +260,7 @@ files:
 - lib/burner/library/io/exist.rb
 - lib/burner/library/io/open_file_base.rb
 - lib/burner/library/io/read.rb
+- lib/burner/library/io/row_reader.rb
 - lib/burner/library/io/write.rb
 - lib/burner/library/nothing.rb
 - lib/burner/library/serialize/csv.rb
@@ -256,6 +272,7 @@ files:
 - lib/burner/modeling.rb
 - lib/burner/modeling/attribute.rb
 - lib/burner/modeling/attribute_renderer.rb
+- lib/burner/modeling/byte_order_mark.rb
 - lib/burner/modeling/key_index_mapping.rb
 - lib/burner/modeling/key_mapping.rb
 - lib/burner/modeling/validations.rb
@@ -292,9 +309,9 @@ required_ruby_version: !ruby/object:Gem::Requirement
       version: '2.5'
 required_rubygems_version: !ruby/object:Gem::Requirement
   requirements:
-  - - ">="
+  - - ">"
     - !ruby/object:Gem::Version
-      version: '0'
+      version: 1.3.1
 requirements: []
 rubygems_version: 3.0.3
 signing_key: