RubyGems - format_parser - Versions diffs - 0.13.5 → 0.13.6 - Mend

format_parser 0.13.5 → 0.13.6

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (5) hide show

checksums.yaml +4 -4
data/CHANGELOG.md +4 -0
data/lib/format_parser/version.rb +1 -1
data/lib/parsers/moov_parser/decoder.rb +32 -23
metadata +1 -1

checksums.yaml CHANGED Viewed

@@ -1,7 +1,7 @@
 ---
 SHA256:
-  metadata.gz: 8837741d44c95c25f1b68ae19991bf6b1c1819b17f8a645d5c53a9d9ba97a8bb
-  data.tar.gz: 58dac9d742cf2b59bbf05ae8b810b8a6b15b144035ca625a52e4a9fbed74f93e
+  metadata.gz: 236f35fe657e5bb8f51cf08724fb3138f17b6a20605af4131a7643711f43cd93
+  data.tar.gz: 65037da607c406be2bf0d8e7eb549537199a4ed8c97243c68b63c62e20bdb9e5
 SHA512:
-  metadata.gz: 5be5537ea121c3eff8ec4520d049b1ff0e813f22cc4ea800ad01be7ccb823e0580ea3155d9d561b6854e1f211a98ecd23e6a8de4ef4c2a735b81a6b69a7aa780
-  data.tar.gz: 9b056ff9cb825a4d925a03ad3fcb245e0e93545057a1cf7c3ef778f84955b16b12175c9d8f3c0ab2e04542364c8bb1c5f65e8c0ad39ff70e199774217282a087
+  metadata.gz: aaa8a5c25a9b9b6884e0ec22adf90390aa2a32e4268e7e1d01c98a5d88a20bb25a4635ca53fd891d28bae8de34287ff57c943af76c905425f41ade98985408d9
+  data.tar.gz: 54a417ead7b3d12d585f6775feee2295d95f40fe9ac66a7a5e0788dfd6791271d95ddc1ef230a7c3e17c04635765916090db2a0cf98a722e5c7d662f80eb7d37

data/CHANGELOG.md CHANGED Viewed

@@ -1,3 +1,7 @@
+## 0.13.6
+* Make all reads in the MOOV decoder strict - fail early if reads are improperly sized
+* Disable parsing for `udta` atoms in MP4/MOV since we do not have a good way of parsing them yet
 ## 0.13.5
 * Use the same TIFF parsing flow for CR2 files as it seems we are not very reliable _yet._ The CR2 parser will need some work.

data/lib/format_parser/version.rb CHANGED Viewed

@@ -1,3 +1,3 @@
 module FormatParser
-  VERSION = '0.13.5'
+  VERSION = '0.13.6'
 end

data/lib/parsers/moov_parser/decoder.rb CHANGED Viewed

@@ -2,6 +2,8 @@
 # read atoms and parse their data fields if applicable. Also contains
 # a few utility functions for finding atoms in a list etc.
 class FormatParser::MOOVParser::Decoder
+  include FormatParser::IOUtils
   class Atom < Struct.new(:at, :atom_size, :atom_type, :path, :children, :atom_fields)
     def to_s
       '%s (%s): %d bytes at offset %d' % [atom_type, path.join('.'), atom_size, at]
@@ -18,11 +20,13 @@ class FormatParser::MOOVParser::Decoder
     end
   end
-  # Atoms (boxes) that are known to only contain children, no data fields
-  KNOWN_BRANCH_ATOM_TYPES = %w(moov mdia trak clip edts minf dinf stbl udta meta)
+  # Atoms (boxes) that are known to only contain children, no data fields.
+  # Avoid including udta or udta.meta here since we do not have methods
+  # for dealing with them yet.
+  KNOWN_BRANCH_ATOM_TYPES = %w(moov mdia trak clip edts minf dinf stbl)
-  # Atoms (boxes) that are known to contain both leaves and data fields
-  KNOWN_BRANCH_AND_LEAF_ATOM_TYPES = %w(meta) # the udta.meta thing used by iTunes
+  # Mark that udta may contain both
+  KNOWN_BRANCH_AND_LEAF_ATOM_TYPES = [] # %w(udta) # the udta.meta thing used by iTunes
   # Limit how many atoms we scan in sequence, to prevent derailments
   MAX_ATOMS_AT_LEVEL = 128
@@ -169,16 +173,24 @@ class FormatParser::MOOVParser::Decoder
   def parse_hdlr_atom(io, atom_size)
     sub_io = StringIO.new(io.read(atom_size - 8))
-    {
-      version: read_byte_value(sub_io),
+    version = read_byte_value(sub_io)
+    base_fields = {
+      version: version,
       flags: read_bytes(sub_io, 3),
       component_type: read_bytes(sub_io, 4),
       component_subtype: read_bytes(sub_io, 4),
       component_manufacturer: read_bytes(sub_io, 4),
-      component_flags: read_bytes(sub_io, 4),
-      component_flags_mask: read_bytes(sub_io, 4),
-      component_name: sub_io.read,
     }
+    if version == 1
+      version1_fields = {
+        component_flags: read_bytes(sub_io, 4),
+        component_flags_mask: read_bytes(sub_io, 4),
+        component_name: sub_io.read,
+      }
+      base_fields.merge(version1_fields)
+    else
+      base_fields
+    end
   end
   def parse_meta_atom(io, atom_size)
@@ -217,11 +229,8 @@ class FormatParser::MOOVParser::Decoder
       # If atom_size is specified to be 1, it is larger than what fits into the
       # 4 bytes and we need to read it right after the atom type
       atom_size = read_64bit_uint(io) if atom_size == 1
-      # We are allowed to read what comes after
-      # the atom size and atom type, but not any more than that
-      size_of_atom_type_and_size = io.pos - atom_pos
-      atom_size_sans_header = atom_size - size_of_atom_type_and_size
+      atom_header_size = io.pos - atom_pos
+      atom_size_sans_header = atom_size - atom_header_size
       children, fields = if KNOWN_BRANCH_AND_LEAF_ATOM_TYPES.include?(atom_type)
         parse_atom_children_and_data_fields(io, atom_size_sans_header, atom_type, current_branch)
@@ -239,39 +248,39 @@ class FormatParser::MOOVParser::Decoder
   end
   def read_16bit_fixed_point(io)
-    _whole, _fraction = io.read(2).unpack('CC')
+    _whole, _fraction = safe_read(io, 2).unpack('CC')
   end
   def read_32bit_fixed_point(io)
-    _whole, _fraction = io.read(4).unpack('nn')
+    _whole, _fraction = safe_read(io, 4).unpack('nn')
   end
   def read_chars(io, n)
-    io.read(n)
+    safe_read(io, n)
   end
   def read_byte_value(io)
-    io.read(1).unpack('C').first
+    safe_read(io, 1).unpack('C').first
   end
   def read_bytes(io, n)
-    io.read(n)
+    safe_read(io, n)
   end
   def read_16bit_uint(io)
-    io.read(2).unpack('n').first
+    safe_read(io, 2).unpack('n').first
   end
   def read_32bit_uint(io)
-    io.read(4).unpack('N').first
+    safe_read(io, 4).unpack('N').first
   end
   def read_64bit_uint(io)
-    io.read(8).unpack('Q>').first
+    safe_read(io, 8).unpack('Q>').first
   end
   def read_binary_coded_decimal(io)
-    bcd_string = io.read(4)
+    bcd_string = safe_read(io, 4)
     [bcd_string].pack('H*').unpack('C*')
   end
 end

metadata CHANGED Viewed

@@ -1,7 +1,7 @@
 --- !ruby/object:Gem::Specification
 name: format_parser
 version: !ruby/object:Gem::Version
-  version: 0.13.5
+  version: 0.13.6
 platform: ruby
 authors:
 - Noah Berman