RubyGems - ecosystems-bibliothecary - Versions diffs - 14.2.0 → 15.0.0 - Mend

ecosystems-bibliothecary 14.2.0 → 15.0.0

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (72) hide show

checksums.yaml +4 -4
data/CHANGELOG.md +48 -0
data/README.md +9 -24
data/bibliothecary.gemspec +5 -9
data/lib/bibliothecary/analyser/analysis.rb +10 -5
data/lib/bibliothecary/analyser/matchers.rb +7 -5
data/lib/bibliothecary/analyser.rb +0 -30
data/lib/bibliothecary/cli.rb +35 -26
data/lib/bibliothecary/configuration.rb +1 -6
data/lib/bibliothecary/dependency.rb +1 -4
data/lib/bibliothecary/file_info.rb +7 -0
data/lib/bibliothecary/parsers/bentoml.rb +0 -2
data/lib/bibliothecary/parsers/bower.rb +0 -1
data/lib/bibliothecary/parsers/cargo.rb +12 -10
data/lib/bibliothecary/parsers/carthage.rb +51 -15
data/lib/bibliothecary/parsers/clojars.rb +14 -18
data/lib/bibliothecary/parsers/cocoapods.rb +100 -19
data/lib/bibliothecary/parsers/cog.rb +0 -2
data/lib/bibliothecary/parsers/conan.rb +156 -0
data/lib/bibliothecary/parsers/conda.rb +0 -3
data/lib/bibliothecary/parsers/cpan.rb +0 -2
data/lib/bibliothecary/parsers/cran.rb +40 -19
data/lib/bibliothecary/parsers/docker.rb +0 -2
data/lib/bibliothecary/parsers/dub.rb +33 -8
data/lib/bibliothecary/parsers/dvc.rb +0 -2
data/lib/bibliothecary/parsers/elm.rb +13 -3
data/lib/bibliothecary/parsers/go.rb +14 -5
data/lib/bibliothecary/parsers/hackage.rb +132 -24
data/lib/bibliothecary/parsers/haxelib.rb +14 -4
data/lib/bibliothecary/parsers/hex.rb +37 -20
data/lib/bibliothecary/parsers/homebrew.rb +0 -2
data/lib/bibliothecary/parsers/julia.rb +0 -2
data/lib/bibliothecary/parsers/maven.rb +35 -25
data/lib/bibliothecary/parsers/meteor.rb +14 -4
data/lib/bibliothecary/parsers/mlflow.rb +0 -2
data/lib/bibliothecary/parsers/npm.rb +47 -59
data/lib/bibliothecary/parsers/nuget.rb +23 -22
data/lib/bibliothecary/parsers/ollama.rb +0 -2
data/lib/bibliothecary/parsers/packagist.rb +0 -3
data/lib/bibliothecary/parsers/pub.rb +0 -2
data/lib/bibliothecary/parsers/pypi.rb +54 -35
data/lib/bibliothecary/parsers/rubygems.rb +92 -27
data/lib/bibliothecary/parsers/shard.rb +0 -1
data/lib/bibliothecary/parsers/swift_pm.rb +77 -29
data/lib/bibliothecary/parsers/vcpkg.rb +68 -17
data/lib/bibliothecary/runner.rb +169 -22
data/lib/bibliothecary/version.rb +1 -1
data/lib/bibliothecary.rb +3 -10
data/lib/dockerfile_parser.rb +1 -1
data/lib/modelfile_parser.rb +8 -8
metadata +2 -108
data/.codeclimate.yml +0 -25
data/.github/CONTRIBUTING.md +0 -195
data/.github/workflows/ci.yml +0 -25
data/.gitignore +0 -10
data/.rspec +0 -2
data/.rubocop.yml +0 -69
data/.ruby-version +0 -1
data/.tidelift +0 -1
data/CODE_OF_CONDUCT.md +0 -74
data/Gemfile +0 -34
data/Rakefile +0 -18
data/bin/console +0 -15
data/bin/setup +0 -8
data/lib/bibliothecary/multi_parsers/bundler_like_manifest.rb +0 -26
data/lib/bibliothecary/multi_parsers/cyclonedx.rb +0 -170
data/lib/bibliothecary/multi_parsers/dependencies_csv.rb +0 -155
data/lib/bibliothecary/multi_parsers/json_runtime.rb +0 -22
data/lib/bibliothecary/multi_parsers/spdx.rb +0 -149
data/lib/bibliothecary/purl_util.rb +0 -37
data/lib/bibliothecary/runner/multi_manifest_filter.rb +0 -92
data/lib/sdl_parser.rb +0 -30

data/lib/bibliothecary/multi_parsers/dependencies_csv.rb DELETED Viewed

@@ -1,155 +0,0 @@
-# frozen_string_literal: true
-require "csv"
-module Bibliothecary
-  module MultiParsers
-    module DependenciesCSV
-      include Bibliothecary::Analyser
-      include Bibliothecary::Analyser::TryCache
-      def self.mapping
-        {
-          match_filename("dependencies.csv") => {
-            kind: "lockfile",
-            ungroupable: true,
-            parser: :parse_dependencies_csv,
-          },
-        }
-      end
-      # Processing a CSV file isn't as exact as using a real manifest file,
-      # but you can get pretty close as long as the data you're importing
-      # is simple.
-      class CSVFile
-        # Header structures are:
-        #
-        # <field to fill in for dependency> => {
-        #   match: [<regexp of incoming column name to match in priority order, highest priority first>...],
-        #   [default]: <optional default value for this field>
-        # }
-        HEADERS = {
-          "platform" => {
-            match: [
-              /^platform$/i,
-            ],
-          },
-          "name" => {
-            match: [
-              /^name$/i,
-            ],
-          },
-          # Manifests have versions that can have operators.
-          # However, since Bibliothecary only currently supports analyzing a
-          # single file as a single thing (either manifest or lockfile)
-          # we can't return manifest-y data. Only take the lockfile requirement
-          # when processing dependencies.csv for now.
-          "requirement" => {
-            match: [
-              /^(lockfile |)requirement$/i,
-              /^version$/i,
-            ],
-          },
-          "type" => {
-            default: "runtime",
-            match: [
-              /^(lockfile |)type$/i,
-              /^(manifest |)type$/i,
-            ],
-          },
-        }.freeze
-        attr_reader :result
-        def initialize(file_contents)
-          @file_contents = file_contents
-          @result = nil
-          # A Hash of "our field name" => ["header in CSV file", "lower priority header in CSV file"]
-          @header_mappings = {}
-        end
-        def parse!
-          table = parse_and_validate_csv_file
-          @result = table.map.with_index do |row, idx|
-            HEADERS.each_with_object({}) do |(header, info), obj|
-              # find the first non-empty field in the row for this header, or nil if not found
-              row_data = row[@header_mappings[header]]
-              # some column have default data to fall back on
-              if row_data
-                obj[header.to_sym] = row_data
-              elsif info.key?(:default)
-                # if the default is nil, don't even add the key to the hash
-                obj[header.to_sym] = info[:default] if info[:default]
-              else
-                # use 1-based index just like the 'csv' std lib, and count the headers as first row.
-                raise "Missing required field '#{header}' on line #{idx + 2}."
-              end
-            end
-          end
-        end
-        private
-        def parse_and_validate_csv_file
-          table = CSV.parse(@file_contents, headers: true)
-          header_examination_results = map_table_headers_to_local_lookups(table, HEADERS)
-          unless header_examination_results[:missing].empty?
-            raise "Missing required headers #{header_examination_results[:missing].join(', ')} in CSV. Check to make sure header names are all lowercase."
-          end
-          @header_mappings = header_examination_results[:found]
-          table
-        end
-        def map_table_headers_to_local_lookups(table, local_lookups)
-          result = local_lookups.each_with_object({ found: {}, missing: [] }) do |(header, info), obj|
-            results = table.headers.each_with_object([]) do |table_header, matches|
-              info[:match].each_with_index do |match_regexp, index|
-                matches << [table_header, index] if table_header[match_regexp]
-              end
-            end
-            if results.empty?
-              # if a header has a default value it's optional
-              obj[:missing] << header unless info.key?(:default)
-            else
-              # select the highest priority header possible
-              obj[:found][header] ||= nil
-              obj[:found][header] = ([obj[:found][header]] + results).compact.min_by(&:last)
-            end
-          end
-          # strip off the priorities. only one mapping should remain.
-          result[:found].transform_values!(&:first)
-          result
-        end
-      end
-      def parse_dependencies_csv(file_contents, options: {})
-        csv_file = try_cache(options, options[:filename]) do
-          raw_csv_file = CSVFile.new(file_contents)
-          raw_csv_file.parse!
-          raw_csv_file
-        end
-        dependencies = csv_file
-          .result
-          .find_all { |dependency| dependency[:platform] == platform_name.to_s }
-          .map do |dep_kvs|
-            Dependency.new(
-              **dep_kvs, source: options.fetch(:filename, nil)
-            )
-          end
-        ParserResult.new(dependencies: dependencies)
-      end
-    end
-  end
-end

data/lib/bibliothecary/multi_parsers/json_runtime.rb DELETED Viewed

@@ -1,22 +0,0 @@
-# frozen_string_literal: true
-module Bibliothecary
-  module MultiParsers
-    # Provide JSON Runtime Manifest parsing
-    module JSONRuntime
-      def parse_json_runtime_manifest(file_contents, options: {})
-        dependencies = JSON.parse(file_contents).fetch("dependencies", []).map do |name, requirement|
-          Dependency.new(
-            platform: platform_name,
-            name: name,
-            requirement: requirement,
-            type: "runtime",
-            source: options.fetch(:filename, nil)
-          )
-        end
-        ParserResult.new(dependencies: dependencies)
-      end
-    end
-  end
-end

data/lib/bibliothecary/multi_parsers/spdx.rb DELETED Viewed

@@ -1,149 +0,0 @@
-# frozen_string_literal: true
-# packageurl-ruby uses pattern-matching (https://docs.ruby-lang.org/en/2.7.0/NEWS.html#label-Pattern+matching)
-# which warns a whole bunch in Ruby 2.7 as being an experimental feature, but has
-# been accepted in Ruby 3.0 (https://rubyreferences.github.io/rubychanges/3.0.html#pattern-matching).
-Warning[:experimental] = false
-require "package_url"
-Warning[:experimental] = true
-module Bibliothecary
-  module MultiParsers
-    module Spdx
-      include Bibliothecary::Analyser
-      include Bibliothecary::Analyser::TryCache
-      # e.g. 'SomeText:' (allowing for leading whitespace)
-      WELLFORMED_LINE_REGEXP = /^\s*[a-zA-Z]+:/
-      # e.g. 'PackageName: (allowing for excessive whitespace)
-      PACKAGE_NAME_REGEXP = /^\s*PackageName:\s*(.*)/
-      # e.g. 'PackageVersion:' (allowing for excessive whitespace)
-      PACKAGE_VERSION_REGEXP = /^\s*PackageVersion:\s*(.*)/
-      # e.g. "ExternalRef: PACKAGE-MANAGER purl (allowing for excessive whitespace)
-      PURL_REGEXP = /^\s*ExternalRef:\s*PACKAGE[-|_]MANAGER\s*purl\s*(.*)/
-      NoEntries = Class.new(StandardError)
-      MalformedFile = Class.new(StandardError)
-      def self.mapping
-        {
-          match_extension(".spdx") => {
-            kind: "lockfile",
-            parser: :parse_spdx_tag_value,
-            ungroupable: true,
-          },
-          match_extension(".spdx.json") => {
-            kind: "lockfile",
-            parser: :parse_spdx_json,
-            ungroupable: true,
-          },
-        }
-      end
-      def parse_spdx_tag_value(file_contents, options: {})
-        entries = try_cache(options, options[:filename]) do
-          parse_spdx_tag_value_file_contents(file_contents, options.fetch(:filename, nil))
-        end
-        raise NoEntries if entries.empty?
-        Bibliothecary::ParserResult.new(dependencies: entries[platform_name.to_sym] || [])
-      end
-      def parse_spdx_tag_value_file_contents(file_contents, source = nil)
-        entries = {}
-        spdx_name = spdx_version = platform = purl_name = purl_version = nil
-        file_contents.each_line do |line|
-          stripped_line = line.strip
-          next if skip_tag_value_line?(stripped_line)
-          raise MalformedFile unless stripped_line.match?(WELLFORMED_LINE_REGEXP)
-          if (match = stripped_line.match(PACKAGE_NAME_REGEXP))
-            # Per the spec:
-            # > A new package Information section is denoted by the package name (7.1) field.
-            add_entry(entries: entries, platform: platform, purl_name: purl_name,
-                      spdx_name: spdx_name, purl_version: purl_version, spdx_version: spdx_version,
-                      source: source)
-            # reset for this new package
-            spdx_name = spdx_version = platform = purl_name = purl_version = nil
-            # capture the new package's name
-            spdx_name = match[1]
-          elsif (match = stripped_line.match(PACKAGE_VERSION_REGEXP))
-            spdx_version = match[1]
-          elsif (match = stripped_line.match(PURL_REGEXP))
-            purl = PackageURL.parse(match[1])
-            platform ||= PurlUtil::PURL_TYPE_MAPPING[purl.type]
-            purl_name ||= PurlUtil.full_name(purl)
-            purl_version ||= purl.version
-          end
-        end
-        add_entry(entries: entries, platform: platform, purl_name: purl_name,
-                  spdx_name: spdx_name, purl_version: purl_version, spdx_version: spdx_version,
-                  source: source)
-        entries
-      end
-      def skip_tag_value_line?(stripped_line)
-        # Ignore blank lines and comments
-        stripped_line.empty? || stripped_line.start_with?("#")
-      end
-      def parse_spdx_json(file_contents, options: {})
-        entries = try_cache(options, options[:filename]) do
-          parse_spdx_json_file_contents(file_contents, options.fetch(:filename, nil))
-        end
-        raise NoEntries if entries.empty?
-        Bibliothecary::ParserResult.new(dependencies: entries[platform_name.to_sym] || [])
-      end
-      def parse_spdx_json_file_contents(file_contents, source = nil)
-        entries = {}
-        manifest = JSON.parse(file_contents)
-        manifest["packages"]&.each do |package|
-          spdx_name = package["name"]
-          spdx_version = package["versionInfo"]
-          first_purl_string = package["externalRefs"]&.find { |ref| ref["referenceType"] == "purl" }&.dig("referenceLocator")
-          purl = first_purl_string && PackageURL.parse(first_purl_string)
-          platform = PurlUtil::PURL_TYPE_MAPPING[purl&.type]
-          purl_name = PurlUtil.full_name(purl)
-          purl_version = purl&.version
-          add_entry(entries: entries, platform: platform, purl_name: purl_name,
-                    spdx_name: spdx_name, purl_version: purl_version, spdx_version: spdx_version,
-                    source: source)
-        end
-        entries
-      end
-      def add_entry(entries:, platform:, purl_name:, spdx_name:, purl_version:, spdx_version:, source: nil)
-        package_name = purl_name || spdx_name
-        package_version = purl_version || spdx_version
-        return unless platform && package_name && package_version
-        entries[platform.to_sym] ||= []
-        entries[platform.to_sym] << Dependency.new(
-          platform: platform.to_s,
-          name: package_name,
-          requirement: package_version,
-          type: "lockfile",
-          source: source
-        )
-      end
-    end
-  end
-end

data/lib/bibliothecary/purl_util.rb DELETED Viewed

@@ -1,37 +0,0 @@
-# frozen_string_literal: true
-module Bibliothecary
-  class PurlUtil
-    # If a purl type (key) exists, it will be used in a manifest for
-    # the key's value. If not, it's ignored.
-    #
-    # https://github.com/package-url/purl-spec/blob/master/PURL-TYPES.rst
-    PURL_TYPE_MAPPING = {
-      "golang" => :go,
-      "maven" => :maven,
-      "npm" => :npm,
-      "cargo" => :cargo,
-      "composer" => :packagist,
-      "conda" => :conda,
-      "cran" => :cran,
-      "gem" => :rubygems,
-      "nuget" => :nuget,
-      "pypi" => :pypi,
-    }.freeze
-    # @param purl [PackageURL]
-    # @return [String] The properly namespaced package name
-    def self.full_name(purl)
-      return nil if purl.nil?
-      parts = [purl.namespace, purl.name].compact
-      case purl.type
-      when "maven"
-        parts.join(":")
-      else
-        parts.join("/")
-      end
-    end
-  end
-end

data/lib/bibliothecary/runner/multi_manifest_filter.rb DELETED Viewed

@@ -1,92 +0,0 @@
-# frozen_string_literal: true
-module Bibliothecary
-  class Runner
-    class MultiManifestFilter
-      # Wrap up a file analysis for easier validity testing
-      class FileAnalysis
-        def initialize(file_analysis)
-          @file_analysis = file_analysis
-        end
-        # Determine if we should skip this file analysis when processing
-        # @return [Boolean] True if we should skip processing
-        def skip?
-          !@file_analysis ||
-            !@file_analysis[:dependencies] ||
-            @file_analysis[:dependencies].empty?
-        end
-      end
-      def initialize(path:, related_files_info_entries:, runner:)
-        @path = path
-        @related_files_info_entries = related_files_info_entries
-        @runner = runner
-      end
-      # Standalone multi manifest files should *always* be treated as lockfiles,
-      # since there's no human-written manifest file to go with them.
-      def files_to_check
-        @files_to_check ||= @related_files_info_entries.each_with_object({}) do |files_info, all|
-          files_info.lockfiles.each do |file|
-            all[file] ||= 0
-            all[file] += 1
-          end
-        end
-      end
-      def results
-        partition_file_entries!
-        (no_lockfile_results + single_file_results + multiple_file_results).uniq
-      end
-      def no_lockfile_results
-        @no_lockfile_results ||= @related_files_info_entries.find_all { |rfi| rfi.lockfiles.empty? }
-      end
-      def single_file_results
-        @single_file_results ||= @single_file_entries.map do |file|
-          @related_files_info_entries.find { |rfi| rfi.lockfiles.include?(file) }
-        end
-      end
-      def multiple_file_results
-        return @multiple_file_results if @multiple_file_results
-        @multiple_file_results = []
-        each_analysis_and_rfis do |analysis, rfis_for_file|
-          rfis_for_file.each do |rfi|
-            file_analysis = FileAnalysis.new(
-              analysis.find { |a| a[:platform] == rfi.platform }
-            )
-            next if file_analysis.skip?
-            @multiple_file_results << rfi
-          end
-        end
-        @multiple_file_results
-      end
-      def each_analysis_and_rfis
-        @multiple_file_entries.each do |file|
-          contents = Bibliothecary.utf8_string(File.read(File.join(@path, file)))
-          analysis = @runner.analyse_file(file, contents)
-          rfis_for_file = @related_files_info_entries.find_all { |rfi| rfi.lockfiles.include?(file) }
-          yield analysis, rfis_for_file
-        end
-      end
-      def partition_file_entries!
-        @single_file_entries, @multiple_file_entries = files_to_check.partition { |_file, count| count == 1 }
-        @single_file_entries = @single_file_entries.map(&:first)
-        @multiple_file_entries = @multiple_file_entries.map(&:first)
-      end
-    end
-  end
-end

data/lib/sdl_parser.rb DELETED Viewed

@@ -1,30 +0,0 @@
-# frozen_string_literal: true
-require "sdl4r"
-class SdlParser
-  attr_reader :contents, :type
-  def initialize(type, contents, platform, source = nil)
-    @contents = contents
-    @type = type || "runtime"
-    @platform = platform
-    @source = source
-  end
-  def dependencies
-    parse.children("dependency").inject([]) do |deps, dep|
-      deps.push(Bibliothecary::Dependency.new(
-                  platform: @platform,
-                  name: dep.value,
-                  requirement: dep.attribute("version") || ">= 0",
-                  type: type,
-                  source: @source
-                ))
-    end.uniq
-  end
-  def parse
-    SDL4R.read(contents)
-  end
-end