RubyGems - ecosystems-bibliothecary - Versions diffs - 14.2.0 → 15.0.0 - Mend

ecosystems-bibliothecary 14.2.0 → 15.0.0

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (72) hide show

checksums.yaml +4 -4
data/CHANGELOG.md +48 -0
data/README.md +9 -24
data/bibliothecary.gemspec +5 -9
data/lib/bibliothecary/analyser/analysis.rb +10 -5
data/lib/bibliothecary/analyser/matchers.rb +7 -5
data/lib/bibliothecary/analyser.rb +0 -30
data/lib/bibliothecary/cli.rb +35 -26
data/lib/bibliothecary/configuration.rb +1 -6
data/lib/bibliothecary/dependency.rb +1 -4
data/lib/bibliothecary/file_info.rb +7 -0
data/lib/bibliothecary/parsers/bentoml.rb +0 -2
data/lib/bibliothecary/parsers/bower.rb +0 -1
data/lib/bibliothecary/parsers/cargo.rb +12 -10
data/lib/bibliothecary/parsers/carthage.rb +51 -15
data/lib/bibliothecary/parsers/clojars.rb +14 -18
data/lib/bibliothecary/parsers/cocoapods.rb +100 -19
data/lib/bibliothecary/parsers/cog.rb +0 -2
data/lib/bibliothecary/parsers/conan.rb +156 -0
data/lib/bibliothecary/parsers/conda.rb +0 -3
data/lib/bibliothecary/parsers/cpan.rb +0 -2
data/lib/bibliothecary/parsers/cran.rb +40 -19
data/lib/bibliothecary/parsers/docker.rb +0 -2
data/lib/bibliothecary/parsers/dub.rb +33 -8
data/lib/bibliothecary/parsers/dvc.rb +0 -2
data/lib/bibliothecary/parsers/elm.rb +13 -3
data/lib/bibliothecary/parsers/go.rb +14 -5
data/lib/bibliothecary/parsers/hackage.rb +132 -24
data/lib/bibliothecary/parsers/haxelib.rb +14 -4
data/lib/bibliothecary/parsers/hex.rb +37 -20
data/lib/bibliothecary/parsers/homebrew.rb +0 -2
data/lib/bibliothecary/parsers/julia.rb +0 -2
data/lib/bibliothecary/parsers/maven.rb +35 -25
data/lib/bibliothecary/parsers/meteor.rb +14 -4
data/lib/bibliothecary/parsers/mlflow.rb +0 -2
data/lib/bibliothecary/parsers/npm.rb +47 -59
data/lib/bibliothecary/parsers/nuget.rb +23 -22
data/lib/bibliothecary/parsers/ollama.rb +0 -2
data/lib/bibliothecary/parsers/packagist.rb +0 -3
data/lib/bibliothecary/parsers/pub.rb +0 -2
data/lib/bibliothecary/parsers/pypi.rb +54 -35
data/lib/bibliothecary/parsers/rubygems.rb +92 -27
data/lib/bibliothecary/parsers/shard.rb +0 -1
data/lib/bibliothecary/parsers/swift_pm.rb +77 -29
data/lib/bibliothecary/parsers/vcpkg.rb +68 -17
data/lib/bibliothecary/runner.rb +169 -22
data/lib/bibliothecary/version.rb +1 -1
data/lib/bibliothecary.rb +3 -10
data/lib/dockerfile_parser.rb +1 -1
data/lib/modelfile_parser.rb +8 -8
metadata +2 -108
data/.codeclimate.yml +0 -25
data/.github/CONTRIBUTING.md +0 -195
data/.github/workflows/ci.yml +0 -25
data/.gitignore +0 -10
data/.rspec +0 -2
data/.rubocop.yml +0 -69
data/.ruby-version +0 -1
data/.tidelift +0 -1
data/CODE_OF_CONDUCT.md +0 -74
data/Gemfile +0 -34
data/Rakefile +0 -18
data/bin/console +0 -15
data/bin/setup +0 -8
data/lib/bibliothecary/multi_parsers/bundler_like_manifest.rb +0 -26
data/lib/bibliothecary/multi_parsers/cyclonedx.rb +0 -170
data/lib/bibliothecary/multi_parsers/dependencies_csv.rb +0 -155
data/lib/bibliothecary/multi_parsers/json_runtime.rb +0 -22
data/lib/bibliothecary/multi_parsers/spdx.rb +0 -149
data/lib/bibliothecary/purl_util.rb +0 -37
data/lib/bibliothecary/runner/multi_manifest_filter.rb +0 -92
data/lib/sdl_parser.rb +0 -30

checksums.yaml CHANGED Viewed

@@ -1,7 +1,7 @@
 ---
 SHA256:
-  metadata.gz: c531c54aa377c8bc30d1a2f75e3de0bbad1a0502568976f3d487fe3c4c78bc53
-  data.tar.gz: 82b7ca70158bc5ce1094af762eed9b7cb20fa6492c807663c965266bc8ce535a
+  metadata.gz: b18779ed0610462aee8f4fc8c9df7989b42ae2ba1e87f1d7592d408b35fbb606
+  data.tar.gz: 004c0db1d58aefbb9cf5a599bb9f7b5790f3c5fd31f1f96b6e3159ba4d646711
 SHA512:
-  metadata.gz: a981fd824d3227d00b9a937199ab3eeb007139c7f76c28de5a8681e1a680948cfe453abab0a791ea4b65c56d6f2d22943b7a834b6c83c3df36de746504bb2c1d
-  data.tar.gz: 35ec260ba3a5a92a84a5db142771681eb609feb1a65288471f1152f29838d118484f7e1ad9f0e6ff021547b322a8dc0a384a53bf5939e55ee6b4430f4224bc24
+  metadata.gz: 466de11f118fe2097167ed318baf5d41289eadf61b68d34329ded86c43bf9efab5ff75bb6e1af7d96f8acc41d7ef2c2815c7838517704c9f6d62d443e491c49d
+  data.tar.gz: 5c9c5baef7c35f6de525449cc3b71331d607095a9491b56fbcc69b0d3e6683186ad7d066cf6d28b537960750cebdc533fb7065da51847b03069bd51175a57169

data/CHANGELOG.md CHANGED Viewed

@@ -13,6 +13,54 @@ and this project adheres to [Semantic Versioning](https://semver.org/spec/v2.0.0
 ### Removed
+## [15.0.0]
+### Added
+- Conan parser: conanfile.py, conanfile.txt, conan.lock
+- vcpkg lockfile support: _generated-vcpkg-list.json
+- vcpkg improvements: overrides support, dev dependency detection (host: true)
+### Changed
+- NuGet packages.lock.json now returns dependencies from all target frameworks instead of arbitrarily picking one
+- Optimized Maven text parsers: lazy ANSI stripping, skip newline normalization when not needed (10-20% faster)
+- Optimized yarn.lock v1 parser with lazy newline normalization (16% faster)
+- Optimized requirements.txt parser with each_line iteration and cached source lookup (10% faster)
+### Removed
+- SPDX parser and support for *.spdx, *.spdx.json files
+- CycloneDX parser and support for cyclonedx.xml, cyclonedx.json, *.cdx.xml, *.cdx.json files
+- DependenciesCSV multi_parser and support for dependencies.csv files
+- packageurl-ruby dependency
+- Multi-parser infrastructure (add_multi_parser, MultiManifestFilter)
+## [14.4.0]
+### Changed
+- Switched Cargo.lock, poetry.lock, uv.lock, Gopkg.lock, and pylock.toml parsers from full TOML parsing to regex-based parsing for 50-250x faster lockfile parsing on these formats.
+- Switched Gemfile.lock parser from Bundler::LockfileParser to regex-based parsing for 6x faster parsing.
+- Switched Podfile.lock parser from YAML to regex-based parsing for 5x faster parsing.
+- Switched yarn.lock v2+ parser from YAML to regex-based parsing for 14x faster parsing.
+## [14.3.0]
+### Added
+- Added `bin/benchmark` script for performance testing.
+### Changed
+- Fixed bug where Runner was recreated on every Bibliothecary method call, causing repeated index rebuilding.
+- Memoized package_managers array in Runner.
+- Added filename/extension index for O(1) parser lookup instead of O(n) linear scan through all parsers.
+- Optimized `identify_manifests` to use filename index directly (~139x faster).
+- Optimized `analyse_file` to use filename index for candidate filtering (~16x faster).
+- Added per-file caching of mapping details in FileInfo to avoid repeated lookups.
+- Added `parse_file_info` method to reuse FileInfo objects during parsing.
 ## [14.2.0]
 ### Added

data/README.md CHANGED Viewed

@@ -4,8 +4,6 @@ Dependency manifest parsing library for https://github.com/ecosyste-ms
 This is a maintained fork of the original [Bibliothecary](https://github.com/librariesio/bibliothecary) gem, with support for additional manifest formats and bug fixes.
-[![license](https://img.shields.io/github/license/ecosyste-ms/bibliothecary.svg)](https://github.com/ecosyste-ms/bibliothecary/blob/master/LICENSE.txt)
 ## Installation
 Requires Ruby 3.4 or above.
@@ -13,12 +11,14 @@ Requires Ruby 3.4 or above.
 Add this line to your application's Gemfile:
 ```ruby
-gem "bibliothecary", git: "https://github.com/ecosyste-ms/bibliothecary.git"
+gem "ecosystems-bibliothecary", git: "https://github.com/ecosyste-ms/bibliothecary.git", require: "bibliothecary"
 ```
 And then execute:
-    $ bundle install
+```shell
+bundle install
+```
 ## Usage
@@ -40,14 +40,6 @@ Search a directory for manifest files and parse the contents:
 Bibliothecary.analyse('./')
 ```
-There are a number of parsers that rely on web services to parse the file formats, those urls can be configured like so:
-```ruby
-Bibliothecary.configure do |config|
-  config.carthage_parser_host = 'http://my-carthage-parsing-service.com'
-end
-```
 All available config options are in: https://github.com/ecosyste-ms/bibliothecary/blob/master/lib/bibliothecary/configuration.rb
 ## Supported package manager file formats
@@ -103,18 +95,6 @@ All available config options are in: https://github.com/ecosyste-ms/bibliothecar
   - paket.lock
   - *.csproj
   - project.assets.json
-- CycloneDX
-  - cyclonedx.xml
-  - cyclonedx.json
-  - *.cdx.xml
-  - *.cdx.json
-  - Note that CycloneDX manifests can contain information on multiple
-    package manager's packages!
-- SPDX
-  - tag:value as *.spdx
-  - JSON as *.spdx.json
-  - Note that SPDX manifests can contain information on multiple
-    package manager's packages!
 - Bower
   - bower.json
 - BentoML
@@ -134,6 +114,10 @@ All available config options are in: https://github.com/ecosyste-ms/bibliothecar
   - project.clj
 - Cog
   - cog.yaml
+- Conan
+  - conanfile.py
+  - conanfile.txt
+  - conan.lock
 - Meteor
   - versions.json
 - MLflow
@@ -198,6 +182,7 @@ All available config options are in: https://github.com/ecosyste-ms/bibliothecar
   - dvc.yaml
 - Vcpkg
   - vcpkg.json
+  - _generated-vcpkg-list.json
 - Homebrew
   - Brewfile
   - Brewfile.lock.json

data/bibliothecary.gemspec CHANGED Viewed

@@ -16,23 +16,19 @@ Gem::Specification.new do |spec|
   spec.homepage      = "https://github.com/ecosyste-ms/bibliothecary"
   spec.license       = "AGPL-3.0"
-  spec.files         = `git ls-files -z`.split("\x0").reject { |f| f.match(%r{^(test|spec|features)/}) }
+  spec.files         = `git ls-files -z`.split("\x0").reject do |f|
+    f.match(%r{^(test|spec|features|\.github)/|^bin/(benchmark|console|setup)|^\.|^(Gemfile|Rakefile|CODE_OF_CONDUCT)})
+  end
   spec.bindir        = "bin"
-  spec.executables   = spec.files.grep(%r{^bin/}) { |f| File.basename(f) }
+  spec.executables   = %w[bibliothecary]
   spec.require_paths = ["lib"]
   spec.add_dependency "bundler"
-  spec.add_dependency "commander"
   spec.add_dependency "csv"
-  spec.add_dependency "deb_control"
   spec.add_dependency "json", "~> 2.8"
-  spec.add_dependency "librariesio-gem-parser"
   spec.add_dependency "ox", ">= 2.8.1"
-  spec.add_dependency "packageurl-ruby"
-  spec.add_dependency "racc"
-  spec.add_dependency "sdl4r"
+  spec.add_dependency "racc" # required by tomlrb but not declared as a dependency
   spec.add_dependency "tomlrb", "~> 2.0"
-  spec.add_dependency "typhoeus"
   spec.metadata["rubygems_mfa_required"] = "true"
 end

data/lib/bibliothecary/analyser/analysis.rb CHANGED Viewed

@@ -40,7 +40,7 @@ module Bibliothecary
         # If your Parser needs to return multiple responses for one file, please override this method
         # For example see conda.rb
         kind = determine_kind_from_info(info)
-        parser_result = parse_file(info.relative_path, info.contents, options: options)
+        parser_result = parse_file_info(info, options: options)
         parser_result = ParserResult.new(dependencies: []) if parser_result.nil? # work around any legacy parsers that return nil
         Bibliothecary::Analyser.create_analysis(platform_name, info.relative_path, kind, parser_result)
@@ -52,26 +52,31 @@ module Bibliothecary
       # Call the matching parse class method for this file with
       # these contents
       def parse_file(filename, contents, options: {})
-        details = first_matching_mapping_details(FileInfo.new(nil, filename, contents))
+        parse_file_info(FileInfo.new(nil, filename, contents), options: options)
+      end
+      # Parse a file using its FileInfo object, reusing cached mapping details.
+      def parse_file_info(info, options: {})
+        details = first_matching_mapping_details(info)
         # this can be raised if we don't check match?/match_info?,
         # OR don't have the file contents when we check them, so
         # it turns out for example that a .xml file isn't a
         # manifest after all.
-        raise Bibliothecary::FileParsingError.new("No parser for this file type", filename) unless details[:parser]
+        raise Bibliothecary::FileParsingError.new("No parser for this file type", info.relative_path) unless details[:parser]
         # The `parser` method should raise an exception if the file is malformed,
         # should return empty [] if the file is fine but simply doesn't contain
         # any dependencies, and should never return nil. At the time of writing
         # this comment, some of the parsers return [] or nil to mean an error
         # which is confusing to users.
-        send(details[:parser], contents, options: options.merge(filename: filename))
+        send(details[:parser], info.contents, options: options.merge(filename: info.relative_path))
       rescue Exception => e # default is StandardError but C bindings throw Exceptions # rubocop:disable Lint/RescueException
         # the C xml parser also puts a newline at the end of the message
         location = e.backtrace_locations[0]
           .to_s
           .then { |l| l =~ /bibliothecary\// ? l.split("bibliothecary/").last : l.split("gems/").last }
-        raise Bibliothecary::FileParsingError.new(e.message.strip, filename, location)
+        raise Bibliothecary::FileParsingError.new(e.message.strip, info.relative_path, location)
       end
       private

data/lib/bibliothecary/analyser/matchers.rb CHANGED Viewed

@@ -52,12 +52,14 @@ module Bibliothecary
         first_matching_mapping_details(info).any?
       end
-      private
+      # Get mapping details for this file, using cache if available.
+      # The cache is stored on the FileInfo object to avoid repeated lookups.
       def first_matching_mapping_details(info)
-        mapping
-          .find { |matcher, details| mapping_entry_match?(matcher, details, info) }
-          &.last || {}
+        info.cached_mapping_details(self) do
+          mapping
+            .find { |matcher, details| mapping_entry_match?(matcher, details, info) }
+            &.last || {}
+        end
       end
     end
   end

data/lib/bibliothecary/analyser.rb CHANGED Viewed

@@ -38,18 +38,6 @@ module Bibliothecary
       base.extend(Bibliothecary::Analyser::Analysis)
     end
-    module TryCache
-      def try_cache(options, key)
-        if options[:cache]
-          options[:cache][key] ||= yield
-          options[:cache][key]
-        else
-          yield
-        end
-      end
-    end
     module ClassMethods
       def platform_name
         @platform_name ||= name.to_s.split("::").last.downcase.freeze
@@ -66,24 +54,6 @@ module Bibliothecary
           )
         end
       end
-      # Add a MultiParser module to a Parser class. This extends the
-      # self.mapping method on the parser to include the multi parser's
-      # files to watch for, and it extends the Parser class with
-      # the multi parser for you.
-      #
-      # @param klass [Class] A Bibliothecary::MultiParsers class
-      def add_multi_parser(klass)
-        raise "No mapping found! You should place the add_multi_parser call below def self.mapping." unless respond_to?(:mapping)
-        original_mapping = mapping
-        define_singleton_method(:mapping) do
-          original_mapping.merge(klass.mapping)
-        end
-        send(:extend, klass)
-      end
     end
   end
 end

data/lib/bibliothecary/cli.rb CHANGED Viewed

@@ -2,39 +2,48 @@
 require "bibliothecary/version"
 require "bibliothecary"
-require "commander"
+require "optparse"
 module Bibliothecary
   class CLI
-    include Commander::Methods
     def run
-      program :name, "Bibliothecary"
-      program :version, Bibliothecary::VERSION
-      program :description, "Parse dependency information from a file or folder of code"
-      command(:list) do |c|
-        c.syntax = "bibliothecary list"
-        c.description = "List dependencies"
-        c.option("--path FILENAME", String, "Path to file/folder to analyse")
-        c.action do |_args, options|
-          options.default path: "./"
-          output = Bibliothecary.analyse(options.path)
-          output.each do |file_contents|
-            puts "#{file_contents[:path]} (#{file_contents[:platform]})"
-            file_contents[:dependencies].group_by { |d| d[:type] }.each do |type, deps|
-              puts "  #{type}"
-              deps.each do |dep|
-                puts "    #{dep[:name]} #{dep[:requirement]}"
-              end
-              puts
-            end
-            puts
-          end
+      options = { path: "./" }
+      parser = OptionParser.new do |opts|
+        opts.banner = "Usage: bibliothecary [options]"
+        opts.separator ""
+        opts.separator "Parse dependency information from a file or folder of code"
+        opts.separator ""
+        opts.on("-p", "--path PATH", "Path to file/folder to analyse (default: ./)") do |path|
+          options[:path] = path
+        end
+        opts.on("-v", "--version", "Show version") do
+          puts Bibliothecary::VERSION
+          exit
+        end
+        opts.on("-h", "--help", "Show this help") do
+          puts opts
+          exit
         end
       end
-      run!
+      parser.parse!
+      output = Bibliothecary.analyse(options[:path])
+      output.each do |file_contents|
+        puts "#{file_contents[:path]} (#{file_contents[:platform]})"
+        file_contents[:dependencies].group_by { |d| d[:type] }.each do |type, deps|
+          puts "  #{type}"
+          deps.each do |dep|
+            puts "    #{dep[:name]} #{dep[:requirement]}"
+          end
+          puts
+        end
+        puts
+      end
     end
   end
 end

data/lib/bibliothecary/configuration.rb CHANGED Viewed

@@ -2,16 +2,11 @@
 module Bibliothecary
   class Configuration
-    attr_accessor :ignored_dirs, :ignored_files, :carthage_parser_host, :clojars_parser_host, :mix_parser_host, :conda_parser_host, :swift_parser_host, :cabal_parser_host
+    attr_accessor :ignored_dirs, :ignored_files
     def initialize
       @ignored_dirs = [".git", "node_modules", "bower_components", "vendor", "dist"]
       @ignored_files = []
-      @carthage_parser_host = "https://carthage.libraries.io"
-      @clojars_parser_host  = "https://clojars.libraries.io"
-      @mix_parser_host      = "https://mix.libraries.io"
-      @swift_parser_host    = "http://swift.libraries.io"
-      @cabal_parser_host    = "http://cabal.libraries.io"
     end
   end
 end

data/lib/bibliothecary/dependency.rb CHANGED Viewed

@@ -5,10 +5,7 @@ module Bibliothecary
   #
   # @attr_reader [String] name The name of the package, e.g. "ansi-string-colors"
   # @attr_reader [String] requirement The version requirement of the release, e.g. "1.0.0" or "^1.0.0"
-  # @attr_reader [String] platform The platform of the package, e.g. "maven". This is optional because
-  #   it's implicit in most parser results, and the analyzer returns the platform name itself. One
-  #   exception are multi-parsers like DependenciesCSV, because they may return deps from multiple platforms.
-  #   Bibliothecary could start returning this field for *all* deps in future, and make it required. (default: nil)
+  # @attr_reader [String] platform The platform of the package, e.g. "maven".
   # @attr_reader [String] type The type or scope of dependency, e.g. "runtime" or "test". In some ecosystems a
   #   default may be set and in other ecosystems it may make sense to return nil when not found.
   # @attr_reader [Boolean] direct Is this dependency a direct dependency (vs transitive dependency)? (default: nil)

data/lib/bibliothecary/file_info.rb CHANGED Viewed

@@ -46,10 +46,17 @@ module Bibliothecary
       @contents = contents
       @package_manager = nil
+      @mapping_cache = {}
     end
     def groupable?
       @package_manager&.groupable?(self)
     end
+    # Cache and retrieve mapping details for a given package manager class.
+    # This avoids repeatedly calling first_matching_mapping_details.
+    def cached_mapping_details(package_manager_class)
+      @mapping_cache[package_manager_class] ||= yield
+    end
   end
 end

data/lib/bibliothecary/parsers/bentoml.rb CHANGED Viewed

@@ -15,8 +15,6 @@ module Bibliothecary
         }
       end
-      add_multi_parser(Bibliothecary::MultiParsers::CycloneDX)
-      add_multi_parser(Bibliothecary::MultiParsers::DependenciesCSV)
       def self.parse_bentofile(file_contents, options: {})
         source = options.fetch(:filename, 'bentofile.yaml')

data/lib/bibliothecary/parsers/bower.rb CHANGED Viewed

@@ -16,7 +16,6 @@ module Bibliothecary
         }
       end
-      add_multi_parser(Bibliothecary::MultiParsers::DependenciesCSV)
       def self.parse_manifest(file_contents, options: {})
         json = JSON.parse(file_contents)

data/lib/bibliothecary/parsers/cargo.rb CHANGED Viewed

@@ -18,9 +18,6 @@ module Bibliothecary
         }
       end
-      add_multi_parser(Bibliothecary::MultiParsers::CycloneDX)
-      add_multi_parser(Bibliothecary::MultiParsers::Spdx)
-      add_multi_parser(Bibliothecary::MultiParsers::DependenciesCSV)
       def self.parse_manifest(file_contents, options: {})
         manifest = Tomlrb.parse(file_contents)
@@ -48,19 +45,24 @@ module Bibliothecary
       end
       def self.parse_lockfile(file_contents, options: {})
-        manifest = Tomlrb.parse(file_contents)
-        dependencies = manifest.fetch("package", []).map do |dependency|
-          next if !dependency["source"] || !dependency["source"].start_with?("registry+")
+        dependencies = []
+        # Split into [[package]] blocks and extract fields from each
+        file_contents.split(/\[\[package\]\]/).drop(1).each do |block|
+          name = block[/name\s*=\s*"([^"]+)"/, 1]
+          version = block[/version\s*=\s*"([^"]+)"/, 1]
+          source = block[/source\s*=\s*"([^"]+)"/, 1]
+          # Skip packages without a registry source (local/workspace packages)
+          next unless source&.start_with?("registry+")
-          Dependency.new(
-            name: dependency["name"],
-            requirement: dependency["version"],
+          dependencies << Dependency.new(
+            name: name,
+            requirement: version,
             type: "runtime",
             source: options.fetch(:filename, nil),
             platform: platform_name
           )
         end
-          .compact
         ParserResult.new(dependencies: dependencies)
       end
     end

data/lib/bibliothecary/parsers/carthage.rb CHANGED Viewed

@@ -3,6 +3,18 @@ module Bibliothecary
     class Carthage
       include Bibliothecary::Analyser
+      # Matches Cartfile entries:
+      # github "owner/repo" >= 1.0
+      # github "owner/repo" "branch"
+      # github "owner/repo"
+      # git "url" "ref"
+      # binary "url" >= 1.0
+      # Group 1: source type (github, git, binary)
+      # Group 2: identifier (owner/repo or URL)
+      # Group 3: quoted version/branch
+      # Group 4: unquoted requirement (e.g., >= 1.0, ~> 2.0)
+      CARTFILE_REGEXP = /^(github|git|binary)\s+"([^"]+)"(?:\s+(?:"([^"]+)"|((?:>=|<=|~>|==|>|<)\s*[\d.]+)))?/
       def self.mapping
         {
           match_filename("Cartfile") => {
@@ -20,36 +32,60 @@ module Bibliothecary
         }
       end
-      add_multi_parser(Bibliothecary::MultiParsers::CycloneDX)
-      add_multi_parser(Bibliothecary::MultiParsers::DependenciesCSV)
       def self.parse_cartfile(file_contents, options: {})
-        map_dependencies(file_contents, "cartfile", options.fetch(:filename, "Cartfile"))
+        parse_cartfile_contents(file_contents, options.fetch(:filename, "Cartfile"), "runtime")
       end
       def self.parse_cartfile_private(file_contents, options: {})
-        map_dependencies(file_contents, "cartfile.private", options.fetch(:filename, "Cartfile.private"))
+        parse_cartfile_contents(file_contents, options.fetch(:filename, "Cartfile.private"), "development")
       end
       def self.parse_cartfile_resolved(file_contents, options: {})
-        map_dependencies(file_contents, "cartfile.resolved", options.fetch(:filename, "Cartfile.resolved"))
+        parse_cartfile_contents(file_contents, options.fetch(:filename, "Cartfile.resolved"), "runtime")
       end
-      def self.map_dependencies(manifest, path, source)
-        response = Typhoeus.post("#{Bibliothecary.configuration.carthage_parser_host}/#{path}", params: {body: manifest}, timeout: 60)
-        raise Bibliothecary::RemoteParsingError.new("Http Error #{response.response_code} when contacting: #{Bibliothecary.configuration.carthage_parser_host}/#{path}", response.response_code) unless response.success?
-        json = JSON.parse(response.body)
+      def self.parse_cartfile_contents(contents, source, type)
+        deps = []
+        contents.each_line do |line|
+          # Remove inline comments
+          line = line.sub(/#.*$/, "").strip
+          next if line.empty?
+          match = line.match(CARTFILE_REGEXP)
+          next unless match
-        deps = json.map do |dependency|
-          Bibliothecary::Dependency.new(
+          source_type = match[1]  # github, git, or binary
+          identifier = match[2]   # owner/repo or URL
+          # match[3] is quoted version/branch, match[4] is unquoted requirement
+          version = match[3] || match[4] || "*"
+          # For github sources, use identifier as-is (could be owner/repo or full URL)
+          # For git/binary sources, extract repo name from URL
+          name = case source_type
+                 when "github"
+                   # Could be "owner/repo" or a full URL like "https://enterprise.local/..."
+                   if identifier.include?("://")
+                     identifier.split("/").last&.sub(/\.git$/, "") || identifier
+                   else
+                     identifier
+                   end
+                 else
+                   # Extract name from URL (last path component without .git)
+                   identifier.split("/").last&.sub(/\.git$/, "") || identifier
+                 end
+          deps << Dependency.new(
             platform: platform_name,
-            name: dependency["name"],
-            requirement: dependency["version"],
-            type: dependency["type"],
+            name: name,
+            requirement: version,
+            type: type,
             source: source
           )
         end
-        Bibliothecary::ParserResult.new(dependencies: deps)
+        ParserResult.new(dependencies: deps)
       end
     end
   end

data/lib/bibliothecary/parsers/clojars.rb CHANGED Viewed

@@ -1,11 +1,12 @@
-require "json"
-require "typhoeus"
 module Bibliothecary
   module Parsers
     class Clojars
       include Bibliothecary::Analyser
+      # Matches individual dependency: [name "version"]
+      # Name can be like: org.clojure/clojure, cheshire, ring/ring-defaults
+      DEPENDENCY_REGEXP = %r{\[([a-zA-Z0-9_./\-]+)\s+"([^"]+)"\]}
       def self.mapping
         {
           match_filename("project.clj") => {
@@ -15,31 +16,26 @@ module Bibliothecary
         }
       end
-      add_multi_parser(Bibliothecary::MultiParsers::CycloneDX)
-      add_multi_parser(Bibliothecary::MultiParsers::DependenciesCSV)
       def self.parse_manifest(file_contents, options: {})
         source = options.fetch(:filename, "project.clj")
-        response = Typhoeus.post("#{Bibliothecary.configuration.clojars_parser_host}/project.clj", body: file_contents, timeout: 60)
-        raise Bibliothecary::RemoteParsingError.new("Http Error #{response.response_code} when contacting: #{Bibliothecary.configuration.clojars_parser_host}/project.clj", response.response_code) unless response.success?
-        json = JSON.parse response.body
-        index = json.index("dependencies")
+        deps = []
-        deps = if index
-          dependencies = json[index + 1]
-          dependencies.map do |dependency|
-            Bibliothecary::Dependency.new(
+        # Find the :dependencies section and extract deps
+        # Look for :dependencies followed by a vector of vectors
+        if (deps_section = file_contents[/:dependencies\s*\[.*?\]\]/m])
+          deps_section.scan(DEPENDENCY_REGEXP) do |name, version|
+            deps << Dependency.new(
               platform: platform_name,
-              name: dependency[0],
-              requirement: dependency[1],
+              name: name,
+              requirement: version,
               type: "runtime",
               source: source
             )
           end
-        else
-          []
         end
-        Bibliothecary::ParserResult.new(dependencies: deps)
+        ParserResult.new(dependencies: deps)
       end
     end
   end