RubyGems - raimei-bench - Versions diffs - 0.1.0 → 0.1.2 - Mend

raimei-bench 0.1.0 → 0.1.2

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (8) hide show

checksums.yaml CHANGED Viewed

@@ -1,7 +1,7 @@
 ---
 SHA256:
-  metadata.gz: 416d74032625f8a01432c62377b606eb5c26da186b6a5a45708304d6ecb41b35
-  data.tar.gz: dd1952e30833c70c69640963c2cb4cf4138b5f302cb2e54c48e80bf3ffd597c3
+  metadata.gz: 15fa8bff21ad42eef9d31f70b09725e018fa800f78b1bf9e9328fceec1cce417
+  data.tar.gz: f3e50c0d28eb25cb04cb0dc5744276923fece6ca56255396bb5c2fe00baca8ee
 SHA512:
-  metadata.gz: e7946148aeaab7fb252f68d5d6cd800528e8314fec81556afa94bd91c3c022755ffabd98861a631aed7f8f687b79fbab7e4eaf4a2275b18fc2d298d4b26c0fff
-  data.tar.gz: c82d1f8b11a53e681ac704f8f6455c2815521b0b612f03595cd4afe98318da5bacc4907af3a043e8d5cc816ffec98d03fbe0e905b1488e25d1419672228bde12
+  metadata.gz: bdf9771fb6a5fbdfe2741fef1026e1a509b543fbb0f7a1b45e2530e0e8f9a0bec355137789f034c77c265ac515fee3dd39cb26feec16c63b54026f047bc20857
+  data.tar.gz: 9fd10c15d9060703f16390cfb364e991c13520011cb6fcb9d7e2ee05052410c9f4d95a8d3746848c26efaf86e07dfa1a80e7a7d8542b99c0bd7bdc5514479919

data/Gemfile ADDED Viewed

@@ -0,0 +1,13 @@
+# frozen_string_literal: true
+source "https://rubygems.org"
+# Specify your gem's dependencies in raimei-bench.gemspec
+gemspec
+gem "irb"
+gem "rake", "~> 13.0"
+gem "minitest", "~> 5.16"
+gem "rubocop", "~> 1.21"

data/README.md CHANGED Viewed

@@ -1,5 +1,8 @@
 # Raimei::Bench
+> ⚠️ Experimental: APIs may change.
 TODO: Delete this and the text below, and describe your gem
 Welcome to your new gem! In this directory, you'll find the files you need to be able to package up your Ruby library into a gem. Put your Ruby code in the file `lib/raimei/bench`. To experiment with that code, run `bin/console` for an interactive prompt.

data/exe/raimei-bench ADDED Viewed

@@ -0,0 +1,62 @@
+#!/usr/bin/env ruby
+# frozen_string_literal: true
+# Add local libs so this works without Bundler
+root = File.expand_path("../../..", __dir__)
+%w[raimei-bench raimei-nim raimei-shared].each do |g|
+  $LOAD_PATH.unshift File.join(root, "gems", g, "lib")
+end
+require "optparse"
+require "yaml"
+require "raimei/bench"
+require "raimei/bench/report"
+def env_or_literal(field)
+  case field
+  when String
+    if (m = field.match(/\AENV\((.+)\)\z/))
+      ENV[m[1]]
+    else
+      field
+    end
+  else
+    nil
+  end
+end
+cmd = ARGV.shift or abort "Usage: raimei-bench <run|report> ..."
+case cmd
+when "run"
+  opts = { url: ENV["URL"], model: ENV["MODEL"], api_key: ENV["API_KEY"], stream: true }
+  OptionParser.new do |o|
+    o.banner = "Usage: raimei-bench run <scenario.yml> [--url URL] [--model MODEL] [--api-key KEY] [--no-stream]"
+    o.on("--url URL"){|v| opts[:url]=v}
+    o.on("--model MODEL"){|v| opts[:model]=v}
+    o.on("--api-key KEY"){|v| opts[:api_key]=v}
+    o.on("--no-stream"){ opts[:stream]=false }
+  end.parse!
+  file = ARGV.shift or abort "scenario.yml required"
+  y = YAML.load_file(file)
+  name   = y["name"] || File.basename(file, ".*")
+  url    = opts[:url]   || env_or_literal(y["url"])   || ENV["URL"]
+  model  = opts[:model] || env_or_literal(y["model"]) || ENV["MODEL"]
+  stream = opts.key?(:stream) ? opts[:stream] : (y["stream"] != false)
+  prompts = y["prompts"]
+  prompts = File.expand_path(prompts, File.dirname(file)) if prompts.is_a?(String)
+  abort "URL missing (set --url or URL env)"     unless url && !url.empty?
+  abort "MODEL missing (set --model or MODEL)"   unless model && !model.empty?
+  sc = Raimei::Bench::Scenario.new(name: name, url: url, model: model, api_key: opts[:api_key], stream: stream)
+  sc.run(prompts)
+when "report"
+  path = ARGV.shift or abort "Usage: raimei-bench report reports/<name>.json"
+  out  = Raimei::Bench::Report.write(path)
+  puts "wrote #{out}"
+else
+  abort "Unknown command: #{cmd}"
+end

data/lib/raimei/bench/report.rb ADDED Viewed

@@ -0,0 +1,55 @@
+# frozen_string_literal: true
+require "json"
+require "erb"
+module Raimei
+  module Bench
+    module Report
+      TEMPLATE = <<~HTML
+      <!doctype html><meta charset="utf-8">
+      <title><%= name %> – Raimei Bench</title>
+      <style>
+        body{font-family:system-ui,-apple-system,Segoe UI,Roboto,Ubuntu,"Helvetica Neue",sans-serif;max-width:920px;margin:32px auto;padding:0 12px}
+        table{border-collapse:collapse;width:100%} th,td{border:1px solid #ddd;padding:8px} th{background:#f7f7f7;text-align:left}
+        .sum{margin:12px 0 20px}
+        .muted{color:#666}
+      </style>
+      <h1><%= name %></h1>
+      <p class="sum">Count: <b><%= data.length %></b> • p50: <b><%= p50 %> ms</b> • p95: <b><%= p95 %> ms</b><% if ttfb_p50 %> • TTFB p50: <b><%= ttfb_p50 %> ms</b><% end %></p>
+      <table>
+        <tr><th>#</th><th>Latency (ms)</th><th>TTFB (ms)</th><th>Prompt</th><th>Output len</th></tr>
+        <% data.each_with_index do |r,i| t=r[:telemetry]; %>
+          <tr>
+            <td><%= i+1 %></td>
+            <td><%= t[:latency_ms] %></td>
+            <td><%= t.dig(:extra,:ttfb_ms) || "" %></td>
+            <td class="muted"><%= r[:prompt] %></td>
+            <td><%= t.dig(:extra,:output_len) %></td>
+          </tr>
+        <% end %>
+      </table>
+      HTML
+      def self.write(json_path, html_path=nil)
+        data = JSON.parse(File.read(json_path), symbolize_names: true)
+        times = data.map { |r| r[:telemetry][:latency_ms] }
+        ttfb  = data.map { |r| r[:telemetry].dig(:extra, :ttfb_ms) }.compact
+        p50   = pctile(times, 50)
+        p95   = pctile(times, 95)
+        ttfb_p50 = ttfb.empty? ? nil : pctile(ttfb, 50)
+        name = File.basename(json_path, ".json")
+        html = ERB.new(TEMPLATE).result(binding)
+        out  = html_path || json_path.sub(/\.json\z/, ".html")
+        File.write(out, html)
+        out
+      end
+      def self.pctile(arr, p)
+        return nil if arr.empty?
+        a = arr.sort; k=(p/100.0)*(a.length-1); f=k.floor; c=k.ceil
+        return a[f] if f==c
+        a[f] + (a[c]-a[f])*(k-f)
+      end
+    end
+  end
+end

data/lib/raimei/bench/version.rb CHANGED Viewed

@@ -2,6 +2,6 @@
 module Raimei
   module Bench
-    VERSION = "0.1.0"
+    VERSION = "0.1.2"
   end
 end

data/lib/raimei/bench.rb CHANGED Viewed

@@ -1,29 +1,118 @@
 # frozen_string_literal: true
 require "json"
+require "yaml"
 require "raimei/shared"
 require "raimei/nim"
 module Raimei
   module Bench
     class Scenario
-      def initialize(name:, url:, model:, api_key: nil)
-        @name, @url, @model, @api_key = name, url, model, api_key
+      # name:   report base name (also printed in summary)
+      # url:    OpenAI-compatible /v1/chat/completions endpoint
+      # model:  model id/name for the provider
+      # api_key: optional bearer token
+      # stream: true -> measure time-to-first-byte (TTFB) + total; false -> total only
+      # outdir: directory for report artifacts (JSON now; HTML can be added by CLI)
+      def initialize(name:, url:, model:, api_key: nil, stream: true, outdir: "reports")
+        @name, @url, @model, @api_key, @stream, @outdir =
+          name,  url,  model,  api_key,  stream,  outdir
       end
-      def run(prompts)
-        client = Raimei::NIM::Client.new(url: @url, api_key: @api_key)
+      # prompts_or_path:
+      #  * Array<String>               -> prompts directly
+      #  * "path/to/file.jsonl"        -> lines like {"prompt":"..."}
+      #  * "path/to/file.yml|.yaml"    -> must contain key "prompts" pointing to file or array
+      #  * "path/to/file.txt"          -> one prompt per line
+      #
+      # Returns the in-memory results array; also writes JSON to @outdir/<name>.json
+      def run(prompts_or_path)
+        prompts = load_prompts(prompts_or_path)
+        client  = Raimei::NIM::Client.new(url: @url, api_key: @api_key)
         results = []
-        prompts.each do |p|
+        latencies = []
+        ttfbs = []
+        prompts.each do |prompt|
           t0 = Raimei::Shared.now_ms
-          out = client.chat(model: @model, messages: [{role: "user", content: p}])
-          ev = Raimei::Shared.finish(name: @name, start_ms: t0, model: @model, extra: { prompt_len: p.size, output_len: out.size })
-          results << { prompt: p, output: out, telemetry: ev.to_h }
+          out = +""
+          ttfb_ms = nil
+          if @stream
+            client.chat(model: @model, messages: [{ role: "user", content: prompt }], stream: true).each do |delta|
+              ttfb_ms ||= (Raimei::Shared.now_ms - t0)
+              out << delta
+            end
+          else
+            out = client.chat(model: @model, messages: [{ role: "user", content: prompt }], stream: false)
+          end
+          ev = Raimei::Shared.finish(
+            name: @name, start_ms: t0, model: @model,
+            tokens_in: nil, tokens_out: nil,
+            extra: { prompt_len: prompt.size, output_len: out.size, ttfb_ms: ttfb_ms }
+          )
+          latencies << ev.latency_ms
+          ttfbs     << ttfb_ms if ttfb_ms
+          results   << { prompt: prompt, output: out, telemetry: ev.to_h }
         end
-        Dir.mkdir("reports") unless Dir.exist?("reports")
-        File.write("reports/#{@name}.json", JSON.pretty_generate(results))
+        Dir.mkdir(@outdir) unless Dir.exist?(@outdir)
+        json_path = File.join(@outdir, "#{@name}.json")
+        File.write(json_path, JSON.pretty_generate(results))
+        summary = {
+          count:      latencies.size,
+          p50_ms:     pctile(latencies, 50),
+          p95_ms:     pctile(latencies, 95),
+          ttfb_p50_ms: ttfbs.empty? ? nil : pctile(ttfbs, 50)
+        }
+        puts "== #{@name} #{summary.inspect}"
         results
       end
+      private
+      # Loads prompts from:
+      # - Array<String>
+      # - .jsonl (expects objects with "prompt")
+      # - .yml/.yaml (expects key "prompts": either array of strings or a file path)
+      # - other text file (one prompt per line)
+      def load_prompts(source)
+        return source if source.is_a?(Array)
+        case File.extname(source)
+        when ".jsonl"
+          File.readlines(source, chomp: true).map { |l| JSON.parse(l).fetch("prompt") }
+        when ".yml", ".yaml"
+          y = YAML.load_file(source)
+          prompts = y["prompts"] || y[:prompts]
+          if prompts.is_a?(Array)
+            prompts.map(&:to_s)
+          elsif prompts.is_a?(String)
+            resolved = File.expand_path(prompts, File.dirname(source))
+            load_prompts(resolved)
+          else
+            raise ArgumentError, "YAML must contain 'prompts' (array or path), got: #{prompts.inspect}"
+          end
+        else
+          # treat as plain text: one prompt per line
+          File.readlines(source, chomp: true)
+        end
+      end
+      def pctile(arr, p)
+        return nil if arr.empty?
+        a = arr.sort
+        k = (p / 100.0) * (a.length - 1)
+        f = k.floor
+        c = k.ceil
+        return a[f] if f == c
+        a[f] + (a[c] - a[f]) * (k - f)
+      end
     end
   end
 end

metadata CHANGED Viewed

@@ -1,7 +1,7 @@
 --- !ruby/object:Gem::Specification
 name: raimei-bench
 version: !ruby/object:Gem::Version
-  version: 0.1.0
+  version: 0.1.2
 platform: ruby
 authors:
 - Hal Fulton
@@ -9,18 +9,23 @@ bindir: exe
 cert_chain: []
 date: 1980-01-02 00:00:00.000000000 Z
 dependencies: []
-description: Provider-agnostic benchmark harness for LLM/CV/audio in Ruby.
+description: Run prompts against multiple backends; record p50/p95 latency & output
+  JSON reports. Experimental; APIs may change.
 email:
 - rubyhacker@gmail.com
-executables: []
+executables:
+- raimei-bench
 extensions: []
 extra_rdoc_files: []
 files:
 - CHANGELOG.md
+- Gemfile
 - LICENSE.txt
 - README.md
 - Rakefile
+- exe/raimei-bench
 - lib/raimei/bench.rb
+- lib/raimei/bench/report.rb
 - lib/raimei/bench/version.rb
 - sig/raimei/bench.rbs
 homepage: https://github.com/raimei-ruby/raimei
@@ -36,7 +41,7 @@ required_ruby_version: !ruby/object:Gem::Requirement
   requirements:
   - - ">="
     - !ruby/object:Gem::Version
-      version: 3.2.0
+      version: '3.2'
 required_rubygems_version: !ruby/object:Gem::Requirement
   requirements:
   - - ">="
@@ -45,5 +50,5 @@ required_rubygems_version: !ruby/object:Gem::Requirement
 requirements: []
 rubygems_version: 3.7.1
 specification_version: 4
-summary: Provider-agnostic benchmark harness for LLM/CV/audio in Ruby.
+summary: Provider-agnostic AI benchmark harness.
 test_files: []