RubyGems - completion-kit - Versions diffs - 0.20.3 → 0.20.4 - Mend

completion-kit 0.20.3 → 0.20.4

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (16) hide show

checksums.yaml +4 -4
data/app/assets/javascripts/completion_kit/application.js +70 -0
data/app/assets/stylesheets/completion_kit/application.css +13 -3
data/app/controllers/completion_kit/metrics_controller.rb +10 -1
data/app/controllers/completion_kit/runs_controller.rb +1 -1
data/app/models/completion_kit/run.rb +3 -3
data/app/services/completion_kit/mcp_tools/judges.rb +1 -1
data/app/services/completion_kit/mcp_tools/prompts.rb +2 -2
data/app/services/completion_kit/mcp_tools/runs.rb +1 -1
data/app/views/completion_kit/api_reference/_body.html.erb +15 -1
data/app/views/completion_kit/metrics/_form.html.erb +16 -14
data/app/views/completion_kit/runs/_form.html.erb +2 -2
data/app/views/completion_kit/runs/_row.html.erb +1 -1
data/app/views/completion_kit/runs/_status_header.html.erb +1 -1
data/lib/completion_kit/version.rb +1 -1
metadata +1 -1

checksums.yaml CHANGED Viewed

@@ -1,7 +1,7 @@
 ---
 SHA256:
-  metadata.gz: 71e8645d7a790e2afc35e4fb7c8ca4ec5a6d08f51f3f84a2c289a2b6c76a9051
-  data.tar.gz: f5143766d938735ae5f2072516bc520c7d826894c02dc6a584bf62e40dd4b583
+  metadata.gz: e49a3e185722be44be75a0e236862942841720af9f8b6bdcfe233778968d26ab
+  data.tar.gz: 1545324b88bc8eef05f507d71a80e06804d4a9d3c65f99010b76610657ffa021
 SHA512:
-  metadata.gz: 0a6c71340315065125e6bc520f80453132de07d858acd4e5327d2cc35d3b3420c920a2f2ccf148c696c20afdad15371f6323d27d85dd7f3d9baa8dd03d3f5386
-  data.tar.gz: 65c2978028e0897cb00e350f3a9e6af98f11e8d6fc6327da245acdbcc6de41bd783b8bbfe63b1cb76fc54e65debbd4488d71103f35d4222478c9611220d84a95
+  metadata.gz: 21f1b48c9ed2ba23b111eb1ff733ac62f180050ce3e1edd9ea31719ee25cf557025af86e00f13be27b6e04a79afb677ced23fa7e7e5a9580715249533559338c
+  data.tar.gz: a7799c294e109c42a585f9fc7aa01e94d389291dd3fc1eec6821123ea4cb066e5cb805b803dfcf935f771b494bf1324fd7f5787f781746cfd0290d6c97b93641

data/app/assets/javascripts/completion_kit/application.js CHANGED Viewed

@@ -210,6 +210,76 @@ document.addEventListener("click", function(e) {
   });
 });
+var CK_CHECK_FIELDS = {
+  contains: ["value", "case_sensitive", "trim"],
+  not_contains: ["value", "case_sensitive", "trim"],
+  equals: ["value", "case_sensitive", "trim"],
+  regex: ["pattern", "case_sensitive", "multiline"],
+  valid_json: [],
+  json_path_equals: ["json_path", "expected"],
+  length_bounds: ["min", "max"],
+  no_refusal: []
+};
+function ckApplyCheckFields(scope) {
+  if (!scope) return;
+  var kindSelect = scope.querySelector('[name="metric[check_config][check_kind]"]');
+  if (!kindSelect) return;
+  var visible = CK_CHECK_FIELDS[kindSelect.value];
+  var targetSelect = scope.querySelector('[name="metric[check_config][target]"]');
+  var targetIsJsonPath = !!(targetSelect && targetSelect.value === "json_path");
+  scope.querySelectorAll("[data-ck-check-field]").forEach(function(field) {
+    var key = field.getAttribute("data-ck-check-field");
+    var show;
+    if (key === "target_path") {
+      show = targetIsJsonPath;
+    } else if (!visible) {
+      show = true;
+    } else {
+      show = visible.indexOf(key) !== -1;
+    }
+    field.hidden = !show;
+  });
+}
+function ckApplyMetricType(group) {
+  var checked = group.querySelector('input[type="radio"]:checked');
+  if (!checked) return;
+  var value = checked.value;
+  var scope = group.closest("form") || document;
+  scope.querySelectorAll("[data-ck-metric-editor]").forEach(function(editor) {
+    var active = editor.getAttribute("data-ck-metric-editor") === value;
+    editor.hidden = !active;
+    editor.querySelectorAll("input, select, textarea").forEach(function(field) {
+      field.disabled = !active;
+    });
+  });
+  ckApplyCheckFields(scope);
+}
+document.addEventListener("turbo:load", function() {
+  document.querySelectorAll("[data-ck-metric-type]").forEach(function(group) {
+    ckApplyMetricType(group);
+  });
+  document.querySelectorAll('[data-ck-metric-editor="check"]').forEach(function(editor) {
+    ckApplyCheckFields(editor);
+  });
+});
+document.addEventListener("change", function(e) {
+  var target = e.target;
+  if (!target || !target.closest) return;
+  var group = target.closest("[data-ck-metric-type]");
+  if (group && target.type === "radio") {
+    ckApplyMetricType(group);
+    return;
+  }
+  if (target.name === "metric[check_config][check_kind]" || target.name === "metric[check_config][target]") {
+    var scope = target.closest('[data-ck-metric-editor="check"]') || target.closest("form");
+    ckApplyCheckFields(scope);
+  }
+});
 document.addEventListener("click", function(e) {
   var btn = e.target.closest("[data-ck-apply]");
   if (!btn) return;

data/app/assets/stylesheets/completion_kit/application.css CHANGED Viewed

@@ -1922,6 +1922,13 @@ label.ck-checkbox input {
   cursor: pointer;
 }
+.ck-radio-info {
+  width: 16px;
+  height: 16px;
+  color: var(--ck-muted);
+  cursor: help;
+}
 .ck-field-row {
   display: flex;
   gap: 1rem;
@@ -3238,7 +3245,8 @@ select.ck-input {
 #ck-tab-metric-groups:checked ~ .ck-api-tabs__nav label[for="ck-tab-metric-groups"],
 #ck-tab-agreements:checked ~ .ck-api-tabs__nav label[for="ck-tab-agreements"],
 #ck-tab-tags:checked ~ .ck-api-tabs__nav label[for="ck-tab-tags"],
-#ck-tab-providers:checked ~ .ck-api-tabs__nav label[for="ck-tab-providers"] {
+#ck-tab-providers:checked ~ .ck-api-tabs__nav label[for="ck-tab-providers"],
+#ck-tab-imports:checked ~ .ck-api-tabs__nav label[for="ck-tab-imports"] {
   color: var(--ck-accent);
   background: var(--ck-surface-soft);
   border-left-color: var(--ck-accent);
@@ -3253,7 +3261,8 @@ select.ck-input {
 #ck-tab-metric-groups:checked ~ .ck-api-tabs__panels .ck-api-tabs__panel:nth-child(7),
 #ck-tab-agreements:checked ~ .ck-api-tabs__panels .ck-api-tabs__panel:nth-child(8),
 #ck-tab-tags:checked ~ .ck-api-tabs__panels .ck-api-tabs__panel:nth-child(9),
-#ck-tab-providers:checked ~ .ck-api-tabs__panels .ck-api-tabs__panel:nth-child(10) {
+#ck-tab-providers:checked ~ .ck-api-tabs__panels .ck-api-tabs__panel:nth-child(10),
+#ck-tab-imports:checked ~ .ck-api-tabs__panels .ck-api-tabs__panel:nth-child(11) {
   display: block;
 }
@@ -3295,7 +3304,8 @@ select.ck-input {
   #ck-tab-metric-groups:checked ~ .ck-api-tabs__nav label[for="ck-tab-metric-groups"],
   #ck-tab-agreements:checked ~ .ck-api-tabs__nav label[for="ck-tab-agreements"],
   #ck-tab-tags:checked ~ .ck-api-tabs__nav label[for="ck-tab-tags"],
-  #ck-tab-providers:checked ~ .ck-api-tabs__nav label[for="ck-tab-providers"] {
+  #ck-tab-providers:checked ~ .ck-api-tabs__nav label[for="ck-tab-providers"],
+  #ck-tab-imports:checked ~ .ck-api-tabs__nav label[for="ck-tab-imports"] {
     border-left-color: transparent;
     border-bottom-color: var(--ck-accent);
   }

data/app/controllers/completion_kit/metrics_controller.rb CHANGED Viewed

@@ -68,7 +68,7 @@ module CompletionKit
     end
     def create
-      @metric = Metric.new(metric_params)
+      @metric = Metric.new(create_metric_params)
       if @metric.save
         redirect_to metric_path(@metric), notice: "Metric was successfully created."
@@ -235,6 +235,15 @@ module CompletionKit
       @metric = Metric.find(params[:id])
     end
+    def create_metric_params
+      attrs = metric_params
+      if attrs[:metric_type] == "check"
+        attrs.except(:instruction, :rubric_bands)
+      else
+        attrs.except(:check_config)
+      end
+    end
     def metric_params
       permitted = params.require(:metric).permit(:name, :instruction, :metric_type,
         rubric_bands: [:stars, :description],

data/app/controllers/completion_kit/runs_controller.rb CHANGED Viewed

@@ -122,7 +122,7 @@ module CompletionKit
     def suggest
       if @run.prompt.nil?
-        redirect_to run_path(@run), alert: "Judge-only runs don't have a prompt to improve."
+        redirect_to run_path(@run), alert: "A run that only scores existing outputs has no prompt to improve."
         return
       end

data/app/models/completion_kit/run.rb CHANGED Viewed

@@ -30,7 +30,7 @@ module CompletionKit
       display_scoped.select(:id)
     end
-    # A judge-only run grades a pre-existing column on the dataset instead of
+    # A scoring-only run grades a pre-existing column on the dataset instead of
     # generating new outputs. No prompt is attached; the response text is read
     # from row[output_column]; no LLM generation happens.
     def judge_only?
@@ -442,7 +442,7 @@ module CompletionKit
         self.name = "#{prompt.name} — v#{prompt.version_number} ##{count}"
       elsif dataset.present?
         count = Run.where(prompt_id: nil, dataset_id: dataset.id).count + 1
-        self.name = "#{dataset.name} — judge-only ##{count}"
+        self.name = "#{dataset.name} scoring ##{count}"
       end
     end
@@ -461,7 +461,7 @@ module CompletionKit
       return if prompt.present?
       if dataset.nil?
-        errors.add(:dataset_id, "is required for a judge-only run (no prompt)")
+        errors.add(:dataset_id, "is required when scoring existing outputs (no prompt)")
         return
       end

data/app/services/completion_kit/mcp_tools/judges.rb CHANGED Viewed

@@ -5,7 +5,7 @@ module CompletionKit
       TOOLS = {
         "judges_replay" => {
-          description: "Run the current judge against a dataset (judge-only run). Wraps runs_create with prompt_id omitted and output_column supplied. Re-judges existing dataset outputs so you can compare against human verdicts.",
+          description: "Run the current judge against a dataset (scores existing outputs). Wraps runs_create with prompt_id omitted and output_column supplied. Re-judges existing dataset outputs so you can compare against human verdicts.",
           inputSchema: {
             type: "object",
             properties: {

data/app/services/completion_kit/mcp_tools/prompts.rb CHANGED Viewed

@@ -51,7 +51,7 @@ module CompletionKit
           handler: :publish
         },
         "prompts_suggest_improvement" => {
-          description: "Suggest an improved version of a prompt, grounded in a run's test results and judge feedback. Analyzes the run's responses, scores, and reviews, then returns reasoning plus a rewritten template (preserving {{variables}}) and persists it as a Suggestion. Requires a run that has a prompt (not a judge-only run).",
+          description: "Suggest an improved version of a prompt, grounded in a run's test results and judge feedback. Analyzes the run's responses, scores, and reviews, then returns reasoning plus a rewritten template (preserving {{variables}}) and persists it as a Suggestion. Requires a run that has a prompt (not a scoring-only run).",
           inputSchema: {
             type: "object",
             properties: {run_id: {type: "integer", description: "The run whose results ground the improvement."}},
@@ -107,7 +107,7 @@ module CompletionKit
       def self.suggest_improvement(args)
         run = Run.find(args["run_id"])
-        return error_result("Judge-only runs don't have a prompt to improve.") if run.prompt.nil?
+        return error_result("A run that only scores existing outputs has no prompt to improve.") if run.prompt.nil?
         result = PromptImprovementService.new(run).suggest
         return error_result("The model didn't return a usable rewrite.") if result["suggested_template"].blank?

data/app/services/completion_kit/mcp_tools/runs.rb CHANGED Viewed

@@ -15,7 +15,7 @@ module CompletionKit
           handler: :get
         },
         "runs_create" => {
-          description: "Create a run. Omit prompt_id and provide output_column for a judge-only run that grades a pre-existing dataset column instead of generating new outputs.",
+          description: "Create a run. Omit prompt_id and provide output_column to score existing outputs by grading a pre-existing dataset column instead of generating new ones.",
           inputSchema: {
             type: "object",
             properties: {

data/app/views/completion_kit/api_reference/_body.html.erb CHANGED Viewed

@@ -20,6 +20,7 @@
   <input type="radio" name="ck-api-tab" id="ck-tab-agreements" class="ck-api-tabs__radio">
   <input type="radio" name="ck-api-tab" id="ck-tab-tags" class="ck-api-tabs__radio">
   <input type="radio" name="ck-api-tab" id="ck-tab-providers" class="ck-api-tabs__radio">
+  <input type="radio" name="ck-api-tab" id="ck-tab-imports" class="ck-api-tabs__radio">
   <nav class="ck-api-tabs__nav">
     <label for="ck-tab-mcp" class="ck-api-tabs__label">MCP <span class="ck-api-tabs__count"><%= CompletionKit::McpDispatcher.tool_definitions.size %></span></label>
@@ -32,6 +33,7 @@
     <label for="ck-tab-agreements" class="ck-api-tabs__label">Agreements <span class="ck-api-tabs__count">3</span></label>
     <label for="ck-tab-tags" class="ck-api-tabs__label">Tags <span class="ck-api-tabs__count">5</span></label>
     <label for="ck-tab-providers" class="ck-api-tabs__label">Providers <span class="ck-api-tabs__count">5</span></label>
+    <label for="ck-tab-imports" class="ck-api-tabs__label">Imports <span class="ck-api-tabs__count">1</span></label>
   </nav>
   <div class="ck-api-tabs__panels">
@@ -124,7 +126,7 @@
       <div class="ck-api-endpoint">
         <p class="ck-api-method"><span class="ck-chip ck-chip--soft">POST</span> /api/v1/runs</p>
         <p class="ck-meta-copy">Create a new run.</p>
-        <p class="ck-api-params"><strong>Optional:</strong>&ensp;<code>name</code>, <code>prompt_id</code>, <code>dataset_id</code>, <code>metric_ids</code>, <code>judge_model</code>, <code>output_column</code> (judge-only: omit <code>prompt_id</code> and grade a dataset column instead, default <code>actual_output</code>)</p>
+        <p class="ck-api-params"><strong>Optional:</strong>&ensp;<code>name</code>, <code>prompt_id</code>, <code>dataset_id</code>, <code>metric_ids</code>, <code>judge_model</code>, <code>output_column</code> (score existing outputs: omit <code>prompt_id</code> and grade a dataset column instead, default <code>actual_output</code>)</p>
         <%= render "completion_kit/api_reference/example", base_url: base_url, token: token, real_token: real_token, cmd: "curl -X POST #{base_url}/api/v1/runs \\\n  -H \"Authorization: Bearer #{token}\" \\\n  -H \"Content-Type: application/json\" \\\n  -d '{\"prompt_id\": 1, \"dataset_id\": 1, \"metric_ids\": [1, 2]}'" %>
       </div>
       <div class="ck-api-endpoint">
@@ -379,6 +381,18 @@
             } %>
     </div>
+    <div class="ck-api-tabs__panel">
+      <h2 class="ck-section-title">Imports</h2>
+      <p class="ck-copy">Bring an existing <a href="https://www.promptfoo.dev" class="ck-link">promptfoo</a> config into CompletionKit in one call. Prompts, the test dataset, assert-based metrics, and providers are created where they map cleanly and skipped with a reason where they don't.</p>
+      <div class="ck-api-endpoint">
+        <p class="ck-api-method"><span class="ck-chip ck-chip--soft">POST</span> /api/v1/imports/promptfoo</p>
+        <p class="ck-meta-copy">Import a promptfooconfig.yaml. Send the YAML as a <code>config</code> param, or POST the raw YAML as the request body. Returns 201 with a mapping summary, or 422 if the YAML cannot be parsed.</p>
+        <p class="ck-api-params"><strong>Request:</strong>&ensp;<code>config</code> (the YAML text) or a raw YAML request body</p>
+        <p class="ck-api-params"><strong>Response 201:</strong>&ensp;<code>prompts</code>, <code>dataset</code>, <code>metrics</code>, and <code>providers</code>, each listing what was <code>created</code> and what was <code>skipped</code> (with a reason)</p>
+        <%= render "completion_kit/api_reference/example", base_url: base_url, token: token, real_token: real_token, cmd: "curl -X POST #{base_url}/api/v1/imports/promptfoo \\\n  -H \"Authorization: Bearer #{token}\" \\\n  -H \"Content-Type: application/x-yaml\" \\\n  --data-binary @promptfooconfig.yaml" %>
+      </div>
+    </div>
   </div>
 </div>

data/app/views/completion_kit/metrics/_form.html.erb CHANGED Viewed

@@ -75,20 +75,22 @@
     <% else %>
       <div class="ck-field" data-ck-metric-type>
         <p class="ck-section-title">Metric type</p>
-        <p class="ck-hint">An LLM judge scores each output on a 1-5 rubric. A deterministic check passes or fails with no model call.</p>
+        <p class="ck-hint">The judge gives each response 1 to 5 stars against your rubric. A check just passes or fails, with no AI.</p>
         <label class="ck-radio">
           <%= form.radio_button :metric_type, "llm_judge", checked: !metric.check? %>
           <span>LLM judge (1-5)</span>
+          <%= heroicon_tag "information-circle", variant: :outline, size: 16, class: "ck-radio-info", "aria-hidden": "true", title: "An AI reads each response and rates it 1 to 5 stars against your rubric, with a written reason. Best for subjective quality: tone, helpfulness, accuracy." %>
         </label>
         <label class="ck-radio">
           <%= form.radio_button :metric_type, "check", checked: metric.check? %>
           <span>Deterministic check</span>
+          <%= heroicon_tag "information-circle", variant: :outline, size: 16, class: "ck-radio-info", "aria-hidden": "true", title: "A rule that passes or fails instantly with no AI and no cost. Best for exact things: valid JSON, contains a phrase, no refusal." %>
         </label>
       </div>
     <% end %>
     <% if show_judge %>
-    <div class="ck-field ck-field--spacious" data-ck-metric-editor="llm_judge">
+    <div class="ck-field ck-field--spacious" data-ck-metric-editor="llm_judge" <%= "hidden" if metric.check? %>>
       <p class="ck-section-title">Instruction</p>
       <p class="ck-hint">What should the judge assess? This instruction is sent to the LLM judge when scoring outputs.</p>
       <%= form.text_area :instruction, rows: 8, class: "ck-input ck-input--area", placeholder: "Evaluate whether the output...", **ck_field_aria(form, :instruction) %>
@@ -112,7 +114,7 @@
       <% end %>
     </div>
-    <div class="ck-field ck-field--spacious">
+    <div class="ck-field ck-field--spacious" data-ck-metric-editor="llm_judge" <%= "hidden" if metric.check? %>>
       <p class="ck-section-title">Rubric<%= render "completion_kit/metrics/rubric_hint" %></p>
       <p class="ck-hint">What each star rating means for this metric.</p>
@@ -155,7 +157,7 @@
     <% if show_check %>
     <% check = metric.check_config || {} %>
-    <div class="ck-field ck-field--spacious" data-ck-metric-editor="check">
+    <div class="ck-field ck-field--spacious" data-ck-metric-editor="check" <%= "hidden" unless metric.check? %>>
       <p class="ck-section-title">Check</p>
       <p class="ck-hint">A deterministic pass/fail rule. Fill only the fields the chosen kind needs.</p>
@@ -177,56 +179,56 @@
         </select>
       </div>
-      <div class="ck-field">
+      <div class="ck-field" data-ck-check-field="target_path">
         <label class="ck-label" for="metric_check_target_path">Target path</label>
         <p class="ck-hint">Used when target is json_path, e.g. data.items.0.name.</p>
         <input type="text" name="metric[check_config][target_path]" id="metric_check_target_path" class="ck-input" value="<%= check["target_path"] %>">
       </div>
-      <div class="ck-field">
+      <div class="ck-field" data-ck-check-field="value">
         <label class="ck-label" for="metric_check_value">Value</label>
         <p class="ck-hint">The substring or exact string for contains, not_contains, or equals.</p>
         <input type="text" name="metric[check_config][value]" id="metric_check_value" class="ck-input" value="<%= check["value"] %>">
       </div>
-      <div class="ck-field">
+      <div class="ck-field" data-ck-check-field="pattern">
         <label class="ck-label" for="metric_check_pattern">Pattern</label>
         <p class="ck-hint">A regular expression for the regex kind.</p>
         <input type="text" name="metric[check_config][pattern]" id="metric_check_pattern" class="ck-input" value="<%= check["pattern"] %>">
       </div>
-      <div class="ck-field">
+      <div class="ck-field" data-ck-check-field="json_path">
         <label class="ck-label" for="metric_check_json_path">JSON path</label>
         <p class="ck-hint">Dotted path into parsed JSON for json_path_equals.</p>
         <input type="text" name="metric[check_config][json_path]" id="metric_check_json_path" class="ck-input" value="<%= check["json_path"] %>">
       </div>
-      <div class="ck-field">
+      <div class="ck-field" data-ck-check-field="expected">
         <label class="ck-label" for="metric_check_expected">Expected</label>
         <p class="ck-hint">The value the JSON path must equal.</p>
         <input type="text" name="metric[check_config][expected]" id="metric_check_expected" class="ck-input" value="<%= check["expected"] %>">
       </div>
       <div class="ck-field-row">
-        <div class="ck-field">
+        <div class="ck-field" data-ck-check-field="min">
           <label class="ck-label" for="metric_check_min">Min length</label>
           <input type="number" name="metric[check_config][min]" id="metric_check_min" class="ck-input" value="<%= check["min"] %>">
         </div>
-        <div class="ck-field">
+        <div class="ck-field" data-ck-check-field="max">
           <label class="ck-label" for="metric_check_max">Max length</label>
           <input type="number" name="metric[check_config][max]" id="metric_check_max" class="ck-input" value="<%= check["max"] %>">
         </div>
       </div>
-      <label class="ck-checkbox">
+      <label class="ck-checkbox" data-ck-check-field="case_sensitive">
         <input type="checkbox" name="metric[check_config][case_sensitive]" value="true"<%= " checked" if check["case_sensitive"] %>>
         <span>Case sensitive</span>
       </label>
-      <label class="ck-checkbox">
+      <label class="ck-checkbox" data-ck-check-field="multiline">
         <input type="checkbox" name="metric[check_config][multiline]" value="true"<%= " checked" if check["multiline"] %>>
         <span>Multiline</span>
       </label>
-      <label class="ck-checkbox">
+      <label class="ck-checkbox" data-ck-check-field="trim">
         <input type="checkbox" name="metric[check_config][trim]" value="true"<%= " checked" if check["trim"] %>>
         <span>Trim whitespace</span>
       </label>

data/app/views/completion_kit/runs/_form.html.erb CHANGED Viewed

@@ -22,7 +22,7 @@
         <%= check_box_tag "run[judge_only]", "1", run.persisted? && run.judge_only?, id: "run_judge_only", class: "ck-checkbox" %>
         <span class="ck-checkbox-label__box" aria-hidden="true"></span>
         <span class="ck-checkbox-label__body">
-          <span class="ck-checkbox-label__text">Judge-only run</span>
+          <span class="ck-checkbox-label__text">Score existing outputs</span>
           <span class="ck-checkbox-label__hint">Grade an existing column on the dataset instead of running a prompt. Roughly half the LLM calls per row.</span>
         </span>
       </label>
@@ -263,7 +263,7 @@ function updateRunForm() {
       }
     } else if (!dataset) {
       if (datasetField) datasetField.className = 'ck-field ck-field--info';
-      if (datasetHint) datasetHint.textContent = 'Judge-only runs need a dataset that supplies the output column.';
+      if (datasetHint) datasetHint.textContent = 'Skip generation and score responses you already have from a dataset column. Works with rubric metrics or deterministic checks.';
     }
   } else {
     valid = prompt !== '';

data/app/views/completion_kit/runs/_row.html.erb CHANGED Viewed

@@ -10,7 +10,7 @@
           <%= link_to run.prompt.name, ck_prompt_path(run.prompt), class: "ck-runs-table__config-link", onclick: "event.stopPropagation();" %>
           <span class="ck-runs-table__version">v<%= run.prompt.version_number %></span>
         <% else %>
-          <span class="ck-runs-table__version">Judge-only</span>
+          <span class="ck-runs-table__version">Scoring only</span>
         <% end %>
         <% if run.dataset %>
           <span class="ck-runs-table__sep">·</span>

data/app/views/completion_kit/runs/_status_header.html.erb CHANGED Viewed

@@ -22,7 +22,7 @@
       <% if run.prompt %>
         <p class="ck-meta-copy"><%= link_to run.prompt.display_name, prompt_path(run.prompt), class: "ck-link" %>&ensp;<span class="ck-chip" style="text-transform: none;"><%= run.prompt.llm_model %></span></p>
       <% else %>
-        <p class="ck-meta-copy">Judge-only run — grading column <code><%= run.output_column.presence || "actual_output" %></code><% if run.dataset %> on <%= link_to run.dataset.name, dataset_path(run.dataset), class: "ck-link" %><% end %></p>
+        <p class="ck-meta-copy">Scoring existing outputs, grading column <code><%= run.output_column.presence || "actual_output" %></code><% if run.dataset %> on <%= link_to run.dataset.name, dataset_path(run.dataset), class: "ck-link" %><% end %></p>
       <% end %>
     </div>
     <%= render "completion_kit/runs/actions", run: run %>

data/lib/completion_kit/version.rb CHANGED Viewed

@@ -1,3 +1,3 @@
 module CompletionKit
-  VERSION = "0.20.3"
+  VERSION = "0.20.4"
 end

metadata CHANGED Viewed

@@ -1,7 +1,7 @@
 --- !ruby/object:Gem::Specification
 name: completion-kit
 version: !ruby/object:Gem::Version
-  version: 0.20.3
+  version: 0.20.4
 platform: ruby
 authors:
 - Damien Bastin