completion-kit 0.11.0 → 0.12.0
This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
- checksums.yaml +4 -4
- data/app/assets/stylesheets/completion_kit/application.css +51 -51
- data/app/controllers/completion_kit/{calibrations_controller.rb → agreements_controller.rb} +19 -19
- data/app/controllers/completion_kit/api/v1/{calibrations_controller.rb → agreements_controller.rb} +18 -18
- data/app/controllers/completion_kit/api/v1/metric_versions_controller.rb +2 -7
- data/app/controllers/completion_kit/api/v1/metrics_controller.rb +1 -1
- data/app/controllers/completion_kit/metrics_controller.rb +10 -11
- data/app/jobs/completion_kit/judge_review_job.rb +2 -2
- data/app/models/completion_kit/{calibration.rb → agreement.rb} +1 -1
- data/app/models/completion_kit/metric_version.rb +1 -17
- data/app/models/completion_kit/review.rb +1 -0
- data/app/services/completion_kit/{calibration_math.rb → agreement_math.rb} +1 -1
- data/app/services/completion_kit/mcp_dispatcher.rb +2 -2
- data/app/services/completion_kit/mcp_tools/{calibrations.rb → agreements.rb} +11 -11
- data/app/services/completion_kit/mcp_tools/judges.rb +3 -3
- data/app/services/completion_kit/mcp_tools/metric_versions.rb +2 -7
- data/app/services/completion_kit/{metric_calibration_examples.rb → metric_agreement_examples.rb} +6 -6
- data/app/services/completion_kit/{metric_calibration_stats.rb → metric_agreement_stats.rb} +6 -6
- data/app/services/completion_kit/metric_improvement_validator.rb +1 -1
- data/app/services/completion_kit/metric_variant_generator.rb +2 -2
- data/app/views/completion_kit/{calibrations → agreements}/_buttons.html.erb +33 -33
- data/app/views/completion_kit/{calibrations → agreements}/_trust_panel.html.erb +5 -5
- data/app/views/completion_kit/api_reference/_body.html.erb +15 -15
- data/app/views/completion_kit/metrics/_guiding_examples.html.erb +1 -1
- data/app/views/completion_kit/metrics/edit.html.erb +1 -1
- data/app/views/completion_kit/metrics/show.html.erb +6 -6
- data/app/views/completion_kit/responses/show.html.erb +4 -4
- data/app/views/completion_kit/runs/show.html.erb +1 -1
- data/config/routes.rb +3 -3
- data/db/migrate/20260531000002_backfill_review_metric_versions.rb +33 -0
- data/db/migrate/20260531000003_add_metric_version_fk_to_reviews.rb +6 -0
- data/db/migrate/20260531000004_rename_calibrations_to_agreements.rb +19 -0
- data/lib/completion_kit/version.rb +1 -1
- data/lib/completion_kit.rb +2 -2
- metadata +13 -10
|
@@ -0,0 +1,19 @@
|
|
|
1
|
+
class RenameCalibrationsToAgreements < ActiveRecord::Migration[8.1]
|
|
2
|
+
CALIBRATION_INDEXES = {
|
|
3
|
+
"index_ck_calibrations_on_metric_id" => "index_ck_agreements_on_metric_id",
|
|
4
|
+
"index_ck_calibrations_on_metric_version_id" => "index_ck_agreements_on_metric_version_id",
|
|
5
|
+
"index_ck_calibrations_on_response_id" => "index_ck_agreements_on_response_id",
|
|
6
|
+
"index_ck_calibrations_on_run_id" => "index_ck_agreements_on_run_id",
|
|
7
|
+
"index_ck_calibrations_on_response_metric_user" => "index_ck_agreements_on_response_metric_user"
|
|
8
|
+
}.freeze
|
|
9
|
+
|
|
10
|
+
def up
|
|
11
|
+
rename_table :completion_kit_calibrations, :completion_kit_agreements
|
|
12
|
+
CALIBRATION_INDEXES.each { |old_name, new_name| rename_index :completion_kit_agreements, old_name, new_name }
|
|
13
|
+
end
|
|
14
|
+
|
|
15
|
+
def down
|
|
16
|
+
CALIBRATION_INDEXES.each { |old_name, new_name| rename_index :completion_kit_agreements, new_name, old_name }
|
|
17
|
+
rename_table :completion_kit_agreements, :completion_kit_calibrations
|
|
18
|
+
end
|
|
19
|
+
end
|
data/lib/completion_kit.rb
CHANGED
|
@@ -12,7 +12,7 @@ module CompletionKit
|
|
|
12
12
|
attr_accessor :api_reference_authentication_partial
|
|
13
13
|
attr_accessor :api_rate_limit, :web_rate_limit
|
|
14
14
|
attr_accessor :allow_loopback_endpoints
|
|
15
|
-
attr_accessor :
|
|
15
|
+
attr_accessor :judge_agreement_enabled
|
|
16
16
|
attr_accessor :judge_examples_from_reviews
|
|
17
17
|
|
|
18
18
|
def initialize
|
|
@@ -29,7 +29,7 @@ module CompletionKit
|
|
|
29
29
|
@web_rate_limit = 300
|
|
30
30
|
|
|
31
31
|
@allow_loopback_endpoints = true
|
|
32
|
-
@
|
|
32
|
+
@judge_agreement_enabled = true
|
|
33
33
|
@judge_examples_from_reviews = false
|
|
34
34
|
|
|
35
35
|
@api_reference_authentication_partial = "completion_kit/api_reference/authentication"
|
metadata
CHANGED
|
@@ -1,7 +1,7 @@
|
|
|
1
1
|
--- !ruby/object:Gem::Specification
|
|
2
2
|
name: completion-kit
|
|
3
3
|
version: !ruby/object:Gem::Version
|
|
4
|
-
version: 0.
|
|
4
|
+
version: 0.12.0
|
|
5
5
|
platform: ruby
|
|
6
6
|
authors:
|
|
7
7
|
- Damien Bastin
|
|
@@ -234,8 +234,9 @@ files:
|
|
|
234
234
|
- app/assets/images/completion_kit/logo.png
|
|
235
235
|
- app/assets/javascripts/completion_kit/application.js
|
|
236
236
|
- app/assets/stylesheets/completion_kit/application.css
|
|
237
|
+
- app/controllers/completion_kit/agreements_controller.rb
|
|
238
|
+
- app/controllers/completion_kit/api/v1/agreements_controller.rb
|
|
237
239
|
- app/controllers/completion_kit/api/v1/base_controller.rb
|
|
238
|
-
- app/controllers/completion_kit/api/v1/calibrations_controller.rb
|
|
239
240
|
- app/controllers/completion_kit/api/v1/datasets_controller.rb
|
|
240
241
|
- app/controllers/completion_kit/api/v1/metric_groups_controller.rb
|
|
241
242
|
- app/controllers/completion_kit/api/v1/metric_versions_controller.rb
|
|
@@ -247,7 +248,6 @@ files:
|
|
|
247
248
|
- app/controllers/completion_kit/api/v1/tags_controller.rb
|
|
248
249
|
- app/controllers/completion_kit/api_reference_controller.rb
|
|
249
250
|
- app/controllers/completion_kit/application_controller.rb
|
|
250
|
-
- app/controllers/completion_kit/calibrations_controller.rb
|
|
251
251
|
- app/controllers/completion_kit/dashboard_controller.rb
|
|
252
252
|
- app/controllers/completion_kit/dashboard_dismissals_controller.rb
|
|
253
253
|
- app/controllers/completion_kit/datasets_controller.rb
|
|
@@ -270,8 +270,8 @@ files:
|
|
|
270
270
|
- app/jobs/completion_kit/model_discovery_job.rb
|
|
271
271
|
- app/jobs/completion_kit/run_completion_check_job.rb
|
|
272
272
|
- app/mailers/completion_kit/application_mailer.rb
|
|
273
|
+
- app/models/completion_kit/agreement.rb
|
|
273
274
|
- app/models/completion_kit/application_record.rb
|
|
274
|
-
- app/models/completion_kit/calibration.rb
|
|
275
275
|
- app/models/completion_kit/dashboard_dismissal.rb
|
|
276
276
|
- app/models/completion_kit/dataset.rb
|
|
277
277
|
- app/models/completion_kit/mcp_session.rb
|
|
@@ -292,16 +292,16 @@ files:
|
|
|
292
292
|
- app/models/completion_kit/tagging.rb
|
|
293
293
|
- app/models/concerns/completion_kit/has_job_status.rb
|
|
294
294
|
- app/models/concerns/completion_kit/taggable.rb
|
|
295
|
+
- app/services/completion_kit/agreement_math.rb
|
|
295
296
|
- app/services/completion_kit/anthropic_client.rb
|
|
296
297
|
- app/services/completion_kit/api_config.rb
|
|
297
|
-
- app/services/completion_kit/calibration_math.rb
|
|
298
298
|
- app/services/completion_kit/csv_processor.rb
|
|
299
299
|
- app/services/completion_kit/dashboard_stats.rb
|
|
300
300
|
- app/services/completion_kit/judge_service.rb
|
|
301
301
|
- app/services/completion_kit/llm_client.rb
|
|
302
302
|
- app/services/completion_kit/mcp_dispatcher.rb
|
|
303
|
+
- app/services/completion_kit/mcp_tools/agreements.rb
|
|
303
304
|
- app/services/completion_kit/mcp_tools/base.rb
|
|
304
|
-
- app/services/completion_kit/mcp_tools/calibrations.rb
|
|
305
305
|
- app/services/completion_kit/mcp_tools/datasets.rb
|
|
306
306
|
- app/services/completion_kit/mcp_tools/judges.rb
|
|
307
307
|
- app/services/completion_kit/mcp_tools/metric_groups.rb
|
|
@@ -312,8 +312,8 @@ files:
|
|
|
312
312
|
- app/services/completion_kit/mcp_tools/responses.rb
|
|
313
313
|
- app/services/completion_kit/mcp_tools/runs.rb
|
|
314
314
|
- app/services/completion_kit/mcp_tools/tags.rb
|
|
315
|
-
- app/services/completion_kit/
|
|
316
|
-
- app/services/completion_kit/
|
|
315
|
+
- app/services/completion_kit/metric_agreement_examples.rb
|
|
316
|
+
- app/services/completion_kit/metric_agreement_stats.rb
|
|
317
317
|
- app/services/completion_kit/metric_improvement_validator.rb
|
|
318
318
|
- app/services/completion_kit/metric_variant_generator.rb
|
|
319
319
|
- app/services/completion_kit/model_discovery_service.rb
|
|
@@ -328,14 +328,14 @@ files:
|
|
|
328
328
|
- app/services/completion_kit/starter_metrics.rb
|
|
329
329
|
- app/services/completion_kit/worker_health.rb
|
|
330
330
|
- app/validators/completion_kit/tenant_scoped_uniqueness_validator.rb
|
|
331
|
+
- app/views/completion_kit/agreements/_buttons.html.erb
|
|
332
|
+
- app/views/completion_kit/agreements/_trust_panel.html.erb
|
|
331
333
|
- app/views/completion_kit/api_reference/_authentication.html.erb
|
|
332
334
|
- app/views/completion_kit/api_reference/_body.html.erb
|
|
333
335
|
- app/views/completion_kit/api_reference/_example.html.erb
|
|
334
336
|
- app/views/completion_kit/api_reference/_resource_card.html.erb
|
|
335
337
|
- app/views/completion_kit/api_reference/_resource_list.html.erb
|
|
336
338
|
- app/views/completion_kit/api_reference/index.html.erb
|
|
337
|
-
- app/views/completion_kit/calibrations/_buttons.html.erb
|
|
338
|
-
- app/views/completion_kit/calibrations/_trust_panel.html.erb
|
|
339
339
|
- app/views/completion_kit/dashboard/_eye_icon.html.erb
|
|
340
340
|
- app/views/completion_kit/dashboard/_eye_off_icon.html.erb
|
|
341
341
|
- app/views/completion_kit/dashboard/_failures_card.html.erb
|
|
@@ -440,6 +440,9 @@ files:
|
|
|
440
440
|
- db/migrate/20260529000001_remove_few_shot_examples_from_completion_kit_metrics.rb
|
|
441
441
|
- db/migrate/20260530000001_add_excluded_from_examples_to_completion_kit_calibrations.rb
|
|
442
442
|
- db/migrate/20260531000001_add_validation_summary_to_completion_kit_metric_versions.rb
|
|
443
|
+
- db/migrate/20260531000002_backfill_review_metric_versions.rb
|
|
444
|
+
- db/migrate/20260531000003_add_metric_version_fk_to_reviews.rb
|
|
445
|
+
- db/migrate/20260531000004_rename_calibrations_to_agreements.rb
|
|
443
446
|
- lib/completion-kit.rb
|
|
444
447
|
- lib/completion_kit.rb
|
|
445
448
|
- lib/completion_kit/concurrency_check.rb
|