completion-kit 0.11.0 → 0.12.0

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
Files changed (35) hide show
  1. checksums.yaml +4 -4
  2. data/app/assets/stylesheets/completion_kit/application.css +51 -51
  3. data/app/controllers/completion_kit/{calibrations_controller.rb → agreements_controller.rb} +19 -19
  4. data/app/controllers/completion_kit/api/v1/{calibrations_controller.rb → agreements_controller.rb} +18 -18
  5. data/app/controllers/completion_kit/api/v1/metric_versions_controller.rb +2 -7
  6. data/app/controllers/completion_kit/api/v1/metrics_controller.rb +1 -1
  7. data/app/controllers/completion_kit/metrics_controller.rb +10 -11
  8. data/app/jobs/completion_kit/judge_review_job.rb +2 -2
  9. data/app/models/completion_kit/{calibration.rb → agreement.rb} +1 -1
  10. data/app/models/completion_kit/metric_version.rb +1 -17
  11. data/app/models/completion_kit/review.rb +1 -0
  12. data/app/services/completion_kit/{calibration_math.rb → agreement_math.rb} +1 -1
  13. data/app/services/completion_kit/mcp_dispatcher.rb +2 -2
  14. data/app/services/completion_kit/mcp_tools/{calibrations.rb → agreements.rb} +11 -11
  15. data/app/services/completion_kit/mcp_tools/judges.rb +3 -3
  16. data/app/services/completion_kit/mcp_tools/metric_versions.rb +2 -7
  17. data/app/services/completion_kit/{metric_calibration_examples.rb → metric_agreement_examples.rb} +6 -6
  18. data/app/services/completion_kit/{metric_calibration_stats.rb → metric_agreement_stats.rb} +6 -6
  19. data/app/services/completion_kit/metric_improvement_validator.rb +1 -1
  20. data/app/services/completion_kit/metric_variant_generator.rb +2 -2
  21. data/app/views/completion_kit/{calibrations → agreements}/_buttons.html.erb +33 -33
  22. data/app/views/completion_kit/{calibrations → agreements}/_trust_panel.html.erb +5 -5
  23. data/app/views/completion_kit/api_reference/_body.html.erb +15 -15
  24. data/app/views/completion_kit/metrics/_guiding_examples.html.erb +1 -1
  25. data/app/views/completion_kit/metrics/edit.html.erb +1 -1
  26. data/app/views/completion_kit/metrics/show.html.erb +6 -6
  27. data/app/views/completion_kit/responses/show.html.erb +4 -4
  28. data/app/views/completion_kit/runs/show.html.erb +1 -1
  29. data/config/routes.rb +3 -3
  30. data/db/migrate/20260531000002_backfill_review_metric_versions.rb +33 -0
  31. data/db/migrate/20260531000003_add_metric_version_fk_to_reviews.rb +6 -0
  32. data/db/migrate/20260531000004_rename_calibrations_to_agreements.rb +19 -0
  33. data/lib/completion_kit/version.rb +1 -1
  34. data/lib/completion_kit.rb +2 -2
  35. metadata +13 -10
@@ -0,0 +1,19 @@
1
+ class RenameCalibrationsToAgreements < ActiveRecord::Migration[8.1]
2
+ CALIBRATION_INDEXES = {
3
+ "index_ck_calibrations_on_metric_id" => "index_ck_agreements_on_metric_id",
4
+ "index_ck_calibrations_on_metric_version_id" => "index_ck_agreements_on_metric_version_id",
5
+ "index_ck_calibrations_on_response_id" => "index_ck_agreements_on_response_id",
6
+ "index_ck_calibrations_on_run_id" => "index_ck_agreements_on_run_id",
7
+ "index_ck_calibrations_on_response_metric_user" => "index_ck_agreements_on_response_metric_user"
8
+ }.freeze
9
+
10
+ def up
11
+ rename_table :completion_kit_calibrations, :completion_kit_agreements
12
+ CALIBRATION_INDEXES.each { |old_name, new_name| rename_index :completion_kit_agreements, old_name, new_name }
13
+ end
14
+
15
+ def down
16
+ CALIBRATION_INDEXES.each { |old_name, new_name| rename_index :completion_kit_agreements, new_name, old_name }
17
+ rename_table :completion_kit_agreements, :completion_kit_calibrations
18
+ end
19
+ end
@@ -1,3 +1,3 @@
1
1
  module CompletionKit
2
- VERSION = "0.11.0"
2
+ VERSION = "0.12.0"
3
3
  end
@@ -12,7 +12,7 @@ module CompletionKit
12
12
  attr_accessor :api_reference_authentication_partial
13
13
  attr_accessor :api_rate_limit, :web_rate_limit
14
14
  attr_accessor :allow_loopback_endpoints
15
- attr_accessor :judge_calibration_enabled
15
+ attr_accessor :judge_agreement_enabled
16
16
  attr_accessor :judge_examples_from_reviews
17
17
 
18
18
  def initialize
@@ -29,7 +29,7 @@ module CompletionKit
29
29
  @web_rate_limit = 300
30
30
 
31
31
  @allow_loopback_endpoints = true
32
- @judge_calibration_enabled = true
32
+ @judge_agreement_enabled = true
33
33
  @judge_examples_from_reviews = false
34
34
 
35
35
  @api_reference_authentication_partial = "completion_kit/api_reference/authentication"
metadata CHANGED
@@ -1,7 +1,7 @@
1
1
  --- !ruby/object:Gem::Specification
2
2
  name: completion-kit
3
3
  version: !ruby/object:Gem::Version
4
- version: 0.11.0
4
+ version: 0.12.0
5
5
  platform: ruby
6
6
  authors:
7
7
  - Damien Bastin
@@ -234,8 +234,9 @@ files:
234
234
  - app/assets/images/completion_kit/logo.png
235
235
  - app/assets/javascripts/completion_kit/application.js
236
236
  - app/assets/stylesheets/completion_kit/application.css
237
+ - app/controllers/completion_kit/agreements_controller.rb
238
+ - app/controllers/completion_kit/api/v1/agreements_controller.rb
237
239
  - app/controllers/completion_kit/api/v1/base_controller.rb
238
- - app/controllers/completion_kit/api/v1/calibrations_controller.rb
239
240
  - app/controllers/completion_kit/api/v1/datasets_controller.rb
240
241
  - app/controllers/completion_kit/api/v1/metric_groups_controller.rb
241
242
  - app/controllers/completion_kit/api/v1/metric_versions_controller.rb
@@ -247,7 +248,6 @@ files:
247
248
  - app/controllers/completion_kit/api/v1/tags_controller.rb
248
249
  - app/controllers/completion_kit/api_reference_controller.rb
249
250
  - app/controllers/completion_kit/application_controller.rb
250
- - app/controllers/completion_kit/calibrations_controller.rb
251
251
  - app/controllers/completion_kit/dashboard_controller.rb
252
252
  - app/controllers/completion_kit/dashboard_dismissals_controller.rb
253
253
  - app/controllers/completion_kit/datasets_controller.rb
@@ -270,8 +270,8 @@ files:
270
270
  - app/jobs/completion_kit/model_discovery_job.rb
271
271
  - app/jobs/completion_kit/run_completion_check_job.rb
272
272
  - app/mailers/completion_kit/application_mailer.rb
273
+ - app/models/completion_kit/agreement.rb
273
274
  - app/models/completion_kit/application_record.rb
274
- - app/models/completion_kit/calibration.rb
275
275
  - app/models/completion_kit/dashboard_dismissal.rb
276
276
  - app/models/completion_kit/dataset.rb
277
277
  - app/models/completion_kit/mcp_session.rb
@@ -292,16 +292,16 @@ files:
292
292
  - app/models/completion_kit/tagging.rb
293
293
  - app/models/concerns/completion_kit/has_job_status.rb
294
294
  - app/models/concerns/completion_kit/taggable.rb
295
+ - app/services/completion_kit/agreement_math.rb
295
296
  - app/services/completion_kit/anthropic_client.rb
296
297
  - app/services/completion_kit/api_config.rb
297
- - app/services/completion_kit/calibration_math.rb
298
298
  - app/services/completion_kit/csv_processor.rb
299
299
  - app/services/completion_kit/dashboard_stats.rb
300
300
  - app/services/completion_kit/judge_service.rb
301
301
  - app/services/completion_kit/llm_client.rb
302
302
  - app/services/completion_kit/mcp_dispatcher.rb
303
+ - app/services/completion_kit/mcp_tools/agreements.rb
303
304
  - app/services/completion_kit/mcp_tools/base.rb
304
- - app/services/completion_kit/mcp_tools/calibrations.rb
305
305
  - app/services/completion_kit/mcp_tools/datasets.rb
306
306
  - app/services/completion_kit/mcp_tools/judges.rb
307
307
  - app/services/completion_kit/mcp_tools/metric_groups.rb
@@ -312,8 +312,8 @@ files:
312
312
  - app/services/completion_kit/mcp_tools/responses.rb
313
313
  - app/services/completion_kit/mcp_tools/runs.rb
314
314
  - app/services/completion_kit/mcp_tools/tags.rb
315
- - app/services/completion_kit/metric_calibration_examples.rb
316
- - app/services/completion_kit/metric_calibration_stats.rb
315
+ - app/services/completion_kit/metric_agreement_examples.rb
316
+ - app/services/completion_kit/metric_agreement_stats.rb
317
317
  - app/services/completion_kit/metric_improvement_validator.rb
318
318
  - app/services/completion_kit/metric_variant_generator.rb
319
319
  - app/services/completion_kit/model_discovery_service.rb
@@ -328,14 +328,14 @@ files:
328
328
  - app/services/completion_kit/starter_metrics.rb
329
329
  - app/services/completion_kit/worker_health.rb
330
330
  - app/validators/completion_kit/tenant_scoped_uniqueness_validator.rb
331
+ - app/views/completion_kit/agreements/_buttons.html.erb
332
+ - app/views/completion_kit/agreements/_trust_panel.html.erb
331
333
  - app/views/completion_kit/api_reference/_authentication.html.erb
332
334
  - app/views/completion_kit/api_reference/_body.html.erb
333
335
  - app/views/completion_kit/api_reference/_example.html.erb
334
336
  - app/views/completion_kit/api_reference/_resource_card.html.erb
335
337
  - app/views/completion_kit/api_reference/_resource_list.html.erb
336
338
  - app/views/completion_kit/api_reference/index.html.erb
337
- - app/views/completion_kit/calibrations/_buttons.html.erb
338
- - app/views/completion_kit/calibrations/_trust_panel.html.erb
339
339
  - app/views/completion_kit/dashboard/_eye_icon.html.erb
340
340
  - app/views/completion_kit/dashboard/_eye_off_icon.html.erb
341
341
  - app/views/completion_kit/dashboard/_failures_card.html.erb
@@ -440,6 +440,9 @@ files:
440
440
  - db/migrate/20260529000001_remove_few_shot_examples_from_completion_kit_metrics.rb
441
441
  - db/migrate/20260530000001_add_excluded_from_examples_to_completion_kit_calibrations.rb
442
442
  - db/migrate/20260531000001_add_validation_summary_to_completion_kit_metric_versions.rb
443
+ - db/migrate/20260531000002_backfill_review_metric_versions.rb
444
+ - db/migrate/20260531000003_add_metric_version_fk_to_reviews.rb
445
+ - db/migrate/20260531000004_rename_calibrations_to_agreements.rb
443
446
  - lib/completion-kit.rb
444
447
  - lib/completion_kit.rb
445
448
  - lib/completion_kit/concurrency_check.rb