scorebook 0.0.8__py3-none-any.whl → 0.0.9__py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
scorebook/evaluate.py CHANGED
@@ -430,14 +430,14 @@ def _build_eval_run_specs(
430
430
  )
431
431
 
432
432
  # Create adaptive eval run spec from string
433
- elif isinstance(dataset, str) and dataset.endswith(":adaptive"):
433
+ elif isinstance(dataset, AdaptiveEvalDataset):
434
434
  if not experiment_id or not project_id:
435
435
  raise ScoreBookError(
436
436
  "experiment_id and project_id are required for adaptive evaluations"
437
437
  )
438
438
  eval_run_specs.append(
439
439
  _build_adaptive_eval_run_spec(
440
- dataset,
440
+ dataset.name,
441
441
  dataset_index,
442
442
  hyperparameter_config,
443
443
  hyperparameters_index,
@@ -38,7 +38,7 @@ async def run_adaptive_evaluation(
38
38
  runner = AdaptiveTest(
39
39
  make_trismik_inference(inference),
40
40
  client=TrismikAsyncClient(
41
- service_url="https://api-stage.trismik.com/adaptive-testing", api_key=get_token()
41
+ service_url="https://api.trismik.com/adaptive-testing", api_key=get_token()
42
42
  ),
43
43
  )
44
44
 
@@ -40,7 +40,7 @@ async def upload_classic_eval_run(
40
40
  runner = AdaptiveTest(
41
41
  lambda x: None,
42
42
  client=TrismikAsyncClient(
43
- service_url="https://api-stage.trismik.com/adaptive-testing", api_key=get_token()
43
+ service_url="https://api.trismik.com/adaptive-testing", api_key=get_token()
44
44
  ),
45
45
  )
46
46
 
@@ -1,6 +1,6 @@
1
1
  Metadata-Version: 2.4
2
2
  Name: scorebook
3
- Version: 0.0.8
3
+ Version: 0.0.9
4
4
  Summary: A Python project for LLM evaluation.
5
5
  License-File: LICENSE
6
6
  Author: Euan Campbell
@@ -3,7 +3,7 @@ scorebook/cli/__init__.py,sha256=E89jR1DljFSHhfjEGSRKLgz0KhxGyRQ9a3vpUOmQL9o,32
3
3
  scorebook/cli/auth.py,sha256=bv3imsgmY_t52wFoMJt9iu-cKPwvKYkVqZ7nE8EVc6E,2931
4
4
  scorebook/cli/main.py,sha256=cEvShENl6L6feX_sa7FGNTeoz5UtwqzwenmcHaON1hg,1589
5
5
  scorebook/eval_dataset.py,sha256=LSTyxUkT06iEAVYCnjIDFxFgZzRejwiS5CZA-jvy1ns,15098
6
- scorebook/evaluate.py,sha256=7tj1qFogcQJtCTAKK3oFnjV1xCMpxaHVnK0EGa9M4Hg,21912
6
+ scorebook/evaluate.py,sha256=OOBTZmx84ZAuZKbIe1pp9L3201cX2gjPAkw_llYNnfE,21899
7
7
  scorebook/exceptions.py,sha256=emq2QY-4mW6VXlq1dxunPjt-xZpLQIxo8Ck_gYxz1VE,1827
8
8
  scorebook/inference/__init__.py,sha256=tqSXSyVurc_YRfPypYed8iTH7Fwt7iFCXMxBXnqY-9I,242
9
9
  scorebook/inference/bedrock.py,sha256=wllq0ysNFQKWJDEqoN-k96Jx43BHCAvfxm14zMRCf90,10074
@@ -17,9 +17,9 @@ scorebook/metrics/metric_base.py,sha256=I3L0DGcRojFp93UGFnXG1tZ2UK9ilTcXXJG6lj5d
17
17
  scorebook/metrics/metric_registry.py,sha256=jWwt9P3zvtFLlEYrd60v7LS7X251nZczouE02zcCxWg,3402
18
18
  scorebook/metrics/precision.py,sha256=AaYPYYKnY74Nwqp_p3jd2Ewf3VHNOJjoRWf5fhb-tXk,563
19
19
  scorebook/trismik_services/__init__.py,sha256=CiGl1u4GcfYhWmB_fGOlsJPwYeKXtIr-uCXoOv4O8yg,284
20
- scorebook/trismik_services/adaptive_testing_service.py,sha256=S1yAVnrzqtVWprsiNS_l3q5FibQkMuAs7I7YaSFNtKM,5109
20
+ scorebook/trismik_services/adaptive_testing_service.py,sha256=4FVW8g7EvJmHYpQp68y0U3xzOw_qJ9nkhEPiMnzTb4s,5103
21
21
  scorebook/trismik_services/login.py,sha256=WtJLaNmBMwCi6gT1Bgp4J9x2tq5HDrDI9U074r08TnU,3275
22
- scorebook/trismik_services/upload_classic_eval_run.py,sha256=oHxELymEPxikVbtC6EQ06LfuNKEFV4Ijnth5v78bAmQ,3664
22
+ scorebook/trismik_services/upload_classic_eval_run.py,sha256=t6tvaKfP2lFBKmZ_bM6oe_mUOjA_UKu35GbgL26QW3A,3658
23
23
  scorebook/types.py,sha256=zt8sGfbRjXatx1WtttWZDVIoiS-yhh_1lP0K4VHYvAM,5797
24
24
  scorebook/utils/__init__.py,sha256=l_bfi9lAMz1oyGnuyKuzYasQKt2DJwffqsbfSl4-GIQ,452
25
25
  scorebook/utils/async_utils.py,sha256=OeNvMrOT9P4rIyaCf5IbR3ZIFMtEzXgoAArNbINRtMU,728
@@ -29,8 +29,8 @@ scorebook/utils/jinja_helpers.py,sha256=ksIKHiKdj8N0o7ZJZGasfbSNoAY6K5d9X_KM6mcK
29
29
  scorebook/utils/mappers.py,sha256=OcUnPBrnSUxZNhAzJhVmVWUWmqIKFXLTrK-xLi6_SUg,1259
30
30
  scorebook/utils/progress_bars.py,sha256=TBz41w3yFujsO9n8vUjeubgOrmdiAMI2P2SSVqTJzAA,5269
31
31
  scorebook/utils/transform_helpers.py,sha256=UnVLtFvcJrtmBEmLsuA4rrX4iJlNUKxm2DkIOGLl-2o,1030
32
- scorebook-0.0.8.dist-info/METADATA,sha256=ozjSfRd5jd9VIiOmjdSWmGsu0l5aaN5qQe-7Ty7ps5U,11516
33
- scorebook-0.0.8.dist-info/WHEEL,sha256=zp0Cn7JsFoX2ATtOhtaFYIiE2rmFAD4OcMhtUki8W3U,88
34
- scorebook-0.0.8.dist-info/entry_points.txt,sha256=9gNd3Q0MEozhJ7fog-Q-Z_PrcGMnF-404Jon40MH2_U,53
35
- scorebook-0.0.8.dist-info/licenses/LICENSE,sha256=JLH1g9FhxHZf6CBCeQ_xAisPtICVObuNGW1bLPiTYEs,1068
36
- scorebook-0.0.8.dist-info/RECORD,,
32
+ scorebook-0.0.9.dist-info/METADATA,sha256=-VyogmnwuCfPBaj6BS_gOGKxgAkxcnAx6k2GFaI1jGg,11516
33
+ scorebook-0.0.9.dist-info/WHEEL,sha256=zp0Cn7JsFoX2ATtOhtaFYIiE2rmFAD4OcMhtUki8W3U,88
34
+ scorebook-0.0.9.dist-info/entry_points.txt,sha256=9gNd3Q0MEozhJ7fog-Q-Z_PrcGMnF-404Jon40MH2_U,53
35
+ scorebook-0.0.9.dist-info/licenses/LICENSE,sha256=JLH1g9FhxHZf6CBCeQ_xAisPtICVObuNGW1bLPiTYEs,1068
36
+ scorebook-0.0.9.dist-info/RECORD,,