langwatch-scenario 0.7.13__py3-none-any.whl → 0.7.14__py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
@@ -1,6 +1,6 @@
1
1
  Metadata-Version: 2.4
2
2
  Name: langwatch-scenario
3
- Version: 0.7.13
3
+ Version: 0.7.14
4
4
  Summary: The end-to-end agent testing library
5
5
  Author-email: LangWatch Team <support@langwatch.ai>
6
6
  License: MIT
@@ -2,7 +2,7 @@ scenario/__init__.py,sha256=4WO8TjY8Lc0NhYL7b9LvaB1xCBqwUkLuI0uIA6PQP6c,4223
2
2
  scenario/_error_messages.py,sha256=QVFSbhzsVNGz2GOBOaoQFW6w6AOyZCWLTt0ySWPfnGw,3882
3
3
  scenario/agent_adapter.py,sha256=PoY2KQqYuqzIIb3-nhIU-MPXwHJc1vmwdweMy7ut-hk,4255
4
4
  scenario/cache.py,sha256=J6s6Sia_Ce6TrnsInlhfxm6SF8tygo3sH-_cQCRX1WA,6213
5
- scenario/judge_agent.py,sha256=xIZaS7t7lWLLEj7UKYRpqKtxXtu7vO3ePN90lW8wbFQ,17686
5
+ scenario/judge_agent.py,sha256=RxXYpImLsr6FpFivSRB26vWSnQFJlAd6ocWdyL6EAYM,17752
6
6
  scenario/py.typed,sha256=47DEQpj8HBSa-_TImW-5JCeuQeRkm5NMpJWZG3hSuFU,0
7
7
  scenario/pytest_plugin.py,sha256=wRCuGD9uwrrLt2fY15zK6mnmY9W_dO_m0WalPJYE5II,11491
8
8
  scenario/scenario_executor.py,sha256=v41UgSHebosXf95FfYIeVUm6s4IbMP_U58FdGoZ_kZU,35653
@@ -235,8 +235,8 @@ scenario/config/__init__.py,sha256=b2X_bqkIrd7jZY9dRrXk2wOqoPe87Nl_SRGuZhlolxA,1
235
235
  scenario/config/langwatch.py,sha256=ijWchFbUsLbQooAZmwyTw4rxfRLQseZ1GoVSiPPbzpw,1677
236
236
  scenario/config/model.py,sha256=VQtPkG-O1gVjtMIKbMOrbcnySv8pqODokC_VOaKVS4g,2054
237
237
  scenario/config/scenario.py,sha256=tUnzFBtuhPimU4EyaXm9T6KlpfntGtQaH5teW2F9oGk,5426
238
- langwatch_scenario-0.7.13.dist-info/METADATA,sha256=mitJjq_Y3AjIUtMFK5gpXpOYBdG9tRU-yHqhLWE6tGM,20065
239
- langwatch_scenario-0.7.13.dist-info/WHEEL,sha256=_zCd3N1l69ArxyTb8rzEoP9TpbYXkqRFSNOD5OuxnTs,91
240
- langwatch_scenario-0.7.13.dist-info/entry_points.txt,sha256=WlEnJ_gku0i18bIa3DSuGqXRX-QDQLe_s0YmRzK45TI,45
241
- langwatch_scenario-0.7.13.dist-info/top_level.txt,sha256=45Mn28aedJsetnBMB5xSmrJ-yo701QLH89Zlz4r1clE,9
242
- langwatch_scenario-0.7.13.dist-info/RECORD,,
238
+ langwatch_scenario-0.7.14.dist-info/METADATA,sha256=B9rniakNtewXOAzmgYi4AbfMRRRS1_GqtXKZiSRtNYQ,20065
239
+ langwatch_scenario-0.7.14.dist-info/WHEEL,sha256=_zCd3N1l69ArxyTb8rzEoP9TpbYXkqRFSNOD5OuxnTs,91
240
+ langwatch_scenario-0.7.14.dist-info/entry_points.txt,sha256=WlEnJ_gku0i18bIa3DSuGqXRX-QDQLe_s0YmRzK45TI,45
241
+ langwatch_scenario-0.7.14.dist-info/top_level.txt,sha256=45Mn28aedJsetnBMB5xSmrJ-yo701QLH89Zlz4r1clE,9
242
+ langwatch_scenario-0.7.14.dist-info/RECORD,,
scenario/judge_agent.py CHANGED
@@ -339,7 +339,8 @@ if you don't have enough information to make a verdict, say inconclusive with ma
339
339
  "type": "object",
340
340
  "properties": {
341
341
  criteria_names[idx]: {
342
- "enum": [True, False, "inconclusive"],
342
+ "type": "string",
343
+ "enum": ["true", "false", "inconclusive"],
343
344
  "description": criterion,
344
345
  }
345
346
  for idx, criterion in enumerate(self.criteria)
@@ -415,12 +416,12 @@ if you don't have enough information to make a verdict, say inconclusive with ma
415
416
  passed_criteria = [
416
417
  self.criteria[idx]
417
418
  for idx, criterion in enumerate(criteria.values())
418
- if criterion == True
419
+ if criterion == "true"
419
420
  ]
420
421
  failed_criteria = [
421
422
  self.criteria[idx]
422
423
  for idx, criterion in enumerate(criteria.values())
423
- if criterion == False or criterion == "inconclusive"
424
+ if criterion == "false" or criterion == "inconclusive"
424
425
  ]
425
426
 
426
427
  # Return the appropriate ScenarioResult based on the verdict