langwatch-scenario 0.7.13__py3-none-any.whl → 0.7.14__py3-none-any.whl
This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
- {langwatch_scenario-0.7.13.dist-info → langwatch_scenario-0.7.14.dist-info}/METADATA +1 -1
- {langwatch_scenario-0.7.13.dist-info → langwatch_scenario-0.7.14.dist-info}/RECORD +6 -6
- scenario/judge_agent.py +4 -3
- {langwatch_scenario-0.7.13.dist-info → langwatch_scenario-0.7.14.dist-info}/WHEEL +0 -0
- {langwatch_scenario-0.7.13.dist-info → langwatch_scenario-0.7.14.dist-info}/entry_points.txt +0 -0
- {langwatch_scenario-0.7.13.dist-info → langwatch_scenario-0.7.14.dist-info}/top_level.txt +0 -0
@@ -2,7 +2,7 @@ scenario/__init__.py,sha256=4WO8TjY8Lc0NhYL7b9LvaB1xCBqwUkLuI0uIA6PQP6c,4223
|
|
2
2
|
scenario/_error_messages.py,sha256=QVFSbhzsVNGz2GOBOaoQFW6w6AOyZCWLTt0ySWPfnGw,3882
|
3
3
|
scenario/agent_adapter.py,sha256=PoY2KQqYuqzIIb3-nhIU-MPXwHJc1vmwdweMy7ut-hk,4255
|
4
4
|
scenario/cache.py,sha256=J6s6Sia_Ce6TrnsInlhfxm6SF8tygo3sH-_cQCRX1WA,6213
|
5
|
-
scenario/judge_agent.py,sha256=
|
5
|
+
scenario/judge_agent.py,sha256=RxXYpImLsr6FpFivSRB26vWSnQFJlAd6ocWdyL6EAYM,17752
|
6
6
|
scenario/py.typed,sha256=47DEQpj8HBSa-_TImW-5JCeuQeRkm5NMpJWZG3hSuFU,0
|
7
7
|
scenario/pytest_plugin.py,sha256=wRCuGD9uwrrLt2fY15zK6mnmY9W_dO_m0WalPJYE5II,11491
|
8
8
|
scenario/scenario_executor.py,sha256=v41UgSHebosXf95FfYIeVUm6s4IbMP_U58FdGoZ_kZU,35653
|
@@ -235,8 +235,8 @@ scenario/config/__init__.py,sha256=b2X_bqkIrd7jZY9dRrXk2wOqoPe87Nl_SRGuZhlolxA,1
|
|
235
235
|
scenario/config/langwatch.py,sha256=ijWchFbUsLbQooAZmwyTw4rxfRLQseZ1GoVSiPPbzpw,1677
|
236
236
|
scenario/config/model.py,sha256=VQtPkG-O1gVjtMIKbMOrbcnySv8pqODokC_VOaKVS4g,2054
|
237
237
|
scenario/config/scenario.py,sha256=tUnzFBtuhPimU4EyaXm9T6KlpfntGtQaH5teW2F9oGk,5426
|
238
|
-
langwatch_scenario-0.7.
|
239
|
-
langwatch_scenario-0.7.
|
240
|
-
langwatch_scenario-0.7.
|
241
|
-
langwatch_scenario-0.7.
|
242
|
-
langwatch_scenario-0.7.
|
238
|
+
langwatch_scenario-0.7.14.dist-info/METADATA,sha256=B9rniakNtewXOAzmgYi4AbfMRRRS1_GqtXKZiSRtNYQ,20065
|
239
|
+
langwatch_scenario-0.7.14.dist-info/WHEEL,sha256=_zCd3N1l69ArxyTb8rzEoP9TpbYXkqRFSNOD5OuxnTs,91
|
240
|
+
langwatch_scenario-0.7.14.dist-info/entry_points.txt,sha256=WlEnJ_gku0i18bIa3DSuGqXRX-QDQLe_s0YmRzK45TI,45
|
241
|
+
langwatch_scenario-0.7.14.dist-info/top_level.txt,sha256=45Mn28aedJsetnBMB5xSmrJ-yo701QLH89Zlz4r1clE,9
|
242
|
+
langwatch_scenario-0.7.14.dist-info/RECORD,,
|
scenario/judge_agent.py
CHANGED
@@ -339,7 +339,8 @@ if you don't have enough information to make a verdict, say inconclusive with ma
|
|
339
339
|
"type": "object",
|
340
340
|
"properties": {
|
341
341
|
criteria_names[idx]: {
|
342
|
-
"
|
342
|
+
"type": "string",
|
343
|
+
"enum": ["true", "false", "inconclusive"],
|
343
344
|
"description": criterion,
|
344
345
|
}
|
345
346
|
for idx, criterion in enumerate(self.criteria)
|
@@ -415,12 +416,12 @@ if you don't have enough information to make a verdict, say inconclusive with ma
|
|
415
416
|
passed_criteria = [
|
416
417
|
self.criteria[idx]
|
417
418
|
for idx, criterion in enumerate(criteria.values())
|
418
|
-
if criterion ==
|
419
|
+
if criterion == "true"
|
419
420
|
]
|
420
421
|
failed_criteria = [
|
421
422
|
self.criteria[idx]
|
422
423
|
for idx, criterion in enumerate(criteria.values())
|
423
|
-
if criterion ==
|
424
|
+
if criterion == "false" or criterion == "inconclusive"
|
424
425
|
]
|
425
426
|
|
426
427
|
# Return the appropriate ScenarioResult based on the verdict
|
File without changes
|
{langwatch_scenario-0.7.13.dist-info → langwatch_scenario-0.7.14.dist-info}/entry_points.txt
RENAMED
File without changes
|
File without changes
|