langwatch-scenario 0.7.12__py3-none-any.whl → 0.7.14__py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
@@ -1,6 +1,6 @@
1
1
  Metadata-Version: 2.4
2
2
  Name: langwatch-scenario
3
- Version: 0.7.12
3
+ Version: 0.7.14
4
4
  Summary: The end-to-end agent testing library
5
5
  Author-email: LangWatch Team <support@langwatch.ai>
6
6
  License: MIT
@@ -2,14 +2,14 @@ scenario/__init__.py,sha256=4WO8TjY8Lc0NhYL7b9LvaB1xCBqwUkLuI0uIA6PQP6c,4223
2
2
  scenario/_error_messages.py,sha256=QVFSbhzsVNGz2GOBOaoQFW6w6AOyZCWLTt0ySWPfnGw,3882
3
3
  scenario/agent_adapter.py,sha256=PoY2KQqYuqzIIb3-nhIU-MPXwHJc1vmwdweMy7ut-hk,4255
4
4
  scenario/cache.py,sha256=J6s6Sia_Ce6TrnsInlhfxm6SF8tygo3sH-_cQCRX1WA,6213
5
- scenario/judge_agent.py,sha256=PiOgrHHPnwvCbIzEFEFdUH4NI9waLnvNfHNZwMSpkrU,17640
5
+ scenario/judge_agent.py,sha256=RxXYpImLsr6FpFivSRB26vWSnQFJlAd6ocWdyL6EAYM,17752
6
6
  scenario/py.typed,sha256=47DEQpj8HBSa-_TImW-5JCeuQeRkm5NMpJWZG3hSuFU,0
7
7
  scenario/pytest_plugin.py,sha256=wRCuGD9uwrrLt2fY15zK6mnmY9W_dO_m0WalPJYE5II,11491
8
8
  scenario/scenario_executor.py,sha256=v41UgSHebosXf95FfYIeVUm6s4IbMP_U58FdGoZ_kZU,35653
9
9
  scenario/scenario_state.py,sha256=R8PhPHW3obYo3DCjBH5XDdZ6bp4uol7wCXO8K2Tz30I,7101
10
10
  scenario/script.py,sha256=A0N5pP0l4FFn1xdKc78U_wkwWhEWH3EFeU_LRDtNyEI,12241
11
11
  scenario/types.py,sha256=CRSCHUplXEXhj6EYQsncwJBzbd2128YTGlFxlk-rrG8,11193
12
- scenario/user_simulator_agent.py,sha256=nBo_i2UKX_Vn_sR1mZIJHrYewhhJfE6tAxkijxW8cmY,10499
12
+ scenario/user_simulator_agent.py,sha256=lQar3rtjOvCIEiFv9nCl4eOI3bafVTdtNVc47lVyMk4,10545
13
13
  scenario/_events/__init__.py,sha256=4cj6H9zuXzvWhT2P2JNdjWzeF1PUepTjqIDw85Vid9s,1500
14
14
  scenario/_events/event_alert_message_logger.py,sha256=4zf9DV69ZkjHdLCyj7mgXdzpMy21YZLwXaVd8EB6AwY,2995
15
15
  scenario/_events/event_bus.py,sha256=IsKNsClF1JFYj728EcxX1hw_KbfDkfJq3Y2Kv4h94n4,9871
@@ -235,8 +235,8 @@ scenario/config/__init__.py,sha256=b2X_bqkIrd7jZY9dRrXk2wOqoPe87Nl_SRGuZhlolxA,1
235
235
  scenario/config/langwatch.py,sha256=ijWchFbUsLbQooAZmwyTw4rxfRLQseZ1GoVSiPPbzpw,1677
236
236
  scenario/config/model.py,sha256=VQtPkG-O1gVjtMIKbMOrbcnySv8pqODokC_VOaKVS4g,2054
237
237
  scenario/config/scenario.py,sha256=tUnzFBtuhPimU4EyaXm9T6KlpfntGtQaH5teW2F9oGk,5426
238
- langwatch_scenario-0.7.12.dist-info/METADATA,sha256=bnDVB7CRXwJxTmW5Rhu8lZ_CoqEVB881wIK5U0LD-kI,20065
239
- langwatch_scenario-0.7.12.dist-info/WHEEL,sha256=_zCd3N1l69ArxyTb8rzEoP9TpbYXkqRFSNOD5OuxnTs,91
240
- langwatch_scenario-0.7.12.dist-info/entry_points.txt,sha256=WlEnJ_gku0i18bIa3DSuGqXRX-QDQLe_s0YmRzK45TI,45
241
- langwatch_scenario-0.7.12.dist-info/top_level.txt,sha256=45Mn28aedJsetnBMB5xSmrJ-yo701QLH89Zlz4r1clE,9
242
- langwatch_scenario-0.7.12.dist-info/RECORD,,
238
+ langwatch_scenario-0.7.14.dist-info/METADATA,sha256=B9rniakNtewXOAzmgYi4AbfMRRRS1_GqtXKZiSRtNYQ,20065
239
+ langwatch_scenario-0.7.14.dist-info/WHEEL,sha256=_zCd3N1l69ArxyTb8rzEoP9TpbYXkqRFSNOD5OuxnTs,91
240
+ langwatch_scenario-0.7.14.dist-info/entry_points.txt,sha256=WlEnJ_gku0i18bIa3DSuGqXRX-QDQLe_s0YmRzK45TI,45
241
+ langwatch_scenario-0.7.14.dist-info/top_level.txt,sha256=45Mn28aedJsetnBMB5xSmrJ-yo701QLH89Zlz4r1clE,9
242
+ langwatch_scenario-0.7.14.dist-info/RECORD,,
scenario/judge_agent.py CHANGED
@@ -181,6 +181,7 @@ class JudgeAgent(AgentAdapter):
181
181
  ScenarioConfig.default_config.default_model, str
182
182
  ):
183
183
  self.model = model or ScenarioConfig.default_config.default_model
184
+ self._extra_params = extra_params
184
185
  elif ScenarioConfig.default_config is not None and isinstance(
185
186
  ScenarioConfig.default_config.default_model, ModelConfig
186
187
  ):
@@ -338,7 +339,8 @@ if you don't have enough information to make a verdict, say inconclusive with ma
338
339
  "type": "object",
339
340
  "properties": {
340
341
  criteria_names[idx]: {
341
- "enum": [True, False, "inconclusive"],
342
+ "type": "string",
343
+ "enum": ["true", "false", "inconclusive"],
342
344
  "description": criterion,
343
345
  }
344
346
  for idx, criterion in enumerate(self.criteria)
@@ -414,12 +416,12 @@ if you don't have enough information to make a verdict, say inconclusive with ma
414
416
  passed_criteria = [
415
417
  self.criteria[idx]
416
418
  for idx, criterion in enumerate(criteria.values())
417
- if criterion == True
419
+ if criterion == "true"
418
420
  ]
419
421
  failed_criteria = [
420
422
  self.criteria[idx]
421
423
  for idx, criterion in enumerate(criteria.values())
422
- if criterion == False or criterion == "inconclusive"
424
+ if criterion == "false" or criterion == "inconclusive"
423
425
  ]
424
426
 
425
427
  # Return the appropriate ScenarioResult based on the verdict
@@ -154,6 +154,7 @@ class UserSimulatorAgent(AgentAdapter):
154
154
  ScenarioConfig.default_config.default_model, str
155
155
  ):
156
156
  self.model = model or ScenarioConfig.default_config.default_model
157
+ self._extra_params = extra_params
157
158
  elif ScenarioConfig.default_config is not None and isinstance(
158
159
  ScenarioConfig.default_config.default_model, ModelConfig
159
160
  ):