ibm-watsonx-orchestrate-evaluation-framework 1.0.3__py3-none-any.whl → 1.0.4__py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Potentially problematic release.


This version of ibm-watsonx-orchestrate-evaluation-framework might be problematic. Click here for more details.

@@ -1,6 +1,6 @@
1
1
  Metadata-Version: 2.4
2
2
  Name: ibm-watsonx-orchestrate-evaluation-framework
3
- Version: 1.0.3
3
+ Version: 1.0.4
4
4
  Summary: The WxO evaluation framework
5
5
  Author-email: Haode Qi <Haode.Qi@ibm.com>
6
6
  License: MIT
@@ -10,7 +10,7 @@ wxo_agentic_evaluation/llm_matching.py,sha256=l010exoMmsvTIAVHCm-Ok0diyeQogjCmem
10
10
  wxo_agentic_evaluation/llm_rag_eval.py,sha256=vsNGz1cFE5QGdhnfrx-iJq1r6q8tSI9Ef1mzuhoHElg,1642
11
11
  wxo_agentic_evaluation/llm_user.py,sha256=0zSsyEM7pYQtLcfbnu0gEIkosHDwntOZY84Ito6__SM,1407
12
12
  wxo_agentic_evaluation/main.py,sha256=tRXVle2o1JhwJZOTpqdsOzBOpxPYxAH5ziZkbCmzfyU,11470
13
- wxo_agentic_evaluation/record_chat.py,sha256=9l99n4TRdwDLAOKct0ZJKKXE5Y7qE7X5WLWUpWUHfLI,7739
13
+ wxo_agentic_evaluation/record_chat.py,sha256=ZaOxIabDcE_CzZjKJESgh8LY7pK9UT4OvqQMFVdTG7A,8102
14
14
  wxo_agentic_evaluation/resource_map.py,sha256=-dIWQdpEpPeSCbDeYfRupG9KV1Q4NlHGb5KXywjkulM,1645
15
15
  wxo_agentic_evaluation/service_instance.py,sha256=yt7XpwheaRRG8Ri4TFIS5G2p5mnCwvNgj6T7bDF5uTU,6494
16
16
  wxo_agentic_evaluation/test_prompt.py,sha256=ksteXCs9iDQPMETc4Hb7JAXHhxz2r678U6-sgZJAO28,3924
@@ -50,7 +50,7 @@ wxo_agentic_evaluation/service_provider/provider.py,sha256=MsnRzLYAaQiU6y6xf6eId
50
50
  wxo_agentic_evaluation/service_provider/watsonx_provider.py,sha256=iKVkWs4PRTM_S0TIdPgQ9NFQWPlDvcEvuHpQlIPzO10,6216
51
51
  wxo_agentic_evaluation/utils/__init__.py,sha256=QMxk6hx1CDvCBLFh40WpPZmqFNJtDqwXP7S7cXD6NQE,145
52
52
  wxo_agentic_evaluation/utils/utils.py,sha256=JYZQZ-OBy43gAWg9S7duJi9StRApGJATs2JUsW1l30M,6057
53
- ibm_watsonx_orchestrate_evaluation_framework-1.0.3.dist-info/METADATA,sha256=L6Hq_FbQ4AY3g3Aho2wC6Io9rcLpnwNDm49BPTHbVCQ,17667
54
- ibm_watsonx_orchestrate_evaluation_framework-1.0.3.dist-info/WHEEL,sha256=_zCd3N1l69ArxyTb8rzEoP9TpbYXkqRFSNOD5OuxnTs,91
55
- ibm_watsonx_orchestrate_evaluation_framework-1.0.3.dist-info/top_level.txt,sha256=2okpqtpxyqHoLyb2msio4pzqSg7yPSzwI7ekks96wYE,23
56
- ibm_watsonx_orchestrate_evaluation_framework-1.0.3.dist-info/RECORD,,
53
+ ibm_watsonx_orchestrate_evaluation_framework-1.0.4.dist-info/METADATA,sha256=uhmuzKUbgWgKDNayG2dAc-YYvZ_ypeVY4onrcomv0Co,17667
54
+ ibm_watsonx_orchestrate_evaluation_framework-1.0.4.dist-info/WHEEL,sha256=_zCd3N1l69ArxyTb8rzEoP9TpbYXkqRFSNOD5OuxnTs,91
55
+ ibm_watsonx_orchestrate_evaluation_framework-1.0.4.dist-info/top_level.txt,sha256=2okpqtpxyqHoLyb2msio4pzqSg7yPSzwI7ekks96wYE,23
56
+ ibm_watsonx_orchestrate_evaluation_framework-1.0.4.dist-info/RECORD,,
@@ -132,7 +132,11 @@ def record_chats(config: ChatRecordingConfig):
132
132
  # Process only new runs that started after our recording began
133
133
  for run in all_runs:
134
134
  thread_id = run.get("thread_id")
135
- agent_name = inference_backend.get_agent_name_from_thread_id(thread_id)
135
+ try:
136
+ agent_name = inference_backend.get_agent_name_from_thread_id(thread_id)
137
+ except Exception as e:
138
+ rich.print(f"[yellow]WARNING:[/yellow]Failure in getting thread id {thread_id}")
139
+ continue
136
140
  if thread_id in seen_threads or agent_name is None:
137
141
  continue
138
142
  seen_threads.add(thread_id)
@@ -154,9 +158,9 @@ def record_chats(config: ChatRecordingConfig):
154
158
  rich.print(
155
159
  f"[green]INFO:[/green] Messages saved to: {os.path.join(config.output_dir, f'{thread_id}_messages.json')}"
156
160
  )
157
- rich.print(
158
- f"[green]INFO:[/green] Annotations saved to: {os.path.join(config.output_dir, f'{thread_id}_annotated_data.json')}"
159
- )
161
+ # rich.print(
162
+ # f"[green]INFO:[/green] Annotations saved to: {os.path.join(config.output_dir, f'{thread_id}_annotated_data.json')}"
163
+ # )
160
164
  processed_threads.add(thread_id)
161
165
 
162
166
  try:
@@ -176,17 +180,20 @@ def record_chats(config: ChatRecordingConfig):
176
180
  messages_filename = os.path.join(
177
181
  config.output_dir, f"{thread_id}_messages.json"
178
182
  )
179
- annotation_filename = os.path.join(
180
- config.output_dir, f"{thread_id}_annotated_data.json"
181
- )
182
183
 
183
184
  with open(messages_filename, "w") as f:
184
185
  json.dump(
185
186
  [msg.model_dump() for msg in messages], f, indent=4
186
187
  )
187
188
 
188
- with open(annotation_filename, "w") as f:
189
- json.dump(annotated_data, f, indent=4)
189
+ # TO-DO: we want some tracing but we also do not want to persist the file
190
+ # in the same folder.
191
+ # annotation_filename = os.path.join(
192
+ # config.output_dir, f"{thread_id}_annotated_data.json"
193
+ # )
194
+
195
+ # with open(annotation_filename, "w") as f:
196
+ # json.dump(annotated_data, f, indent=4)
190
197
  except Exception as e:
191
198
  rich.print(
192
199
  f"[red]ERROR:[/red] Failed to process thread {thread_id}: {str(e)}"