ibm-watsonx-orchestrate-evaluation-framework 1.0.3__py3-none-any.whl → 1.0.4__py3-none-any.whl
This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
Potentially problematic release.
This version of ibm-watsonx-orchestrate-evaluation-framework might be problematic. Click here for more details.
- {ibm_watsonx_orchestrate_evaluation_framework-1.0.3.dist-info → ibm_watsonx_orchestrate_evaluation_framework-1.0.4.dist-info}/METADATA +1 -1
- {ibm_watsonx_orchestrate_evaluation_framework-1.0.3.dist-info → ibm_watsonx_orchestrate_evaluation_framework-1.0.4.dist-info}/RECORD +5 -5
- wxo_agentic_evaluation/record_chat.py +16 -9
- {ibm_watsonx_orchestrate_evaluation_framework-1.0.3.dist-info → ibm_watsonx_orchestrate_evaluation_framework-1.0.4.dist-info}/WHEEL +0 -0
- {ibm_watsonx_orchestrate_evaluation_framework-1.0.3.dist-info → ibm_watsonx_orchestrate_evaluation_framework-1.0.4.dist-info}/top_level.txt +0 -0
|
@@ -10,7 +10,7 @@ wxo_agentic_evaluation/llm_matching.py,sha256=l010exoMmsvTIAVHCm-Ok0diyeQogjCmem
|
|
|
10
10
|
wxo_agentic_evaluation/llm_rag_eval.py,sha256=vsNGz1cFE5QGdhnfrx-iJq1r6q8tSI9Ef1mzuhoHElg,1642
|
|
11
11
|
wxo_agentic_evaluation/llm_user.py,sha256=0zSsyEM7pYQtLcfbnu0gEIkosHDwntOZY84Ito6__SM,1407
|
|
12
12
|
wxo_agentic_evaluation/main.py,sha256=tRXVle2o1JhwJZOTpqdsOzBOpxPYxAH5ziZkbCmzfyU,11470
|
|
13
|
-
wxo_agentic_evaluation/record_chat.py,sha256=
|
|
13
|
+
wxo_agentic_evaluation/record_chat.py,sha256=ZaOxIabDcE_CzZjKJESgh8LY7pK9UT4OvqQMFVdTG7A,8102
|
|
14
14
|
wxo_agentic_evaluation/resource_map.py,sha256=-dIWQdpEpPeSCbDeYfRupG9KV1Q4NlHGb5KXywjkulM,1645
|
|
15
15
|
wxo_agentic_evaluation/service_instance.py,sha256=yt7XpwheaRRG8Ri4TFIS5G2p5mnCwvNgj6T7bDF5uTU,6494
|
|
16
16
|
wxo_agentic_evaluation/test_prompt.py,sha256=ksteXCs9iDQPMETc4Hb7JAXHhxz2r678U6-sgZJAO28,3924
|
|
@@ -50,7 +50,7 @@ wxo_agentic_evaluation/service_provider/provider.py,sha256=MsnRzLYAaQiU6y6xf6eId
|
|
|
50
50
|
wxo_agentic_evaluation/service_provider/watsonx_provider.py,sha256=iKVkWs4PRTM_S0TIdPgQ9NFQWPlDvcEvuHpQlIPzO10,6216
|
|
51
51
|
wxo_agentic_evaluation/utils/__init__.py,sha256=QMxk6hx1CDvCBLFh40WpPZmqFNJtDqwXP7S7cXD6NQE,145
|
|
52
52
|
wxo_agentic_evaluation/utils/utils.py,sha256=JYZQZ-OBy43gAWg9S7duJi9StRApGJATs2JUsW1l30M,6057
|
|
53
|
-
ibm_watsonx_orchestrate_evaluation_framework-1.0.
|
|
54
|
-
ibm_watsonx_orchestrate_evaluation_framework-1.0.
|
|
55
|
-
ibm_watsonx_orchestrate_evaluation_framework-1.0.
|
|
56
|
-
ibm_watsonx_orchestrate_evaluation_framework-1.0.
|
|
53
|
+
ibm_watsonx_orchestrate_evaluation_framework-1.0.4.dist-info/METADATA,sha256=uhmuzKUbgWgKDNayG2dAc-YYvZ_ypeVY4onrcomv0Co,17667
|
|
54
|
+
ibm_watsonx_orchestrate_evaluation_framework-1.0.4.dist-info/WHEEL,sha256=_zCd3N1l69ArxyTb8rzEoP9TpbYXkqRFSNOD5OuxnTs,91
|
|
55
|
+
ibm_watsonx_orchestrate_evaluation_framework-1.0.4.dist-info/top_level.txt,sha256=2okpqtpxyqHoLyb2msio4pzqSg7yPSzwI7ekks96wYE,23
|
|
56
|
+
ibm_watsonx_orchestrate_evaluation_framework-1.0.4.dist-info/RECORD,,
|
|
@@ -132,7 +132,11 @@ def record_chats(config: ChatRecordingConfig):
|
|
|
132
132
|
# Process only new runs that started after our recording began
|
|
133
133
|
for run in all_runs:
|
|
134
134
|
thread_id = run.get("thread_id")
|
|
135
|
-
|
|
135
|
+
try:
|
|
136
|
+
agent_name = inference_backend.get_agent_name_from_thread_id(thread_id)
|
|
137
|
+
except Exception as e:
|
|
138
|
+
rich.print(f"[yellow]WARNING:[/yellow]Failure in getting thread id {thread_id}")
|
|
139
|
+
continue
|
|
136
140
|
if thread_id in seen_threads or agent_name is None:
|
|
137
141
|
continue
|
|
138
142
|
seen_threads.add(thread_id)
|
|
@@ -154,9 +158,9 @@ def record_chats(config: ChatRecordingConfig):
|
|
|
154
158
|
rich.print(
|
|
155
159
|
f"[green]INFO:[/green] Messages saved to: {os.path.join(config.output_dir, f'{thread_id}_messages.json')}"
|
|
156
160
|
)
|
|
157
|
-
rich.print(
|
|
158
|
-
|
|
159
|
-
)
|
|
161
|
+
# rich.print(
|
|
162
|
+
# f"[green]INFO:[/green] Annotations saved to: {os.path.join(config.output_dir, f'{thread_id}_annotated_data.json')}"
|
|
163
|
+
# )
|
|
160
164
|
processed_threads.add(thread_id)
|
|
161
165
|
|
|
162
166
|
try:
|
|
@@ -176,17 +180,20 @@ def record_chats(config: ChatRecordingConfig):
|
|
|
176
180
|
messages_filename = os.path.join(
|
|
177
181
|
config.output_dir, f"{thread_id}_messages.json"
|
|
178
182
|
)
|
|
179
|
-
annotation_filename = os.path.join(
|
|
180
|
-
config.output_dir, f"{thread_id}_annotated_data.json"
|
|
181
|
-
)
|
|
182
183
|
|
|
183
184
|
with open(messages_filename, "w") as f:
|
|
184
185
|
json.dump(
|
|
185
186
|
[msg.model_dump() for msg in messages], f, indent=4
|
|
186
187
|
)
|
|
187
188
|
|
|
188
|
-
|
|
189
|
-
|
|
189
|
+
# TO-DO: we want some tracing but we also do not want to persist the file
|
|
190
|
+
# in the same folder.
|
|
191
|
+
# annotation_filename = os.path.join(
|
|
192
|
+
# config.output_dir, f"{thread_id}_annotated_data.json"
|
|
193
|
+
# )
|
|
194
|
+
|
|
195
|
+
# with open(annotation_filename, "w") as f:
|
|
196
|
+
# json.dump(annotated_data, f, indent=4)
|
|
190
197
|
except Exception as e:
|
|
191
198
|
rich.print(
|
|
192
199
|
f"[red]ERROR:[/red] Failed to process thread {thread_id}: {str(e)}"
|
|
File without changes
|