hte-cli 0.2.16__tar.gz → 0.2.17__tar.gz
This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
- {hte_cli-0.2.16 → hte_cli-0.2.17}/PKG-INFO +1 -1
- {hte_cli-0.2.16 → hte_cli-0.2.17}/pyproject.toml +1 -1
- {hte_cli-0.2.16 → hte_cli-0.2.17}/src/hte_cli/cli.py +16 -1
- {hte_cli-0.2.16 → hte_cli-0.2.17}/.gitignore +0 -0
- {hte_cli-0.2.16 → hte_cli-0.2.17}/README.md +0 -0
- {hte_cli-0.2.16 → hte_cli-0.2.17}/src/hte_cli/__init__.py +0 -0
- {hte_cli-0.2.16 → hte_cli-0.2.17}/src/hte_cli/__main__.py +0 -0
- {hte_cli-0.2.16 → hte_cli-0.2.17}/src/hte_cli/api_client.py +0 -0
- {hte_cli-0.2.16 → hte_cli-0.2.17}/src/hte_cli/config.py +0 -0
- {hte_cli-0.2.16 → hte_cli-0.2.17}/src/hte_cli/errors.py +0 -0
- {hte_cli-0.2.16 → hte_cli-0.2.17}/src/hte_cli/events.py +0 -0
- {hte_cli-0.2.16 → hte_cli-0.2.17}/src/hte_cli/image_utils.py +0 -0
- {hte_cli-0.2.16 → hte_cli-0.2.17}/src/hte_cli/runner.py +0 -0
- {hte_cli-0.2.16 → hte_cli-0.2.17}/src/hte_cli/scorers.py +0 -0
- {hte_cli-0.2.16 → hte_cli-0.2.17}/src/hte_cli/version_check.py +0 -0
- {hte_cli-0.2.16 → hte_cli-0.2.17}/tests/__init__.py +0 -0
- {hte_cli-0.2.16 → hte_cli-0.2.17}/tests/e2e/__init__.py +0 -0
- {hte_cli-0.2.16 → hte_cli-0.2.17}/tests/e2e/automated_runner.py +0 -0
- {hte_cli-0.2.16 → hte_cli-0.2.17}/tests/e2e/conftest.py +0 -0
- {hte_cli-0.2.16 → hte_cli-0.2.17}/tests/e2e/e2e_test.py +0 -0
- {hte_cli-0.2.16 → hte_cli-0.2.17}/tests/e2e/test_benchmark_flows.py +0 -0
- {hte_cli-0.2.16 → hte_cli-0.2.17}/tests/e2e/test_eval_logs.py +0 -0
- {hte_cli-0.2.16 → hte_cli-0.2.17}/tests/e2e/test_infrastructure.py +0 -0
- {hte_cli-0.2.16 → hte_cli-0.2.17}/tests/e2e/test_runtime_imports.py +0 -0
- {hte_cli-0.2.16 → hte_cli-0.2.17}/tests/e2e/test_session_lifecycle.py +0 -0
- {hte_cli-0.2.16 → hte_cli-0.2.17}/tests/e2e/verify_docker_deps.py +0 -0
- {hte_cli-0.2.16 → hte_cli-0.2.17}/uv.lock +0 -0
|
@@ -408,6 +408,21 @@ def session_join(ctx, session_id: str, force_setup: bool):
|
|
|
408
408
|
answer=result.answer,
|
|
409
409
|
)
|
|
410
410
|
|
|
411
|
+
# Extract agent_id from task files for CyberGym post-hoc verification
|
|
412
|
+
agent_id = None
|
|
413
|
+
if files_zip:
|
|
414
|
+
try:
|
|
415
|
+
from io import BytesIO
|
|
416
|
+
from zipfile import ZipFile
|
|
417
|
+
with ZipFile(BytesIO(files_zip)) as zf:
|
|
418
|
+
if "difficulty_levels.json" in zf.namelist():
|
|
419
|
+
with zf.open("difficulty_levels.json") as f:
|
|
420
|
+
import json
|
|
421
|
+
difficulty_info = json.load(f)
|
|
422
|
+
agent_id = difficulty_info.get("agent_id")
|
|
423
|
+
except Exception:
|
|
424
|
+
pass # Not a CyberGym task or malformed zip
|
|
425
|
+
|
|
411
426
|
console.print()
|
|
412
427
|
console.print("[green]Task completed![/green]")
|
|
413
428
|
console.print(f"Answer: {result.answer}")
|
|
@@ -428,7 +443,7 @@ def session_join(ctx, session_id: str, force_setup: bool):
|
|
|
428
443
|
eval_log_bytes=eval_log_bytes,
|
|
429
444
|
score=result.score,
|
|
430
445
|
score_binarized=result.score_binarized,
|
|
431
|
-
agent_id=
|
|
446
|
+
agent_id=agent_id,
|
|
432
447
|
)
|
|
433
448
|
except APIError as e:
|
|
434
449
|
console.print(f"[red]Failed to upload result: {e}[/red]")
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|