hte-cli 0.1.20__tar.gz → 0.1.21__tar.gz

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
@@ -1,6 +1,6 @@
1
1
  Metadata-Version: 2.4
2
2
  Name: hte-cli
3
- Version: 0.1.20
3
+ Version: 0.1.21
4
4
  Summary: Human Time-to-Completion Evaluation CLI
5
5
  Project-URL: Homepage, https://github.com/sean-peters-au/lyptus-mono
6
6
  Author: Lyptus Research
@@ -1,6 +1,6 @@
1
1
  [project]
2
2
  name = "hte-cli"
3
- version = "0.1.20"
3
+ version = "0.1.21"
4
4
  description = "Human Time-to-Completion Evaluation CLI"
5
5
  readme = "README.md"
6
6
  requires-python = ">=3.11"
File without changes
File without changes
@@ -333,6 +333,7 @@ def tasks_run(ctx, task_id: str | None):
333
333
  console.print(f"[dim]Note: {e}[/dim]")
334
334
 
335
335
  # Validate compose for sandbox-required benchmarks
336
+ benchmark = assignment.get("benchmark", "").lower()
336
337
  SANDBOX_REQUIRED_BENCHMARKS = {"cybench", "intercode-ctf", "cvebench", "cybergym", "nyuctf"}
337
338
  if benchmark in SANDBOX_REQUIRED_BENCHMARKS and not compose_yaml:
338
339
  console.print(
@@ -354,7 +355,6 @@ def tasks_run(ctx, task_id: str | None):
354
355
  )
355
356
 
356
357
  # Step 4: Show pre-task message (benchmark-specific)
357
- benchmark = assignment.get("benchmark", "").lower()
358
358
  single_shot_benchmarks = {"nl2bash", "cybashbench"}
359
359
 
360
360
  console.print()
File without changes
File without changes
File without changes
File without changes
File without changes