feat(direct_benchmark): add run ID to completion blocks

Include config:challenge:attempt and timestamp in completion block header for easier debugging and log correlation. Co-Authored-By: Claude Opus 4.5 <noreply@anthropic.com>
2026-04-08 03:00:28 -04:00 · 2026-01-20 00:14:23 -06:00
parent 634bff8277
commit 00e02a4696
1 changed files with 18 additions and 5 deletions
--- a/classic/direct_benchmark/direct_benchmark/ui.py
+++ b/classic/direct_benchmark/direct_benchmark/ui.py
@@ -71,9 +71,9 @@ class BenchmarkUI:
            configure_logging_for_benchmark()

        # Track state - use run_key (config:challenge) for uniqueness
-        self.active_runs: dict[
-            str, tuple[str, str]
-        ] = {}  # run_key -> (config_name, challenge_name)
+        self.active_runs: dict[str, tuple[str, str]] = (
+            {}
+        )  # run_key -> (config_name, challenge_name)
        self.active_steps: dict[str, str] = {}  # run_key -> current step info
        self.completed: list[ChallengeResult] = []
        self.results_by_config: dict[str, list[ChallengeResult]] = {}
@@ -195,16 +195,29 @@ class BenchmarkUI:
        steps: list[tuple[int, str, str, bool]],
    ) -> None:
        """Print a copy-paste friendly completion block."""
+        from datetime import datetime
+
        color = self.get_config_color(config_name)
        status = "PASS" if result.success else "FAIL"
        status_style = "green" if result.success else "red"

-        # Print header
+        # Build challenge display with attempt if > 1
+        challenge_display = challenge_name
+        if result.attempt > 1:
+            challenge_display = f"{challenge_name} (attempt {result.attempt})"
+
+        # Generate timestamp for run identification
+        timestamp = datetime.now().strftime("%Y%m%d_%H%M%S")
+
+        # Print header with full identification
        console.print()
        console.print(f"[{status_style}]{'═' * 70}[/{status_style}]")
        console.print(
            f"[{status_style} bold][{status}][/{status_style} bold] "
-            f"[{color}]{config_name}[/{color}] - {challenge_name}"
+            f"[{color}]{config_name}[/{color}] - {challenge_display}"
+        )
+        console.print(
+            f"[dim]Run ID: {config_name}:{challenge_name}:{result.attempt} @ {timestamp}[/dim]"
        )
        console.print(f"[{status_style}]{'═' * 70}[/{status_style}]")