Spaces:

build-small-hackathon
/

trace-field-notes

Running on Zero

App Files Files Community

JacobLinCool Codex commited on 26 days ago

Commit

7c8120d

verified ·

1 Parent(s): 6ac8ef6

feat: improve qwen zerogpu ux

Browse files

Co-authored-by: Codex <noreply@openai.com>

Files changed (6) hide show

README.md +9 -11
analyzer.py +1 -1
app.py +111 -65
model_runtime.py +5 -5
report_renderer.py +1 -1
tests/test_model_runtime.py +7 -1

README.md CHANGED Viewed

@@ -22,11 +22,11 @@ telemetry by default and analyzes only the agent's visible narrative messages:
 what it planned, where it got stuck, how it detoured, how it recovered, and how
 it claimed completion.
-Built for the Build Small Hackathon as a Gradio app. The default engine uses a
-verified deterministic codebook analyzer so the Space can always start and
-produce a report. The app also exposes explicit small-model assist modes for
-`nvidia/NVIDIA-Nemotron-3-Nano-30B-A3B-BF16` and `Qwen/Qwen3.5-9B` through
-Hugging Face Inference Providers when the user signs in with Hugging Face OAuth.
 ## Run Locally
@@ -45,12 +45,10 @@ python3.11 -m unittest discover -s tests
 ## Analysis Engines
-- `Deterministic field notes`: default, local, no model dependency.
-- `Small-model assist: NVIDIA Nemotron 3 Nano 30B-A3B`: uses the hackathon-sized
-  30B total-parameter Nemotron model through the signed-in user's
-  `inference-api` OAuth scope.
-- `Quick small-model assist: Qwen3.5 9B`: optional lower-latency model-assisted
-  memo.
 If a selected model is unavailable or the user is not signed in, the report
 records the reason in model notes and returns the deterministic analysis instead

 what it planned, where it got stuck, how it detoured, how it recovered, and how
 it claimed completion.
+Built for the Build Small Hackathon as a Gradio app. The default engine is the
+quick Qwen3.5 9B model-assisted path on ZeroGPU, with a verified deterministic
+codebook analyzer as the always-available recovery path. The app also exposes
+`nvidia/NVIDIA-Nemotron-3-Nano-30B-A3B-BF16` through Hugging Face Inference
+Providers when the user signs in with Hugging Face OAuth.
 ## Run Locally
 ## Analysis Engines
+- `Quick small-model assist: Qwen3.5 9B`: default model-assisted memo.
+- `NVIDIA Nemotron 3 Nano 30B-A3B assist`: uses Nemotron through the signed-in
+  user's `inference-api` OAuth scope.
+- `Deterministic field notes`: local, no model dependency.
 If a selected model is unavailable or the user is not signed in, the report
 records the reason in model notes and returns the deterministic analysis instead

analyzer.py CHANGED Viewed

@@ -197,7 +197,7 @@ def analyze_trace_file(
                 )
             except Exception as exc:
                 result.model_notes.append(
-                    "Small-model assist was requested but unavailable: "
                     f"{type(exc).__name__}: {exc}. Deterministic analysis was returned."
                 )
             else:

                 )
             except Exception as exc:
                 result.model_notes.append(
+                    "Model assist was requested but unavailable: "
                     f"{type(exc).__name__}: {exc}. Deterministic analysis was returned."
                 )
             else:

app.py CHANGED Viewed

@@ -17,6 +17,8 @@ from report_renderer import render_report
 SPACE_URL = "https://huggingface.co/spaces/build-small-hackathon/trace-field-notes"
 PRIVACY_WARNING = (
     "Agent traces can contain prompts, tool inputs, command outputs, local file paths, "
@@ -25,34 +27,22 @@ PRIVACY_WARNING = (
 )
 HERO_MD = f"""
-# Trace Field Notes
-See how your coding agent got stuck, detoured, recovered, and claimed success.
-Upload a Codex, Claude Code, or Pi Agent session log. The app extracts visible narrative messages, classifies difficulty episodes, and turns the session into a qualitative field report.
-> {PRIVACY_WARNING}
 """
 SESSION_PATHS_MD = """
-## Find Your Session Log
 | Agent | Local session directory |
 |---|---|
 | Codex | `~/.codex/sessions` |
 | Claude Code | `~/.claude/projects` |
 | Pi Agent | `~/.pi/agent/sessions` |
-```bash
-# Codex
-ls ~/.codex/sessions
-# Claude Code
-ls ~/.claude/projects
-# Pi Agent
-ls ~/.pi/agent/sessions
-```
 """
 AGENT_PROMPT = f"""Use this Space as a tool.
@@ -69,26 +59,81 @@ AGENT_PROMPT = f"""Use this Space as a tool.
 CUSTOM_CSS = """
 :root {
-  --field-border: #d7d0c2;
-  --field-ink: #202124;
-  --field-muted: #605b52;
-  --field-paper: #fbfaf7;
-  --field-accent: #326b59;
 }
 .gradio-container {
-  max-width: 1180px !important;
   color: var(--field-ink);
 }
 .trace-panel {
   border: 1px solid var(--field-border);
   border-radius: 8px;
-  padding: 14px;
-  background: var(--field-paper);
 }
 button.primary {
   background: var(--field-accent) !important;
   border-color: var(--field-accent) !important;
 }
 textarea, input {
   border-radius: 6px !important;
 }
@@ -101,7 +146,7 @@ def _analyze_trace_impl(
     redact_secrets: bool = True,
     ignore_tool_calls: bool = True,
     report_style: str = "field_notes",
-    analysis_engine: str = "deterministic",
     oauth_token: Optional[gr.OAuthToken] = None,
 ) -> tuple[str, dict[str, Any], str, str, str]:
     """Gradio-callable analysis endpoint."""
@@ -144,7 +189,7 @@ def analyze_trace(
     redact_secrets: bool = True,
     ignore_tool_calls: bool = True,
     report_style: str = "field_notes",
-    analysis_engine: str = "deterministic",
     oauth_token: Optional[gr.OAuthToken] = None,
 ) -> tuple[str, dict[str, Any], str, str, str]:
     """ZeroGPU-visible Gradio endpoint."""
@@ -184,6 +229,10 @@ def write_temp_artifact(prefix: str, suffix: str, content: str) -> str:
         return handle.name
 with gr.Blocks(
     title="Trace Field Notes",
     css=CUSTOM_CSS,
@@ -198,23 +247,24 @@ with gr.Blocks(
     with gr.Row(equal_height=False):
         with gr.Column(scale=3, elem_classes=["trace-panel"]):
             trace_input = gr.File(
-                label="Upload Agent Session Log",
                 file_types=[".jsonl", ".json", ".txt", ".log"],
                 type="filepath",
             )
             with gr.Row():
                 include_user_context = gr.Checkbox(
                     value=True,
-                    label="Include user prompts as context",
                 )
                 redact_secrets = gr.Checkbox(
                     value=True,
-                    label="Redact likely secrets before analysis",
                 )
             ignore_tool_calls = gr.Checkbox(
                 value=True,
-                label="Ignore tool call contents",
                 interactive=False,
             )
             report_style = gr.Radio(
@@ -222,13 +272,14 @@ with gr.Blocks(
                 value="field_notes",
                 label="Report style",
                 interactive=False,
             )
             analysis_engine = gr.Radio(
                 choices=[
                     (str(choice["label"]), key)
                     for key, choice in MODEL_CHOICES.items()
                 ],
-                value="deterministic",
                 label="Analysis engine",
             )
             with gr.Row():
@@ -241,31 +292,24 @@ with gr.Blocks(
                 "Model-assisted modes use your signed-in Hugging Face OAuth token with the `inference-api` scope. "
                 "The deterministic engine does not require sign-in."
             )
-            analyze_button = gr.Button("Analyze My Trace", variant="primary")
-        with gr.Column(scale=2):
             gr.Markdown(SESSION_PATHS_MD)
-    with gr.Accordion("Agent-callable prompt", open=False):
-        gr.Textbox(
-            value=AGENT_PROMPT,
-            label="Prompt for Codex or Claude Code",
-            lines=9,
-            interactive=False,
-            show_copy_button=True,
-        )
-    gr.Examples(
-        examples=[
-            [
-                "examples/sample_trace_redacted.jsonl",
-                True,
-                True,
-                True,
-                "field_notes",
-                "deterministic",
-            ]
-        ],
-        inputs=[
             trace_input,
             include_user_context,
             redact_secrets,
@@ -273,16 +317,18 @@ with gr.Blocks(
             report_style,
             analysis_engine,
         ],
-        label="Try a redacted sample trace",
     )
-    report_output = gr.Markdown(label="Field Report")
-    with gr.Row():
-        episode_json = gr.JSON(label="Structured Episode JSON")
-    with gr.Row():
-        redacted_download = gr.File(label="Download Redacted Narrative")
-        report_download = gr.File(label="Download Markdown Report")
-        json_download = gr.File(label="Download Structured JSON")
     analyze_button.click(
         analyze_trace,

 SPACE_URL = "https://huggingface.co/spaces/build-small-hackathon/trace-field-notes"
+DEFAULT_ANALYSIS_ENGINE = "qwen"
+SAMPLE_TRACE_PATH = "examples/sample_trace_redacted.jsonl"
 PRIVACY_WARNING = (
     "Agent traces can contain prompts, tool inputs, command outputs, local file paths, "
 )
 HERO_MD = f"""
+<div class="hero">
+  <div class="hero-kicker">ZeroGPU field report</div>
+  <h1>Trace Field Notes</h1>
+  <p>Map where a coding agent got stuck, changed route, recovered, and claimed success.</p>
+</div>
+<div class="privacy-callout">{PRIVACY_WARNING}</div>
 """
 SESSION_PATHS_MD = """
+### Session Logs
 | Agent | Local session directory |
 |---|---|
 | Codex | `~/.codex/sessions` |
 | Claude Code | `~/.claude/projects` |
 | Pi Agent | `~/.pi/agent/sessions` |
 """
 AGENT_PROMPT = f"""Use this Space as a tool.
 CUSTOM_CSS = """
 :root {
+  --field-border: rgba(148, 163, 184, 0.28);
+  --field-ink: #f8fafc;
+  --field-muted: #94a3b8;
+  --field-panel: rgba(15, 23, 42, 0.74);
+  --field-panel-strong: rgba(15, 23, 42, 0.92);
+  --field-accent: #2f8a69;
+  --field-accent-strong: #23785d;
 }
 .gradio-container {
+  max-width: 1220px !important;
   color: var(--field-ink);
 }
+.hero {
+  border: 1px solid var(--field-border);
+  border-radius: 8px;
+  padding: 18px 20px;
+  background: linear-gradient(135deg, rgba(47, 138, 105, 0.18), rgba(15, 23, 42, 0.3));
+}
+.hero h1 {
+  margin: 0;
+  font-size: 34px;
+  line-height: 1.08;
+}
+.hero p {
+  max-width: 760px;
+  margin: 10px 0 0;
+  color: var(--field-muted);
+  font-size: 15px;
+}
+.hero-kicker {
+  margin-bottom: 8px;
+  color: #7dd3fc;
+  font: 700 12px/1.2 ui-monospace, SFMono-Regular, Menlo, Monaco, Consolas, monospace;
+  text-transform: uppercase;
+  letter-spacing: 0;
+}
+.privacy-callout {
+  margin: 12px 0 16px;
+  border-left: 3px solid #f59e0b;
+  padding: 10px 12px;
+  color: #dbe4ef;
+  background: rgba(245, 158, 11, 0.08);
+  border-radius: 0 6px 6px 0;
+}
 .trace-panel {
   border: 1px solid var(--field-border);
   border-radius: 8px;
+  padding: 16px;
+  background: var(--field-panel);
+}
+.guide-panel {
+  border: 1px solid var(--field-border);
+  border-radius: 8px;
+  padding: 16px;
+  background: var(--field-panel);
+}
+.guide-panel table {
+  width: 100%;
+}
+.action-row button {
+  min-height: 42px;
 }
 button.primary {
   background: var(--field-accent) !important;
   border-color: var(--field-accent) !important;
 }
+button.primary:hover {
+  background: var(--field-accent-strong) !important;
+}
+.download-row {
+  align-items: stretch;
+}
+.result-tabs {
+  margin-top: 14px;
+}
 textarea, input {
   border-radius: 6px !important;
 }
     redact_secrets: bool = True,
     ignore_tool_calls: bool = True,
     report_style: str = "field_notes",
+    analysis_engine: str = DEFAULT_ANALYSIS_ENGINE,
     oauth_token: Optional[gr.OAuthToken] = None,
 ) -> tuple[str, dict[str, Any], str, str, str]:
     """Gradio-callable analysis endpoint."""
     redact_secrets: bool = True,
     ignore_tool_calls: bool = True,
     report_style: str = "field_notes",
+    analysis_engine: str = DEFAULT_ANALYSIS_ENGINE,
     oauth_token: Optional[gr.OAuthToken] = None,
 ) -> tuple[str, dict[str, Any], str, str, str]:
     """ZeroGPU-visible Gradio endpoint."""
         return handle.name
+def load_sample_trace() -> tuple[str, bool, bool, bool, str, str]:
+    return SAMPLE_TRACE_PATH, True, True, True, "field_notes", DEFAULT_ANALYSIS_ENGINE
 with gr.Blocks(
     title="Trace Field Notes",
     css=CUSTOM_CSS,
     with gr.Row(equal_height=False):
         with gr.Column(scale=3, elem_classes=["trace-panel"]):
+            gr.Markdown("### Trace Input")
             trace_input = gr.File(
+                label="Agent session log",
                 file_types=[".jsonl", ".json", ".txt", ".log"],
                 type="filepath",
             )
             with gr.Row():
                 include_user_context = gr.Checkbox(
                     value=True,
+                    label="Include user context",
                 )
                 redact_secrets = gr.Checkbox(
                     value=True,
+                    label="Redact likely secrets",
                 )
             ignore_tool_calls = gr.Checkbox(
                 value=True,
+                label="Ignore tool contents",
                 interactive=False,
             )
             report_style = gr.Radio(
                 value="field_notes",
                 label="Report style",
                 interactive=False,
+                visible=False,
             )
             analysis_engine = gr.Radio(
                 choices=[
                     (str(choice["label"]), key)
                     for key, choice in MODEL_CHOICES.items()
                 ],
+                value=DEFAULT_ANALYSIS_ENGINE,
                 label="Analysis engine",
             )
             with gr.Row():
                 "Model-assisted modes use your signed-in Hugging Face OAuth token with the `inference-api` scope. "
                 "The deterministic engine does not require sign-in."
             )
+            with gr.Row(elem_classes=["action-row"]):
+                analyze_button = gr.Button("Analyze My Trace", variant="primary")
+                sample_button = gr.Button("Use Sample Trace", variant="secondary")
+        with gr.Column(scale=2, elem_classes=["guide-panel"]):
             gr.Markdown(SESSION_PATHS_MD)
+            with gr.Accordion("Agent-callable prompt", open=False):
+                gr.Textbox(
+                    value=AGENT_PROMPT,
+                    label="Prompt for Codex or Claude Code",
+                    lines=9,
+                    interactive=False,
+                    show_copy_button=True,
+                )
+    sample_button.click(
+        load_sample_trace,
+        inputs=None,
+        outputs=[
             trace_input,
             include_user_context,
             redact_secrets,
             report_style,
             analysis_engine,
         ],
     )
+    with gr.Tabs(elem_classes=["result-tabs"]):
+        with gr.Tab("Field Report"):
+            report_output = gr.Markdown(label="Field Report")
+        with gr.Tab("Episodes JSON"):
+            episode_json = gr.JSON(label="Structured Episode JSON")
+        with gr.Tab("Downloads"):
+            with gr.Row(elem_classes=["download-row"]):
+                redacted_download = gr.File(label="Redacted Narrative")
+                report_download = gr.File(label="Markdown Report")
+                json_download = gr.File(label="Structured JSON")
     analyze_button.click(
         analyze_trace,

model_runtime.py CHANGED Viewed

@@ -1,4 +1,4 @@
-"""Optional small-model assistance through Hugging Face Inference Providers."""
 from __future__ import annotations
@@ -19,7 +19,7 @@ MODEL_CHOICES = {
         "model_id": None,
     },
     "nemotron": {
-        "label": "Small-model assist: NVIDIA Nemotron 3 Nano 30B-A3B",
         "model_id": PRIMARY_MODEL_ID,
     },
     "qwen": {
@@ -57,7 +57,7 @@ def run_model_assist(
     token: str | None = None,
     client: ChatClient | None = None,
 ) -> ModelAssistResult:
-    """Ask the selected small model for a concise memo grounded in visible text."""
     model_id = model_id_for_engine(engine)
     if not model_id:
@@ -70,7 +70,7 @@ def run_model_assist(
         resolved_token = token or os.getenv("HF_TOKEN") or get_token()
         if not resolved_token:
             raise ValueError(
-                "Sign in with Hugging Face to enable small-model assist through "
                 "the inference-api OAuth scope."
             )
@@ -103,7 +103,7 @@ def run_model_assist(
     return ModelAssistResult(
         model_id=model_id,
         memo=memo,
-        note=f"Small-model assist completed with {model_id}.",
     )

+"""Optional model assistance through Hugging Face Inference Providers."""
 from __future__ import annotations
         "model_id": None,
     },
     "nemotron": {
+        "label": "NVIDIA Nemotron 3 Nano 30B-A3B assist",
         "model_id": PRIMARY_MODEL_ID,
     },
     "qwen": {
     token: str | None = None,
     client: ChatClient | None = None,
 ) -> ModelAssistResult:
+    """Ask the selected model for a concise memo grounded in visible text."""
     model_id = model_id_for_engine(engine)
     if not model_id:
         resolved_token = token or os.getenv("HF_TOKEN") or get_token()
         if not resolved_token:
             raise ValueError(
+                "Sign in with Hugging Face to enable model assist through "
                 "the inference-api OAuth scope."
             )
     return ModelAssistResult(
         model_id=model_id,
         memo=memo,
+        note=f"Model assist completed with {model_id}.",
     )

report_renderer.py CHANGED Viewed

@@ -76,7 +76,7 @@ def render_model_memo(result: AnalysisResult) -> str:
     if not result.model_memo and not result.model_notes:
         return ""
-    lines = ["## Small-Model Memo"]
     if result.model_memo:
         lines.append(result.model_memo.get("executive_memo", ""))
         lines.append(f"**Detours:** {result.model_memo.get('detour_memo', '')}")

     if not result.model_memo and not result.model_notes:
         return ""
+    lines = ["## Model Memo"]
     if result.model_memo:
         lines.append(result.model_memo.get("executive_memo", ""))
         lines.append(f"**Detours:** {result.model_memo.get('detour_memo', '')}")

tests/test_model_runtime.py CHANGED Viewed

@@ -7,7 +7,7 @@ from pathlib import Path
 from unittest.mock import patch
 from analyzer import analyze_trace_file
-from model_runtime import PRIMARY_MODEL_ID, parse_model_json, run_model_assist
 class FakeChatClient:
@@ -31,6 +31,12 @@ class FakeChatClient:
 class ModelRuntimeTests(unittest.TestCase):
     def test_parse_model_json_validates_required_shape(self) -> None:
         memo = parse_model_json(
             json.dumps(

 from unittest.mock import patch
 from analyzer import analyze_trace_file
+from model_runtime import MODEL_CHOICES, PRIMARY_MODEL_ID, parse_model_json, run_model_assist
 class FakeChatClient:
 class ModelRuntimeTests(unittest.TestCase):
+    def test_nemotron_label_does_not_call_it_small(self) -> None:
+        label = str(MODEL_CHOICES["nemotron"]["label"])
+        self.assertIn("NVIDIA Nemotron 3 Nano 30B-A3B", label)
+        self.assertNotIn("small", label.lower())
     def test_parse_model_json_validates_required_shape(self) -> None:
         memo = parse_model_json(
             json.dumps(