Spaces:

build-small-hackathon
/

matchday

Running

mzidan000 commited on 18 days ago

Commit

e7be4df

verified ·

1 Parent(s): ea60d1a

Upload folder using huggingface_hub

Files changed (2) hide show

matchday/agent_trace.py CHANGED Viewed

@@ -433,7 +433,14 @@ def validate_packages(result: Any, trip: Any | None = None) -> list[dict[str, st
                 f"{late} of {checked} flight(s) land after kickoff" if late
                 else f"{checked} flight(s) land before kickoff")
         else:
-            add("arrival before kickoff", "skipped", "kickoff/arrival times not comparable")
     else:
         late = [p for p in packages
                 if float((getattr(p, "scores", {}) or {}).get("arrival_buffer", 1) or 1) <= 0]

                 f"{late} of {checked} flight(s) land after kickoff" if late
                 else f"{checked} flight(s) land before kickoff")
         else:
+            # kickoff present but not directly comparable to the arrival time
+            # (e.g. a bare time/str) — fall back to the normalized arrival-buffer
+            # score (>0 means the package lands before kickoff). Honest: it
+            # evaluates instead of skipping when a strict datetime compare can't.
+            late = [p for p in packages
+                    if float((getattr(p, "scores", {}) or {}).get("arrival_buffer", 1) or 1) <= 0]
+            add("arrival before kickoff", "fail" if late else "pass",
+                "arrival-buffer score <= 0" if late else "positive arrival buffer on every package")
     else:
         late = [p for p in packages
                 if float((getattr(p, "scores", {}) or {}).get("arrival_buffer", 1) or 1) <= 0]

matchday/record_trace.py CHANGED Viewed

@@ -29,6 +29,7 @@ from pathlib import Path
 from matchday.agent import MatchDayAgent
 from matchday.agent_loop import run_agent_loop
 from matchday.intent import parse_intent
 from matchday.models import TripRequest
 from matchday.prompts import EXPLANATION_HINT
@@ -178,6 +179,20 @@ async def record(query: str, out_path: str) -> None:
             packages=_packages_view(result),
             compact=format_for_nemotron(result),
         )
         explanation = await _explain(agent, query, trip, result)
         log(event="nemotron_explanation", text=explanation)
     elif agent_text:

 from matchday.agent import MatchDayAgent
 from matchday.agent_loop import run_agent_loop
+from matchday.agent_trace import validate_packages
 from matchday.intent import parse_intent
 from matchday.models import TripRequest
 from matchday.prompts import EXPLANATION_HINT
             packages=_packages_view(result),
             compact=format_for_nemotron(result),
         )
+        # Self-check / validation gate — the SAME deterministic gate the deployed
+        # plan_trip runs live (core agentic #8 self-check / #10 safe final
+        # recommendation). Recorded here so the artifact proves the output was
+        # validated before recommending: no invented match, sane prices, every
+        # flight lands before kickoff, stay brackets the match day.
+        validation = validate_packages(result, trip)
+        _vpass = sum(1 for c in validation if c.get("status") == "pass")
+        _vfail = sum(1 for c in validation if c.get("status") == "fail")
+        log(
+            event="self_check",
+            status="flagged" if _vfail else "all_clear",
+            passed=f"{_vpass}/{len(validation)}",
+            checks=validation,
+        )
         explanation = await _explain(agent, query, trip, result)
         log(event="nemotron_explanation", text=explanation)
     elif agent_text: