Spaces:

Ma-Ri-Ba-Ku
/

Picarones

Running

Claude commited on 29 days ago

Commit

50b07b8

unverified ·

1 Parent(s): 6a8026b

feat(web,tests): Corr-A/B/C — exposer views + expose_alto + B2 features Web/test helper

Audit B3-final commit C2. Suite de C1 (CLI) — étend l'exposition
des features à la couche Web et corrige la divergence test↔prod
sur les vues identifiée par l'audit.

picarones/interfaces/web/models.py
- PipelineConfig.expose_alto: bool = False
(B5 — flag Tesseract ALTO XML)
- BenchmarkRunRequest.views: list[ViewName] = ["text_final"]
(B6 — défaut compat ascendante)
- BenchmarkRunRequest.profile: Literal[...] = "standard" (B2.6)
- BenchmarkRunRequest.partial_dir: str = "" (B2.3)
- BenchmarkRunRequest.entity_extractor: str = "" (B2.4)
- BenchmarkRunRequest.output_json: str = "" (B2.7)

picarones/interfaces/web/benchmark_utils.py
- _engine_from_competitor propage comp.expose_alto au factory
Tesseract uniquement (autres adapters ignorent).
- run_benchmark_thread_v2 propage views/profile/partial_dir/
entity_extractor/output_json à prepare_preset_args.

tests/_migration_helpers.py — helper test B4
- Nouveau kwarg views: tuple[str, ...] = ("text_final",)
propagé à prepare_preset_args.
- Corrige la divergence test↔prod identifiée par l'audit
(le helper test ne supportait pas les vues multi-format,
aucun test B4 ne couvrait ce chemin).

tests/app/services/test_python_helpers.py
- Nouveau TestMigrationHelperViewsPropagation : 1 cas qui
vérifie que le helper propage bien views au RunResult final
(text_final-only vs multi-vues).

Tests : 10 passed pour les helpers, 484 passed pour CLI+Web.

Impact utilisateur (API REST POST /api/benchmark/run) :
{
"corpus_path": "./corpus",
"competitors": [{"engine_name": "tesseract", "expose_alto": true}],
"views": ["text_final", "alto_documentary", "searchability"],
"profile": "standard"
}
→ rapport HTML avec 3 sections de vues + ALTO Tesseract.

Files changed (4) hide show

picarones/interfaces/web/benchmark_utils.py +15 -2
picarones/interfaces/web/models.py +38 -0
tests/_migration_helpers.py +2 -0
tests/app/services/test_python_helpers.py +37 -0

picarones/interfaces/web/benchmark_utils.py CHANGED Viewed

@@ -251,6 +251,11 @@ def _engine_from_competitor(comp: PipelineConfig) -> Any:
         # n'est plus possible de l'oublier pour un nouveau moteur.
         try:
             kwargs = _build_ocr_kwargs(engine_id, comp.ocr_model)
             ocr = ocr_adapter_from_name(engine_id, **kwargs)
         except ValueError as exc:
             # Adapter indisponible (dépendance optionnelle absente)
@@ -384,13 +389,21 @@ def run_benchmark_thread_v2(job: BenchmarkJob, req: BenchmarkRunRequest) -> None
         with tempfile.TemporaryDirectory(prefix="picarones_web_") as _ws:
             _ws_path = Path(_ws)
             _run_dir = _ws_path / "run"
             _preset = prepare_preset_args(
                 corpus, engines,
                 workspace_dir=_ws_path / "gt",
                 output_dir=_run_dir,
                 char_exclude=char_excl,
                 normalization_profile=req.normalization_profile,
-                output_json=output_json,
             )
             _orch_result = RunOrchestrator(_run_dir).execute_preset(
                 spec=_preset.spec,
@@ -407,7 +420,7 @@ def run_benchmark_thread_v2(job: BenchmarkJob, req: BenchmarkRunRequest) -> None
                 corpus=corpus, engines=engines,
                 char_exclude=char_excl,
                 normalization_profile=req.normalization_profile,
-                profile="standard",
             )
         if job.status == "cancelled":

         # n'est plus possible de l'oublier pour un nouveau moteur.
         try:
             kwargs = _build_ocr_kwargs(engine_id, comp.ocr_model)
+            # Phase B3-final corr-B (mai 2026) — propage expose_alto
+            # à Tesseract (les autres adapters ignorent ce kwarg via
+            # validation du factory).
+            if comp.expose_alto and engine_id.lower() in {"tesseract", "tess"}:
+                kwargs["expose_alto"] = True
             ocr = ocr_adapter_from_name(engine_id, **kwargs)
         except ValueError as exc:
             # Adapter indisponible (dépendance optionnelle absente)
         with tempfile.TemporaryDirectory(prefix="picarones_web_") as _ws:
             _ws_path = Path(_ws)
             _run_dir = _ws_path / "run"
+            # Phase B3-final corr-A/B/C (mai 2026) — propage les
+            # nouveaux champs ``BenchmarkRunRequest`` (views, profile,
+            # partial_dir, entity_extractor, output_json).
+            _views_tuple = tuple(req.views) if req.views else ("text_final",)
             _preset = prepare_preset_args(
                 corpus, engines,
                 workspace_dir=_ws_path / "gt",
                 output_dir=_run_dir,
+                views=_views_tuple,
                 char_exclude=char_excl,
                 normalization_profile=req.normalization_profile,
+                profile=req.profile,
+                partial_dir=req.partial_dir or None,
+                entity_extractor=req.entity_extractor or None,
+                output_json=req.output_json or output_json,
             )
             _orch_result = RunOrchestrator(_run_dir).execute_preset(
                 spec=_preset.spec,
                 corpus=corpus, engines=engines,
                 char_exclude=char_excl,
                 normalization_profile=req.normalization_profile,
+                profile=req.profile,
             )
         if job.status == "cancelled":

picarones/interfaces/web/models.py CHANGED Viewed

@@ -121,6 +121,17 @@ class PipelineConfig(BaseModel):
     autorisée pour indiquer qu'aucun LLM n'est attaché au moteur OCR.
     """
     prompt_file: str = Field(default="", max_length=_MAX_PROMPT_FILENAME)
 class BenchmarkRunRequest(BaseModel):
@@ -133,6 +144,33 @@ class BenchmarkRunRequest(BaseModel):
     output_dir: str = Field(default="./rapports/", max_length=_MAX_PATH)
     report_name: str = Field(default="", max_length=_MAX_NAME)
     report_lang: ReportLang = "fr"
 __all__ = [

     autorisée pour indiquer qu'aucun LLM n'est attaché au moteur OCR.
     """
     prompt_file: str = Field(default="", max_length=_MAX_PROMPT_FILENAME)
+    expose_alto: bool = False
+    """Phase B3-final corr-B (mai 2026) — active la production native
+    d'ALTO XML par Tesseract via ``pytesseract.image_to_alto_xml``.
+    Combiné avec ``BenchmarkRunRequest.views`` contenant
+    ``alto_documentary``, débloque les sections multi-vues du rapport
+    HTML.  Ignoré pour les engines non-Tesseract."""
+# Phase B3-final corr-A — vues canoniques d'évaluation acceptées.
+ViewName = Literal["text_final", "alto_documentary", "searchability"]
 class BenchmarkRunRequest(BaseModel):
     output_dir: str = Field(default="./rapports/", max_length=_MAX_PATH)
     report_name: str = Field(default="", max_length=_MAX_NAME)
     report_lang: ReportLang = "fr"
+    # Phase B3-final corr-A/B/C (mai 2026) — exposition des features
+    # B2/B5/B6 aux clients de l'API REST.
+    views: list[ViewName] = Field(default_factory=lambda: ["text_final"])
+    """Liste des vues d'évaluation à appliquer.  Défaut :
+    ``["text_final"]`` (compat ascendante).  Pour activer le rapport
+    HTML multi-vues (AltoView, SearchView), passer ``["text_final",
+    "alto_documentary", "searchability"]``.  Nécessite que les
+    pipelines produisent les artefacts éligibles (ex :
+    ``alto_documentary`` requiert ``PipelineConfig.expose_alto=true``
+    côté Tesseract)."""
+    profile: Literal[
+        "minimal", "standard", "philological", "diagnostics",
+        "economics", "pipeline", "full",
+    ] = "standard"
+    """Phase B2.6 — profil de hooks document-level / corpus aggregators.
+    Sélectionne quels ``@register_document_metric`` /
+    ``@register_corpus_aggregator`` s'exécutent."""
+    partial_dir: str = Field(default="", max_length=_MAX_PATH)
+    """Phase B2.3 — répertoire pour la reprise sur interruption.
+    Vide = pas de resume."""
+    entity_extractor: str = Field(default="", max_length=_MAX_NAME * 4)
+    """Phase B2.4 — dotted path vers une factory d'extracteur d'entités
+    (ex : ``mypkg.ner:SpacyExtractor``).  Vide = pas de NER attach."""
+    output_json: str = Field(default="", max_length=_MAX_PATH)
+    """Phase B2.7 — chemin facultatif où sérialiser le BenchmarkResult
+    legacy en JSON.  Vide = pas de sortie JSON additionnelle (le
+    rapport HTML reste produit normalement)."""
 __all__ = [

tests/_migration_helpers.py CHANGED Viewed

@@ -34,6 +34,7 @@ def run_via_orchestrator(
     corpus: "Corpus",
     engines: list[Any],
     *,
     char_exclude: Any | None = None,
     normalization_profile: Any | None = None,
     output_json: str | Path | None = None,
@@ -97,6 +98,7 @@ def run_via_orchestrator(
             corpus, engines,
             workspace_dir=ws_path / "gt",
             output_dir=run_dir,
             char_exclude=char_exclude,
             normalization_profile=normalization_profile,
             partial_dir=partial_dir,

     corpus: "Corpus",
     engines: list[Any],
     *,
+    views: tuple[str, ...] = ("text_final",),
     char_exclude: Any | None = None,
     normalization_profile: Any | None = None,
     output_json: str | Path | None = None,
             corpus, engines,
             workspace_dir=ws_path / "gt",
             output_dir=run_dir,
+            views=views,
             char_exclude=char_exclude,
             normalization_profile=normalization_profile,
             partial_dir=partial_dir,

tests/app/services/test_python_helpers.py CHANGED Viewed

@@ -104,6 +104,43 @@ class TestNominal:
         )
 # ──────────────────────────────────────────────────────────────────────
 # Multi-engines
 # ──────────────────────────────────────────────────────────────────────

         )
+# ──────────────────────────────────────────────────────────────────────
+# Phase B3-final corr-A/D — vérifier que le helper test propage `views`
+# ──────────────────────────────────────────────────────────────────────
+class TestMigrationHelperViewsPropagation:
+    """Garantie que ``tests/_migration_helpers.run_via_orchestrator``
+    propage le param ``views`` à ``prepare_preset_args``.
+    Audit Phase B3-final a identifié une divergence test↔prod : le
+    helper de test ne transmettait pas ``views``, donc aucun test B4
+    ne couvrait le multi-vues via le helper.  Corr-D : helper test
+    aligné, test de propagation explicite.
+    """
+    def test_helper_propagates_views_to_run_result(
+        self, tmp_path: Path,
+    ) -> None:
+        from tests._migration_helpers import run_via_orchestrator
+        corpus = _make_corpus(tmp_path, n=1)
+        engine = _MockOCR()
+        # Sans param ``views`` → défaut text_final seulement.
+        bm_default = run_via_orchestrator(corpus, [engine])
+        assert "text_final" in bm_default.view_results
+        assert "alto_documentary" not in bm_default.view_results
+        # Avec ``views=...`` → propagation effective.
+        bm_multi = run_via_orchestrator(
+            corpus, [engine],
+            views=("text_final", "searchability"),
+        )
+        assert "text_final" in bm_multi.view_results
+        assert "searchability" in bm_multi.view_results
 # ──────────────────────────────────────────────────────────────────────
 # Multi-engines
 # ──────────────────────────────────────────────────────────────────────