Spaces:
Sleeping
Sleeping
File size: 10,287 Bytes
3116157 0d00572 3116157 0d00572 3116157 0d00572 3116157 0d00572 3116157 0d00572 3116157 0d00572 3116157 | 1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24 25 26 27 28 29 30 31 32 33 34 35 36 37 38 39 40 41 42 43 44 45 46 47 48 49 50 51 52 53 54 55 56 57 58 59 60 61 62 63 64 65 66 67 68 69 70 71 72 73 74 75 76 77 78 79 80 81 82 83 84 85 86 87 88 89 90 91 92 93 94 95 96 97 98 99 100 101 102 103 104 105 106 107 108 109 110 111 112 113 114 115 116 117 118 119 120 121 122 123 124 125 126 127 128 129 130 131 132 133 134 135 136 137 138 139 140 141 142 143 144 145 146 147 148 149 150 151 152 153 154 155 156 157 158 159 160 161 162 163 164 165 166 167 168 169 170 171 172 173 174 175 176 177 178 179 180 181 182 183 184 185 186 187 188 189 190 191 192 193 194 195 196 197 198 199 200 201 202 203 204 205 206 207 208 209 210 211 212 213 214 215 216 217 218 219 220 221 222 223 224 225 226 227 228 229 230 231 232 233 234 235 236 237 238 239 240 241 242 243 244 245 246 247 248 249 250 251 252 253 254 255 256 257 258 259 260 261 262 | """Sprint A14-S5 β contrats dΓ©claratifs des vues d'Γ©valuation.
Tests de ``MetricSpec``, ``EvaluationView``, ``EvaluationSpec``,
``ProjectionSpec``. Pas de logique mΓ©tier β juste les invariants
des dataclasses pydantic.
"""
from __future__ import annotations
import pytest
from pydantic import ValidationError
from picarones.domain import (
ArtifactType,
EvaluationSpec,
EvaluationView,
MetricSpec,
ProjectionSpec,
)
# ββββββββββββββββββββββββββββββββββββββββββββββββββββββββββββββββββββββ
# MetricSpec
# ββββββββββββββββββββββββββββββββββββββββββββββββββββββββββββββββββββββ
class TestMetricSpec:
def test_minimal_spec(self) -> None:
spec = MetricSpec(
name="cer",
input_types=(ArtifactType.RAW_TEXT, ArtifactType.RAW_TEXT),
)
assert spec.name == "cer"
assert spec.description == ""
assert spec.higher_is_better is False
assert spec.tags == frozenset()
def test_higher_is_better_for_quality_metrics(self) -> None:
spec = MetricSpec(
name="ner_f1",
input_types=(ArtifactType.ENTITIES, ArtifactType.ENTITIES),
description="F1 micro sur entitΓ©s nommΓ©es",
higher_is_better=True,
tags=frozenset({"ner", "icdar"}),
)
assert spec.higher_is_better is True
assert "ner" in spec.tags
def test_frozen(self) -> None:
spec = MetricSpec(
name="cer",
input_types=(ArtifactType.RAW_TEXT, ArtifactType.RAW_TEXT),
)
with pytest.raises(ValidationError):
spec.name = "wer" # type: ignore[misc]
def test_no_callable_field(self) -> None:
"""DiffΓ©rence avec l'ancien core.metric_registry.MetricSpec :
pas de ``func`` ici (le callable vit dans MetricRegistry)."""
spec = MetricSpec(
name="cer",
input_types=(ArtifactType.RAW_TEXT, ArtifactType.RAW_TEXT),
)
assert not hasattr(spec, "func")
def test_extra_field_rejected(self) -> None:
with pytest.raises(ValidationError):
MetricSpec( # type: ignore[call-arg]
name="cer",
input_types=(ArtifactType.RAW_TEXT, ArtifactType.RAW_TEXT),
bogus=42,
)
# ββββββββββββββββββββββββββββββββββββββββββββββββββββββββββββββββββββββ
# ProjectionSpec
# ββββββββββββββββββββββββββββββββββββββββββββββββββββββββββββββββββββββ
class TestProjectionSpec:
def test_alto_to_text(self) -> None:
p = ProjectionSpec(
source_type=ArtifactType.ALTO_XML,
target_type=ArtifactType.RAW_TEXT,
projector_name="alto_to_text",
)
assert p.source_type == ArtifactType.ALTO_XML
assert p.target_type == ArtifactType.RAW_TEXT
assert p.params == {}
assert p.is_identity is False
def test_identity_projection(self) -> None:
p = ProjectionSpec(
source_type=ArtifactType.RAW_TEXT,
target_type=ArtifactType.RAW_TEXT,
projector_name="identity",
)
assert p.is_identity is True
def test_with_params(self) -> None:
p = ProjectionSpec(
source_type=ArtifactType.ALTO_XML,
target_type=ArtifactType.RAW_TEXT,
projector_name="alto_to_text",
params={"reading_order": "natural", "preserve_hyphens": True},
)
assert p.params["reading_order"] == "natural"
assert p.params["preserve_hyphens"] is True
def test_frozen(self) -> None:
p = ProjectionSpec(
source_type=ArtifactType.ALTO_XML,
target_type=ArtifactType.RAW_TEXT,
projector_name="alto_to_text",
)
with pytest.raises(ValidationError):
p.projector_name = "other" # type: ignore[misc]
def test_json_roundtrip(self) -> None:
p = ProjectionSpec(
source_type=ArtifactType.ALTO_XML,
target_type=ArtifactType.RAW_TEXT,
projector_name="alto_to_text",
params={"reading_order": "natural"},
)
p2 = ProjectionSpec.model_validate_json(p.model_dump_json())
assert p == p2
# ββββββββββββββββββββββββββββββββββββββββββββββββββββββββββββββββββββββ
# EvaluationView β la piΓ¨ce centrale du S5
# ββββββββββββββββββββββββββββββββββββββββββββββββββββββββββββββββββββββ
class TestEvaluationView:
def test_text_final_view_canonical_shape(self) -> None:
"""DΓ©finition de done du S5 : tu peux instancier
``EvaluationView(name="text_final", projection_spec=..., metrics=...)``
sans rien d'autre."""
view = EvaluationView(
name="text_final",
description="Compare les sorties textuelles finales.",
candidate_types=frozenset({
ArtifactType.RAW_TEXT,
ArtifactType.CORRECTED_TEXT,
ArtifactType.ALTO_XML,
}),
projection=ProjectionSpec(
source_type=ArtifactType.ALTO_XML,
target_type=ArtifactType.RAW_TEXT,
projector_name="alto_to_text",
),
metric_names=("cer", "wer"),
ignored_dimensions=("geometry", "block_structure"),
warnings=("Cette vue ignore la structure spatiale.",),
)
assert view.name == "text_final"
assert view.accepts(ArtifactType.RAW_TEXT)
assert view.accepts(ArtifactType.ALTO_XML)
assert not view.accepts(ArtifactType.IMAGE)
def test_alto_view_no_projection(self) -> None:
"""Une vue qui n'a pas besoin de projection (compare l'ALTO
tel quel)."""
view = EvaluationView(
name="alto_documentary",
candidate_types=frozenset({ArtifactType.ALTO_XML}),
projection=None,
metric_names=("alto_validity", "line_alignment_f1"),
)
assert view.projection is None
def test_search_view_text_only(self) -> None:
view = EvaluationView(
name="searchability",
candidate_types=frozenset({
ArtifactType.RAW_TEXT, ArtifactType.CORRECTED_TEXT,
}),
metric_names=("rare_token_recall", "numerical_sequences"),
)
assert view.accepts(ArtifactType.RAW_TEXT)
assert not view.accepts(ArtifactType.ALTO_XML)
def test_view_with_normalization_profile(self) -> None:
view = EvaluationView(
name="text_diplomatic",
candidate_types=frozenset({ArtifactType.RAW_TEXT}),
normalization_profile="medieval_french",
metric_names=("cer",),
)
assert view.normalization_profile == "medieval_french"
def test_empty_candidate_types_is_valid_but_useless(self) -> None:
"""Pas de validation Γ la construction : un caller peut
construire une vue inutile (qui n'accepte rien) ; Γ
l'EvaluationViewExecutor de la signaler runtime."""
view = EvaluationView(
name="useless",
candidate_types=frozenset(),
)
assert not view.accepts(ArtifactType.RAW_TEXT)
def test_frozen(self) -> None:
view = EvaluationView(
name="x",
candidate_types=frozenset({ArtifactType.RAW_TEXT}),
)
with pytest.raises(ValidationError):
view.name = "y" # type: ignore[misc]
def test_json_roundtrip(self) -> None:
view = EvaluationView(
name="text_final",
description="x",
candidate_types=frozenset({ArtifactType.RAW_TEXT}),
projection=ProjectionSpec(
source_type=ArtifactType.ALTO_XML,
target_type=ArtifactType.RAW_TEXT,
projector_name="alto_to_text",
),
normalization_profile="nfc",
metric_names=("cer",),
ignored_dimensions=("geometry",),
warnings=("avertissement",),
)
v2 = EvaluationView.model_validate_json(view.model_dump_json())
assert view == v2
# ββββββββββββββββββββββββββββββββββββββββββββββββββββββββββββββββββββββ
# EvaluationSpec
# ββββββββββββββββββββββββββββββββββββββββββββββββββββββββββββββββββββββ
class TestEvaluationSpec:
def test_empty_spec(self) -> None:
s = EvaluationSpec()
assert s.views == ()
def test_multi_view_spec(self) -> None:
s = EvaluationSpec(
views=(
EvaluationView(
name="text",
candidate_types=frozenset({ArtifactType.RAW_TEXT}),
),
EvaluationView(
name="alto",
candidate_types=frozenset({ArtifactType.ALTO_XML}),
),
),
)
assert len(s.views) == 2
assert s.view_by_name("text") is not None
assert s.view_by_name("alto") is not None
assert s.view_by_name("missing") is None
def test_frozen(self) -> None:
s = EvaluationSpec()
with pytest.raises(ValidationError):
s.views = () # type: ignore[misc]
|