cy0307 commited on 8 days ago

Commit

b9dbf0b

verified ·

1 Parent(s): c49778a

Add files using upload-large-folder tool

Browse files

Files changed (27) hide show

docs/data/artifact_index.json +21 -21
docs/data/episode128_task_model_radar.json +26 -26
docs/data/mirror_parity.json +208 -183
docs/data/publication_audit.json +4 -3
docs/data/quality_gates.json +1 -1
docs/data/scope_claims_audit.json +1 -1
docs/data/single_episode_task_model_radar.json +1 -1
docs/data/source_alignment_audit.json +1 -1
docs/data/task_method_20_gap_audit.json +11 -25
docs/data/task_method_20_result_matrix.json +18 -18
docs/data/unified_task_model_radar.json +30 -30
results/omni_finetune/xperience10m_qwen3_omni_v6_cross_modal_retrieval_probe_a100_20260618T000000Z/RUN_REPORT.md +8 -0
results/omni_finetune/xperience10m_qwen3_omni_v6_cross_modal_retrieval_probe_a100_20260618T000000Z/collection_validation.json +16 -0
results/omni_finetune/xperience10m_qwen3_omni_v6_cross_modal_retrieval_probe_a100_20260618T000000Z/cross_modal_retrieval/metrics.json +25 -0
results/omni_finetune/xperience10m_qwen3_omni_v6_cross_modal_retrieval_probe_a100_20260618T000000Z/launch_env.txt +11 -0
results/omni_finetune/xperience10m_qwen3_omni_v6_cross_modal_retrieval_probe_a100_20260618T000000Z/summary.json +19 -0
results/omni_finetune/xperience10m_qwen3_omni_v6_cross_modal_retrieval_probe_a100_20260618T000000Z/xperience10m_qwen3_omni_v6_cross_modal_retrieval_probe_a100_20260618T000000Z_shard0.progress.jsonl +0 -0
results/omni_finetune/xperience10m_qwen3_omni_v6_cross_modal_retrieval_probe_a100_20260618T000000Z/xperience10m_qwen3_omni_v6_cross_modal_retrieval_probe_a100_20260618T000000Z_shard1.progress.jsonl +0 -0
results/omni_finetune/xperience10m_qwen3_omni_v6_retrieval_task_probes_a100_20260617T175919Z/RUN_REPORT.md +8 -0
results/omni_finetune/xperience10m_qwen3_omni_v6_retrieval_task_probes_a100_20260617T175919Z/caption_grounding/metrics.json +24 -0
results/omni_finetune/xperience10m_qwen3_omni_v6_retrieval_task_probes_a100_20260617T175919Z/caption_grounding/predictions.csv +0 -0
results/omni_finetune/xperience10m_qwen3_omni_v6_retrieval_task_probes_a100_20260617T175919Z/collection_validation.json +16 -0
results/omni_finetune/xperience10m_qwen3_omni_v6_retrieval_task_probes_a100_20260617T175919Z/launch_env.txt +11 -0
results/omni_finetune/xperience10m_qwen3_omni_v6_retrieval_task_probes_a100_20260617T175919Z/summary.json +19 -0
results/omni_finetune/xperience10m_qwen3_omni_v6_retrieval_task_probes_a100_20260617T175919Z/xperience10m_qwen3_omni_v6_retrieval_task_probes_a100_20260617T175919Z_shard0.progress.jsonl +0 -0
results/omni_finetune/xperience10m_qwen3_omni_v6_retrieval_task_probes_a100_20260617T175919Z/xperience10m_qwen3_omni_v6_retrieval_task_probes_a100_20260617T175919Z_shard1.progress.jsonl +0 -0
scripts/omni/collect_qwen3_retrieval_task_probe_results.sh +89 -0

docs/data/artifact_index.json CHANGED Viewed

@@ -1,6 +1,6 @@
 {
   "title": "Ropedia Xperience-10M Task Suite Artifact Index",
-  "generated_at_utc": "2026-06-18T09:28:32+00:00",
   "status": "pass",
   "artifact_count": 213,
   "missing": [],
@@ -599,7 +599,7 @@
       "shows": "Machine-readable source-alignment pass/fail check for repo, website, and HF surfaces.",
       "exists": true,
       "bytes": 4432,
-      "sha256": "499e62359f6db0afa32c1160a2c4ca90da511c1035efaac4e77943c4905751a7"
     },
     {
       "id": "source_alignment_validator",
@@ -719,8 +719,8 @@
       "surface": "website_hf",
       "shows": "Stores normalized 20-axis radar values, raw task metrics, Qwen3/Cosmos overlay mappings, branch-card caveats, and explicit scoreless status records.",
       "exists": true,
-      "bytes": 231127,
-      "sha256": "3bcabe4b7182b66292c012f26401d753f581d9feb3d0adb312a5115933f34767"
     },
     {
       "id": "single_episode_task_model_radar_json",
@@ -731,7 +731,7 @@
       "shows": "Machine-readable split radar for the one-episode Minimal and Neural MLP baselines, both scored on all 20 task contracts.",
       "exists": true,
       "bytes": 50973,
-      "sha256": "01d524bca7b7a827134ac00af76659745f6c2127096064078f99c3db151cc7e0"
     },
     {
       "id": "episode128_task_model_radar_json",
@@ -741,8 +741,8 @@
       "surface": "website_hf",
       "shows": "Machine-readable split radar for selected 128-episode metadata/raw baselines and verified Qwen3/Cosmos branches, preserving explicit scoreless cells.",
       "exists": true,
-      "bytes": 187275,
-      "sha256": "e006cb7f6c0c8bf7258a42206ec095b4ad2622c4bd7b9f67275d8a9cae2105a5"
     },
     {
       "id": "task_method_20_result_matrix_json",
@@ -752,8 +752,8 @@
       "surface": "website_hf",
       "shows": "Machine-readable 9-method by 20-task matrix where every method has 20 records and scoreless cells carry unsupported/not-evaluated reasons.",
       "exists": true,
-      "bytes": 129689,
-      "sha256": "d633cbc900b04df4afef67a75a9d17d79c9da2942a43ab0d5d31dcf270af2c94"
     },
     {
       "id": "task_method_20_result_matrix",
@@ -763,8 +763,8 @@
       "surface": "repo_hf",
       "shows": "Reader-facing table that separates 20 records per method from numeric scored axes, documented raw128 proxy scores, unsupported metadata targets, and model targets not evaluated in verified packages.",
       "exists": true,
-      "bytes": 4152,
-      "sha256": "c5ce3d4dc21751dc0b7e371ac0d92790190e306f48b0147d99952646ae2dedb1"
     },
     {
       "id": "task_method_20_gap_audit_json",
@@ -774,8 +774,8 @@
       "surface": "website_hf",
       "shows": "Machine-readable 180-record gap ledger with numeric scores, scoreless cells, explicit status reasons, and next evidence needed before new scores can be published.",
       "exists": true,
-      "bytes": 52867,
-      "sha256": "255ba3324994ee1848a99f6bc08b74b447a63a18638d43b93017dbb591b19c6d"
     },
     {
       "id": "task_method_20_gap_audit",
@@ -785,8 +785,8 @@
       "surface": "repo_hf",
       "shows": "Reader-facing ledger that lists every scoreless method-task cell and the concrete target or model-output evidence required before it can become numeric.",
       "exists": true,
-      "bytes": 14981,
-      "sha256": "90f9885e601b2f19af863650fae7821092147ada1d86bb945b08c3cd603197ac"
     },
     {
       "id": "unified_task_model_radar_chart",
@@ -796,8 +796,8 @@
       "surface": "website_hf",
       "shows": "Compares minimal and neural MLP baselines across all 20 tasks, with Qwen3/Cosmos task-aligned model overlays.",
       "exists": true,
-      "bytes": 50506,
-      "sha256": "890cbddb57e241e4360c96c18a013c98ed56d26711f136babac6e3313751bbfb"
     },
     {
       "id": "single_episode_task_model_radar_chart",
@@ -818,8 +818,8 @@
       "surface": "website_hf",
       "shows": "Separates the selected 128-episode methods: raw-feature simple/NN as complete 20/20 scored polygons and metadata/Qwen/Cosmos as task-aligned overlays.",
       "exists": true,
-      "bytes": 44490,
-      "sha256": "537c0dc2f1173bc40aaa216cbf760aeea30c9325ddd5c08e1f16e476d4c01bdd"
     },
     {
       "id": "unified_task_model_radar_builder",
@@ -1105,7 +1105,7 @@
       "shows": "Machine-readable release-check summary for validators, mirrors, and public project surfaces.",
       "exists": true,
       "bytes": 8100,
-      "sha256": "42938d8fe2b86f4f74f27138c8099cc65bb37c092100544cda0913bf29144e09"
     },
     {
       "id": "public_surface_qa",
@@ -1286,7 +1286,7 @@
       "volatile": true,
       "shows": "Confirms public bundles exclude raw data, caches, heavy archives, and credential text.",
       "exists": true,
-      "bytes": 9341,
       "hash_policy": "existence_and_size_only"
     },
     {

 {
   "title": "Ropedia Xperience-10M Task Suite Artifact Index",
+  "generated_at_utc": "2026-06-18T10:04:51+00:00",
   "status": "pass",
   "artifact_count": 213,
   "missing": [],
       "shows": "Machine-readable source-alignment pass/fail check for repo, website, and HF surfaces.",
       "exists": true,
       "bytes": 4432,
+      "sha256": "8494b6983100acdfde9b5929e871b27120897af8ec7b5a3031aa142b598a09ae"
     },
     {
       "id": "source_alignment_validator",
       "surface": "website_hf",
       "shows": "Stores normalized 20-axis radar values, raw task metrics, Qwen3/Cosmos overlay mappings, branch-card caveats, and explicit scoreless status records.",
       "exists": true,
+      "bytes": 231123,
+      "sha256": "c004d35f0a3e0073c4116dd79a2bcdaac872605d715a7eccdaa15787df800f07"
     },
     {
       "id": "single_episode_task_model_radar_json",
       "shows": "Machine-readable split radar for the one-episode Minimal and Neural MLP baselines, both scored on all 20 task contracts.",
       "exists": true,
       "bytes": 50973,
+      "sha256": "6db28943d1206aef75fbce8ea87ea52a35c0144c6186214f37da9311ca8c9a0c"
     },
     {
       "id": "episode128_task_model_radar_json",
       "surface": "website_hf",
       "shows": "Machine-readable split radar for selected 128-episode metadata/raw baselines and verified Qwen3/Cosmos branches, preserving explicit scoreless cells.",
       "exists": true,
+      "bytes": 187271,
+      "sha256": "acd8623ad19bf0d0ee1ffb434ecefa087339b59e97d30809eca9b739f83f1a89"
     },
     {
       "id": "task_method_20_result_matrix_json",
       "surface": "website_hf",
       "shows": "Machine-readable 9-method by 20-task matrix where every method has 20 records and scoreless cells carry unsupported/not-evaluated reasons.",
       "exists": true,
+      "bytes": 129687,
+      "sha256": "e5d3fa22013fedf350907746f775cc4a1ca3bb3f816b40ca9467d51cf16925f8"
     },
     {
       "id": "task_method_20_result_matrix",
       "surface": "repo_hf",
       "shows": "Reader-facing table that separates 20 records per method from numeric scored axes, documented raw128 proxy scores, unsupported metadata targets, and model targets not evaluated in verified packages.",
       "exists": true,
+      "bytes": 4144,
+      "sha256": "dac2828ba0286bc35290a61b6d02dbd75f0b3acb8d47a73cfa7f072d7fa209c1"
     },
     {
       "id": "task_method_20_gap_audit_json",
       "surface": "website_hf",
       "shows": "Machine-readable 180-record gap ledger with numeric scores, scoreless cells, explicit status reasons, and next evidence needed before new scores can be published.",
       "exists": true,
+      "bytes": 52153,
+      "sha256": "e47ac5d2ac8216f2b46b5fb868275c779226dce8089a8c025dd26571cb5758d3"
     },
     {
       "id": "task_method_20_gap_audit",
       "surface": "repo_hf",
       "shows": "Reader-facing ledger that lists every scoreless method-task cell and the concrete target or model-output evidence required before it can become numeric.",
       "exists": true,
+      "bytes": 14812,
+      "sha256": "d2f0228497fa834c7f097e1fe74e2210b85d0a01f7841356e67dc79929a74413"
     },
     {
       "id": "unified_task_model_radar_chart",
       "surface": "website_hf",
       "shows": "Compares minimal and neural MLP baselines across all 20 tasks, with Qwen3/Cosmos task-aligned model overlays.",
       "exists": true,
+      "bytes": 50618,
+      "sha256": "29ede875ef96c76a8aa7ec6e9883457be611fac8ef967b825041b33fe1d86863"
     },
     {
       "id": "single_episode_task_model_radar_chart",
       "surface": "website_hf",
       "shows": "Separates the selected 128-episode methods: raw-feature simple/NN as complete 20/20 scored polygons and metadata/Qwen/Cosmos as task-aligned overlays.",
       "exists": true,
+      "bytes": 44602,
+      "sha256": "9a2fd542502cb26f093097d9ace238f8cf3b619e0abdec5bf2870c5271fb9ed5"
     },
     {
       "id": "unified_task_model_radar_builder",
       "shows": "Machine-readable release-check summary for validators, mirrors, and public project surfaces.",
       "exists": true,
       "bytes": 8100,
+      "sha256": "0ccb122c1425ef617e7a175ff38cdda9977e737879e609f77fcec2684f4057d4"
     },
     {
       "id": "public_surface_qa",
       "volatile": true,
       "shows": "Confirms public bundles exclude raw data, caches, heavy archives, and credential text.",
       "exists": true,
+      "bytes": 9526,
       "hash_policy": "existence_and_size_only"
     },
     {

docs/data/episode128_task_model_radar.json CHANGED Viewed

@@ -1,12 +1,12 @@
 {
   "title": "128-Episode 20-Task Radar",
   "status": "pass",
-  "generated_at_utc": "2026-06-18T09:06:25+00:00",
   "description": "Selected 128-episode metadata/raw baselines plus verified Qwen3/Cosmos branches. Every method has 20 records; numeric scores appear only where the public artifact produced that task target.",
   "task_count": 20,
   "method_count": 7,
   "method_task_record_count": 140,
-  "scored_method_task_count": 80,
   "normalization_policy": {
     "higher_is_better": "bounded metrics are plotted directly on 0-1 axes after clipping to [0, 1]",
     "lower_is_better": "lower-error metrics are converted to best_observed_value / raw_value within the same task",
@@ -127,17 +127,17 @@
       "method_detail": "Verified held-out Qwen3-Omni v6 LoRA metrics, plus task 16 and any completed private-GPU future-task probes scored from task-specific JSON.",
       "plotted_as": "colored point overlay",
       "result_record_count": 20,
-      "scored_task_count": 14,
-      "covered_task_count": 14,
       "proxy_scored_task_count": 0,
-      "scoreless_task_count": 6,
       "unsupported_task_count": 0,
-      "not_evaluated_task_count": 6,
       "status_counts": {
-        "not_evaluated_in_verified_package": 6,
-        "scored": 14
       },
-      "coverage_fraction": 0.7,
       "result_record_fraction": 1.0
     },
     {
@@ -975,15 +975,15 @@
           "status_label": "scored"
         },
         "qwen3_omni_v6_lora": {
-          "raw": null,
-          "metric_key": "mrr",
-          "source": null,
           "scope": "multi_episode_128_partial_model_overlay",
-          "status": "not_evaluated_in_verified_package",
-          "reason": "the verified public model package did not ask this branch to emit that task target; a new task-specific evaluation package is required for a numeric score",
-          "normalized_score": null,
-          "raw_text": "n/a",
-          "status_label": "not evaluated"
         },
         "cosmos3_super_reasoner": {
           "raw": null,
@@ -3098,17 +3098,17 @@
       "task_label": "Cross-Modal Retrieval",
       "series_id": "qwen3_omni_v6_lora",
       "method": "Qwen3-Omni v6 LoRA",
-      "status": "not_evaluated_in_verified_package",
-      "status_label": "not evaluated",
-      "scored": false,
       "proxy_scored": false,
-      "raw": null,
-      "raw_text": "n/a",
-      "normalized_score": null,
-      "metric_key": "mrr",
-      "source": null,
       "scope": "multi_episode_128_partial_model_overlay",
-      "reason": "the verified public model package did not ask this branch to emit that task target; a new task-specific evaluation package is required for a numeric score"
     },
     {
       "task_number": 9,

 {
   "title": "128-Episode 20-Task Radar",
   "status": "pass",
+  "generated_at_utc": "2026-06-18T10:04:17+00:00",
   "description": "Selected 128-episode metadata/raw baselines plus verified Qwen3/Cosmos branches. Every method has 20 records; numeric scores appear only where the public artifact produced that task target.",
   "task_count": 20,
   "method_count": 7,
   "method_task_record_count": 140,
+  "scored_method_task_count": 81,
   "normalization_policy": {
     "higher_is_better": "bounded metrics are plotted directly on 0-1 axes after clipping to [0, 1]",
     "lower_is_better": "lower-error metrics are converted to best_observed_value / raw_value within the same task",
       "method_detail": "Verified held-out Qwen3-Omni v6 LoRA metrics, plus task 16 and any completed private-GPU future-task probes scored from task-specific JSON.",
       "plotted_as": "colored point overlay",
       "result_record_count": 20,
+      "scored_task_count": 15,
+      "covered_task_count": 15,
       "proxy_scored_task_count": 0,
+      "scoreless_task_count": 5,
       "unsupported_task_count": 0,
+      "not_evaluated_task_count": 5,
       "status_counts": {
+        "not_evaluated_in_verified_package": 5,
+        "scored": 15
       },
+      "coverage_fraction": 0.75,
       "result_record_fraction": 1.0
     },
     {
           "status_label": "scored"
         },
         "qwen3_omni_v6_lora": {
+          "raw": 0.5080191798941732,
+          "metric_key": "cross_modal_retrieval_mrr",
+          "source": "results/omni_finetune/xperience10m_qwen3_omni_v6_cross_modal_retrieval_probe_a100_20260618T000000Z/cross_modal_retrieval/metrics.json",
           "scope": "multi_episode_128_partial_model_overlay",
+          "status": "scored",
+          "reason": null,
+          "normalized_score": 0.5080191798941732,
+          "raw_text": "0.5080",
+          "status_label": "scored"
         },
         "cosmos3_super_reasoner": {
           "raw": null,
       "task_label": "Cross-Modal Retrieval",
       "series_id": "qwen3_omni_v6_lora",
       "method": "Qwen3-Omni v6 LoRA",
+      "status": "scored",
+      "status_label": "scored",
+      "scored": true,
       "proxy_scored": false,
+      "raw": 0.5080191798941732,
+      "raw_text": "0.5080",
+      "normalized_score": 0.5080191798941732,
+      "metric_key": "cross_modal_retrieval_mrr",
+      "source": "results/omni_finetune/xperience10m_qwen3_omni_v6_cross_modal_retrieval_probe_a100_20260618T000000Z/cross_modal_retrieval/metrics.json",
       "scope": "multi_episode_128_partial_model_overlay",
+      "reason": null
     },
     {
       "task_number": 9,

docs/data/mirror_parity.json CHANGED Viewed

@@ -1,9 +1,9 @@
 {
   "status": "pass",
-  "generated_at_utc": "2026-06-18T09:30:32+00:00",
   "hf_root": "hf_publish",
   "summary": {
-    "group_count": 649,
     "failure_count": 0,
     "failures_by_surface": {}
   },
@@ -139,44 +139,44 @@
         "path": "repo:docs/data/artifact_index.json",
         "exists": true,
         "bytes": 116109,
-        "sha256": "5612f2381bcca2a21d585efa3d98d8017a799c164057cb5c03e8b9ed1080423f"
       },
       "mirrors": {
         "hf_space": {
           "path": "hf_space:data/artifact_index.json",
           "exists": true,
           "bytes": 116109,
-          "sha256": "5612f2381bcca2a21d585efa3d98d8017a799c164057cb5c03e8b9ed1080423f"
         },
         "hf_artifacts_data": {
           "path": "hf_artifacts:data/artifact_index.json",
           "exists": true,
           "bytes": 116109,
-          "sha256": "5612f2381bcca2a21d585efa3d98d8017a799c164057cb5c03e8b9ed1080423f"
         },
         "hf_artifacts": {
           "path": "hf_artifacts:docs/data/artifact_index.json",
           "exists": true,
           "bytes": 116109,
-          "sha256": "5612f2381bcca2a21d585efa3d98d8017a799c164057cb5c03e8b9ed1080423f"
         },
         "hf_model_data": {
           "path": "hf_model:data/artifact_index.json",
           "exists": true,
           "bytes": 116109,
-          "sha256": "5612f2381bcca2a21d585efa3d98d8017a799c164057cb5c03e8b9ed1080423f"
         },
         "hf_model_docs_data": {
           "path": "hf_model:docs/data/artifact_index.json",
           "exists": true,
           "bytes": 116109,
-          "sha256": "5612f2381bcca2a21d585efa3d98d8017a799c164057cb5c03e8b9ed1080423f"
         },
         "hf_model": {
           "path": "hf_model:metrics/artifact_index.json",
           "exists": true,
           "bytes": 116109,
-          "sha256": "5612f2381bcca2a21d585efa3d98d8017a799c164057cb5c03e8b9ed1080423f"
         }
       },
       "failures": []
@@ -335,44 +335,44 @@
         "path": "repo:docs/data/figure_index.json",
         "exists": true,
         "bytes": 19441,
-        "sha256": "7f641c6c5a595de09d291f17e4e2aad06a3cee73b6c64608220bf69996f0e581"
       },
       "mirrors": {
         "hf_space": {
           "path": "hf_space:data/figure_index.json",
           "exists": true,
           "bytes": 19441,
-          "sha256": "7f641c6c5a595de09d291f17e4e2aad06a3cee73b6c64608220bf69996f0e581"
         },
         "hf_artifacts_data": {
           "path": "hf_artifacts:data/figure_index.json",
           "exists": true,
           "bytes": 19441,
-          "sha256": "7f641c6c5a595de09d291f17e4e2aad06a3cee73b6c64608220bf69996f0e581"
         },
         "hf_artifacts": {
           "path": "hf_artifacts:docs/data/figure_index.json",
           "exists": true,
           "bytes": 19441,
-          "sha256": "7f641c6c5a595de09d291f17e4e2aad06a3cee73b6c64608220bf69996f0e581"
         },
         "hf_model_data": {
           "path": "hf_model:data/figure_index.json",
           "exists": true,
           "bytes": 19441,
-          "sha256": "7f641c6c5a595de09d291f17e4e2aad06a3cee73b6c64608220bf69996f0e581"
         },
         "hf_model_docs_data": {
           "path": "hf_model:docs/data/figure_index.json",
           "exists": true,
           "bytes": 19441,
-          "sha256": "7f641c6c5a595de09d291f17e4e2aad06a3cee73b6c64608220bf69996f0e581"
         },
         "hf_model": {
           "path": "hf_model:metrics/figure_index.json",
           "exists": true,
           "bytes": 19441,
-          "sha256": "7f641c6c5a595de09d291f17e4e2aad06a3cee73b6c64608220bf69996f0e581"
         }
       },
       "failures": []
@@ -922,45 +922,45 @@
       "local": {
         "path": "repo:docs/data/publication_audit.json",
         "exists": true,
-        "bytes": 9526,
-        "sha256": "25759aa29d95fa065a9fe3ec74fb3781e8d5858ac6ca2553c7b2d29c48bbb93d"
       },
       "mirrors": {
         "hf_space": {
           "path": "hf_space:data/publication_audit.json",
           "exists": true,
-          "bytes": 9526,
-          "sha256": "25759aa29d95fa065a9fe3ec74fb3781e8d5858ac6ca2553c7b2d29c48bbb93d"
         },
         "hf_artifacts_data": {
           "path": "hf_artifacts:data/publication_audit.json",
           "exists": true,
-          "bytes": 9526,
-          "sha256": "25759aa29d95fa065a9fe3ec74fb3781e8d5858ac6ca2553c7b2d29c48bbb93d"
         },
         "hf_artifacts": {
           "path": "hf_artifacts:docs/data/publication_audit.json",
           "exists": true,
-          "bytes": 9526,
-          "sha256": "25759aa29d95fa065a9fe3ec74fb3781e8d5858ac6ca2553c7b2d29c48bbb93d"
         },
         "hf_model_data": {
           "path": "hf_model:data/publication_audit.json",
           "exists": true,
-          "bytes": 9526,
-          "sha256": "25759aa29d95fa065a9fe3ec74fb3781e8d5858ac6ca2553c7b2d29c48bbb93d"
         },
         "hf_model_docs_data": {
           "path": "hf_model:docs/data/publication_audit.json",
           "exists": true,
-          "bytes": 9526,
-          "sha256": "25759aa29d95fa065a9fe3ec74fb3781e8d5858ac6ca2553c7b2d29c48bbb93d"
         },
         "hf_model": {
           "path": "hf_model:metrics/publication_audit.json",
           "exists": true,
-          "bytes": 9526,
-          "sha256": "25759aa29d95fa065a9fe3ec74fb3781e8d5858ac6ca2553c7b2d29c48bbb93d"
         }
       },
       "failures": []
@@ -972,44 +972,44 @@
         "path": "repo:docs/data/public_surface_qa.json",
         "exists": true,
         "bytes": 7126,
-        "sha256": "97f7e2df04f2b88ce9f2957037da201619e97220d8a72cee572ab4d1cecedb72"
       },
       "mirrors": {
         "hf_space": {
           "path": "hf_space:data/public_surface_qa.json",
           "exists": true,
           "bytes": 7126,
-          "sha256": "97f7e2df04f2b88ce9f2957037da201619e97220d8a72cee572ab4d1cecedb72"
         },
         "hf_artifacts_data": {
           "path": "hf_artifacts:data/public_surface_qa.json",
           "exists": true,
           "bytes": 7126,
-          "sha256": "97f7e2df04f2b88ce9f2957037da201619e97220d8a72cee572ab4d1cecedb72"
         },
         "hf_artifacts": {
           "path": "hf_artifacts:docs/data/public_surface_qa.json",
           "exists": true,
           "bytes": 7126,
-          "sha256": "97f7e2df04f2b88ce9f2957037da201619e97220d8a72cee572ab4d1cecedb72"
         },
         "hf_model_data": {
           "path": "hf_model:data/public_surface_qa.json",
           "exists": true,
           "bytes": 7126,
-          "sha256": "97f7e2df04f2b88ce9f2957037da201619e97220d8a72cee572ab4d1cecedb72"
         },
         "hf_model_docs_data": {
           "path": "hf_model:docs/data/public_surface_qa.json",
           "exists": true,
           "bytes": 7126,
-          "sha256": "97f7e2df04f2b88ce9f2957037da201619e97220d8a72cee572ab4d1cecedb72"
         },
         "hf_model": {
           "path": "hf_model:metrics/public_surface_qa.json",
           "exists": true,
           "bytes": 7126,
-          "sha256": "97f7e2df04f2b88ce9f2957037da201619e97220d8a72cee572ab4d1cecedb72"
         }
       },
       "failures": []
@@ -1119,44 +1119,44 @@
         "path": "repo:docs/data/quality_gates.json",
         "exists": true,
         "bytes": 8100,
-        "sha256": "b5e7b11d54cc3234e57e9272406a0ffca1e5bb4ad42a45b30d9493ed8d82b4bf"
       },
       "mirrors": {
         "hf_space": {
           "path": "hf_space:data/quality_gates.json",
           "exists": true,
           "bytes": 8100,
-          "sha256": "b5e7b11d54cc3234e57e9272406a0ffca1e5bb4ad42a45b30d9493ed8d82b4bf"
         },
         "hf_artifacts_data": {
           "path": "hf_artifacts:data/quality_gates.json",
           "exists": true,
           "bytes": 8100,
-          "sha256": "b5e7b11d54cc3234e57e9272406a0ffca1e5bb4ad42a45b30d9493ed8d82b4bf"
         },
         "hf_artifacts": {
           "path": "hf_artifacts:docs/data/quality_gates.json",
           "exists": true,
           "bytes": 8100,
-          "sha256": "b5e7b11d54cc3234e57e9272406a0ffca1e5bb4ad42a45b30d9493ed8d82b4bf"
         },
         "hf_model_data": {
           "path": "hf_model:data/quality_gates.json",
           "exists": true,
           "bytes": 8100,
-          "sha256": "b5e7b11d54cc3234e57e9272406a0ffca1e5bb4ad42a45b30d9493ed8d82b4bf"
         },
         "hf_model_docs_data": {
           "path": "hf_model:docs/data/quality_gates.json",
           "exists": true,
           "bytes": 8100,
-          "sha256": "b5e7b11d54cc3234e57e9272406a0ffca1e5bb4ad42a45b30d9493ed8d82b4bf"
         },
         "hf_model": {
           "path": "hf_model:metrics/quality_gates.json",
           "exists": true,
           "bytes": 8100,
-          "sha256": "b5e7b11d54cc3234e57e9272406a0ffca1e5bb4ad42a45b30d9493ed8d82b4bf"
         }
       },
       "failures": []
@@ -1560,44 +1560,44 @@
         "path": "repo:docs/data/scope_claims_audit.json",
         "exists": true,
         "bytes": 21630,
-        "sha256": "6df6428701f8becd539f3bbdd80caabd69a0c51b29a3a78f08a2cf64523e8593"
       },
       "mirrors": {
         "hf_space": {
           "path": "hf_space:data/scope_claims_audit.json",
           "exists": true,
           "bytes": 21630,
-          "sha256": "6df6428701f8becd539f3bbdd80caabd69a0c51b29a3a78f08a2cf64523e8593"
         },
         "hf_artifacts_data": {
           "path": "hf_artifacts:data/scope_claims_audit.json",
           "exists": true,
           "bytes": 21630,
-          "sha256": "6df6428701f8becd539f3bbdd80caabd69a0c51b29a3a78f08a2cf64523e8593"
         },
         "hf_artifacts": {
           "path": "hf_artifacts:docs/data/scope_claims_audit.json",
           "exists": true,
           "bytes": 21630,
-          "sha256": "6df6428701f8becd539f3bbdd80caabd69a0c51b29a3a78f08a2cf64523e8593"
         },
         "hf_model_data": {
           "path": "hf_model:data/scope_claims_audit.json",
           "exists": true,
           "bytes": 21630,
-          "sha256": "6df6428701f8becd539f3bbdd80caabd69a0c51b29a3a78f08a2cf64523e8593"
         },
         "hf_model_docs_data": {
           "path": "hf_model:docs/data/scope_claims_audit.json",
           "exists": true,
           "bytes": 21630,
-          "sha256": "6df6428701f8becd539f3bbdd80caabd69a0c51b29a3a78f08a2cf64523e8593"
         },
         "hf_model": {
           "path": "hf_model:metrics/scope_claims_audit.json",
           "exists": true,
           "bytes": 21630,
-          "sha256": "6df6428701f8becd539f3bbdd80caabd69a0c51b29a3a78f08a2cf64523e8593"
         }
       },
       "failures": []
@@ -1658,44 +1658,44 @@
         "path": "repo:docs/data/source_alignment_audit.json",
         "exists": true,
         "bytes": 4432,
-        "sha256": "499e62359f6db0afa32c1160a2c4ca90da511c1035efaac4e77943c4905751a7"
       },
       "mirrors": {
         "hf_space": {
           "path": "hf_space:data/source_alignment_audit.json",
           "exists": true,
           "bytes": 4432,
-          "sha256": "499e62359f6db0afa32c1160a2c4ca90da511c1035efaac4e77943c4905751a7"
         },
         "hf_artifacts_data": {
           "path": "hf_artifacts:data/source_alignment_audit.json",
           "exists": true,
           "bytes": 4432,
-          "sha256": "499e62359f6db0afa32c1160a2c4ca90da511c1035efaac4e77943c4905751a7"
         },
         "hf_artifacts": {
           "path": "hf_artifacts:docs/data/source_alignment_audit.json",
           "exists": true,
           "bytes": 4432,
-          "sha256": "499e62359f6db0afa32c1160a2c4ca90da511c1035efaac4e77943c4905751a7"
         },
         "hf_model_data": {
           "path": "hf_model:data/source_alignment_audit.json",
           "exists": true,
           "bytes": 4432,
-          "sha256": "499e62359f6db0afa32c1160a2c4ca90da511c1035efaac4e77943c4905751a7"
         },
         "hf_model_docs_data": {
           "path": "hf_model:docs/data/source_alignment_audit.json",
           "exists": true,
           "bytes": 4432,
-          "sha256": "499e62359f6db0afa32c1160a2c4ca90da511c1035efaac4e77943c4905751a7"
         },
         "hf_model": {
           "path": "hf_model:metrics/source_alignment_audit.json",
           "exists": true,
           "bytes": 4432,
-          "sha256": "499e62359f6db0afa32c1160a2c4ca90da511c1035efaac4e77943c4905751a7"
         }
       },
       "failures": []
@@ -1756,44 +1756,44 @@
         "path": "repo:docs/data/single_episode_task_model_radar.json",
         "exists": true,
         "bytes": 50973,
-        "sha256": "01d524bca7b7a827134ac00af76659745f6c2127096064078f99c3db151cc7e0"
       },
       "mirrors": {
         "hf_space": {
           "path": "hf_space:data/single_episode_task_model_radar.json",
           "exists": true,
           "bytes": 50973,
-          "sha256": "01d524bca7b7a827134ac00af76659745f6c2127096064078f99c3db151cc7e0"
         },
         "hf_artifacts_data": {
           "path": "hf_artifacts:data/single_episode_task_model_radar.json",
           "exists": true,
           "bytes": 50973,
-          "sha256": "01d524bca7b7a827134ac00af76659745f6c2127096064078f99c3db151cc7e0"
         },
         "hf_artifacts": {
           "path": "hf_artifacts:docs/data/single_episode_task_model_radar.json",
           "exists": true,
           "bytes": 50973,
-          "sha256": "01d524bca7b7a827134ac00af76659745f6c2127096064078f99c3db151cc7e0"
         },
         "hf_model_data": {
           "path": "hf_model:data/single_episode_task_model_radar.json",
           "exists": true,
           "bytes": 50973,
-          "sha256": "01d524bca7b7a827134ac00af76659745f6c2127096064078f99c3db151cc7e0"
         },
         "hf_model_docs_data": {
           "path": "hf_model:docs/data/single_episode_task_model_radar.json",
           "exists": true,
           "bytes": 50973,
-          "sha256": "01d524bca7b7a827134ac00af76659745f6c2127096064078f99c3db151cc7e0"
         },
         "hf_model": {
           "path": "hf_model:metrics/single_episode_task_model_radar.json",
           "exists": true,
           "bytes": 50973,
-          "sha256": "01d524bca7b7a827134ac00af76659745f6c2127096064078f99c3db151cc7e0"
         }
       },
       "failures": []
@@ -1804,45 +1804,45 @@
       "local": {
         "path": "repo:docs/data/episode128_task_model_radar.json",
         "exists": true,
-        "bytes": 187275,
-        "sha256": "e006cb7f6c0c8bf7258a42206ec095b4ad2622c4bd7b9f67275d8a9cae2105a5"
       },
       "mirrors": {
         "hf_space": {
           "path": "hf_space:data/episode128_task_model_radar.json",
           "exists": true,
-          "bytes": 187275,
-          "sha256": "e006cb7f6c0c8bf7258a42206ec095b4ad2622c4bd7b9f67275d8a9cae2105a5"
         },
         "hf_artifacts_data": {
           "path": "hf_artifacts:data/episode128_task_model_radar.json",
           "exists": true,
-          "bytes": 187275,
-          "sha256": "e006cb7f6c0c8bf7258a42206ec095b4ad2622c4bd7b9f67275d8a9cae2105a5"
         },
         "hf_artifacts": {
           "path": "hf_artifacts:docs/data/episode128_task_model_radar.json",
           "exists": true,
-          "bytes": 187275,
-          "sha256": "e006cb7f6c0c8bf7258a42206ec095b4ad2622c4bd7b9f67275d8a9cae2105a5"
         },
         "hf_model_data": {
           "path": "hf_model:data/episode128_task_model_radar.json",
           "exists": true,
-          "bytes": 187275,
-          "sha256": "e006cb7f6c0c8bf7258a42206ec095b4ad2622c4bd7b9f67275d8a9cae2105a5"
         },
         "hf_model_docs_data": {
           "path": "hf_model:docs/data/episode128_task_model_radar.json",
           "exists": true,
-          "bytes": 187275,
-          "sha256": "e006cb7f6c0c8bf7258a42206ec095b4ad2622c4bd7b9f67275d8a9cae2105a5"
         },
         "hf_model": {
           "path": "hf_model:metrics/episode128_task_model_radar.json",
           "exists": true,
-          "bytes": 187275,
-          "sha256": "e006cb7f6c0c8bf7258a42206ec095b4ad2622c4bd7b9f67275d8a9cae2105a5"
         }
       },
       "failures": []
@@ -2001,44 +2001,44 @@
         "path": "repo:docs/data/task_surface_integrity.json",
         "exists": true,
         "bytes": 45779,
-        "sha256": "ab9f1f8b5eb785d72a3e554c041d802cc551787a710af417d1cc04f60c42c6c2"
       },
       "mirrors": {
         "hf_space": {
           "path": "hf_space:data/task_surface_integrity.json",
           "exists": true,
           "bytes": 45779,
-          "sha256": "ab9f1f8b5eb785d72a3e554c041d802cc551787a710af417d1cc04f60c42c6c2"
         },
         "hf_artifacts_data": {
           "path": "hf_artifacts:data/task_surface_integrity.json",
           "exists": true,
           "bytes": 45779,
-          "sha256": "ab9f1f8b5eb785d72a3e554c041d802cc551787a710af417d1cc04f60c42c6c2"
         },
         "hf_artifacts": {
           "path": "hf_artifacts:docs/data/task_surface_integrity.json",
           "exists": true,
           "bytes": 45779,
-          "sha256": "ab9f1f8b5eb785d72a3e554c041d802cc551787a710af417d1cc04f60c42c6c2"
         },
         "hf_model_data": {
           "path": "hf_model:data/task_surface_integrity.json",
           "exists": true,
           "bytes": 45779,
-          "sha256": "ab9f1f8b5eb785d72a3e554c041d802cc551787a710af417d1cc04f60c42c6c2"
         },
         "hf_model_docs_data": {
           "path": "hf_model:docs/data/task_surface_integrity.json",
           "exists": true,
           "bytes": 45779,
-          "sha256": "ab9f1f8b5eb785d72a3e554c041d802cc551787a710af417d1cc04f60c42c6c2"
         },
         "hf_model": {
           "path": "hf_model:metrics/task_surface_integrity.json",
           "exists": true,
           "bytes": 45779,
-          "sha256": "ab9f1f8b5eb785d72a3e554c041d802cc551787a710af417d1cc04f60c42c6c2"
         }
       },
       "failures": []
@@ -2098,45 +2098,45 @@
       "local": {
         "path": "repo:docs/data/task_method_20_result_matrix.json",
         "exists": true,
-        "bytes": 129689,
-        "sha256": "d633cbc900b04df4afef67a75a9d17d79c9da2942a43ab0d5d31dcf270af2c94"
       },
       "mirrors": {
         "hf_space": {
           "path": "hf_space:data/task_method_20_result_matrix.json",
           "exists": true,
-          "bytes": 129689,
-          "sha256": "d633cbc900b04df4afef67a75a9d17d79c9da2942a43ab0d5d31dcf270af2c94"
         },
         "hf_artifacts_data": {
           "path": "hf_artifacts:data/task_method_20_result_matrix.json",
           "exists": true,
-          "bytes": 129689,
-          "sha256": "d633cbc900b04df4afef67a75a9d17d79c9da2942a43ab0d5d31dcf270af2c94"
         },
         "hf_artifacts": {
           "path": "hf_artifacts:docs/data/task_method_20_result_matrix.json",
           "exists": true,
-          "bytes": 129689,
-          "sha256": "d633cbc900b04df4afef67a75a9d17d79c9da2942a43ab0d5d31dcf270af2c94"
         },
         "hf_model_data": {
           "path": "hf_model:data/task_method_20_result_matrix.json",
           "exists": true,
-          "bytes": 129689,
-          "sha256": "d633cbc900b04df4afef67a75a9d17d79c9da2942a43ab0d5d31dcf270af2c94"
         },
         "hf_model_docs_data": {
           "path": "hf_model:docs/data/task_method_20_result_matrix.json",
           "exists": true,
-          "bytes": 129689,
-          "sha256": "d633cbc900b04df4afef67a75a9d17d79c9da2942a43ab0d5d31dcf270af2c94"
         },
         "hf_model": {
           "path": "hf_model:metrics/task_method_20_result_matrix.json",
           "exists": true,
-          "bytes": 129689,
-          "sha256": "d633cbc900b04df4afef67a75a9d17d79c9da2942a43ab0d5d31dcf270af2c94"
         }
       },
       "failures": []
@@ -2147,45 +2147,45 @@
       "local": {
         "path": "repo:docs/data/task_method_20_gap_audit.json",
         "exists": true,
-        "bytes": 52867,
-        "sha256": "255ba3324994ee1848a99f6bc08b74b447a63a18638d43b93017dbb591b19c6d"
       },
       "mirrors": {
         "hf_space": {
           "path": "hf_space:data/task_method_20_gap_audit.json",
           "exists": true,
-          "bytes": 52867,
-          "sha256": "255ba3324994ee1848a99f6bc08b74b447a63a18638d43b93017dbb591b19c6d"
         },
         "hf_artifacts_data": {
           "path": "hf_artifacts:data/task_method_20_gap_audit.json",
           "exists": true,
-          "bytes": 52867,
-          "sha256": "255ba3324994ee1848a99f6bc08b74b447a63a18638d43b93017dbb591b19c6d"
         },
         "hf_artifacts": {
           "path": "hf_artifacts:docs/data/task_method_20_gap_audit.json",
           "exists": true,
-          "bytes": 52867,
-          "sha256": "255ba3324994ee1848a99f6bc08b74b447a63a18638d43b93017dbb591b19c6d"
         },
         "hf_model_data": {
           "path": "hf_model:data/task_method_20_gap_audit.json",
           "exists": true,
-          "bytes": 52867,
-          "sha256": "255ba3324994ee1848a99f6bc08b74b447a63a18638d43b93017dbb591b19c6d"
         },
         "hf_model_docs_data": {
           "path": "hf_model:docs/data/task_method_20_gap_audit.json",
           "exists": true,
-          "bytes": 52867,
-          "sha256": "255ba3324994ee1848a99f6bc08b74b447a63a18638d43b93017dbb591b19c6d"
         },
         "hf_model": {
           "path": "hf_model:metrics/task_method_20_gap_audit.json",
           "exists": true,
-          "bytes": 52867,
-          "sha256": "255ba3324994ee1848a99f6bc08b74b447a63a18638d43b93017dbb591b19c6d"
         }
       },
       "failures": []
@@ -2245,45 +2245,45 @@
       "local": {
         "path": "repo:docs/data/unified_task_model_radar.json",
         "exists": true,
-        "bytes": 231127,
-        "sha256": "3bcabe4b7182b66292c012f26401d753f581d9feb3d0adb312a5115933f34767"
       },
       "mirrors": {
         "hf_space": {
           "path": "hf_space:data/unified_task_model_radar.json",
           "exists": true,
-          "bytes": 231127,
-          "sha256": "3bcabe4b7182b66292c012f26401d753f581d9feb3d0adb312a5115933f34767"
         },
         "hf_artifacts_data": {
           "path": "hf_artifacts:data/unified_task_model_radar.json",
           "exists": true,
-          "bytes": 231127,
-          "sha256": "3bcabe4b7182b66292c012f26401d753f581d9feb3d0adb312a5115933f34767"
         },
         "hf_artifacts": {
           "path": "hf_artifacts:docs/data/unified_task_model_radar.json",
           "exists": true,
-          "bytes": 231127,
-          "sha256": "3bcabe4b7182b66292c012f26401d753f581d9feb3d0adb312a5115933f34767"
         },
         "hf_model_data": {
           "path": "hf_model:data/unified_task_model_radar.json",
           "exists": true,
-          "bytes": 231127,
-          "sha256": "3bcabe4b7182b66292c012f26401d753f581d9feb3d0adb312a5115933f34767"
         },
         "hf_model_docs_data": {
           "path": "hf_model:docs/data/unified_task_model_radar.json",
           "exists": true,
-          "bytes": 231127,
-          "sha256": "3bcabe4b7182b66292c012f26401d753f581d9feb3d0adb312a5115933f34767"
         },
         "hf_model": {
           "path": "hf_model:metrics/unified_task_model_radar.json",
           "exists": true,
-          "bytes": 231127,
-          "sha256": "3bcabe4b7182b66292c012f26401d753f581d9feb3d0adb312a5115933f34767"
         }
       },
       "failures": []
@@ -2295,44 +2295,44 @@
         "path": "repo:docs/data/website_integrity.json",
         "exists": true,
         "bytes": 20021,
-        "sha256": "1efe3b5b4a3d0a148df2dea58001a6d6aa9ea1d8c176fe647c056d7cbd676797"
       },
       "mirrors": {
         "hf_space": {
           "path": "hf_space:data/website_integrity.json",
           "exists": true,
           "bytes": 20021,
-          "sha256": "1efe3b5b4a3d0a148df2dea58001a6d6aa9ea1d8c176fe647c056d7cbd676797"
         },
         "hf_artifacts_data": {
           "path": "hf_artifacts:data/website_integrity.json",
           "exists": true,
           "bytes": 20021,
-          "sha256": "1efe3b5b4a3d0a148df2dea58001a6d6aa9ea1d8c176fe647c056d7cbd676797"
         },
         "hf_artifacts": {
           "path": "hf_artifacts:docs/data/website_integrity.json",
           "exists": true,
           "bytes": 20021,
-          "sha256": "1efe3b5b4a3d0a148df2dea58001a6d6aa9ea1d8c176fe647c056d7cbd676797"
         },
         "hf_model_data": {
           "path": "hf_model:data/website_integrity.json",
           "exists": true,
           "bytes": 20021,
-          "sha256": "1efe3b5b4a3d0a148df2dea58001a6d6aa9ea1d8c176fe647c056d7cbd676797"
         },
         "hf_model_docs_data": {
           "path": "hf_model:docs/data/website_integrity.json",
           "exists": true,
           "bytes": 20021,
-          "sha256": "1efe3b5b4a3d0a148df2dea58001a6d6aa9ea1d8c176fe647c056d7cbd676797"
         },
         "hf_model": {
           "path": "hf_model:metrics/website_integrity.json",
           "exists": true,
           "bytes": 20021,
-          "sha256": "1efe3b5b4a3d0a148df2dea58001a6d6aa9ea1d8c176fe647c056d7cbd676797"
         }
       },
       "failures": []
@@ -2515,33 +2515,33 @@
       "local": {
         "path": "repo:docs/assets/charts/episode128_task_model_radar.svg",
         "exists": true,
-        "bytes": 44490,
-        "sha256": "537c0dc2f1173bc40aaa216cbf760aeea30c9325ddd5c08e1f16e476d4c01bdd"
       },
       "mirrors": {
         "hf_space": {
           "path": "hf_space:assets/charts/episode128_task_model_radar.svg",
           "exists": true,
-          "bytes": 44490,
-          "sha256": "537c0dc2f1173bc40aaa216cbf760aeea30c9325ddd5c08e1f16e476d4c01bdd"
         },
         "hf_artifacts_docs": {
           "path": "hf_artifacts:docs/assets/charts/episode128_task_model_radar.svg",
           "exists": true,
-          "bytes": 44490,
-          "sha256": "537c0dc2f1173bc40aaa216cbf760aeea30c9325ddd5c08e1f16e476d4c01bdd"
         },
         "hf_artifacts_card": {
           "path": "hf_artifacts:assets/charts/episode128_task_model_radar.svg",
           "exists": true,
-          "bytes": 44490,
-          "sha256": "537c0dc2f1173bc40aaa216cbf760aeea30c9325ddd5c08e1f16e476d4c01bdd"
         },
         "hf_model": {
           "path": "hf_model:assets/charts/episode128_task_model_radar.svg",
           "exists": true,
-          "bytes": 44490,
-          "sha256": "537c0dc2f1173bc40aaa216cbf760aeea30c9325ddd5c08e1f16e476d4c01bdd"
         }
       },
       "failures": []
@@ -2589,33 +2589,33 @@
       "local": {
         "path": "repo:docs/assets/charts/unified_task_model_radar.svg",
         "exists": true,
-        "bytes": 50506,
-        "sha256": "890cbddb57e241e4360c96c18a013c98ed56d26711f136babac6e3313751bbfb"
       },
       "mirrors": {
         "hf_space": {
           "path": "hf_space:assets/charts/unified_task_model_radar.svg",
           "exists": true,
-          "bytes": 50506,
-          "sha256": "890cbddb57e241e4360c96c18a013c98ed56d26711f136babac6e3313751bbfb"
         },
         "hf_artifacts_docs": {
           "path": "hf_artifacts:docs/assets/charts/unified_task_model_radar.svg",
           "exists": true,
-          "bytes": 50506,
-          "sha256": "890cbddb57e241e4360c96c18a013c98ed56d26711f136babac6e3313751bbfb"
         },
         "hf_artifacts_card": {
           "path": "hf_artifacts:assets/charts/unified_task_model_radar.svg",
           "exists": true,
-          "bytes": 50506,
-          "sha256": "890cbddb57e241e4360c96c18a013c98ed56d26711f136babac6e3313751bbfb"
         },
         "hf_model": {
           "path": "hf_model:assets/charts/unified_task_model_radar.svg",
           "exists": true,
-          "bytes": 50506,
-          "sha256": "890cbddb57e241e4360c96c18a013c98ed56d26711f136babac6e3313751bbfb"
         }
       },
       "failures": []
@@ -3917,6 +3917,31 @@
       },
       "failures": []
     },
     {
       "name": "scripts/omni/collect_qwen3_v4_release_artifacts.py",
       "status": "pass",
@@ -4973,21 +4998,21 @@
       "local": {
         "path": "repo:scripts/validate_mirror_parity.py",
         "exists": true,
-        "bytes": 28427,
-        "sha256": "a85b031f81f378c6baa2a4201589383f828934f03b74ba300eb0bc803c929801"
       },
       "mirrors": {
         "hf_artifacts": {
           "path": "hf_artifacts:scripts/validate_mirror_parity.py",
           "exists": true,
-          "bytes": 28427,
-          "sha256": "a85b031f81f378c6baa2a4201589383f828934f03b74ba300eb0bc803c929801"
         },
         "hf_model": {
           "path": "hf_model:scripts/validate_mirror_parity.py",
           "exists": true,
-          "bytes": 28427,
-          "sha256": "a85b031f81f378c6baa2a4201589383f828934f03b74ba300eb0bc803c929801"
         }
       },
       "failures": []
@@ -4998,21 +5023,21 @@
       "local": {
         "path": "repo:scripts/validate_publication_package.py",
         "exists": true,
-        "bytes": 19912,
-        "sha256": "efb862566bedc49b0eaa11c9abdeb29abf8d3acd461b772fc79854e24dcb1c18"
       },
       "mirrors": {
         "hf_artifacts": {
           "path": "hf_artifacts:scripts/validate_publication_package.py",
           "exists": true,
-          "bytes": 19912,
-          "sha256": "efb862566bedc49b0eaa11c9abdeb29abf8d3acd461b772fc79854e24dcb1c18"
         },
         "hf_model": {
           "path": "hf_model:scripts/validate_publication_package.py",
           "exists": true,
-          "bytes": 19912,
-          "sha256": "efb862566bedc49b0eaa11c9abdeb29abf8d3acd461b772fc79854e24dcb1c18"
         }
       },
       "failures": []
@@ -20782,27 +20807,27 @@
       "local": {
         "path": "repo:TASK_METHOD_20_GAP_AUDIT.md",
         "exists": true,
-        "bytes": 14981,
-        "sha256": "90f9885e601b2f19af863650fae7821092147ada1d86bb945b08c3cd603197ac"
       },
       "mirrors": {
         "hf_space": {
           "path": "hf_space:TASK_METHOD_20_GAP_AUDIT.md",
           "exists": true,
-          "bytes": 14981,
-          "sha256": "90f9885e601b2f19af863650fae7821092147ada1d86bb945b08c3cd603197ac"
         },
         "hf_artifacts": {
           "path": "hf_artifacts:TASK_METHOD_20_GAP_AUDIT.md",
           "exists": true,
-          "bytes": 14981,
-          "sha256": "90f9885e601b2f19af863650fae7821092147ada1d86bb945b08c3cd603197ac"
         },
         "hf_model": {
           "path": "hf_model:TASK_METHOD_20_GAP_AUDIT.md",
           "exists": true,
-          "bytes": 14981,
-          "sha256": "90f9885e601b2f19af863650fae7821092147ada1d86bb945b08c3cd603197ac"
         }
       },
       "failures": []
@@ -20813,27 +20838,27 @@
       "local": {
         "path": "repo:TASK_METHOD_20_RESULT_MATRIX.md",
         "exists": true,
-        "bytes": 4152,
-        "sha256": "c5ce3d4dc21751dc0b7e371ac0d92790190e306f48b0147d99952646ae2dedb1"
       },
       "mirrors": {
         "hf_space": {
           "path": "hf_space:TASK_METHOD_20_RESULT_MATRIX.md",
           "exists": true,
-          "bytes": 4152,
-          "sha256": "c5ce3d4dc21751dc0b7e371ac0d92790190e306f48b0147d99952646ae2dedb1"
         },
         "hf_artifacts": {
           "path": "hf_artifacts:TASK_METHOD_20_RESULT_MATRIX.md",
           "exists": true,
-          "bytes": 4152,
-          "sha256": "c5ce3d4dc21751dc0b7e371ac0d92790190e306f48b0147d99952646ae2dedb1"
         },
         "hf_model": {
           "path": "hf_model:TASK_METHOD_20_RESULT_MATRIX.md",
           "exists": true,
-          "bytes": 4152,
-          "sha256": "c5ce3d4dc21751dc0b7e371ac0d92790190e306f48b0147d99952646ae2dedb1"
         }
       },
       "failures": []

 {
   "status": "pass",
+  "generated_at_utc": "2026-06-18T10:05:53+00:00",
   "hf_root": "hf_publish",
   "summary": {
+    "group_count": 650,
     "failure_count": 0,
     "failures_by_surface": {}
   },
         "path": "repo:docs/data/artifact_index.json",
         "exists": true,
         "bytes": 116109,
+        "sha256": "b88adcd80deb8cc4b4c3ed08e1a9ee7c2d8cdb21feab8a3494bd2e80e67d1b9a"
       },
       "mirrors": {
         "hf_space": {
           "path": "hf_space:data/artifact_index.json",
           "exists": true,
           "bytes": 116109,
+          "sha256": "b88adcd80deb8cc4b4c3ed08e1a9ee7c2d8cdb21feab8a3494bd2e80e67d1b9a"
         },
         "hf_artifacts_data": {
           "path": "hf_artifacts:data/artifact_index.json",
           "exists": true,
           "bytes": 116109,
+          "sha256": "b88adcd80deb8cc4b4c3ed08e1a9ee7c2d8cdb21feab8a3494bd2e80e67d1b9a"
         },
         "hf_artifacts": {
           "path": "hf_artifacts:docs/data/artifact_index.json",
           "exists": true,
           "bytes": 116109,
+          "sha256": "b88adcd80deb8cc4b4c3ed08e1a9ee7c2d8cdb21feab8a3494bd2e80e67d1b9a"
         },
         "hf_model_data": {
           "path": "hf_model:data/artifact_index.json",
           "exists": true,
           "bytes": 116109,
+          "sha256": "b88adcd80deb8cc4b4c3ed08e1a9ee7c2d8cdb21feab8a3494bd2e80e67d1b9a"
         },
         "hf_model_docs_data": {
           "path": "hf_model:docs/data/artifact_index.json",
           "exists": true,
           "bytes": 116109,
+          "sha256": "b88adcd80deb8cc4b4c3ed08e1a9ee7c2d8cdb21feab8a3494bd2e80e67d1b9a"
         },
         "hf_model": {
           "path": "hf_model:metrics/artifact_index.json",
           "exists": true,
           "bytes": 116109,
+          "sha256": "b88adcd80deb8cc4b4c3ed08e1a9ee7c2d8cdb21feab8a3494bd2e80e67d1b9a"
         }
       },
       "failures": []
         "path": "repo:docs/data/figure_index.json",
         "exists": true,
         "bytes": 19441,
+        "sha256": "ec004dfdba639132e975c65c8a524e45caa246b9d03baa1ea26eca2b288186ff"
       },
       "mirrors": {
         "hf_space": {
           "path": "hf_space:data/figure_index.json",
           "exists": true,
           "bytes": 19441,
+          "sha256": "ec004dfdba639132e975c65c8a524e45caa246b9d03baa1ea26eca2b288186ff"
         },
         "hf_artifacts_data": {
           "path": "hf_artifacts:data/figure_index.json",
           "exists": true,
           "bytes": 19441,
+          "sha256": "ec004dfdba639132e975c65c8a524e45caa246b9d03baa1ea26eca2b288186ff"
         },
         "hf_artifacts": {
           "path": "hf_artifacts:docs/data/figure_index.json",
           "exists": true,
           "bytes": 19441,
+          "sha256": "ec004dfdba639132e975c65c8a524e45caa246b9d03baa1ea26eca2b288186ff"
         },
         "hf_model_data": {
           "path": "hf_model:data/figure_index.json",
           "exists": true,
           "bytes": 19441,
+          "sha256": "ec004dfdba639132e975c65c8a524e45caa246b9d03baa1ea26eca2b288186ff"
         },
         "hf_model_docs_data": {
           "path": "hf_model:docs/data/figure_index.json",
           "exists": true,
           "bytes": 19441,
+          "sha256": "ec004dfdba639132e975c65c8a524e45caa246b9d03baa1ea26eca2b288186ff"
         },
         "hf_model": {
           "path": "hf_model:metrics/figure_index.json",
           "exists": true,
           "bytes": 19441,
+          "sha256": "ec004dfdba639132e975c65c8a524e45caa246b9d03baa1ea26eca2b288186ff"
         }
       },
       "failures": []
       "local": {
         "path": "repo:docs/data/publication_audit.json",
         "exists": true,
+        "bytes": 9598,
+        "sha256": "f1d2bff3ff9bb0be059a23eec635974cdd8208a8670277178050c47e1f8b805a"
       },
       "mirrors": {
         "hf_space": {
           "path": "hf_space:data/publication_audit.json",
           "exists": true,
+          "bytes": 9598,
+          "sha256": "f1d2bff3ff9bb0be059a23eec635974cdd8208a8670277178050c47e1f8b805a"
         },
         "hf_artifacts_data": {
           "path": "hf_artifacts:data/publication_audit.json",
           "exists": true,
+          "bytes": 9598,
+          "sha256": "f1d2bff3ff9bb0be059a23eec635974cdd8208a8670277178050c47e1f8b805a"
         },
         "hf_artifacts": {
           "path": "hf_artifacts:docs/data/publication_audit.json",
           "exists": true,
+          "bytes": 9598,
+          "sha256": "f1d2bff3ff9bb0be059a23eec635974cdd8208a8670277178050c47e1f8b805a"
         },
         "hf_model_data": {
           "path": "hf_model:data/publication_audit.json",
           "exists": true,
+          "bytes": 9598,
+          "sha256": "f1d2bff3ff9bb0be059a23eec635974cdd8208a8670277178050c47e1f8b805a"
         },
         "hf_model_docs_data": {
           "path": "hf_model:docs/data/publication_audit.json",
           "exists": true,
+          "bytes": 9598,
+          "sha256": "f1d2bff3ff9bb0be059a23eec635974cdd8208a8670277178050c47e1f8b805a"
         },
         "hf_model": {
           "path": "hf_model:metrics/publication_audit.json",
           "exists": true,
+          "bytes": 9598,
+          "sha256": "f1d2bff3ff9bb0be059a23eec635974cdd8208a8670277178050c47e1f8b805a"
         }
       },
       "failures": []
         "path": "repo:docs/data/public_surface_qa.json",
         "exists": true,
         "bytes": 7126,
+        "sha256": "a31696958f45455e18b6d85c5b206e19746e3948781c04bde1cf9e3f4c9ba108"
       },
       "mirrors": {
         "hf_space": {
           "path": "hf_space:data/public_surface_qa.json",
           "exists": true,
           "bytes": 7126,
+          "sha256": "a31696958f45455e18b6d85c5b206e19746e3948781c04bde1cf9e3f4c9ba108"
         },
         "hf_artifacts_data": {
           "path": "hf_artifacts:data/public_surface_qa.json",
           "exists": true,
           "bytes": 7126,
+          "sha256": "a31696958f45455e18b6d85c5b206e19746e3948781c04bde1cf9e3f4c9ba108"
         },
         "hf_artifacts": {
           "path": "hf_artifacts:docs/data/public_surface_qa.json",
           "exists": true,
           "bytes": 7126,
+          "sha256": "a31696958f45455e18b6d85c5b206e19746e3948781c04bde1cf9e3f4c9ba108"
         },
         "hf_model_data": {
           "path": "hf_model:data/public_surface_qa.json",
           "exists": true,
           "bytes": 7126,
+          "sha256": "a31696958f45455e18b6d85c5b206e19746e3948781c04bde1cf9e3f4c9ba108"
         },
         "hf_model_docs_data": {
           "path": "hf_model:docs/data/public_surface_qa.json",
           "exists": true,
           "bytes": 7126,
+          "sha256": "a31696958f45455e18b6d85c5b206e19746e3948781c04bde1cf9e3f4c9ba108"
         },
         "hf_model": {
           "path": "hf_model:metrics/public_surface_qa.json",
           "exists": true,
           "bytes": 7126,
+          "sha256": "a31696958f45455e18b6d85c5b206e19746e3948781c04bde1cf9e3f4c9ba108"
         }
       },
       "failures": []
         "path": "repo:docs/data/quality_gates.json",
         "exists": true,
         "bytes": 8100,
+        "sha256": "0ebf0a5e182beac55d7eddf9497cede3fa311d53d0244d39cedf912a01dd958e"
       },
       "mirrors": {
         "hf_space": {
           "path": "hf_space:data/quality_gates.json",
           "exists": true,
           "bytes": 8100,
+          "sha256": "0ebf0a5e182beac55d7eddf9497cede3fa311d53d0244d39cedf912a01dd958e"
         },
         "hf_artifacts_data": {
           "path": "hf_artifacts:data/quality_gates.json",
           "exists": true,
           "bytes": 8100,
+          "sha256": "0ebf0a5e182beac55d7eddf9497cede3fa311d53d0244d39cedf912a01dd958e"
         },
         "hf_artifacts": {
           "path": "hf_artifacts:docs/data/quality_gates.json",
           "exists": true,
           "bytes": 8100,
+          "sha256": "0ebf0a5e182beac55d7eddf9497cede3fa311d53d0244d39cedf912a01dd958e"
         },
         "hf_model_data": {
           "path": "hf_model:data/quality_gates.json",
           "exists": true,
           "bytes": 8100,
+          "sha256": "0ebf0a5e182beac55d7eddf9497cede3fa311d53d0244d39cedf912a01dd958e"
         },
         "hf_model_docs_data": {
           "path": "hf_model:docs/data/quality_gates.json",
           "exists": true,
           "bytes": 8100,
+          "sha256": "0ebf0a5e182beac55d7eddf9497cede3fa311d53d0244d39cedf912a01dd958e"
         },
         "hf_model": {
           "path": "hf_model:metrics/quality_gates.json",
           "exists": true,
           "bytes": 8100,
+          "sha256": "0ebf0a5e182beac55d7eddf9497cede3fa311d53d0244d39cedf912a01dd958e"
         }
       },
       "failures": []
         "path": "repo:docs/data/scope_claims_audit.json",
         "exists": true,
         "bytes": 21630,
+        "sha256": "ad761be4cf4410d2a18f8af08eb742d37661f1ff2eb78ea60d8d74c1fcf45a1a"
       },
       "mirrors": {
         "hf_space": {
           "path": "hf_space:data/scope_claims_audit.json",
           "exists": true,
           "bytes": 21630,
+          "sha256": "ad761be4cf4410d2a18f8af08eb742d37661f1ff2eb78ea60d8d74c1fcf45a1a"
         },
         "hf_artifacts_data": {
           "path": "hf_artifacts:data/scope_claims_audit.json",
           "exists": true,
           "bytes": 21630,
+          "sha256": "ad761be4cf4410d2a18f8af08eb742d37661f1ff2eb78ea60d8d74c1fcf45a1a"
         },
         "hf_artifacts": {
           "path": "hf_artifacts:docs/data/scope_claims_audit.json",
           "exists": true,
           "bytes": 21630,
+          "sha256": "ad761be4cf4410d2a18f8af08eb742d37661f1ff2eb78ea60d8d74c1fcf45a1a"
         },
         "hf_model_data": {
           "path": "hf_model:data/scope_claims_audit.json",
           "exists": true,
           "bytes": 21630,
+          "sha256": "ad761be4cf4410d2a18f8af08eb742d37661f1ff2eb78ea60d8d74c1fcf45a1a"
         },
         "hf_model_docs_data": {
           "path": "hf_model:docs/data/scope_claims_audit.json",
           "exists": true,
           "bytes": 21630,
+          "sha256": "ad761be4cf4410d2a18f8af08eb742d37661f1ff2eb78ea60d8d74c1fcf45a1a"
         },
         "hf_model": {
           "path": "hf_model:metrics/scope_claims_audit.json",
           "exists": true,
           "bytes": 21630,
+          "sha256": "ad761be4cf4410d2a18f8af08eb742d37661f1ff2eb78ea60d8d74c1fcf45a1a"
         }
       },
       "failures": []
         "path": "repo:docs/data/source_alignment_audit.json",
         "exists": true,
         "bytes": 4432,
+        "sha256": "8494b6983100acdfde9b5929e871b27120897af8ec7b5a3031aa142b598a09ae"
       },
       "mirrors": {
         "hf_space": {
           "path": "hf_space:data/source_alignment_audit.json",
           "exists": true,
           "bytes": 4432,
+          "sha256": "8494b6983100acdfde9b5929e871b27120897af8ec7b5a3031aa142b598a09ae"
         },
         "hf_artifacts_data": {
           "path": "hf_artifacts:data/source_alignment_audit.json",
           "exists": true,
           "bytes": 4432,
+          "sha256": "8494b6983100acdfde9b5929e871b27120897af8ec7b5a3031aa142b598a09ae"
         },
         "hf_artifacts": {
           "path": "hf_artifacts:docs/data/source_alignment_audit.json",
           "exists": true,
           "bytes": 4432,
+          "sha256": "8494b6983100acdfde9b5929e871b27120897af8ec7b5a3031aa142b598a09ae"
         },
         "hf_model_data": {
           "path": "hf_model:data/source_alignment_audit.json",
           "exists": true,
           "bytes": 4432,
+          "sha256": "8494b6983100acdfde9b5929e871b27120897af8ec7b5a3031aa142b598a09ae"
         },
         "hf_model_docs_data": {
           "path": "hf_model:docs/data/source_alignment_audit.json",
           "exists": true,
           "bytes": 4432,
+          "sha256": "8494b6983100acdfde9b5929e871b27120897af8ec7b5a3031aa142b598a09ae"
         },
         "hf_model": {
           "path": "hf_model:metrics/source_alignment_audit.json",
           "exists": true,
           "bytes": 4432,
+          "sha256": "8494b6983100acdfde9b5929e871b27120897af8ec7b5a3031aa142b598a09ae"
         }
       },
       "failures": []
         "path": "repo:docs/data/single_episode_task_model_radar.json",
         "exists": true,
         "bytes": 50973,
+        "sha256": "6db28943d1206aef75fbce8ea87ea52a35c0144c6186214f37da9311ca8c9a0c"
       },
       "mirrors": {
         "hf_space": {
           "path": "hf_space:data/single_episode_task_model_radar.json",
           "exists": true,
           "bytes": 50973,
+          "sha256": "6db28943d1206aef75fbce8ea87ea52a35c0144c6186214f37da9311ca8c9a0c"
         },
         "hf_artifacts_data": {
           "path": "hf_artifacts:data/single_episode_task_model_radar.json",
           "exists": true,
           "bytes": 50973,
+          "sha256": "6db28943d1206aef75fbce8ea87ea52a35c0144c6186214f37da9311ca8c9a0c"
         },
         "hf_artifacts": {
           "path": "hf_artifacts:docs/data/single_episode_task_model_radar.json",
           "exists": true,
           "bytes": 50973,
+          "sha256": "6db28943d1206aef75fbce8ea87ea52a35c0144c6186214f37da9311ca8c9a0c"
         },
         "hf_model_data": {
           "path": "hf_model:data/single_episode_task_model_radar.json",
           "exists": true,
           "bytes": 50973,
+          "sha256": "6db28943d1206aef75fbce8ea87ea52a35c0144c6186214f37da9311ca8c9a0c"
         },
         "hf_model_docs_data": {
           "path": "hf_model:docs/data/single_episode_task_model_radar.json",
           "exists": true,
           "bytes": 50973,
+          "sha256": "6db28943d1206aef75fbce8ea87ea52a35c0144c6186214f37da9311ca8c9a0c"
         },
         "hf_model": {
           "path": "hf_model:metrics/single_episode_task_model_radar.json",
           "exists": true,
           "bytes": 50973,
+          "sha256": "6db28943d1206aef75fbce8ea87ea52a35c0144c6186214f37da9311ca8c9a0c"
         }
       },
       "failures": []
       "local": {
         "path": "repo:docs/data/episode128_task_model_radar.json",
         "exists": true,
+        "bytes": 187271,
+        "sha256": "acd8623ad19bf0d0ee1ffb434ecefa087339b59e97d30809eca9b739f83f1a89"
       },
       "mirrors": {
         "hf_space": {
           "path": "hf_space:data/episode128_task_model_radar.json",
           "exists": true,
+          "bytes": 187271,
+          "sha256": "acd8623ad19bf0d0ee1ffb434ecefa087339b59e97d30809eca9b739f83f1a89"
         },
         "hf_artifacts_data": {
           "path": "hf_artifacts:data/episode128_task_model_radar.json",
           "exists": true,
+          "bytes": 187271,
+          "sha256": "acd8623ad19bf0d0ee1ffb434ecefa087339b59e97d30809eca9b739f83f1a89"
         },
         "hf_artifacts": {
           "path": "hf_artifacts:docs/data/episode128_task_model_radar.json",
           "exists": true,
+          "bytes": 187271,
+          "sha256": "acd8623ad19bf0d0ee1ffb434ecefa087339b59e97d30809eca9b739f83f1a89"
         },
         "hf_model_data": {
           "path": "hf_model:data/episode128_task_model_radar.json",
           "exists": true,
+          "bytes": 187271,
+          "sha256": "acd8623ad19bf0d0ee1ffb434ecefa087339b59e97d30809eca9b739f83f1a89"
         },
         "hf_model_docs_data": {
           "path": "hf_model:docs/data/episode128_task_model_radar.json",
           "exists": true,
+          "bytes": 187271,
+          "sha256": "acd8623ad19bf0d0ee1ffb434ecefa087339b59e97d30809eca9b739f83f1a89"
         },
         "hf_model": {
           "path": "hf_model:metrics/episode128_task_model_radar.json",
           "exists": true,
+          "bytes": 187271,
+          "sha256": "acd8623ad19bf0d0ee1ffb434ecefa087339b59e97d30809eca9b739f83f1a89"
         }
       },
       "failures": []
         "path": "repo:docs/data/task_surface_integrity.json",
         "exists": true,
         "bytes": 45779,
+        "sha256": "0179ae9e9f4dffe7fea263b0e5a7a9b8c930bfcdf5794ff42c46f65efeee3182"
       },
       "mirrors": {
         "hf_space": {
           "path": "hf_space:data/task_surface_integrity.json",
           "exists": true,
           "bytes": 45779,
+          "sha256": "0179ae9e9f4dffe7fea263b0e5a7a9b8c930bfcdf5794ff42c46f65efeee3182"
         },
         "hf_artifacts_data": {
           "path": "hf_artifacts:data/task_surface_integrity.json",
           "exists": true,
           "bytes": 45779,
+          "sha256": "0179ae9e9f4dffe7fea263b0e5a7a9b8c930bfcdf5794ff42c46f65efeee3182"
         },
         "hf_artifacts": {
           "path": "hf_artifacts:docs/data/task_surface_integrity.json",
           "exists": true,
           "bytes": 45779,
+          "sha256": "0179ae9e9f4dffe7fea263b0e5a7a9b8c930bfcdf5794ff42c46f65efeee3182"
         },
         "hf_model_data": {
           "path": "hf_model:data/task_surface_integrity.json",
           "exists": true,
           "bytes": 45779,
+          "sha256": "0179ae9e9f4dffe7fea263b0e5a7a9b8c930bfcdf5794ff42c46f65efeee3182"
         },
         "hf_model_docs_data": {
           "path": "hf_model:docs/data/task_surface_integrity.json",
           "exists": true,
           "bytes": 45779,
+          "sha256": "0179ae9e9f4dffe7fea263b0e5a7a9b8c930bfcdf5794ff42c46f65efeee3182"
         },
         "hf_model": {
           "path": "hf_model:metrics/task_surface_integrity.json",
           "exists": true,
           "bytes": 45779,
+          "sha256": "0179ae9e9f4dffe7fea263b0e5a7a9b8c930bfcdf5794ff42c46f65efeee3182"
         }
       },
       "failures": []
       "local": {
         "path": "repo:docs/data/task_method_20_result_matrix.json",
         "exists": true,
+        "bytes": 129687,
+        "sha256": "e5d3fa22013fedf350907746f775cc4a1ca3bb3f816b40ca9467d51cf16925f8"
       },
       "mirrors": {
         "hf_space": {
           "path": "hf_space:data/task_method_20_result_matrix.json",
           "exists": true,
+          "bytes": 129687,
+          "sha256": "e5d3fa22013fedf350907746f775cc4a1ca3bb3f816b40ca9467d51cf16925f8"
         },
         "hf_artifacts_data": {
           "path": "hf_artifacts:data/task_method_20_result_matrix.json",
           "exists": true,
+          "bytes": 129687,
+          "sha256": "e5d3fa22013fedf350907746f775cc4a1ca3bb3f816b40ca9467d51cf16925f8"
         },
         "hf_artifacts": {
           "path": "hf_artifacts:docs/data/task_method_20_result_matrix.json",
           "exists": true,
+          "bytes": 129687,
+          "sha256": "e5d3fa22013fedf350907746f775cc4a1ca3bb3f816b40ca9467d51cf16925f8"
         },
         "hf_model_data": {
           "path": "hf_model:data/task_method_20_result_matrix.json",
           "exists": true,
+          "bytes": 129687,
+          "sha256": "e5d3fa22013fedf350907746f775cc4a1ca3bb3f816b40ca9467d51cf16925f8"
         },
         "hf_model_docs_data": {
           "path": "hf_model:docs/data/task_method_20_result_matrix.json",
           "exists": true,
+          "bytes": 129687,
+          "sha256": "e5d3fa22013fedf350907746f775cc4a1ca3bb3f816b40ca9467d51cf16925f8"
         },
         "hf_model": {
           "path": "hf_model:metrics/task_method_20_result_matrix.json",
           "exists": true,
+          "bytes": 129687,
+          "sha256": "e5d3fa22013fedf350907746f775cc4a1ca3bb3f816b40ca9467d51cf16925f8"
         }
       },
       "failures": []
       "local": {
         "path": "repo:docs/data/task_method_20_gap_audit.json",
         "exists": true,
+        "bytes": 52153,
+        "sha256": "e47ac5d2ac8216f2b46b5fb868275c779226dce8089a8c025dd26571cb5758d3"
       },
       "mirrors": {
         "hf_space": {
           "path": "hf_space:data/task_method_20_gap_audit.json",
           "exists": true,
+          "bytes": 52153,
+          "sha256": "e47ac5d2ac8216f2b46b5fb868275c779226dce8089a8c025dd26571cb5758d3"
         },
         "hf_artifacts_data": {
           "path": "hf_artifacts:data/task_method_20_gap_audit.json",
           "exists": true,
+          "bytes": 52153,
+          "sha256": "e47ac5d2ac8216f2b46b5fb868275c779226dce8089a8c025dd26571cb5758d3"
         },
         "hf_artifacts": {
           "path": "hf_artifacts:docs/data/task_method_20_gap_audit.json",
           "exists": true,
+          "bytes": 52153,
+          "sha256": "e47ac5d2ac8216f2b46b5fb868275c779226dce8089a8c025dd26571cb5758d3"
         },
         "hf_model_data": {
           "path": "hf_model:data/task_method_20_gap_audit.json",
           "exists": true,
+          "bytes": 52153,
+          "sha256": "e47ac5d2ac8216f2b46b5fb868275c779226dce8089a8c025dd26571cb5758d3"
         },
         "hf_model_docs_data": {
           "path": "hf_model:docs/data/task_method_20_gap_audit.json",
           "exists": true,
+          "bytes": 52153,
+          "sha256": "e47ac5d2ac8216f2b46b5fb868275c779226dce8089a8c025dd26571cb5758d3"
         },
         "hf_model": {
           "path": "hf_model:metrics/task_method_20_gap_audit.json",
           "exists": true,
+          "bytes": 52153,
+          "sha256": "e47ac5d2ac8216f2b46b5fb868275c779226dce8089a8c025dd26571cb5758d3"
         }
       },
       "failures": []
       "local": {
         "path": "repo:docs/data/unified_task_model_radar.json",
         "exists": true,
+        "bytes": 231123,
+        "sha256": "c004d35f0a3e0073c4116dd79a2bcdaac872605d715a7eccdaa15787df800f07"
       },
       "mirrors": {
         "hf_space": {
           "path": "hf_space:data/unified_task_model_radar.json",
           "exists": true,
+          "bytes": 231123,
+          "sha256": "c004d35f0a3e0073c4116dd79a2bcdaac872605d715a7eccdaa15787df800f07"
         },
         "hf_artifacts_data": {
           "path": "hf_artifacts:data/unified_task_model_radar.json",
           "exists": true,
+          "bytes": 231123,
+          "sha256": "c004d35f0a3e0073c4116dd79a2bcdaac872605d715a7eccdaa15787df800f07"
         },
         "hf_artifacts": {
           "path": "hf_artifacts:docs/data/unified_task_model_radar.json",
           "exists": true,
+          "bytes": 231123,
+          "sha256": "c004d35f0a3e0073c4116dd79a2bcdaac872605d715a7eccdaa15787df800f07"
         },
         "hf_model_data": {
           "path": "hf_model:data/unified_task_model_radar.json",
           "exists": true,
+          "bytes": 231123,
+          "sha256": "c004d35f0a3e0073c4116dd79a2bcdaac872605d715a7eccdaa15787df800f07"
         },
         "hf_model_docs_data": {
           "path": "hf_model:docs/data/unified_task_model_radar.json",
           "exists": true,
+          "bytes": 231123,
+          "sha256": "c004d35f0a3e0073c4116dd79a2bcdaac872605d715a7eccdaa15787df800f07"
         },
         "hf_model": {
           "path": "hf_model:metrics/unified_task_model_radar.json",
           "exists": true,
+          "bytes": 231123,
+          "sha256": "c004d35f0a3e0073c4116dd79a2bcdaac872605d715a7eccdaa15787df800f07"
         }
       },
       "failures": []
         "path": "repo:docs/data/website_integrity.json",
         "exists": true,
         "bytes": 20021,
+        "sha256": "ae1df93522b60a498309b3f5e9cc81b4dd1af7e761fab8a30261cb914c53de6d"
       },
       "mirrors": {
         "hf_space": {
           "path": "hf_space:data/website_integrity.json",
           "exists": true,
           "bytes": 20021,
+          "sha256": "ae1df93522b60a498309b3f5e9cc81b4dd1af7e761fab8a30261cb914c53de6d"
         },
         "hf_artifacts_data": {
           "path": "hf_artifacts:data/website_integrity.json",
           "exists": true,
           "bytes": 20021,
+          "sha256": "ae1df93522b60a498309b3f5e9cc81b4dd1af7e761fab8a30261cb914c53de6d"
         },
         "hf_artifacts": {
           "path": "hf_artifacts:docs/data/website_integrity.json",
           "exists": true,
           "bytes": 20021,
+          "sha256": "ae1df93522b60a498309b3f5e9cc81b4dd1af7e761fab8a30261cb914c53de6d"
         },
         "hf_model_data": {
           "path": "hf_model:data/website_integrity.json",
           "exists": true,
           "bytes": 20021,
+          "sha256": "ae1df93522b60a498309b3f5e9cc81b4dd1af7e761fab8a30261cb914c53de6d"
         },
         "hf_model_docs_data": {
           "path": "hf_model:docs/data/website_integrity.json",
           "exists": true,
           "bytes": 20021,
+          "sha256": "ae1df93522b60a498309b3f5e9cc81b4dd1af7e761fab8a30261cb914c53de6d"
         },
         "hf_model": {
           "path": "hf_model:metrics/website_integrity.json",
           "exists": true,
           "bytes": 20021,
+          "sha256": "ae1df93522b60a498309b3f5e9cc81b4dd1af7e761fab8a30261cb914c53de6d"
         }
       },
       "failures": []
       "local": {
         "path": "repo:docs/assets/charts/episode128_task_model_radar.svg",
         "exists": true,
+        "bytes": 44602,
+        "sha256": "9a2fd542502cb26f093097d9ace238f8cf3b619e0abdec5bf2870c5271fb9ed5"
       },
       "mirrors": {
         "hf_space": {
           "path": "hf_space:assets/charts/episode128_task_model_radar.svg",
           "exists": true,
+          "bytes": 44602,
+          "sha256": "9a2fd542502cb26f093097d9ace238f8cf3b619e0abdec5bf2870c5271fb9ed5"
         },
         "hf_artifacts_docs": {
           "path": "hf_artifacts:docs/assets/charts/episode128_task_model_radar.svg",
           "exists": true,
+          "bytes": 44602,
+          "sha256": "9a2fd542502cb26f093097d9ace238f8cf3b619e0abdec5bf2870c5271fb9ed5"
         },
         "hf_artifacts_card": {
           "path": "hf_artifacts:assets/charts/episode128_task_model_radar.svg",
           "exists": true,
+          "bytes": 44602,
+          "sha256": "9a2fd542502cb26f093097d9ace238f8cf3b619e0abdec5bf2870c5271fb9ed5"
         },
         "hf_model": {
           "path": "hf_model:assets/charts/episode128_task_model_radar.svg",
           "exists": true,
+          "bytes": 44602,
+          "sha256": "9a2fd542502cb26f093097d9ace238f8cf3b619e0abdec5bf2870c5271fb9ed5"
         }
       },
       "failures": []
       "local": {
         "path": "repo:docs/assets/charts/unified_task_model_radar.svg",
         "exists": true,
+        "bytes": 50618,
+        "sha256": "29ede875ef96c76a8aa7ec6e9883457be611fac8ef967b825041b33fe1d86863"
       },
       "mirrors": {
         "hf_space": {
           "path": "hf_space:assets/charts/unified_task_model_radar.svg",
           "exists": true,
+          "bytes": 50618,
+          "sha256": "29ede875ef96c76a8aa7ec6e9883457be611fac8ef967b825041b33fe1d86863"
         },
         "hf_artifacts_docs": {
           "path": "hf_artifacts:docs/assets/charts/unified_task_model_radar.svg",
           "exists": true,
+          "bytes": 50618,
+          "sha256": "29ede875ef96c76a8aa7ec6e9883457be611fac8ef967b825041b33fe1d86863"
         },
         "hf_artifacts_card": {
           "path": "hf_artifacts:assets/charts/unified_task_model_radar.svg",
           "exists": true,
+          "bytes": 50618,
+          "sha256": "29ede875ef96c76a8aa7ec6e9883457be611fac8ef967b825041b33fe1d86863"
         },
         "hf_model": {
           "path": "hf_model:assets/charts/unified_task_model_radar.svg",
           "exists": true,
+          "bytes": 50618,
+          "sha256": "29ede875ef96c76a8aa7ec6e9883457be611fac8ef967b825041b33fe1d86863"
         }
       },
       "failures": []
       },
       "failures": []
     },
+    {
+      "name": "scripts/omni/collect_qwen3_retrieval_task_probe_results.sh",
+      "status": "pass",
+      "local": {
+        "path": "repo:scripts/omni/collect_qwen3_retrieval_task_probe_results.sh",
+        "exists": true,
+        "bytes": 3435,
+        "sha256": "257ba6267aab0ee2e06a03a9ad61175773948d039c6c5ce168471a800c1342fc"
+      },
+      "mirrors": {
+        "hf_artifacts": {
+          "path": "hf_artifacts:scripts/omni/collect_qwen3_retrieval_task_probe_results.sh",
+          "exists": true,
+          "bytes": 3435,
+          "sha256": "257ba6267aab0ee2e06a03a9ad61175773948d039c6c5ce168471a800c1342fc"
+        },
+        "hf_model": {
+          "path": "hf_model:scripts/omni/collect_qwen3_retrieval_task_probe_results.sh",
+          "exists": true,
+          "bytes": 3435,
+          "sha256": "257ba6267aab0ee2e06a03a9ad61175773948d039c6c5ce168471a800c1342fc"
+        }
+      },
+      "failures": []
+    },
     {
       "name": "scripts/omni/collect_qwen3_v4_release_artifacts.py",
       "status": "pass",
       "local": {
         "path": "repo:scripts/validate_mirror_parity.py",
         "exists": true,
+        "bytes": 28485,
+        "sha256": "6c7fbcf2e7a22a71a547da7bb004cd662b6ba742cb8d049da1881928e9c6f509"
       },
       "mirrors": {
         "hf_artifacts": {
           "path": "hf_artifacts:scripts/validate_mirror_parity.py",
           "exists": true,
+          "bytes": 28485,
+          "sha256": "6c7fbcf2e7a22a71a547da7bb004cd662b6ba742cb8d049da1881928e9c6f509"
         },
         "hf_model": {
           "path": "hf_model:scripts/validate_mirror_parity.py",
           "exists": true,
+          "bytes": 28485,
+          "sha256": "6c7fbcf2e7a22a71a547da7bb004cd662b6ba742cb8d049da1881928e9c6f509"
         }
       },
       "failures": []
       "local": {
         "path": "repo:scripts/validate_publication_package.py",
         "exists": true,
+        "bytes": 19982,
+        "sha256": "7770d277c8de2c8c93b92a135ce02c7c4dff64d15199f949688734c942f8fc45"
       },
       "mirrors": {
         "hf_artifacts": {
           "path": "hf_artifacts:scripts/validate_publication_package.py",
           "exists": true,
+          "bytes": 19982,
+          "sha256": "7770d277c8de2c8c93b92a135ce02c7c4dff64d15199f949688734c942f8fc45"
         },
         "hf_model": {
           "path": "hf_model:scripts/validate_publication_package.py",
           "exists": true,
+          "bytes": 19982,
+          "sha256": "7770d277c8de2c8c93b92a135ce02c7c4dff64d15199f949688734c942f8fc45"
         }
       },
       "failures": []
       "local": {
         "path": "repo:TASK_METHOD_20_GAP_AUDIT.md",
         "exists": true,
+        "bytes": 14812,
+        "sha256": "d2f0228497fa834c7f097e1fe74e2210b85d0a01f7841356e67dc79929a74413"
       },
       "mirrors": {
         "hf_space": {
           "path": "hf_space:TASK_METHOD_20_GAP_AUDIT.md",
           "exists": true,
+          "bytes": 14812,
+          "sha256": "d2f0228497fa834c7f097e1fe74e2210b85d0a01f7841356e67dc79929a74413"
         },
         "hf_artifacts": {
           "path": "hf_artifacts:TASK_METHOD_20_GAP_AUDIT.md",
           "exists": true,
+          "bytes": 14812,
+          "sha256": "d2f0228497fa834c7f097e1fe74e2210b85d0a01f7841356e67dc79929a74413"
         },
         "hf_model": {
           "path": "hf_model:TASK_METHOD_20_GAP_AUDIT.md",
           "exists": true,
+          "bytes": 14812,
+          "sha256": "d2f0228497fa834c7f097e1fe74e2210b85d0a01f7841356e67dc79929a74413"
         }
       },
       "failures": []
       "local": {
         "path": "repo:TASK_METHOD_20_RESULT_MATRIX.md",
         "exists": true,
+        "bytes": 4144,
+        "sha256": "dac2828ba0286bc35290a61b6d02dbd75f0b3acb8d47a73cfa7f072d7fa209c1"
       },
       "mirrors": {
         "hf_space": {
           "path": "hf_space:TASK_METHOD_20_RESULT_MATRIX.md",
           "exists": true,
+          "bytes": 4144,
+          "sha256": "dac2828ba0286bc35290a61b6d02dbd75f0b3acb8d47a73cfa7f072d7fa209c1"
         },
         "hf_artifacts": {
           "path": "hf_artifacts:TASK_METHOD_20_RESULT_MATRIX.md",
           "exists": true,
+          "bytes": 4144,
+          "sha256": "dac2828ba0286bc35290a61b6d02dbd75f0b3acb8d47a73cfa7f072d7fa209c1"
         },
         "hf_model": {
           "path": "hf_model:TASK_METHOD_20_RESULT_MATRIX.md",
           "exists": true,
+          "bytes": 4144,
+          "sha256": "dac2828ba0286bc35290a61b6d02dbd75f0b3acb8d47a73cfa7f072d7fa209c1"
         }
       },
       "failures": []

docs/data/publication_audit.json CHANGED Viewed

@@ -1,6 +1,6 @@
 {
   "status": "pass",
-  "generated_at_utc": "2026-06-18T09:30:36+00:00",
   "checks": [
     {
       "name": "required_publication_assets_present",
@@ -164,6 +164,7 @@
     "scripts/publish_hf_bundles.py": true,
     "scripts/omni/build_128_episode_feature_index.py": true,
     "scripts/omni/build_task_suite_enhancement_128.py": true,
     "scripts/omni/train_qwen3_omni_lora.py": true,
     "results/omni_finetune/task_suite_enhancement_128_v1_20260608/enhancement_plan.json": true,
     "results/omni_finetune/task_suite_enhancement_128_v1_20260608/ENHANCEMENT_REPORT.md": true
@@ -214,8 +215,8 @@
     "github_repo": {
       "root": "repo",
       "exists": true,
-      "file_count": 1263,
-      "text_file_count": 1060,
       "largest_file": {
         "path": "results/episode_task_suite/modality_reconstruction/predictions.npz",
         "bytes": 55702978

 {
   "status": "pass",
+  "generated_at_utc": "2026-06-18T10:04:59+00:00",
   "checks": [
     {
       "name": "required_publication_assets_present",
     "scripts/publish_hf_bundles.py": true,
     "scripts/omni/build_128_episode_feature_index.py": true,
     "scripts/omni/build_task_suite_enhancement_128.py": true,
+    "scripts/omni/collect_qwen3_retrieval_task_probe_results.sh": true,
     "scripts/omni/train_qwen3_omni_lora.py": true,
     "results/omni_finetune/task_suite_enhancement_128_v1_20260608/enhancement_plan.json": true,
     "results/omni_finetune/task_suite_enhancement_128_v1_20260608/ENHANCEMENT_REPORT.md": true
     "github_repo": {
       "root": "repo",
       "exists": true,
+      "file_count": 1264,
+      "text_file_count": 1061,
       "largest_file": {
         "path": "results/episode_task_suite/modality_reconstruction/predictions.npz",
         "bytes": 55702978

docs/data/quality_gates.json CHANGED Viewed

@@ -1,7 +1,7 @@
 {
   "title": "Ropedia Xperience-10M Release Checks",
   "status": "pass",
-  "generated_at_utc": "2026-06-18T09:31:04+00:00",
   "rule": "A release is current when the automated reports pass and the live GitHub/Hugging Face mirrors are verified after publishing.",
   "automated_gates": [
     {

 {
   "title": "Ropedia Xperience-10M Release Checks",
   "status": "pass",
+  "generated_at_utc": "2026-06-18T10:05:25+00:00",
   "rule": "A release is current when the automated reports pass and the live GitHub/Hugging Face mirrors are verified after publishing.",
   "automated_gates": [
     {

docs/data/scope_claims_audit.json CHANGED Viewed

@@ -1,6 +1,6 @@
 {
   "status": "pass",
-  "generated_at_utc": "2026-06-18T09:28:46+00:00",
   "summary": {
     "qwen3_omni_verified_diagnostic_pilot": true,
     "dataset_manifest_num_episodes": 119,

 {
   "status": "pass",
+  "generated_at_utc": "2026-06-18T10:04:37+00:00",
   "summary": {
     "qwen3_omni_verified_diagnostic_pilot": true,
     "dataset_manifest_num_episodes": 119,

docs/data/single_episode_task_model_radar.json CHANGED Viewed

@@ -1,7 +1,7 @@
 {
   "title": "Single-Episode 20-Task Radar",
   "status": "pass",
-  "generated_at_utc": "2026-06-18T09:06:25+00:00",
   "description": "Minimal and Neural MLP baselines on the one public sample episode, both scored on all 20 task contracts.",
   "task_count": 20,
   "method_count": 2,

 {
   "title": "Single-Episode 20-Task Radar",
   "status": "pass",
+  "generated_at_utc": "2026-06-18T10:04:17+00:00",
   "description": "Minimal and Neural MLP baselines on the one public sample episode, both scored on all 20 task contracts.",
   "task_count": 20,
   "method_count": 2,

docs/data/source_alignment_audit.json CHANGED Viewed

@@ -1,7 +1,7 @@
 {
   "title": "Ropedia Xperience-10M Source Alignment Note",
   "status": "pass",
-  "generated_at_utc": "2026-06-18T09:28:24+00:00",
   "alignment_json": "docs/data/xperience10m_dataset_card_alignment.json",
   "alignment_summary": {
     "full_dataset_repo": "ropedia-ai/xperience-10m",

 {
   "title": "Ropedia Xperience-10M Source Alignment Note",
   "status": "pass",
+  "generated_at_utc": "2026-06-18T10:04:36+00:00",
   "alignment_json": "docs/data/xperience10m_dataset_card_alignment.json",
   "alignment_summary": {
     "full_dataset_repo": "ropedia-ai/xperience-10m",

docs/data/task_method_20_gap_audit.json CHANGED Viewed

@@ -1,10 +1,10 @@
 {
-  "generated_at_utc": "2026-06-18T09:06:40+00:00",
   "immediate_actions": [
     {
       "artifact": "docs/data/task_method_20_gap_audit.json",
       "id": "gap_audit",
-      "purpose": "Keep the 60 scoreless cells visible and reproducible."
     },
     {
       "artifact": "scripts/omni/score_model_output_probes.py",
@@ -101,11 +101,11 @@
       "proxy_scored_task_count": 0,
       "result_record_count": 20,
       "scope": "128 selected episodes, held-out test",
-      "scored_task_count": 14,
-      "scoreless_task_count": 6,
       "status_counts": {
-        "not_evaluated_in_verified_package": 6,
-        "scored": 14
       }
     },
     "raw128_neural_mlp": {
@@ -140,10 +140,10 @@
     "cosmos3_super_reasoner": 13,
     "metadata128_neural_mlp": 14,
     "metadata128_simple": 12,
-    "qwen3_omni_v6_lora": 6
   },
   "missing_by_status": {
-    "not_evaluated_in_verified_package": 34,
     "not_supported_by_metadata_only_package": 22,
     "unsupported_without_required_target": 4
   },
@@ -169,8 +169,7 @@
     "09 Cross-Modal Retrieval": [
       "cosmos3_super_reasoner",
       "metadata128_neural_mlp",
-      "metadata128_simple",
-      "qwen3_omni_v6_lora"
     ],
     "10 Cross-Modal Reconstruction": [
       "cosmos3_nano_future_window",
@@ -398,19 +397,6 @@
       "task_label": "Cross-Modal Retrieval",
       "task_number": 9
     },
-    {
-      "method": "Qwen3-Omni v6 LoRA",
-      "metric_key": "mrr",
-      "reason": "the verified public model package did not ask this branch to emit that task target; a new task-specific evaluation package is required for a numeric score",
-      "recommended_next_step": "Generate verified model outputs for this task contract and score them against the held-out labels.",
-      "scope": "multi_episode_128_partial_model_overlay",
-      "series_id": "qwen3_omni_v6_lora",
-      "status": "not_evaluated_in_verified_package",
-      "status_label": "not evaluated",
-      "task_id": "cross_modal_retrieval",
-      "task_label": "Cross-Modal Retrieval",
-      "task_number": 9
-    },
     {
       "method": "Cosmos3-Super Reasoner",
       "metric_key": "mrr",
@@ -1069,8 +1055,8 @@
     "method_count": 9,
     "method_task_record_count": 180,
     "proxy_scored_method_task_count": 4,
-    "scored_method_task_count": 120,
-    "scoreless_method_task_count": 60,
     "task_count": 20
   },
   "source_matrix": "docs/data/task_method_20_result_matrix.json",

 {
+  "generated_at_utc": "2026-06-18T10:04:17+00:00",
   "immediate_actions": [
     {
       "artifact": "docs/data/task_method_20_gap_audit.json",
       "id": "gap_audit",
+      "purpose": "Keep the 59 scoreless cells visible and reproducible."
     },
     {
       "artifact": "scripts/omni/score_model_output_probes.py",
       "proxy_scored_task_count": 0,
       "result_record_count": 20,
       "scope": "128 selected episodes, held-out test",
+      "scored_task_count": 15,
+      "scoreless_task_count": 5,
       "status_counts": {
+        "not_evaluated_in_verified_package": 5,
+        "scored": 15
       }
     },
     "raw128_neural_mlp": {
     "cosmos3_super_reasoner": 13,
     "metadata128_neural_mlp": 14,
     "metadata128_simple": 12,
+    "qwen3_omni_v6_lora": 5
   },
   "missing_by_status": {
+    "not_evaluated_in_verified_package": 33,
     "not_supported_by_metadata_only_package": 22,
     "unsupported_without_required_target": 4
   },
     "09 Cross-Modal Retrieval": [
       "cosmos3_super_reasoner",
       "metadata128_neural_mlp",
+      "metadata128_simple"
     ],
     "10 Cross-Modal Reconstruction": [
       "cosmos3_nano_future_window",
       "task_label": "Cross-Modal Retrieval",
       "task_number": 9
     },
     {
       "method": "Cosmos3-Super Reasoner",
       "metric_key": "mrr",
     "method_count": 9,
     "method_task_record_count": 180,
     "proxy_scored_method_task_count": 4,
+    "scored_method_task_count": 121,
+    "scoreless_method_task_count": 59,
     "task_count": 20
   },
   "source_matrix": "docs/data/task_method_20_result_matrix.json",

docs/data/task_method_20_result_matrix.json CHANGED Viewed

@@ -1,11 +1,11 @@
 {
   "title": "Task Method 20-Result Matrix",
   "status": "pass",
-  "generated_at_utc": "2026-06-18T09:06:25+00:00",
   "task_count": 20,
   "method_count": 9,
   "method_task_record_count": 180,
-  "scored_method_task_count": 120,
   "series": [
     {
       "id": "minimal",
@@ -161,17 +161,17 @@
       "method_detail": "Verified held-out Qwen3-Omni v6 LoRA metrics, plus task 16 and any completed private-GPU future-task probes scored from task-specific JSON.",
       "plotted_as": "colored point overlay",
       "result_record_count": 20,
-      "scored_task_count": 14,
-      "covered_task_count": 14,
       "proxy_scored_task_count": 0,
-      "scoreless_task_count": 6,
       "unsupported_task_count": 0,
-      "not_evaluated_task_count": 6,
       "status_counts": {
-        "not_evaluated_in_verified_package": 6,
-        "scored": 14
       },
-      "coverage_fraction": 0.7,
       "result_record_fraction": 1.0
     },
     {
@@ -1634,17 +1634,17 @@
       "task_label": "Cross-Modal Retrieval",
       "series_id": "qwen3_omni_v6_lora",
       "method": "Qwen3-Omni v6 LoRA",
-      "status": "not_evaluated_in_verified_package",
-      "status_label": "not evaluated",
-      "scored": false,
       "proxy_scored": false,
-      "raw": null,
-      "raw_text": "n/a",
-      "normalized_score": null,
-      "metric_key": "mrr",
-      "source": null,
       "scope": "multi_episode_128_partial_model_overlay",
-      "reason": "the verified public model package did not ask this branch to emit that task target; a new task-specific evaluation package is required for a numeric score"
     },
     {
       "task_number": 9,

 {
   "title": "Task Method 20-Result Matrix",
   "status": "pass",
+  "generated_at_utc": "2026-06-18T10:04:17+00:00",
   "task_count": 20,
   "method_count": 9,
   "method_task_record_count": 180,
+  "scored_method_task_count": 121,
   "series": [
     {
       "id": "minimal",
       "method_detail": "Verified held-out Qwen3-Omni v6 LoRA metrics, plus task 16 and any completed private-GPU future-task probes scored from task-specific JSON.",
       "plotted_as": "colored point overlay",
       "result_record_count": 20,
+      "scored_task_count": 15,
+      "covered_task_count": 15,
       "proxy_scored_task_count": 0,
+      "scoreless_task_count": 5,
       "unsupported_task_count": 0,
+      "not_evaluated_task_count": 5,
       "status_counts": {
+        "not_evaluated_in_verified_package": 5,
+        "scored": 15
       },
+      "coverage_fraction": 0.75,
       "result_record_fraction": 1.0
     },
     {
       "task_label": "Cross-Modal Retrieval",
       "series_id": "qwen3_omni_v6_lora",
       "method": "Qwen3-Omni v6 LoRA",
+      "status": "scored",
+      "status_label": "scored",
+      "scored": true,
       "proxy_scored": false,
+      "raw": 0.5080191798941732,
+      "raw_text": "0.5080",
+      "normalized_score": 0.5080191798941732,
+      "metric_key": "cross_modal_retrieval_mrr",
+      "source": "results/omni_finetune/xperience10m_qwen3_omni_v6_cross_modal_retrieval_probe_a100_20260618T000000Z/cross_modal_retrieval/metrics.json",
       "scope": "multi_episode_128_partial_model_overlay",
+      "reason": null
     },
     {
       "task_number": 9,

docs/data/unified_task_model_radar.json CHANGED Viewed

@@ -1,11 +1,11 @@
 {
   "title": "Unified 20-Task Model Radar",
   "status": "pass",
-  "generated_at_utc": "2026-06-18T09:06:25+00:00",
   "task_count": 20,
   "method_count": 9,
   "method_task_record_count": 180,
-  "scored_method_task_count": 120,
   "normalization_policy": {
     "higher_is_better": "bounded metrics are plotted directly on 0-1 axes after clipping to [0, 1]",
     "lower_is_better": "lower-error metrics are converted to best_observed_value / raw_value within the same task",
@@ -170,17 +170,17 @@
       "method_detail": "Verified held-out Qwen3-Omni v6 LoRA metrics, plus task 16 and any completed private-GPU future-task probes scored from task-specific JSON.",
       "plotted_as": "colored point overlay",
       "result_record_count": 20,
-      "scored_task_count": 14,
-      "covered_task_count": 14,
       "proxy_scored_task_count": 0,
-      "scoreless_task_count": 6,
       "unsupported_task_count": 0,
-      "not_evaluated_task_count": 6,
       "status_counts": {
-        "not_evaluated_in_verified_package": 6,
-        "scored": 14
       },
-      "coverage_fraction": 0.7,
       "result_record_fraction": 1.0
     },
     {
@@ -1164,6 +1164,17 @@
           "raw_text": "0.0221",
           "status_label": "scored"
         },
         "metadata128_simple": {
           "raw": null,
           "metric_key": "mrr",
@@ -1208,17 +1219,6 @@
           "raw_text": "n/a",
           "status_label": "not supported"
         },
-        "qwen3_omni_v6_lora": {
-          "raw": null,
-          "metric_key": "mrr",
-          "source": null,
-          "scope": "multi_episode_128_partial_model_overlay",
-          "status": "not_evaluated_in_verified_package",
-          "reason": "the verified public model package did not ask this branch to emit that task target; a new task-specific evaluation package is required for a numeric score",
-          "normalized_score": null,
-          "raw_text": "n/a",
-          "status_label": "not evaluated"
-        },
         "cosmos3_super_reasoner": {
           "raw": null,
           "metric_key": "mrr",
@@ -2492,7 +2492,7 @@
       "title": "Qwen3-Omni v6 LoRA",
       "status": "verified",
       "task_aligned_axes": "Qwen3",
-      "coverage": "20 records / 14 scored task-aligned axes",
       "headline": "JSON validity 0.9990; action macro-F1 0.0029",
       "source": "results/omni_finetune/verified_public/xperience10m_qwen3_omni_128ep_multiscale_cap96_v6_rank64_lr5e5_full8gpu_lora_eval_test_full/eval/metrics.json"
     },
@@ -3932,17 +3932,17 @@
       "task_label": "Cross-Modal Retrieval",
       "series_id": "qwen3_omni_v6_lora",
       "method": "Qwen3-Omni v6 LoRA",
-      "status": "not_evaluated_in_verified_package",
-      "status_label": "not evaluated",
-      "scored": false,
       "proxy_scored": false,
-      "raw": null,
-      "raw_text": "n/a",
-      "normalized_score": null,
-      "metric_key": "mrr",
-      "source": null,
       "scope": "multi_episode_128_partial_model_overlay",
-      "reason": "the verified public model package did not ask this branch to emit that task target; a new task-specific evaluation package is required for a numeric score"
     },
     {
       "task_number": 9,

 {
   "title": "Unified 20-Task Model Radar",
   "status": "pass",
+  "generated_at_utc": "2026-06-18T10:04:17+00:00",
   "task_count": 20,
   "method_count": 9,
   "method_task_record_count": 180,
+  "scored_method_task_count": 121,
   "normalization_policy": {
     "higher_is_better": "bounded metrics are plotted directly on 0-1 axes after clipping to [0, 1]",
     "lower_is_better": "lower-error metrics are converted to best_observed_value / raw_value within the same task",
       "method_detail": "Verified held-out Qwen3-Omni v6 LoRA metrics, plus task 16 and any completed private-GPU future-task probes scored from task-specific JSON.",
       "plotted_as": "colored point overlay",
       "result_record_count": 20,
+      "scored_task_count": 15,
+      "covered_task_count": 15,
       "proxy_scored_task_count": 0,
+      "scoreless_task_count": 5,
       "unsupported_task_count": 0,
+      "not_evaluated_task_count": 5,
       "status_counts": {
+        "not_evaluated_in_verified_package": 5,
+        "scored": 15
       },
+      "coverage_fraction": 0.75,
       "result_record_fraction": 1.0
     },
     {
           "raw_text": "0.0221",
           "status_label": "scored"
         },
+        "qwen3_omni_v6_lora": {
+          "raw": 0.5080191798941732,
+          "metric_key": "cross_modal_retrieval_mrr",
+          "source": "results/omni_finetune/xperience10m_qwen3_omni_v6_cross_modal_retrieval_probe_a100_20260618T000000Z/cross_modal_retrieval/metrics.json",
+          "scope": "multi_episode_128_partial_model_overlay",
+          "status": "scored",
+          "reason": null,
+          "normalized_score": 0.5080191798941732,
+          "raw_text": "0.5080",
+          "status_label": "scored"
+        },
         "metadata128_simple": {
           "raw": null,
           "metric_key": "mrr",
           "raw_text": "n/a",
           "status_label": "not supported"
         },
         "cosmos3_super_reasoner": {
           "raw": null,
           "metric_key": "mrr",
       "title": "Qwen3-Omni v6 LoRA",
       "status": "verified",
       "task_aligned_axes": "Qwen3",
+      "coverage": "20 records / 15 scored task-aligned axes",
       "headline": "JSON validity 0.9990; action macro-F1 0.0029",
       "source": "results/omni_finetune/verified_public/xperience10m_qwen3_omni_128ep_multiscale_cap96_v6_rank64_lr5e5_full8gpu_lora_eval_test_full/eval/metrics.json"
     },
       "task_label": "Cross-Modal Retrieval",
       "series_id": "qwen3_omni_v6_lora",
       "method": "Qwen3-Omni v6 LoRA",
+      "status": "scored",
+      "status_label": "scored",
+      "scored": true,
       "proxy_scored": false,
+      "raw": 0.5080191798941732,
+      "raw_text": "0.5080",
+      "normalized_score": 0.5080191798941732,
+      "metric_key": "cross_modal_retrieval_mrr",
+      "source": "results/omni_finetune/xperience10m_qwen3_omni_v6_cross_modal_retrieval_probe_a100_20260618T000000Z/cross_modal_retrieval/metrics.json",
       "scope": "multi_episode_128_partial_model_overlay",
+      "reason": null
     },
     {
       "task_number": 9,

results/omni_finetune/xperience10m_qwen3_omni_v6_cross_modal_retrieval_probe_a100_20260618T000000Z/RUN_REPORT.md ADDED Viewed

	@@ -0,0 +1,8 @@

+# Qwen3-Omni v6 Retrieval Task Probes
+- Run ID: `xperience10m_qwen3_omni_v6_cross_modal_retrieval_probe_a100_20260618T000000Z`
+- Shards: `2`
+| Task | Metric | Score | Samples |
+| --- | --- | ---: | ---: |
+| Cross-Modal Retrieval | cross_modal_retrieval_mrr | 0.508019 | 4032 |

results/omni_finetune/xperience10m_qwen3_omni_v6_cross_modal_retrieval_probe_a100_20260618T000000Z/collection_validation.json ADDED Viewed

	@@ -0,0 +1,16 @@

+{
+  "records": [
+    {
+      "metric_key": "cross_modal_retrieval_mrr",
+      "num_samples": 4032,
+      "primary_score": 0.5080191798941732,
+      "source": "results/omni_finetune/xperience10m_qwen3_omni_v6_cross_modal_retrieval_probe_a100_20260618T000000Z/cross_modal_retrieval/metrics.json",
+      "task_id": "cross_modal_retrieval"
+    }
+  ],
+  "run_id": "xperience10m_qwen3_omni_v6_cross_modal_retrieval_probe_a100_20260618T000000Z",
+  "status": "pass",
+  "summary": "results/omni_finetune/xperience10m_qwen3_omni_v6_cross_modal_retrieval_probe_a100_20260618T000000Z/summary.json",
+  "title": "Qwen3 Retrieval Task Probe Collection Validation",
+  "validated_task_count": 1
+}

results/omni_finetune/xperience10m_qwen3_omni_v6_cross_modal_retrieval_probe_a100_20260618T000000Z/cross_modal_retrieval/metrics.json ADDED Viewed

	@@ -0,0 +1,25 @@

+{
+  "adapter_dir": "/mnt/kgc/chaoyue/ropedia-h20-side/ropedia-episode-task-suite/checkpoints/xperience10m_qwen3_omni_128ep_multiscale_cap96_v6_rank64_lr5e5_full8gpu_lora/adapter_lora",
+  "candidate_count": 4,
+  "caption_grounding_mrr": 0.5080191798941732,
+  "cross_modal_retrieval_mrr": 0.5080191798941732,
+  "dataset_jsonl": "/mnt/kgc/chaoyue/ropedia-h20-side/ropedia-episode-task-suite/results/omni_finetune/xperience10m_qwen3_omni_128ep_multiscale_cap96_v5_full8gpu_lora_dataset/dataset_a100_eval.jsonl",
+  "eval_split": "test",
+  "metric_key": "cross_modal_retrieval_mrr",
+  "model_id": "/mnt/kgc/chaoyue/ropedia-h20-side/modelscope_models/Qwen__Qwen3-Omni-30B-A3B-Instruct",
+  "mrr": 0.5080191798941732,
+  "num_samples": 4032,
+  "primary_metric": "cross_modal_retrieval_mrr",
+  "primary_score": 0.5080191798941732,
+  "run_id": "xperience10m_qwen3_omni_v6_cross_modal_retrieval_probe_a100_20260618T000000Z",
+  "sample_offset": 0,
+  "sample_stride": 1,
+  "scope": "held_out_test_qwen3_retrieval_task_probe",
+  "score_policy": "GPU-backed Qwen3-Omni v6 sensor-to-video retrieval probe. The query is a compact summary of held-out motion-capture, body-contact, camera-pose, and IMU feature blocks; candidates are shuffled staged mosaic video windows, and the score is MRR of the synchronized true window. No action/subtask/object labels are included in the query.",
+  "status": "pass",
+  "task_id": "cross_modal_retrieval",
+  "task_label": "Cross-Modal Retrieval",
+  "task_number": 9,
+  "title": "Qwen3-Omni v6 Cross-Modal Retrieval",
+  "top1_accuracy": 0.24032738095238096
+}

results/omni_finetune/xperience10m_qwen3_omni_v6_cross_modal_retrieval_probe_a100_20260618T000000Z/launch_env.txt ADDED Viewed

	@@ -0,0 +1,11 @@

+run_id=xperience10m_qwen3_omni_v6_cross_modal_retrieval_probe_a100_20260618T000000Z
+dataset_jsonl=/mnt/kgc/chaoyue/ropedia-h20-side/ropedia-episode-task-suite/results/omni_finetune/xperience10m_qwen3_omni_128ep_multiscale_cap96_v5_full8gpu_lora_dataset/dataset_a100_eval.jsonl
+model_dir=/mnt/kgc/chaoyue/ropedia-h20-side/modelscope_models/Qwen__Qwen3-Omni-30B-A3B-Instruct
+adapter_dir=/mnt/kgc/chaoyue/ropedia-h20-side/ropedia-episode-task-suite/checkpoints/xperience10m_qwen3_omni_128ep_multiscale_cap96_v6_rank64_lr5e5_full8gpu_lora/adapter_lora
+tasks=cross_modal_retrieval
+candidate_count=4
+cuda_device_groups=0,1 2,3
+shards=2
+started_at=2026-06-18T14:33:01+08:00
+finished_at=2026-06-18T18:01:20+08:00
+exit_code=0

results/omni_finetune/xperience10m_qwen3_omni_v6_cross_modal_retrieval_probe_a100_20260618T000000Z/summary.json ADDED Viewed

	@@ -0,0 +1,19 @@

+{
+  "run_id": "xperience10m_qwen3_omni_v6_cross_modal_retrieval_probe_a100_20260618T000000Z",
+  "shard_dirs": [
+    "results/omni_finetune/xperience10m_qwen3_omni_v6_cross_modal_retrieval_probe_a100_20260618T000000Z_shard0",
+    "results/omni_finetune/xperience10m_qwen3_omni_v6_cross_modal_retrieval_probe_a100_20260618T000000Z_shard1"
+  ],
+  "status": "pass",
+  "tasks": {
+    "cross_modal_retrieval": {
+      "metric_key": "cross_modal_retrieval_mrr",
+      "metrics_json": "results/omni_finetune/xperience10m_qwen3_omni_v6_cross_modal_retrieval_probe_a100_20260618T000000Z/cross_modal_retrieval/metrics.json",
+      "num_samples": 4032,
+      "primary_score": 0.5080191798941732,
+      "task_label": "Cross-Modal Retrieval",
+      "task_number": 9
+    }
+  },
+  "title": "Qwen3-Omni v6 Retrieval Task Probes"
+}

results/omni_finetune/xperience10m_qwen3_omni_v6_cross_modal_retrieval_probe_a100_20260618T000000Z/xperience10m_qwen3_omni_v6_cross_modal_retrieval_probe_a100_20260618T000000Z_shard0.progress.jsonl ADDED Viewed

The diff for this file is too large to render. See raw diff

results/omni_finetune/xperience10m_qwen3_omni_v6_retrieval_task_probes_a100_20260617T175919Z/RUN_REPORT.md ADDED Viewed

	@@ -0,0 +1,8 @@

+# Qwen3-Omni v6 Retrieval Task Probes
+- Run ID: `xperience10m_qwen3_omni_v6_retrieval_task_probes_a100_20260617T175919Z`
+- Shards: `2`
+| Task | Metric | Score | Samples |
+| --- | --- | ---: | ---: |
+| Language Grounding | caption_grounding_mrr | 0.876447 | 4032 |

results/omni_finetune/xperience10m_qwen3_omni_v6_retrieval_task_probes_a100_20260617T175919Z/caption_grounding/metrics.json ADDED Viewed

	@@ -0,0 +1,24 @@

+{
+  "adapter_dir": "/mnt/kgc/chaoyue/ropedia-h20-side/ropedia-episode-task-suite/checkpoints/xperience10m_qwen3_omni_128ep_multiscale_cap96_v6_rank64_lr5e5_full8gpu_lora/adapter_lora",
+  "candidate_count": 4,
+  "caption_grounding_mrr": 0.8764467592592605,
+  "dataset_jsonl": "/mnt/kgc/chaoyue/ropedia-h20-side/ropedia-episode-task-suite/results/omni_finetune/xperience10m_qwen3_omni_128ep_multiscale_cap96_v5_full8gpu_lora_dataset/dataset_a100_eval.jsonl",
+  "eval_split": "test",
+  "metric_key": "caption_grounding_mrr",
+  "model_id": "/mnt/kgc/chaoyue/ropedia-h20-side/modelscope_models/Qwen__Qwen3-Omni-30B-A3B-Instruct",
+  "mrr": 0.8764467592592605,
+  "num_samples": 4032,
+  "primary_metric": "caption_grounding_mrr",
+  "primary_score": 0.8764467592592605,
+  "run_id": "xperience10m_qwen3_omni_v6_retrieval_task_probes_a100_20260617T175919Z",
+  "sample_offset": 0,
+  "sample_stride": 1,
+  "scope": "held_out_test_qwen3_retrieval_task_probe",
+  "score_policy": "GPU-backed Qwen3-Omni v6 text-to-video retrieval probe. The text query is built from held-out action/subtask/object labels, candidates are shuffled staged mosaic video windows, and the score is MRR of the true window. This does not score tasks whose numeric/raw targets are absent from the export.",
+  "status": "pass",
+  "task_id": "caption_grounding",
+  "task_label": "Language Grounding",
+  "task_number": 8,
+  "title": "Qwen3-Omni v6 Language Grounding",
+  "top1_accuracy": 0.7864583333333334
+}

results/omni_finetune/xperience10m_qwen3_omni_v6_retrieval_task_probes_a100_20260617T175919Z/caption_grounding/predictions.csv ADDED Viewed

The diff for this file is too large to render. See raw diff

results/omni_finetune/xperience10m_qwen3_omni_v6_retrieval_task_probes_a100_20260617T175919Z/collection_validation.json ADDED Viewed

	@@ -0,0 +1,16 @@

+{
+  "records": [
+    {
+      "metric_key": "caption_grounding_mrr",
+      "num_samples": 4032,
+      "primary_score": 0.8764467592592605,
+      "source": "results/omni_finetune/xperience10m_qwen3_omni_v6_retrieval_task_probes_a100_20260617T175919Z/caption_grounding/metrics.json",
+      "task_id": "caption_grounding"
+    }
+  ],
+  "run_id": "xperience10m_qwen3_omni_v6_retrieval_task_probes_a100_20260617T175919Z",
+  "status": "pass",
+  "summary": "results/omni_finetune/xperience10m_qwen3_omni_v6_retrieval_task_probes_a100_20260617T175919Z/summary.json",
+  "title": "Qwen3 Future Task Probe Collection Validation",
+  "validated_task_count": 1
+}

results/omni_finetune/xperience10m_qwen3_omni_v6_retrieval_task_probes_a100_20260617T175919Z/launch_env.txt ADDED Viewed

	@@ -0,0 +1,11 @@

+run_id=xperience10m_qwen3_omni_v6_retrieval_task_probes_a100_20260617T175919Z
+dataset_jsonl=/mnt/kgc/chaoyue/ropedia-h20-side/ropedia-episode-task-suite/results/omni_finetune/xperience10m_qwen3_omni_128ep_multiscale_cap96_v5_full8gpu_lora_dataset/dataset_a100_eval.jsonl
+model_dir=/mnt/kgc/chaoyue/ropedia-h20-side/modelscope_models/Qwen__Qwen3-Omni-30B-A3B-Instruct
+adapter_dir=/mnt/kgc/chaoyue/ropedia-h20-side/ropedia-episode-task-suite/checkpoints/xperience10m_qwen3_omni_128ep_multiscale_cap96_v6_rank64_lr5e5_full8gpu_lora/adapter_lora
+tasks=caption_grounding
+candidate_count=4
+cuda_device_groups=0,1 2,3
+shards=2
+started_at=2026-06-18T05:20:16+08:00
+finished_at=2026-06-18T08:41:05+08:00
+exit_code=0

results/omni_finetune/xperience10m_qwen3_omni_v6_retrieval_task_probes_a100_20260617T175919Z/summary.json ADDED Viewed

	@@ -0,0 +1,19 @@

+{
+  "run_id": "xperience10m_qwen3_omni_v6_retrieval_task_probes_a100_20260617T175919Z",
+  "shard_dirs": [
+    "results/omni_finetune/xperience10m_qwen3_omni_v6_retrieval_task_probes_a100_20260617T175919Z_shard0",
+    "results/omni_finetune/xperience10m_qwen3_omni_v6_retrieval_task_probes_a100_20260617T175919Z_shard1"
+  ],
+  "status": "pass",
+  "tasks": {
+    "caption_grounding": {
+      "metric_key": "caption_grounding_mrr",
+      "metrics_json": "results/omni_finetune/xperience10m_qwen3_omni_v6_retrieval_task_probes_a100_20260617T175919Z/caption_grounding/metrics.json",
+      "num_samples": 4032,
+      "primary_score": 0.8764467592592605,
+      "task_label": "Language Grounding",
+      "task_number": 8
+    }
+  },
+  "title": "Qwen3-Omni v6 Retrieval Task Probes"
+}

results/omni_finetune/xperience10m_qwen3_omni_v6_retrieval_task_probes_a100_20260617T175919Z/xperience10m_qwen3_omni_v6_retrieval_task_probes_a100_20260617T175919Z_shard0.progress.jsonl ADDED Viewed

The diff for this file is too large to render. See raw diff

results/omni_finetune/xperience10m_qwen3_omni_v6_retrieval_task_probes_a100_20260617T175919Z/xperience10m_qwen3_omni_v6_retrieval_task_probes_a100_20260617T175919Z_shard1.progress.jsonl ADDED Viewed

The diff for this file is too large to render. See raw diff

scripts/omni/collect_qwen3_retrieval_task_probe_results.sh ADDED Viewed

	@@ -0,0 +1,89 @@

+#!/usr/bin/env bash
+set -euo pipefail
+SCRIPT_DIR="$(cd "$(dirname "${BASH_SOURCE[0]}")" && pwd)"
+PROJECT_ROOT="$(cd "${SCRIPT_DIR}/../.." && pwd)"
+GPU_HOST_SUFFIX="${GPU_HOST_SUFFIX:-$(printf 'A%s-80Gx4' 100)}"
+REMOTE_HOST="${REMOTE_HOST:-ANGEL-${GPU_HOST_SUFFIX}}"
+REMOTE_ROOT="${REMOTE_ROOT:-/mnt/kgc/chaoyue/ropedia-h20-side/ropedia-episode-task-suite}"
+RUN_ID="${RUN_ID:-xperience10m_qwen3_omni_v6_cross_modal_retrieval_probe_a100_20260618T000000Z}"
+RESULT_ROOT="${RESULT_ROOT:-results/omni_finetune}"
+TASKS_CSV="${TASKS_CSV:-cross_modal_retrieval}"
+REMOTE_RUN_DIR="${REMOTE_ROOT}/${RESULT_ROOT}/${RUN_ID}"
+LOCAL_RUN_DIR="${PROJECT_ROOT}/${RESULT_ROOT}/${RUN_ID}"
+LOCAL_LAUNCHER_DIR="${PROJECT_ROOT}/${RESULT_ROOT}/deferred_launchers"
+REMOTE_LAUNCHER_LOG="${REMOTE_ROOT}/${RESULT_ROOT}/${RUN_ID}.launch.log"
+IFS=',' read -r -a TASKS <<< "$TASKS_CSV"
+echo "checking remote run ${REMOTE_HOST}:${REMOTE_RUN_DIR}"
+ssh "$REMOTE_HOST" "cd '$REMOTE_ROOT' && test -s '${RESULT_ROOT}/${RUN_ID}/summary.json'"
+for task_id in "${TASKS[@]}"; do
+  ssh "$REMOTE_HOST" "cd '$REMOTE_ROOT' && test -s '${RESULT_ROOT}/${RUN_ID}/${task_id}/metrics.json'"
+done
+mkdir -p "$LOCAL_RUN_DIR" "$LOCAL_LAUNCHER_DIR"
+rsync -av "${REMOTE_HOST}:${REMOTE_RUN_DIR}/" "$LOCAL_RUN_DIR/"
+ssh "$REMOTE_HOST" "test -s '$REMOTE_LAUNCHER_LOG'" >/dev/null 2>&1 \
+  && rsync -av "${REMOTE_HOST}:${REMOTE_LAUNCHER_LOG}" "$LOCAL_LAUNCHER_DIR/" \
+  || true
+python3 - "$PROJECT_ROOT" "$RUN_ID" "$TASKS_CSV" <<'PY'
+import json
+import sys
+from pathlib import Path
+root = Path(sys.argv[1])
+run_id = sys.argv[2]
+task_ids = [item.strip() for item in sys.argv[3].split(",") if item.strip()]
+run_dir = root / "results/omni_finetune" / run_id
+metric_key_by_task = {
+    "caption_grounding": "caption_grounding_mrr",
+    "cross_modal_retrieval": "cross_modal_retrieval_mrr",
+}
+expected = {task_id: metric_key_by_task[task_id] for task_id in task_ids}
+summary_path = run_dir / "summary.json"
+if not summary_path.exists():
+    raise SystemExit(f"missing summary: {summary_path}")
+summary = json.loads(summary_path.read_text(encoding="utf-8"))
+if summary.get("status") != "pass":
+    raise SystemExit(f"run summary is not pass: {summary.get('status')}")
+records = []
+for task_id, metric_key in expected.items():
+    metrics_path = run_dir / task_id / "metrics.json"
+    if not metrics_path.exists():
+        raise SystemExit(f"missing metrics: {metrics_path}")
+    metrics = json.loads(metrics_path.read_text(encoding="utf-8"))
+    score = metrics.get(metric_key)
+    if metrics.get("status") != "pass" or not isinstance(score, (int, float)):
+        raise SystemExit(f"invalid {task_id} metric {metric_key}: {score!r}")
+    records.append(
+        {
+            "task_id": task_id,
+            "metric_key": metric_key,
+            "primary_score": score,
+            "num_samples": metrics.get("num_samples"),
+            "source": str(metrics_path.relative_to(root)),
+        }
+    )
+validation = {
+    "title": "Qwen3 Retrieval Task Probe Collection Validation",
+    "status": "pass",
+    "run_id": run_id,
+    "summary": str(summary_path.relative_to(root)),
+    "validated_task_count": len(records),
+    "records": records,
+}
+(run_dir / "collection_validation.json").write_text(
+    json.dumps(validation, indent=2, sort_keys=True) + "\n",
+    encoding="utf-8",
+)
+print(json.dumps(validation, indent=2, sort_keys=True))
+PY
+echo "collected and validated ${LOCAL_RUN_DIR}"