cy0307 commited on
Commit
f61ea5b
·
verified ·
1 Parent(s): 942c6d8

Update 145-result docs data

Browse files
docs/data/artifact_index.json CHANGED
@@ -1,6 +1,6 @@
1
  {
2
  "title": "Ropedia Xperience-10M Task Suite Artifact Index",
3
- "generated_at_utc": "2026-06-18T14:33:19+00:00",
4
  "status": "pass",
5
  "artifact_count": 213,
6
  "missing": [],
@@ -599,7 +599,7 @@
599
  "shows": "Machine-readable source-alignment pass/fail check for repo, website, and HF surfaces.",
600
  "exists": true,
601
  "bytes": 4432,
602
- "sha256": "8d92c5a61bfc4dd1b21330cce7da6fc76be2aeb333ed0396589cbceb053f2c2c"
603
  },
604
  {
605
  "id": "source_alignment_validator",
@@ -719,8 +719,8 @@
719
  "surface": "website_hf",
720
  "shows": "Stores normalized 20-axis radar values, raw task metrics, Qwen3/Cosmos overlay mappings, branch-card caveats, and explicit scoreless status records.",
721
  "exists": true,
722
- "bytes": 229355,
723
- "sha256": "f25fca45a1b418122a0bcb2bd37376639102385c2faf0b464013bfa2ab52c54e"
724
  },
725
  {
726
  "id": "single_episode_task_model_radar_json",
@@ -731,7 +731,7 @@
731
  "shows": "Machine-readable split radar for the one-episode Minimal and Neural MLP baselines, both scored on all 20 task contracts.",
732
  "exists": true,
733
  "bytes": 51064,
734
- "sha256": "2f508b484058116acb3d485a5c53847ac07b710a8f99e599a51433346997bdfd"
735
  },
736
  {
737
  "id": "episode128_task_model_radar_json",
@@ -741,8 +741,8 @@
741
  "surface": "website_hf",
742
  "shows": "Machine-readable split radar for selected 128-episode metadata/raw baselines and verified Qwen3/Cosmos branches, preserving explicit scoreless cells.",
743
  "exists": true,
744
- "bytes": 185503,
745
- "sha256": "32ba033a12e0da3a4cb5a2ae427fe6a78830f9af21b4a5f9c4c4fc6e44087303"
746
  },
747
  {
748
  "id": "task_method_20_result_matrix_json",
@@ -752,8 +752,8 @@
752
  "surface": "website_hf",
753
  "shows": "Machine-readable 9-method by 20-task matrix where every method has 20 records and scoreless cells carry unsupported/not-evaluated reasons.",
754
  "exists": true,
755
- "bytes": 128856,
756
- "sha256": "90fb4a25420b03c473ca790fc286ea11117fb26ea6c084a8c288663041cba503"
757
  },
758
  {
759
  "id": "task_method_20_result_matrix",
@@ -763,8 +763,8 @@
763
  "surface": "repo_hf",
764
  "shows": "Reader-facing table that separates 20 records per method from numeric scored axes, documented raw128 proxy scores, unsupported metadata targets, and model targets not evaluated in verified packages.",
765
  "exists": true,
766
- "bytes": 3946,
767
- "sha256": "b166f6362dfed5ce4b0619f8c65853a1795ff9d65c47200825658ec725d7616d"
768
  },
769
  {
770
  "id": "task_method_20_gap_audit_json",
@@ -774,8 +774,8 @@
774
  "surface": "website_hf",
775
  "shows": "Machine-readable 180-record gap ledger with numeric scores, scoreless cells, explicit status reasons, and next evidence needed before new scores can be published.",
776
  "exists": true,
777
- "bytes": 35121,
778
- "sha256": "9724eb26b9243729b7aab6062745244f856d6004185cc70cb19fa8c11fc609c6"
779
  },
780
  {
781
  "id": "task_method_20_gap_audit",
@@ -785,8 +785,8 @@
785
  "surface": "repo_hf",
786
  "shows": "Reader-facing ledger that lists every scoreless method-task cell and the concrete target or model-output evidence required before it can become numeric.",
787
  "exists": true,
788
- "bytes": 10094,
789
- "sha256": "d4590c09e18344db280965ba7de38a2531fc3bc8d72fa8ee7cdfcd61928461dd"
790
  },
791
  {
792
  "id": "unified_task_model_radar_chart",
@@ -796,8 +796,8 @@
796
  "surface": "website_hf",
797
  "shows": "Compares minimal and neural MLP baselines across all 20 tasks, with Qwen3/Cosmos task-aligned model overlays.",
798
  "exists": true,
799
- "bytes": 53899,
800
- "sha256": "6a72bfb7f2415ea88dd5c60ae6efce67e0296da3fa859b17cbda7692d4817fe4"
801
  },
802
  {
803
  "id": "single_episode_task_model_radar_chart",
@@ -818,8 +818,8 @@
818
  "surface": "website_hf",
819
  "shows": "Separates the selected 128-episode methods: raw-feature simple/NN as complete 20/20 scored polygons and metadata/Qwen/Cosmos as task-aligned overlays.",
820
  "exists": true,
821
- "bytes": 47886,
822
- "sha256": "486d477a2c7eff2a3c51f20a55bb069b53e0a6529ec8d305a32cecb3536a6bdc"
823
  },
824
  {
825
  "id": "unified_task_model_radar_builder",
@@ -829,8 +829,8 @@
829
  "surface": "repo_hf",
830
  "shows": "Regenerates the direction-aware radar chart and machine-readable metric overlay JSON.",
831
  "exists": true,
832
- "bytes": 53250,
833
- "sha256": "cedb6a0ef284b8809c9fc9a256e3b5d411e19431b3dcb7629c104c32a573c5f3"
834
  },
835
  {
836
  "id": "task_method_20_gap_audit_builder",
@@ -884,8 +884,8 @@
884
  "surface": "repo_hf",
885
  "shows": "Scores task 16 action-object relation only where verified held-out prediction JSON already contains action and object-set fields.",
886
  "exists": true,
887
- "bytes": 2830,
888
- "sha256": "7313cc227e570e7a71e245f75c14da3df9c005e5f048fd82696d852b1bf2d2f3"
889
  },
890
  {
891
  "id": "existing_model_output_task_probe_script",
@@ -895,8 +895,8 @@
895
  "surface": "repo_hf",
896
  "shows": "Derives task-specific scores from committed verified model outputs without running new inference or backfilling absent targets.",
897
  "exists": true,
898
- "bytes": 20580,
899
- "sha256": "7b23192c05f214219e24a8774de96da990b26cc6abf35c8994938a73934c8163"
900
  },
901
  {
902
  "id": "a100_128_metadata_task_baselines",
@@ -1105,7 +1105,7 @@
1105
  "shows": "Machine-readable release-check summary for validators, mirrors, and public project surfaces.",
1106
  "exists": true,
1107
  "bytes": 8100,
1108
- "sha256": "2c24d43a2062ce9a242ca39bf27beac84380b96f0f0e0825a40fec60e5c488e7"
1109
  },
1110
  {
1111
  "id": "public_surface_qa",
@@ -1286,7 +1286,7 @@
1286
  "volatile": true,
1287
  "shows": "Confirms public bundles exclude raw data, caches, heavy archives, and credential text.",
1288
  "exists": true,
1289
- "bytes": 9598,
1290
  "hash_policy": "existence_and_size_only"
1291
  },
1292
  {
@@ -1310,7 +1310,7 @@
1310
  "volatile": true,
1311
  "shows": "Confirms prepared GitHub/HF Space/artifact/model mirrors share the same critical data, figure, website HTML, and validator files.",
1312
  "exists": true,
1313
- "bytes": 1102386,
1314
  "hash_policy": "existence_and_size_only"
1315
  },
1316
  {
 
1
  {
2
  "title": "Ropedia Xperience-10M Task Suite Artifact Index",
3
+ "generated_at_utc": "2026-06-18T15:28:15+00:00",
4
  "status": "pass",
5
  "artifact_count": 213,
6
  "missing": [],
 
599
  "shows": "Machine-readable source-alignment pass/fail check for repo, website, and HF surfaces.",
600
  "exists": true,
601
  "bytes": 4432,
602
+ "sha256": "dddcbc30a5a4ccd134317fd35bf0e15b5103981ac09bd3359794c55e3a3dbacb"
603
  },
604
  {
605
  "id": "source_alignment_validator",
 
719
  "surface": "website_hf",
720
  "shows": "Stores normalized 20-axis radar values, raw task metrics, Qwen3/Cosmos overlay mappings, branch-card caveats, and explicit scoreless status records.",
721
  "exists": true,
722
+ "bytes": 229332,
723
+ "sha256": "34bccb1afa3dc987a98e774c55b00e23d4345d69b3dca3fd124ef64bde0c3d34"
724
  },
725
  {
726
  "id": "single_episode_task_model_radar_json",
 
731
  "shows": "Machine-readable split radar for the one-episode Minimal and Neural MLP baselines, both scored on all 20 task contracts.",
732
  "exists": true,
733
  "bytes": 51064,
734
+ "sha256": "ca48852ee62c58d83ff9fed7f775a3babb07653aab00a2b4266ea9885cbc45ff"
735
  },
736
  {
737
  "id": "episode128_task_model_radar_json",
 
741
  "surface": "website_hf",
742
  "shows": "Machine-readable split radar for selected 128-episode metadata/raw baselines and verified Qwen3/Cosmos branches, preserving explicit scoreless cells.",
743
  "exists": true,
744
+ "bytes": 185480,
745
+ "sha256": "52250951319a87a069bfca26338a1daa1511a2bd4bb145801e5e44d230dcac1c"
746
  },
747
  {
748
  "id": "task_method_20_result_matrix_json",
 
752
  "surface": "website_hf",
753
  "shows": "Machine-readable 9-method by 20-task matrix where every method has 20 records and scoreless cells carry unsupported/not-evaluated reasons.",
754
  "exists": true,
755
+ "bytes": 128862,
756
+ "sha256": "7d071dd9d840025d566d430f7c24f7005f8c8d4acb73d14fbbd5df754e996f70"
757
  },
758
  {
759
  "id": "task_method_20_result_matrix",
 
763
  "surface": "repo_hf",
764
  "shows": "Reader-facing table that separates 20 records per method from numeric scored axes, documented raw128 proxy scores, unsupported metadata targets, and model targets not evaluated in verified packages.",
765
  "exists": true,
766
+ "bytes": 3938,
767
+ "sha256": "b15ca4161fc6aa94e5f452b14d802b37d80d565bbf64a795dfdaeef07e5263de"
768
  },
769
  {
770
  "id": "task_method_20_gap_audit_json",
 
774
  "surface": "website_hf",
775
  "shows": "Machine-readable 180-record gap ledger with numeric scores, scoreless cells, explicit status reasons, and next evidence needed before new scores can be published.",
776
  "exists": true,
777
+ "bytes": 34384,
778
+ "sha256": "ec64d78e07d4951f14832945668b1c2252a61393672e3d607478e7d6f95ccf99"
779
  },
780
  {
781
  "id": "task_method_20_gap_audit",
 
785
  "surface": "repo_hf",
786
  "shows": "Reader-facing ledger that lists every scoreless method-task cell and the concrete target or model-output evidence required before it can become numeric.",
787
  "exists": true,
788
+ "bytes": 9908,
789
+ "sha256": "6b76d3cb4294150c5322b0af6c22fe52ed658d31b87a646fa26a54322d6a55e2"
790
  },
791
  {
792
  "id": "unified_task_model_radar_chart",
 
796
  "surface": "website_hf",
797
  "shows": "Compares minimal and neural MLP baselines across all 20 tasks, with Qwen3/Cosmos task-aligned model overlays.",
798
  "exists": true,
799
+ "bytes": 54032,
800
+ "sha256": "56893b66dfb07f3028844fe96846614715058b808c731ce870232ad6247a3a50"
801
  },
802
  {
803
  "id": "single_episode_task_model_radar_chart",
 
818
  "surface": "website_hf",
819
  "shows": "Separates the selected 128-episode methods: raw-feature simple/NN as complete 20/20 scored polygons and metadata/Qwen/Cosmos as task-aligned overlays.",
820
  "exists": true,
821
+ "bytes": 48019,
822
+ "sha256": "70fb20c3f8f9574303b5e4832fba7b5e39ae20b75aa006af53ac1457b7daf64e"
823
  },
824
  {
825
  "id": "unified_task_model_radar_builder",
 
829
  "surface": "repo_hf",
830
  "shows": "Regenerates the direction-aware radar chart and machine-readable metric overlay JSON.",
831
  "exists": true,
832
+ "bytes": 53705,
833
+ "sha256": "e35607dd679ce7c199868660cd733e1e67c6877e2c5f207de15e9738483af0dc"
834
  },
835
  {
836
  "id": "task_method_20_gap_audit_builder",
 
884
  "surface": "repo_hf",
885
  "shows": "Scores task 16 action-object relation only where verified held-out prediction JSON already contains action and object-set fields.",
886
  "exists": true,
887
+ "bytes": 3180,
888
+ "sha256": "82a36cc5d23fa34792eac6b7124eecbed900d52c8f0b2a7921d409e236efd68a"
889
  },
890
  {
891
  "id": "existing_model_output_task_probe_script",
 
895
  "surface": "repo_hf",
896
  "shows": "Derives task-specific scores from committed verified model outputs without running new inference or backfilling absent targets.",
897
  "exists": true,
898
+ "bytes": 27917,
899
+ "sha256": "421c50262c38dd222ab0c5f50d78f4d92ee18f13b9a96661b292c44c05e89b1d"
900
  },
901
  {
902
  "id": "a100_128_metadata_task_baselines",
 
1105
  "shows": "Machine-readable release-check summary for validators, mirrors, and public project surfaces.",
1106
  "exists": true,
1107
  "bytes": 8100,
1108
+ "sha256": "b83cc28e9ae1843761e5a15ca34d1b9468749d6d2dd740313e26148aaca92357"
1109
  },
1110
  {
1111
  "id": "public_surface_qa",
 
1286
  "volatile": true,
1287
  "shows": "Confirms public bundles exclude raw data, caches, heavy archives, and credential text.",
1288
  "exists": true,
1289
+ "bytes": 9520,
1290
  "hash_policy": "existence_and_size_only"
1291
  },
1292
  {
 
1310
  "volatile": true,
1311
  "shows": "Confirms prepared GitHub/HF Space/artifact/model mirrors share the same critical data, figure, website HTML, and validator files.",
1312
  "exists": true,
1313
+ "bytes": 919718,
1314
  "hash_policy": "existence_and_size_only"
1315
  },
1316
  {
docs/data/episode128_task_model_radar.json CHANGED
@@ -1,12 +1,12 @@
1
  {
2
  "title": "128-Episode 20-Task Radar",
3
  "status": "pass",
4
- "generated_at_utc": "2026-06-18T14:32:46+00:00",
5
  "description": "Selected 128-episode metadata/raw baselines plus verified Qwen3/Cosmos branches. Every method has 20 records; numeric scores appear only where the public artifact produced that task target.",
6
  "task_count": 20,
7
  "method_count": 7,
8
  "method_task_record_count": 140,
9
- "scored_method_task_count": 104,
10
  "normalization_policy": {
11
  "higher_is_better": "bounded metrics are plotted directly on 0-1 axes after clipping to [0, 1]",
12
  "lower_is_better": "lower-error metrics are converted to best_observed_value / raw_value within the same task",
@@ -147,20 +147,20 @@
147
  "kind": "partial_128_episode_foundation_model_overlay",
148
  "scope": "128 selected episodes, held-out test",
149
  "stroke_dasharray": "4 7",
150
- "method_detail": "Verified Cosmos3-Super base-weight Reasoner JSON-task evaluation, plus task 16 scored from existing verified action/object JSON.",
151
  "plotted_as": "colored point overlay",
152
  "result_record_count": 20,
153
- "scored_task_count": 7,
154
- "covered_task_count": 7,
155
  "proxy_scored_task_count": 0,
156
- "scoreless_task_count": 13,
157
  "unsupported_task_count": 0,
158
- "not_evaluated_task_count": 13,
159
  "status_counts": {
160
- "not_evaluated_in_verified_package": 13,
161
- "scored": 7
162
  },
163
- "coverage_fraction": 0.35,
164
  "result_record_fraction": 1.0
165
  },
166
  {
@@ -1986,15 +1986,15 @@
1986
  "status_label": "scored"
1987
  },
1988
  "cosmos3_super_reasoner": {
1989
- "raw": null,
1990
- "metric_key": "mae",
1991
- "source": null,
1992
  "scope": "multi_episode_128_partial_model_overlay",
1993
- "status": "not_evaluated_in_verified_package",
1994
- "reason": "the verified public model package did not ask this branch to emit that task target; a new task-specific evaluation package is required for a numeric score",
1995
- "normalized_score": null,
1996
- "raw_text": "n/a",
1997
- "status_label": "not evaluated"
1998
  },
1999
  "cosmos3_nano_future_window": {
2000
  "raw": null,
@@ -4501,17 +4501,17 @@
4501
  "task_label": "Time-to-Next-Transition Regression",
4502
  "series_id": "cosmos3_super_reasoner",
4503
  "method": "Cosmos3-Super Reasoner",
4504
- "status": "not_evaluated_in_verified_package",
4505
- "status_label": "not evaluated",
4506
- "scored": false,
4507
  "proxy_scored": false,
4508
- "raw": null,
4509
- "raw_text": "n/a",
4510
- "normalized_score": null,
4511
- "metric_key": "mae",
4512
- "source": null,
4513
  "scope": "multi_episode_128_partial_model_overlay",
4514
- "reason": "the verified public model package did not ask this branch to emit that task target; a new task-specific evaluation package is required for a numeric score"
4515
  },
4516
  {
4517
  "task_number": 20,
 
1
  {
2
  "title": "128-Episode 20-Task Radar",
3
  "status": "pass",
4
+ "generated_at_utc": "2026-06-18T15:27:21+00:00",
5
  "description": "Selected 128-episode metadata/raw baselines plus verified Qwen3/Cosmos branches. Every method has 20 records; numeric scores appear only where the public artifact produced that task target.",
6
  "task_count": 20,
7
  "method_count": 7,
8
  "method_task_record_count": 140,
9
+ "scored_method_task_count": 105,
10
  "normalization_policy": {
11
  "higher_is_better": "bounded metrics are plotted directly on 0-1 axes after clipping to [0, 1]",
12
  "lower_is_better": "lower-error metrics are converted to best_observed_value / raw_value within the same task",
 
147
  "kind": "partial_128_episode_foundation_model_overlay",
148
  "scope": "128 selected episodes, held-out test",
149
  "stroke_dasharray": "4 7",
150
+ "method_detail": "Verified Cosmos3-Super base-weight Reasoner JSON-task evaluation, plus task 16 and a derived task-20 action-boundary timing probe scored from existing verified JSON.",
151
  "plotted_as": "colored point overlay",
152
  "result_record_count": 20,
153
+ "scored_task_count": 8,
154
+ "covered_task_count": 8,
155
  "proxy_scored_task_count": 0,
156
+ "scoreless_task_count": 12,
157
  "unsupported_task_count": 0,
158
+ "not_evaluated_task_count": 12,
159
  "status_counts": {
160
+ "not_evaluated_in_verified_package": 12,
161
+ "scored": 8
162
  },
163
+ "coverage_fraction": 0.4,
164
  "result_record_fraction": 1.0
165
  },
166
  {
 
1986
  "status_label": "scored"
1987
  },
1988
  "cosmos3_super_reasoner": {
1989
+ "raw": 52.94642857142857,
1990
+ "metric_key": "time_to_transition_mae",
1991
+ "source": "results/omni_finetune/model_output_task_probes_20260616/time_to_transition/cosmos3_super_reasoner/metrics.json",
1992
  "scope": "multi_episode_128_partial_model_overlay",
1993
+ "status": "scored",
1994
+ "reason": null,
1995
+ "normalized_score": 0.19901920981190058,
1996
+ "raw_text": "52.95",
1997
+ "status_label": "scored"
1998
  },
1999
  "cosmos3_nano_future_window": {
2000
  "raw": null,
 
4501
  "task_label": "Time-to-Next-Transition Regression",
4502
  "series_id": "cosmos3_super_reasoner",
4503
  "method": "Cosmos3-Super Reasoner",
4504
+ "status": "scored",
4505
+ "status_label": "scored",
4506
+ "scored": true,
4507
  "proxy_scored": false,
4508
+ "raw": 52.94642857142857,
4509
+ "raw_text": "52.95",
4510
+ "normalized_score": 0.19901920981190058,
4511
+ "metric_key": "time_to_transition_mae",
4512
+ "source": "results/omni_finetune/model_output_task_probes_20260616/time_to_transition/cosmos3_super_reasoner/metrics.json",
4513
  "scope": "multi_episode_128_partial_model_overlay",
4514
+ "reason": null
4515
  },
4516
  {
4517
  "task_number": 20,
docs/data/mirror_parity.json CHANGED
@@ -1,9 +1,9 @@
1
  {
2
  "status": "pass",
3
- "generated_at_utc": "2026-06-18T14:59:22+00:00",
4
  "hf_root": "hf_publish",
5
  "summary": {
6
- "group_count": 756,
7
  "failure_count": 0,
8
  "failures_by_surface": {}
9
  },
@@ -138,45 +138,45 @@
138
  "local": {
139
  "path": "repo:docs/data/artifact_index.json",
140
  "exists": true,
141
- "bytes": 116111,
142
- "sha256": "a227be29b220c1c9bc2438f979f29e0aac635d82f13cffef2b0e0016c300a179"
143
  },
144
  "mirrors": {
145
  "hf_space": {
146
  "path": "hf_space:data/artifact_index.json",
147
  "exists": true,
148
- "bytes": 116111,
149
- "sha256": "a227be29b220c1c9bc2438f979f29e0aac635d82f13cffef2b0e0016c300a179"
150
  },
151
  "hf_artifacts_data": {
152
  "path": "hf_artifacts:data/artifact_index.json",
153
  "exists": true,
154
- "bytes": 116111,
155
- "sha256": "a227be29b220c1c9bc2438f979f29e0aac635d82f13cffef2b0e0016c300a179"
156
  },
157
  "hf_artifacts": {
158
  "path": "hf_artifacts:docs/data/artifact_index.json",
159
  "exists": true,
160
- "bytes": 116111,
161
- "sha256": "a227be29b220c1c9bc2438f979f29e0aac635d82f13cffef2b0e0016c300a179"
162
  },
163
  "hf_model_data": {
164
  "path": "hf_model:data/artifact_index.json",
165
  "exists": true,
166
- "bytes": 116111,
167
- "sha256": "a227be29b220c1c9bc2438f979f29e0aac635d82f13cffef2b0e0016c300a179"
168
  },
169
  "hf_model_docs_data": {
170
  "path": "hf_model:docs/data/artifact_index.json",
171
  "exists": true,
172
- "bytes": 116111,
173
- "sha256": "a227be29b220c1c9bc2438f979f29e0aac635d82f13cffef2b0e0016c300a179"
174
  },
175
  "hf_model": {
176
  "path": "hf_model:metrics/artifact_index.json",
177
  "exists": true,
178
- "bytes": 116111,
179
- "sha256": "a227be29b220c1c9bc2438f979f29e0aac635d82f13cffef2b0e0016c300a179"
180
  }
181
  },
182
  "failures": []
@@ -923,44 +923,44 @@
923
  "path": "repo:docs/data/publication_audit.json",
924
  "exists": true,
925
  "bytes": 9520,
926
- "sha256": "23261bd9b51b9cd9e0df8460422e4da9c291a4c354bdb42a34577c386d827173"
927
  },
928
  "mirrors": {
929
  "hf_space": {
930
  "path": "hf_space:data/publication_audit.json",
931
  "exists": true,
932
  "bytes": 9520,
933
- "sha256": "23261bd9b51b9cd9e0df8460422e4da9c291a4c354bdb42a34577c386d827173"
934
  },
935
  "hf_artifacts_data": {
936
  "path": "hf_artifacts:data/publication_audit.json",
937
  "exists": true,
938
  "bytes": 9520,
939
- "sha256": "23261bd9b51b9cd9e0df8460422e4da9c291a4c354bdb42a34577c386d827173"
940
  },
941
  "hf_artifacts": {
942
  "path": "hf_artifacts:docs/data/publication_audit.json",
943
  "exists": true,
944
  "bytes": 9520,
945
- "sha256": "23261bd9b51b9cd9e0df8460422e4da9c291a4c354bdb42a34577c386d827173"
946
  },
947
  "hf_model_data": {
948
  "path": "hf_model:data/publication_audit.json",
949
  "exists": true,
950
  "bytes": 9520,
951
- "sha256": "23261bd9b51b9cd9e0df8460422e4da9c291a4c354bdb42a34577c386d827173"
952
  },
953
  "hf_model_docs_data": {
954
  "path": "hf_model:docs/data/publication_audit.json",
955
  "exists": true,
956
  "bytes": 9520,
957
- "sha256": "23261bd9b51b9cd9e0df8460422e4da9c291a4c354bdb42a34577c386d827173"
958
  },
959
  "hf_model": {
960
  "path": "hf_model:metrics/publication_audit.json",
961
  "exists": true,
962
  "bytes": 9520,
963
- "sha256": "23261bd9b51b9cd9e0df8460422e4da9c291a4c354bdb42a34577c386d827173"
964
  }
965
  },
966
  "failures": []
@@ -972,44 +972,44 @@
972
  "path": "repo:docs/data/public_surface_qa.json",
973
  "exists": true,
974
  "bytes": 7126,
975
- "sha256": "86550c6f3eb1c21fae26eb259d0713d6ec81629e23fd301660a35aef8ab277bf"
976
  },
977
  "mirrors": {
978
  "hf_space": {
979
  "path": "hf_space:data/public_surface_qa.json",
980
  "exists": true,
981
  "bytes": 7126,
982
- "sha256": "86550c6f3eb1c21fae26eb259d0713d6ec81629e23fd301660a35aef8ab277bf"
983
  },
984
  "hf_artifacts_data": {
985
  "path": "hf_artifacts:data/public_surface_qa.json",
986
  "exists": true,
987
  "bytes": 7126,
988
- "sha256": "86550c6f3eb1c21fae26eb259d0713d6ec81629e23fd301660a35aef8ab277bf"
989
  },
990
  "hf_artifacts": {
991
  "path": "hf_artifacts:docs/data/public_surface_qa.json",
992
  "exists": true,
993
  "bytes": 7126,
994
- "sha256": "86550c6f3eb1c21fae26eb259d0713d6ec81629e23fd301660a35aef8ab277bf"
995
  },
996
  "hf_model_data": {
997
  "path": "hf_model:data/public_surface_qa.json",
998
  "exists": true,
999
  "bytes": 7126,
1000
- "sha256": "86550c6f3eb1c21fae26eb259d0713d6ec81629e23fd301660a35aef8ab277bf"
1001
  },
1002
  "hf_model_docs_data": {
1003
  "path": "hf_model:docs/data/public_surface_qa.json",
1004
  "exists": true,
1005
  "bytes": 7126,
1006
- "sha256": "86550c6f3eb1c21fae26eb259d0713d6ec81629e23fd301660a35aef8ab277bf"
1007
  },
1008
  "hf_model": {
1009
  "path": "hf_model:metrics/public_surface_qa.json",
1010
  "exists": true,
1011
  "bytes": 7126,
1012
- "sha256": "86550c6f3eb1c21fae26eb259d0713d6ec81629e23fd301660a35aef8ab277bf"
1013
  }
1014
  },
1015
  "failures": []
@@ -1119,44 +1119,44 @@
1119
  "path": "repo:docs/data/quality_gates.json",
1120
  "exists": true,
1121
  "bytes": 8100,
1122
- "sha256": "ab3abda98791d4fea4af45e0d68ed8c203951ad17429ac2e3c022cc0afdd9ccb"
1123
  },
1124
  "mirrors": {
1125
  "hf_space": {
1126
  "path": "hf_space:data/quality_gates.json",
1127
  "exists": true,
1128
  "bytes": 8100,
1129
- "sha256": "ab3abda98791d4fea4af45e0d68ed8c203951ad17429ac2e3c022cc0afdd9ccb"
1130
  },
1131
  "hf_artifacts_data": {
1132
  "path": "hf_artifacts:data/quality_gates.json",
1133
  "exists": true,
1134
  "bytes": 8100,
1135
- "sha256": "ab3abda98791d4fea4af45e0d68ed8c203951ad17429ac2e3c022cc0afdd9ccb"
1136
  },
1137
  "hf_artifacts": {
1138
  "path": "hf_artifacts:docs/data/quality_gates.json",
1139
  "exists": true,
1140
  "bytes": 8100,
1141
- "sha256": "ab3abda98791d4fea4af45e0d68ed8c203951ad17429ac2e3c022cc0afdd9ccb"
1142
  },
1143
  "hf_model_data": {
1144
  "path": "hf_model:data/quality_gates.json",
1145
  "exists": true,
1146
  "bytes": 8100,
1147
- "sha256": "ab3abda98791d4fea4af45e0d68ed8c203951ad17429ac2e3c022cc0afdd9ccb"
1148
  },
1149
  "hf_model_docs_data": {
1150
  "path": "hf_model:docs/data/quality_gates.json",
1151
  "exists": true,
1152
  "bytes": 8100,
1153
- "sha256": "ab3abda98791d4fea4af45e0d68ed8c203951ad17429ac2e3c022cc0afdd9ccb"
1154
  },
1155
  "hf_model": {
1156
  "path": "hf_model:metrics/quality_gates.json",
1157
  "exists": true,
1158
  "bytes": 8100,
1159
- "sha256": "ab3abda98791d4fea4af45e0d68ed8c203951ad17429ac2e3c022cc0afdd9ccb"
1160
  }
1161
  },
1162
  "failures": []
@@ -1658,44 +1658,44 @@
1658
  "path": "repo:docs/data/source_alignment_audit.json",
1659
  "exists": true,
1660
  "bytes": 4432,
1661
- "sha256": "dddcbc30a5a4ccd134317fd35bf0e15b5103981ac09bd3359794c55e3a3dbacb"
1662
  },
1663
  "mirrors": {
1664
  "hf_space": {
1665
  "path": "hf_space:data/source_alignment_audit.json",
1666
  "exists": true,
1667
  "bytes": 4432,
1668
- "sha256": "dddcbc30a5a4ccd134317fd35bf0e15b5103981ac09bd3359794c55e3a3dbacb"
1669
  },
1670
  "hf_artifacts_data": {
1671
  "path": "hf_artifacts:data/source_alignment_audit.json",
1672
  "exists": true,
1673
  "bytes": 4432,
1674
- "sha256": "dddcbc30a5a4ccd134317fd35bf0e15b5103981ac09bd3359794c55e3a3dbacb"
1675
  },
1676
  "hf_artifacts": {
1677
  "path": "hf_artifacts:docs/data/source_alignment_audit.json",
1678
  "exists": true,
1679
  "bytes": 4432,
1680
- "sha256": "dddcbc30a5a4ccd134317fd35bf0e15b5103981ac09bd3359794c55e3a3dbacb"
1681
  },
1682
  "hf_model_data": {
1683
  "path": "hf_model:data/source_alignment_audit.json",
1684
  "exists": true,
1685
  "bytes": 4432,
1686
- "sha256": "dddcbc30a5a4ccd134317fd35bf0e15b5103981ac09bd3359794c55e3a3dbacb"
1687
  },
1688
  "hf_model_docs_data": {
1689
  "path": "hf_model:docs/data/source_alignment_audit.json",
1690
  "exists": true,
1691
  "bytes": 4432,
1692
- "sha256": "dddcbc30a5a4ccd134317fd35bf0e15b5103981ac09bd3359794c55e3a3dbacb"
1693
  },
1694
  "hf_model": {
1695
  "path": "hf_model:metrics/source_alignment_audit.json",
1696
  "exists": true,
1697
  "bytes": 4432,
1698
- "sha256": "dddcbc30a5a4ccd134317fd35bf0e15b5103981ac09bd3359794c55e3a3dbacb"
1699
  }
1700
  },
1701
  "failures": []
@@ -1756,44 +1756,44 @@
1756
  "path": "repo:docs/data/single_episode_task_model_radar.json",
1757
  "exists": true,
1758
  "bytes": 51064,
1759
- "sha256": "2f508b484058116acb3d485a5c53847ac07b710a8f99e599a51433346997bdfd"
1760
  },
1761
  "mirrors": {
1762
  "hf_space": {
1763
  "path": "hf_space:data/single_episode_task_model_radar.json",
1764
  "exists": true,
1765
  "bytes": 51064,
1766
- "sha256": "2f508b484058116acb3d485a5c53847ac07b710a8f99e599a51433346997bdfd"
1767
  },
1768
  "hf_artifacts_data": {
1769
  "path": "hf_artifacts:data/single_episode_task_model_radar.json",
1770
  "exists": true,
1771
  "bytes": 51064,
1772
- "sha256": "2f508b484058116acb3d485a5c53847ac07b710a8f99e599a51433346997bdfd"
1773
  },
1774
  "hf_artifacts": {
1775
  "path": "hf_artifacts:docs/data/single_episode_task_model_radar.json",
1776
  "exists": true,
1777
  "bytes": 51064,
1778
- "sha256": "2f508b484058116acb3d485a5c53847ac07b710a8f99e599a51433346997bdfd"
1779
  },
1780
  "hf_model_data": {
1781
  "path": "hf_model:data/single_episode_task_model_radar.json",
1782
  "exists": true,
1783
  "bytes": 51064,
1784
- "sha256": "2f508b484058116acb3d485a5c53847ac07b710a8f99e599a51433346997bdfd"
1785
  },
1786
  "hf_model_docs_data": {
1787
  "path": "hf_model:docs/data/single_episode_task_model_radar.json",
1788
  "exists": true,
1789
  "bytes": 51064,
1790
- "sha256": "2f508b484058116acb3d485a5c53847ac07b710a8f99e599a51433346997bdfd"
1791
  },
1792
  "hf_model": {
1793
  "path": "hf_model:metrics/single_episode_task_model_radar.json",
1794
  "exists": true,
1795
  "bytes": 51064,
1796
- "sha256": "2f508b484058116acb3d485a5c53847ac07b710a8f99e599a51433346997bdfd"
1797
  }
1798
  },
1799
  "failures": []
@@ -1804,45 +1804,45 @@
1804
  "local": {
1805
  "path": "repo:docs/data/episode128_task_model_radar.json",
1806
  "exists": true,
1807
- "bytes": 185503,
1808
- "sha256": "32ba033a12e0da3a4cb5a2ae427fe6a78830f9af21b4a5f9c4c4fc6e44087303"
1809
  },
1810
  "mirrors": {
1811
  "hf_space": {
1812
  "path": "hf_space:data/episode128_task_model_radar.json",
1813
  "exists": true,
1814
- "bytes": 185503,
1815
- "sha256": "32ba033a12e0da3a4cb5a2ae427fe6a78830f9af21b4a5f9c4c4fc6e44087303"
1816
  },
1817
  "hf_artifacts_data": {
1818
  "path": "hf_artifacts:data/episode128_task_model_radar.json",
1819
  "exists": true,
1820
- "bytes": 185503,
1821
- "sha256": "32ba033a12e0da3a4cb5a2ae427fe6a78830f9af21b4a5f9c4c4fc6e44087303"
1822
  },
1823
  "hf_artifacts": {
1824
  "path": "hf_artifacts:docs/data/episode128_task_model_radar.json",
1825
  "exists": true,
1826
- "bytes": 185503,
1827
- "sha256": "32ba033a12e0da3a4cb5a2ae427fe6a78830f9af21b4a5f9c4c4fc6e44087303"
1828
  },
1829
  "hf_model_data": {
1830
  "path": "hf_model:data/episode128_task_model_radar.json",
1831
  "exists": true,
1832
- "bytes": 185503,
1833
- "sha256": "32ba033a12e0da3a4cb5a2ae427fe6a78830f9af21b4a5f9c4c4fc6e44087303"
1834
  },
1835
  "hf_model_docs_data": {
1836
  "path": "hf_model:docs/data/episode128_task_model_radar.json",
1837
  "exists": true,
1838
- "bytes": 185503,
1839
- "sha256": "32ba033a12e0da3a4cb5a2ae427fe6a78830f9af21b4a5f9c4c4fc6e44087303"
1840
  },
1841
  "hf_model": {
1842
  "path": "hf_model:metrics/episode128_task_model_radar.json",
1843
  "exists": true,
1844
- "bytes": 185503,
1845
- "sha256": "32ba033a12e0da3a4cb5a2ae427fe6a78830f9af21b4a5f9c4c4fc6e44087303"
1846
  }
1847
  },
1848
  "failures": []
@@ -2001,44 +2001,44 @@
2001
  "path": "repo:docs/data/task_surface_integrity.json",
2002
  "exists": true,
2003
  "bytes": 45779,
2004
- "sha256": "9073c4a4424b519ae50a1a9761b4e25bf7fd12c5c9e0cd5ff528473157e17c9f"
2005
  },
2006
  "mirrors": {
2007
  "hf_space": {
2008
  "path": "hf_space:data/task_surface_integrity.json",
2009
  "exists": true,
2010
  "bytes": 45779,
2011
- "sha256": "9073c4a4424b519ae50a1a9761b4e25bf7fd12c5c9e0cd5ff528473157e17c9f"
2012
  },
2013
  "hf_artifacts_data": {
2014
  "path": "hf_artifacts:data/task_surface_integrity.json",
2015
  "exists": true,
2016
  "bytes": 45779,
2017
- "sha256": "9073c4a4424b519ae50a1a9761b4e25bf7fd12c5c9e0cd5ff528473157e17c9f"
2018
  },
2019
  "hf_artifacts": {
2020
  "path": "hf_artifacts:docs/data/task_surface_integrity.json",
2021
  "exists": true,
2022
  "bytes": 45779,
2023
- "sha256": "9073c4a4424b519ae50a1a9761b4e25bf7fd12c5c9e0cd5ff528473157e17c9f"
2024
  },
2025
  "hf_model_data": {
2026
  "path": "hf_model:data/task_surface_integrity.json",
2027
  "exists": true,
2028
  "bytes": 45779,
2029
- "sha256": "9073c4a4424b519ae50a1a9761b4e25bf7fd12c5c9e0cd5ff528473157e17c9f"
2030
  },
2031
  "hf_model_docs_data": {
2032
  "path": "hf_model:docs/data/task_surface_integrity.json",
2033
  "exists": true,
2034
  "bytes": 45779,
2035
- "sha256": "9073c4a4424b519ae50a1a9761b4e25bf7fd12c5c9e0cd5ff528473157e17c9f"
2036
  },
2037
  "hf_model": {
2038
  "path": "hf_model:metrics/task_surface_integrity.json",
2039
  "exists": true,
2040
  "bytes": 45779,
2041
- "sha256": "9073c4a4424b519ae50a1a9761b4e25bf7fd12c5c9e0cd5ff528473157e17c9f"
2042
  }
2043
  },
2044
  "failures": []
@@ -2098,45 +2098,45 @@
2098
  "local": {
2099
  "path": "repo:docs/data/task_method_20_result_matrix.json",
2100
  "exists": true,
2101
- "bytes": 128856,
2102
- "sha256": "90fb4a25420b03c473ca790fc286ea11117fb26ea6c084a8c288663041cba503"
2103
  },
2104
  "mirrors": {
2105
  "hf_space": {
2106
  "path": "hf_space:data/task_method_20_result_matrix.json",
2107
  "exists": true,
2108
- "bytes": 128856,
2109
- "sha256": "90fb4a25420b03c473ca790fc286ea11117fb26ea6c084a8c288663041cba503"
2110
  },
2111
  "hf_artifacts_data": {
2112
  "path": "hf_artifacts:data/task_method_20_result_matrix.json",
2113
  "exists": true,
2114
- "bytes": 128856,
2115
- "sha256": "90fb4a25420b03c473ca790fc286ea11117fb26ea6c084a8c288663041cba503"
2116
  },
2117
  "hf_artifacts": {
2118
  "path": "hf_artifacts:docs/data/task_method_20_result_matrix.json",
2119
  "exists": true,
2120
- "bytes": 128856,
2121
- "sha256": "90fb4a25420b03c473ca790fc286ea11117fb26ea6c084a8c288663041cba503"
2122
  },
2123
  "hf_model_data": {
2124
  "path": "hf_model:data/task_method_20_result_matrix.json",
2125
  "exists": true,
2126
- "bytes": 128856,
2127
- "sha256": "90fb4a25420b03c473ca790fc286ea11117fb26ea6c084a8c288663041cba503"
2128
  },
2129
  "hf_model_docs_data": {
2130
  "path": "hf_model:docs/data/task_method_20_result_matrix.json",
2131
  "exists": true,
2132
- "bytes": 128856,
2133
- "sha256": "90fb4a25420b03c473ca790fc286ea11117fb26ea6c084a8c288663041cba503"
2134
  },
2135
  "hf_model": {
2136
  "path": "hf_model:metrics/task_method_20_result_matrix.json",
2137
  "exists": true,
2138
- "bytes": 128856,
2139
- "sha256": "90fb4a25420b03c473ca790fc286ea11117fb26ea6c084a8c288663041cba503"
2140
  }
2141
  },
2142
  "failures": []
@@ -2147,45 +2147,45 @@
2147
  "local": {
2148
  "path": "repo:docs/data/task_method_20_gap_audit.json",
2149
  "exists": true,
2150
- "bytes": 35121,
2151
- "sha256": "9724eb26b9243729b7aab6062745244f856d6004185cc70cb19fa8c11fc609c6"
2152
  },
2153
  "mirrors": {
2154
  "hf_space": {
2155
  "path": "hf_space:data/task_method_20_gap_audit.json",
2156
  "exists": true,
2157
- "bytes": 35121,
2158
- "sha256": "9724eb26b9243729b7aab6062745244f856d6004185cc70cb19fa8c11fc609c6"
2159
  },
2160
  "hf_artifacts_data": {
2161
  "path": "hf_artifacts:data/task_method_20_gap_audit.json",
2162
  "exists": true,
2163
- "bytes": 35121,
2164
- "sha256": "9724eb26b9243729b7aab6062745244f856d6004185cc70cb19fa8c11fc609c6"
2165
  },
2166
  "hf_artifacts": {
2167
  "path": "hf_artifacts:docs/data/task_method_20_gap_audit.json",
2168
  "exists": true,
2169
- "bytes": 35121,
2170
- "sha256": "9724eb26b9243729b7aab6062745244f856d6004185cc70cb19fa8c11fc609c6"
2171
  },
2172
  "hf_model_data": {
2173
  "path": "hf_model:data/task_method_20_gap_audit.json",
2174
  "exists": true,
2175
- "bytes": 35121,
2176
- "sha256": "9724eb26b9243729b7aab6062745244f856d6004185cc70cb19fa8c11fc609c6"
2177
  },
2178
  "hf_model_docs_data": {
2179
  "path": "hf_model:docs/data/task_method_20_gap_audit.json",
2180
  "exists": true,
2181
- "bytes": 35121,
2182
- "sha256": "9724eb26b9243729b7aab6062745244f856d6004185cc70cb19fa8c11fc609c6"
2183
  },
2184
  "hf_model": {
2185
  "path": "hf_model:metrics/task_method_20_gap_audit.json",
2186
  "exists": true,
2187
- "bytes": 35121,
2188
- "sha256": "9724eb26b9243729b7aab6062745244f856d6004185cc70cb19fa8c11fc609c6"
2189
  }
2190
  },
2191
  "failures": []
@@ -2245,45 +2245,45 @@
2245
  "local": {
2246
  "path": "repo:docs/data/unified_task_model_radar.json",
2247
  "exists": true,
2248
- "bytes": 229355,
2249
- "sha256": "f25fca45a1b418122a0bcb2bd37376639102385c2faf0b464013bfa2ab52c54e"
2250
  },
2251
  "mirrors": {
2252
  "hf_space": {
2253
  "path": "hf_space:data/unified_task_model_radar.json",
2254
  "exists": true,
2255
- "bytes": 229355,
2256
- "sha256": "f25fca45a1b418122a0bcb2bd37376639102385c2faf0b464013bfa2ab52c54e"
2257
  },
2258
  "hf_artifacts_data": {
2259
  "path": "hf_artifacts:data/unified_task_model_radar.json",
2260
  "exists": true,
2261
- "bytes": 229355,
2262
- "sha256": "f25fca45a1b418122a0bcb2bd37376639102385c2faf0b464013bfa2ab52c54e"
2263
  },
2264
  "hf_artifacts": {
2265
  "path": "hf_artifacts:docs/data/unified_task_model_radar.json",
2266
  "exists": true,
2267
- "bytes": 229355,
2268
- "sha256": "f25fca45a1b418122a0bcb2bd37376639102385c2faf0b464013bfa2ab52c54e"
2269
  },
2270
  "hf_model_data": {
2271
  "path": "hf_model:data/unified_task_model_radar.json",
2272
  "exists": true,
2273
- "bytes": 229355,
2274
- "sha256": "f25fca45a1b418122a0bcb2bd37376639102385c2faf0b464013bfa2ab52c54e"
2275
  },
2276
  "hf_model_docs_data": {
2277
  "path": "hf_model:docs/data/unified_task_model_radar.json",
2278
  "exists": true,
2279
- "bytes": 229355,
2280
- "sha256": "f25fca45a1b418122a0bcb2bd37376639102385c2faf0b464013bfa2ab52c54e"
2281
  },
2282
  "hf_model": {
2283
  "path": "hf_model:metrics/unified_task_model_radar.json",
2284
  "exists": true,
2285
- "bytes": 229355,
2286
- "sha256": "f25fca45a1b418122a0bcb2bd37376639102385c2faf0b464013bfa2ab52c54e"
2287
  }
2288
  },
2289
  "failures": []
@@ -2294,45 +2294,45 @@
2294
  "local": {
2295
  "path": "repo:docs/data/website_integrity.json",
2296
  "exists": true,
2297
- "bytes": 20022,
2298
- "sha256": "5e123f9e4592beb38c3c4b908cd18a9bb4d737cf4be70309b0d94742e9fefdde"
2299
  },
2300
  "mirrors": {
2301
  "hf_space": {
2302
  "path": "hf_space:data/website_integrity.json",
2303
  "exists": true,
2304
- "bytes": 20022,
2305
- "sha256": "5e123f9e4592beb38c3c4b908cd18a9bb4d737cf4be70309b0d94742e9fefdde"
2306
  },
2307
  "hf_artifacts_data": {
2308
  "path": "hf_artifacts:data/website_integrity.json",
2309
  "exists": true,
2310
- "bytes": 20022,
2311
- "sha256": "5e123f9e4592beb38c3c4b908cd18a9bb4d737cf4be70309b0d94742e9fefdde"
2312
  },
2313
  "hf_artifacts": {
2314
  "path": "hf_artifacts:docs/data/website_integrity.json",
2315
  "exists": true,
2316
- "bytes": 20022,
2317
- "sha256": "5e123f9e4592beb38c3c4b908cd18a9bb4d737cf4be70309b0d94742e9fefdde"
2318
  },
2319
  "hf_model_data": {
2320
  "path": "hf_model:data/website_integrity.json",
2321
  "exists": true,
2322
- "bytes": 20022,
2323
- "sha256": "5e123f9e4592beb38c3c4b908cd18a9bb4d737cf4be70309b0d94742e9fefdde"
2324
  },
2325
  "hf_model_docs_data": {
2326
  "path": "hf_model:docs/data/website_integrity.json",
2327
  "exists": true,
2328
- "bytes": 20022,
2329
- "sha256": "5e123f9e4592beb38c3c4b908cd18a9bb4d737cf4be70309b0d94742e9fefdde"
2330
  },
2331
  "hf_model": {
2332
  "path": "hf_model:metrics/website_integrity.json",
2333
  "exists": true,
2334
- "bytes": 20022,
2335
- "sha256": "5e123f9e4592beb38c3c4b908cd18a9bb4d737cf4be70309b0d94742e9fefdde"
2336
  }
2337
  },
2338
  "failures": []
@@ -2515,33 +2515,33 @@
2515
  "local": {
2516
  "path": "repo:docs/assets/charts/episode128_task_model_radar.svg",
2517
  "exists": true,
2518
- "bytes": 47886,
2519
- "sha256": "486d477a2c7eff2a3c51f20a55bb069b53e0a6529ec8d305a32cecb3536a6bdc"
2520
  },
2521
  "mirrors": {
2522
  "hf_space": {
2523
  "path": "hf_space:assets/charts/episode128_task_model_radar.svg",
2524
  "exists": true,
2525
- "bytes": 47886,
2526
- "sha256": "486d477a2c7eff2a3c51f20a55bb069b53e0a6529ec8d305a32cecb3536a6bdc"
2527
  },
2528
  "hf_artifacts_docs": {
2529
  "path": "hf_artifacts:docs/assets/charts/episode128_task_model_radar.svg",
2530
  "exists": true,
2531
- "bytes": 47886,
2532
- "sha256": "486d477a2c7eff2a3c51f20a55bb069b53e0a6529ec8d305a32cecb3536a6bdc"
2533
  },
2534
  "hf_artifacts_card": {
2535
  "path": "hf_artifacts:assets/charts/episode128_task_model_radar.svg",
2536
  "exists": true,
2537
- "bytes": 47886,
2538
- "sha256": "486d477a2c7eff2a3c51f20a55bb069b53e0a6529ec8d305a32cecb3536a6bdc"
2539
  },
2540
  "hf_model": {
2541
  "path": "hf_model:assets/charts/episode128_task_model_radar.svg",
2542
  "exists": true,
2543
- "bytes": 47886,
2544
- "sha256": "486d477a2c7eff2a3c51f20a55bb069b53e0a6529ec8d305a32cecb3536a6bdc"
2545
  }
2546
  },
2547
  "failures": []
@@ -2589,33 +2589,33 @@
2589
  "local": {
2590
  "path": "repo:docs/assets/charts/unified_task_model_radar.svg",
2591
  "exists": true,
2592
- "bytes": 53899,
2593
- "sha256": "6a72bfb7f2415ea88dd5c60ae6efce67e0296da3fa859b17cbda7692d4817fe4"
2594
  },
2595
  "mirrors": {
2596
  "hf_space": {
2597
  "path": "hf_space:assets/charts/unified_task_model_radar.svg",
2598
  "exists": true,
2599
- "bytes": 53899,
2600
- "sha256": "6a72bfb7f2415ea88dd5c60ae6efce67e0296da3fa859b17cbda7692d4817fe4"
2601
  },
2602
  "hf_artifacts_docs": {
2603
  "path": "hf_artifacts:docs/assets/charts/unified_task_model_radar.svg",
2604
  "exists": true,
2605
- "bytes": 53899,
2606
- "sha256": "6a72bfb7f2415ea88dd5c60ae6efce67e0296da3fa859b17cbda7692d4817fe4"
2607
  },
2608
  "hf_artifacts_card": {
2609
  "path": "hf_artifacts:assets/charts/unified_task_model_radar.svg",
2610
  "exists": true,
2611
- "bytes": 53899,
2612
- "sha256": "6a72bfb7f2415ea88dd5c60ae6efce67e0296da3fa859b17cbda7692d4817fe4"
2613
  },
2614
  "hf_model": {
2615
  "path": "hf_model:assets/charts/unified_task_model_radar.svg",
2616
  "exists": true,
2617
- "bytes": 53899,
2618
- "sha256": "6a72bfb7f2415ea88dd5c60ae6efce67e0296da3fa859b17cbda7692d4817fe4"
2619
  }
2620
  },
2621
  "failures": []
@@ -4472,21 +4472,21 @@
4472
  "local": {
4473
  "path": "repo:scripts/omni/score_existing_model_output_task_probes.py",
4474
  "exists": true,
4475
- "bytes": 20580,
4476
- "sha256": "7b23192c05f214219e24a8774de96da990b26cc6abf35c8994938a73934c8163"
4477
  },
4478
  "mirrors": {
4479
  "hf_artifacts": {
4480
  "path": "hf_artifacts:scripts/omni/score_existing_model_output_task_probes.py",
4481
  "exists": true,
4482
- "bytes": 20580,
4483
- "sha256": "7b23192c05f214219e24a8774de96da990b26cc6abf35c8994938a73934c8163"
4484
  },
4485
  "hf_model": {
4486
  "path": "hf_model:scripts/omni/score_existing_model_output_task_probes.py",
4487
  "exists": true,
4488
- "bytes": 20580,
4489
- "sha256": "7b23192c05f214219e24a8774de96da990b26cc6abf35c8994938a73934c8163"
4490
  }
4491
  },
4492
  "failures": []
@@ -4997,21 +4997,21 @@
4997
  "local": {
4998
  "path": "repo:scripts/build_unified_task_model_radar.py",
4999
  "exists": true,
5000
- "bytes": 53250,
5001
- "sha256": "cedb6a0ef284b8809c9fc9a256e3b5d411e19431b3dcb7629c104c32a573c5f3"
5002
  },
5003
  "mirrors": {
5004
  "hf_artifacts": {
5005
  "path": "hf_artifacts:scripts/build_unified_task_model_radar.py",
5006
  "exists": true,
5007
- "bytes": 53250,
5008
- "sha256": "cedb6a0ef284b8809c9fc9a256e3b5d411e19431b3dcb7629c104c32a573c5f3"
5009
  },
5010
  "hf_model": {
5011
  "path": "hf_model:scripts/build_unified_task_model_radar.py",
5012
  "exists": true,
5013
- "bytes": 53250,
5014
- "sha256": "cedb6a0ef284b8809c9fc9a256e3b5d411e19431b3dcb7629c104c32a573c5f3"
5015
  }
5016
  },
5017
  "failures": []
@@ -5427,38 +5427,38 @@
5427
  "path": "repo:docs/index.html",
5428
  "exists": true,
5429
  "bytes": 254705,
5430
- "sha256": "0dc5781b35fbf5ae2064bb830f2a7471990ab09fcb8bced20ca9dea6fe863b16"
5431
  },
5432
  "mirrors": {
5433
  "hf_space": {
5434
  "path": "hf_space:index.html",
5435
  "exists": true,
5436
  "bytes": 254705,
5437
- "sha256": "0dc5781b35fbf5ae2064bb830f2a7471990ab09fcb8bced20ca9dea6fe863b16"
5438
  },
5439
  "hf_artifacts_root": {
5440
  "path": "hf_artifacts:index.html",
5441
  "exists": true,
5442
  "bytes": 254705,
5443
- "sha256": "0dc5781b35fbf5ae2064bb830f2a7471990ab09fcb8bced20ca9dea6fe863b16"
5444
  },
5445
  "hf_artifacts_docs": {
5446
  "path": "hf_artifacts:docs/index.html",
5447
  "exists": true,
5448
  "bytes": 254705,
5449
- "sha256": "0dc5781b35fbf5ae2064bb830f2a7471990ab09fcb8bced20ca9dea6fe863b16"
5450
  },
5451
  "hf_model": {
5452
  "path": "hf_model:index.html",
5453
  "exists": true,
5454
  "bytes": 254705,
5455
- "sha256": "0dc5781b35fbf5ae2064bb830f2a7471990ab09fcb8bced20ca9dea6fe863b16"
5456
  },
5457
  "hf_model_docs": {
5458
  "path": "hf_model:docs/index.html",
5459
  "exists": true,
5460
  "bytes": 254705,
5461
- "sha256": "0dc5781b35fbf5ae2064bb830f2a7471990ab09fcb8bced20ca9dea6fe863b16"
5462
  }
5463
  },
5464
  "failures": []
@@ -12498,21 +12498,21 @@
12498
  "local": {
12499
  "path": "repo:results/omni_finetune/model_output_task_probes_20260616/RUN_REPORT.md",
12500
  "exists": true,
12501
- "bytes": 1138,
12502
- "sha256": "c29bcc33b88b3a338fa6713e3744f4489bcfce1e0fbaea866942a4c892dda9b1"
12503
  },
12504
  "mirrors": {
12505
  "hf_artifacts": {
12506
  "path": "hf_artifacts:results/omni_finetune/model_output_task_probes_20260616/RUN_REPORT.md",
12507
  "exists": true,
12508
- "bytes": 1138,
12509
- "sha256": "c29bcc33b88b3a338fa6713e3744f4489bcfce1e0fbaea866942a4c892dda9b1"
12510
  },
12511
  "hf_model": {
12512
  "path": "hf_model:results/omni_finetune/model_output_task_probes_20260616/RUN_REPORT.md",
12513
  "exists": true,
12514
- "bytes": 1138,
12515
- "sha256": "c29bcc33b88b3a338fa6713e3744f4489bcfce1e0fbaea866942a4c892dda9b1"
12516
  }
12517
  },
12518
  "failures": []
@@ -12524,20 +12524,20 @@
12524
  "path": "repo:results/omni_finetune/model_output_task_probes_20260616/action_object_relation/cosmos3_super_reasoner/metrics.json",
12525
  "exists": true,
12526
  "bytes": 21876,
12527
- "sha256": "a29f7e178b87c33f080cfa6dd275429e375d95c1d0a889f0436cee5f9d8a8974"
12528
  },
12529
  "mirrors": {
12530
  "hf_artifacts": {
12531
  "path": "hf_artifacts:results/omni_finetune/model_output_task_probes_20260616/action_object_relation/cosmos3_super_reasoner/metrics.json",
12532
  "exists": true,
12533
  "bytes": 21876,
12534
- "sha256": "a29f7e178b87c33f080cfa6dd275429e375d95c1d0a889f0436cee5f9d8a8974"
12535
  },
12536
  "hf_model": {
12537
  "path": "hf_model:results/omni_finetune/model_output_task_probes_20260616/action_object_relation/cosmos3_super_reasoner/metrics.json",
12538
  "exists": true,
12539
  "bytes": 21876,
12540
- "sha256": "a29f7e178b87c33f080cfa6dd275429e375d95c1d0a889f0436cee5f9d8a8974"
12541
  }
12542
  },
12543
  "failures": []
@@ -12599,20 +12599,20 @@
12599
  "path": "repo:results/omni_finetune/model_output_task_probes_20260616/action_object_relation/qwen3_omni_v6_lora/metrics.json",
12600
  "exists": true,
12601
  "bytes": 169938,
12602
- "sha256": "81ce31f176ce451fd3f99397c3c252356f7af49d4a29b404767640b7bb828c26"
12603
  },
12604
  "mirrors": {
12605
  "hf_artifacts": {
12606
  "path": "hf_artifacts:results/omni_finetune/model_output_task_probes_20260616/action_object_relation/qwen3_omni_v6_lora/metrics.json",
12607
  "exists": true,
12608
  "bytes": 169938,
12609
- "sha256": "81ce31f176ce451fd3f99397c3c252356f7af49d4a29b404767640b7bb828c26"
12610
  },
12611
  "hf_model": {
12612
  "path": "hf_model:results/omni_finetune/model_output_task_probes_20260616/action_object_relation/qwen3_omni_v6_lora/metrics.json",
12613
  "exists": true,
12614
  "bytes": 169938,
12615
- "sha256": "81ce31f176ce451fd3f99397c3c252356f7af49d4a29b404767640b7bb828c26"
12616
  }
12617
  },
12618
  "failures": []
@@ -12674,20 +12674,20 @@
12674
  "path": "repo:results/omni_finetune/model_output_task_probes_20260616/long_horizon_next_action/cosmos3_nano_future_window/metrics.json",
12675
  "exists": true,
12676
  "bytes": 7404,
12677
- "sha256": "2278e86f837c556f415ea9b4b331527c3297c5b443ffb0b65190338db57423b3"
12678
  },
12679
  "mirrors": {
12680
  "hf_artifacts": {
12681
  "path": "hf_artifacts:results/omni_finetune/model_output_task_probes_20260616/long_horizon_next_action/cosmos3_nano_future_window/metrics.json",
12682
  "exists": true,
12683
  "bytes": 7404,
12684
- "sha256": "2278e86f837c556f415ea9b4b331527c3297c5b443ffb0b65190338db57423b3"
12685
  },
12686
  "hf_model": {
12687
  "path": "hf_model:results/omni_finetune/model_output_task_probes_20260616/long_horizon_next_action/cosmos3_nano_future_window/metrics.json",
12688
  "exists": true,
12689
  "bytes": 7404,
12690
- "sha256": "2278e86f837c556f415ea9b4b331527c3297c5b443ffb0b65190338db57423b3"
12691
  }
12692
  },
12693
  "failures": []
@@ -12748,21 +12748,71 @@
12748
  "local": {
12749
  "path": "repo:results/omni_finetune/model_output_task_probes_20260616/summary.json",
12750
  "exists": true,
12751
- "bytes": 2830,
12752
- "sha256": "7313cc227e570e7a71e245f75c14da3df9c005e5f048fd82696d852b1bf2d2f3"
12753
  },
12754
  "mirrors": {
12755
  "hf_artifacts": {
12756
  "path": "hf_artifacts:results/omni_finetune/model_output_task_probes_20260616/summary.json",
12757
  "exists": true,
12758
- "bytes": 2830,
12759
- "sha256": "7313cc227e570e7a71e245f75c14da3df9c005e5f048fd82696d852b1bf2d2f3"
12760
  },
12761
  "hf_model": {
12762
  "path": "hf_model:results/omni_finetune/model_output_task_probes_20260616/summary.json",
12763
  "exists": true,
12764
- "bytes": 2830,
12765
- "sha256": "7313cc227e570e7a71e245f75c14da3df9c005e5f048fd82696d852b1bf2d2f3"
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
12766
  }
12767
  },
12768
  "failures": []
@@ -20661,27 +20711,27 @@
20661
  "local": {
20662
  "path": "repo:TASK_METHOD_20_GAP_AUDIT.md",
20663
  "exists": true,
20664
- "bytes": 10094,
20665
- "sha256": "d4590c09e18344db280965ba7de38a2531fc3bc8d72fa8ee7cdfcd61928461dd"
20666
  },
20667
  "mirrors": {
20668
  "hf_space": {
20669
  "path": "hf_space:TASK_METHOD_20_GAP_AUDIT.md",
20670
  "exists": true,
20671
- "bytes": 10094,
20672
- "sha256": "d4590c09e18344db280965ba7de38a2531fc3bc8d72fa8ee7cdfcd61928461dd"
20673
  },
20674
  "hf_artifacts": {
20675
  "path": "hf_artifacts:TASK_METHOD_20_GAP_AUDIT.md",
20676
  "exists": true,
20677
- "bytes": 10094,
20678
- "sha256": "d4590c09e18344db280965ba7de38a2531fc3bc8d72fa8ee7cdfcd61928461dd"
20679
  },
20680
  "hf_model": {
20681
  "path": "hf_model:TASK_METHOD_20_GAP_AUDIT.md",
20682
  "exists": true,
20683
- "bytes": 10094,
20684
- "sha256": "d4590c09e18344db280965ba7de38a2531fc3bc8d72fa8ee7cdfcd61928461dd"
20685
  }
20686
  },
20687
  "failures": []
@@ -20692,27 +20742,27 @@
20692
  "local": {
20693
  "path": "repo:TASK_METHOD_20_RESULT_MATRIX.md",
20694
  "exists": true,
20695
- "bytes": 3946,
20696
- "sha256": "b166f6362dfed5ce4b0619f8c65853a1795ff9d65c47200825658ec725d7616d"
20697
  },
20698
  "mirrors": {
20699
  "hf_space": {
20700
  "path": "hf_space:TASK_METHOD_20_RESULT_MATRIX.md",
20701
  "exists": true,
20702
- "bytes": 3946,
20703
- "sha256": "b166f6362dfed5ce4b0619f8c65853a1795ff9d65c47200825658ec725d7616d"
20704
  },
20705
  "hf_artifacts": {
20706
  "path": "hf_artifacts:TASK_METHOD_20_RESULT_MATRIX.md",
20707
  "exists": true,
20708
- "bytes": 3946,
20709
- "sha256": "b166f6362dfed5ce4b0619f8c65853a1795ff9d65c47200825658ec725d7616d"
20710
  },
20711
  "hf_model": {
20712
  "path": "hf_model:TASK_METHOD_20_RESULT_MATRIX.md",
20713
  "exists": true,
20714
- "bytes": 3946,
20715
- "sha256": "b166f6362dfed5ce4b0619f8c65853a1795ff9d65c47200825658ec725d7616d"
20716
  }
20717
  },
20718
  "failures": []
 
1
  {
2
  "status": "pass",
3
+ "generated_at_utc": "2026-06-18T15:39:07+00:00",
4
  "hf_root": "hf_publish",
5
  "summary": {
6
+ "group_count": 758,
7
  "failure_count": 0,
8
  "failures_by_surface": {}
9
  },
 
138
  "local": {
139
  "path": "repo:docs/data/artifact_index.json",
140
  "exists": true,
141
+ "bytes": 116109,
142
+ "sha256": "3bdc53d5d238108e58c345cd7f572f3f55d388ce1387319538242326946e8f4a"
143
  },
144
  "mirrors": {
145
  "hf_space": {
146
  "path": "hf_space:data/artifact_index.json",
147
  "exists": true,
148
+ "bytes": 116109,
149
+ "sha256": "3bdc53d5d238108e58c345cd7f572f3f55d388ce1387319538242326946e8f4a"
150
  },
151
  "hf_artifacts_data": {
152
  "path": "hf_artifacts:data/artifact_index.json",
153
  "exists": true,
154
+ "bytes": 116109,
155
+ "sha256": "3bdc53d5d238108e58c345cd7f572f3f55d388ce1387319538242326946e8f4a"
156
  },
157
  "hf_artifacts": {
158
  "path": "hf_artifacts:docs/data/artifact_index.json",
159
  "exists": true,
160
+ "bytes": 116109,
161
+ "sha256": "3bdc53d5d238108e58c345cd7f572f3f55d388ce1387319538242326946e8f4a"
162
  },
163
  "hf_model_data": {
164
  "path": "hf_model:data/artifact_index.json",
165
  "exists": true,
166
+ "bytes": 116109,
167
+ "sha256": "3bdc53d5d238108e58c345cd7f572f3f55d388ce1387319538242326946e8f4a"
168
  },
169
  "hf_model_docs_data": {
170
  "path": "hf_model:docs/data/artifact_index.json",
171
  "exists": true,
172
+ "bytes": 116109,
173
+ "sha256": "3bdc53d5d238108e58c345cd7f572f3f55d388ce1387319538242326946e8f4a"
174
  },
175
  "hf_model": {
176
  "path": "hf_model:metrics/artifact_index.json",
177
  "exists": true,
178
+ "bytes": 116109,
179
+ "sha256": "3bdc53d5d238108e58c345cd7f572f3f55d388ce1387319538242326946e8f4a"
180
  }
181
  },
182
  "failures": []
 
923
  "path": "repo:docs/data/publication_audit.json",
924
  "exists": true,
925
  "bytes": 9520,
926
+ "sha256": "b454dbac39adce1d31c6918ab8ff28e4688363c12a4e3816ccb54c3a8a1170f8"
927
  },
928
  "mirrors": {
929
  "hf_space": {
930
  "path": "hf_space:data/publication_audit.json",
931
  "exists": true,
932
  "bytes": 9520,
933
+ "sha256": "b454dbac39adce1d31c6918ab8ff28e4688363c12a4e3816ccb54c3a8a1170f8"
934
  },
935
  "hf_artifacts_data": {
936
  "path": "hf_artifacts:data/publication_audit.json",
937
  "exists": true,
938
  "bytes": 9520,
939
+ "sha256": "b454dbac39adce1d31c6918ab8ff28e4688363c12a4e3816ccb54c3a8a1170f8"
940
  },
941
  "hf_artifacts": {
942
  "path": "hf_artifacts:docs/data/publication_audit.json",
943
  "exists": true,
944
  "bytes": 9520,
945
+ "sha256": "b454dbac39adce1d31c6918ab8ff28e4688363c12a4e3816ccb54c3a8a1170f8"
946
  },
947
  "hf_model_data": {
948
  "path": "hf_model:data/publication_audit.json",
949
  "exists": true,
950
  "bytes": 9520,
951
+ "sha256": "b454dbac39adce1d31c6918ab8ff28e4688363c12a4e3816ccb54c3a8a1170f8"
952
  },
953
  "hf_model_docs_data": {
954
  "path": "hf_model:docs/data/publication_audit.json",
955
  "exists": true,
956
  "bytes": 9520,
957
+ "sha256": "b454dbac39adce1d31c6918ab8ff28e4688363c12a4e3816ccb54c3a8a1170f8"
958
  },
959
  "hf_model": {
960
  "path": "hf_model:metrics/publication_audit.json",
961
  "exists": true,
962
  "bytes": 9520,
963
+ "sha256": "b454dbac39adce1d31c6918ab8ff28e4688363c12a4e3816ccb54c3a8a1170f8"
964
  }
965
  },
966
  "failures": []
 
972
  "path": "repo:docs/data/public_surface_qa.json",
973
  "exists": true,
974
  "bytes": 7126,
975
+ "sha256": "f911c70b8a08a8b3f6738278d2927c3612f238be7b27c1c724a4abb00031ba35"
976
  },
977
  "mirrors": {
978
  "hf_space": {
979
  "path": "hf_space:data/public_surface_qa.json",
980
  "exists": true,
981
  "bytes": 7126,
982
+ "sha256": "f911c70b8a08a8b3f6738278d2927c3612f238be7b27c1c724a4abb00031ba35"
983
  },
984
  "hf_artifacts_data": {
985
  "path": "hf_artifacts:data/public_surface_qa.json",
986
  "exists": true,
987
  "bytes": 7126,
988
+ "sha256": "f911c70b8a08a8b3f6738278d2927c3612f238be7b27c1c724a4abb00031ba35"
989
  },
990
  "hf_artifacts": {
991
  "path": "hf_artifacts:docs/data/public_surface_qa.json",
992
  "exists": true,
993
  "bytes": 7126,
994
+ "sha256": "f911c70b8a08a8b3f6738278d2927c3612f238be7b27c1c724a4abb00031ba35"
995
  },
996
  "hf_model_data": {
997
  "path": "hf_model:data/public_surface_qa.json",
998
  "exists": true,
999
  "bytes": 7126,
1000
+ "sha256": "f911c70b8a08a8b3f6738278d2927c3612f238be7b27c1c724a4abb00031ba35"
1001
  },
1002
  "hf_model_docs_data": {
1003
  "path": "hf_model:docs/data/public_surface_qa.json",
1004
  "exists": true,
1005
  "bytes": 7126,
1006
+ "sha256": "f911c70b8a08a8b3f6738278d2927c3612f238be7b27c1c724a4abb00031ba35"
1007
  },
1008
  "hf_model": {
1009
  "path": "hf_model:metrics/public_surface_qa.json",
1010
  "exists": true,
1011
  "bytes": 7126,
1012
+ "sha256": "f911c70b8a08a8b3f6738278d2927c3612f238be7b27c1c724a4abb00031ba35"
1013
  }
1014
  },
1015
  "failures": []
 
1119
  "path": "repo:docs/data/quality_gates.json",
1120
  "exists": true,
1121
  "bytes": 8100,
1122
+ "sha256": "60250841056be6be5856bbe903fa561ec1cc3b7d37566b8d321da555a70aa343"
1123
  },
1124
  "mirrors": {
1125
  "hf_space": {
1126
  "path": "hf_space:data/quality_gates.json",
1127
  "exists": true,
1128
  "bytes": 8100,
1129
+ "sha256": "60250841056be6be5856bbe903fa561ec1cc3b7d37566b8d321da555a70aa343"
1130
  },
1131
  "hf_artifacts_data": {
1132
  "path": "hf_artifacts:data/quality_gates.json",
1133
  "exists": true,
1134
  "bytes": 8100,
1135
+ "sha256": "60250841056be6be5856bbe903fa561ec1cc3b7d37566b8d321da555a70aa343"
1136
  },
1137
  "hf_artifacts": {
1138
  "path": "hf_artifacts:docs/data/quality_gates.json",
1139
  "exists": true,
1140
  "bytes": 8100,
1141
+ "sha256": "60250841056be6be5856bbe903fa561ec1cc3b7d37566b8d321da555a70aa343"
1142
  },
1143
  "hf_model_data": {
1144
  "path": "hf_model:data/quality_gates.json",
1145
  "exists": true,
1146
  "bytes": 8100,
1147
+ "sha256": "60250841056be6be5856bbe903fa561ec1cc3b7d37566b8d321da555a70aa343"
1148
  },
1149
  "hf_model_docs_data": {
1150
  "path": "hf_model:docs/data/quality_gates.json",
1151
  "exists": true,
1152
  "bytes": 8100,
1153
+ "sha256": "60250841056be6be5856bbe903fa561ec1cc3b7d37566b8d321da555a70aa343"
1154
  },
1155
  "hf_model": {
1156
  "path": "hf_model:metrics/quality_gates.json",
1157
  "exists": true,
1158
  "bytes": 8100,
1159
+ "sha256": "60250841056be6be5856bbe903fa561ec1cc3b7d37566b8d321da555a70aa343"
1160
  }
1161
  },
1162
  "failures": []
 
1658
  "path": "repo:docs/data/source_alignment_audit.json",
1659
  "exists": true,
1660
  "bytes": 4432,
1661
+ "sha256": "e3437d446af0c3073f7f78034280032cd2c4c83114c50a2903e676790886fd37"
1662
  },
1663
  "mirrors": {
1664
  "hf_space": {
1665
  "path": "hf_space:data/source_alignment_audit.json",
1666
  "exists": true,
1667
  "bytes": 4432,
1668
+ "sha256": "e3437d446af0c3073f7f78034280032cd2c4c83114c50a2903e676790886fd37"
1669
  },
1670
  "hf_artifacts_data": {
1671
  "path": "hf_artifacts:data/source_alignment_audit.json",
1672
  "exists": true,
1673
  "bytes": 4432,
1674
+ "sha256": "e3437d446af0c3073f7f78034280032cd2c4c83114c50a2903e676790886fd37"
1675
  },
1676
  "hf_artifacts": {
1677
  "path": "hf_artifacts:docs/data/source_alignment_audit.json",
1678
  "exists": true,
1679
  "bytes": 4432,
1680
+ "sha256": "e3437d446af0c3073f7f78034280032cd2c4c83114c50a2903e676790886fd37"
1681
  },
1682
  "hf_model_data": {
1683
  "path": "hf_model:data/source_alignment_audit.json",
1684
  "exists": true,
1685
  "bytes": 4432,
1686
+ "sha256": "e3437d446af0c3073f7f78034280032cd2c4c83114c50a2903e676790886fd37"
1687
  },
1688
  "hf_model_docs_data": {
1689
  "path": "hf_model:docs/data/source_alignment_audit.json",
1690
  "exists": true,
1691
  "bytes": 4432,
1692
+ "sha256": "e3437d446af0c3073f7f78034280032cd2c4c83114c50a2903e676790886fd37"
1693
  },
1694
  "hf_model": {
1695
  "path": "hf_model:metrics/source_alignment_audit.json",
1696
  "exists": true,
1697
  "bytes": 4432,
1698
+ "sha256": "e3437d446af0c3073f7f78034280032cd2c4c83114c50a2903e676790886fd37"
1699
  }
1700
  },
1701
  "failures": []
 
1756
  "path": "repo:docs/data/single_episode_task_model_radar.json",
1757
  "exists": true,
1758
  "bytes": 51064,
1759
+ "sha256": "ca48852ee62c58d83ff9fed7f775a3babb07653aab00a2b4266ea9885cbc45ff"
1760
  },
1761
  "mirrors": {
1762
  "hf_space": {
1763
  "path": "hf_space:data/single_episode_task_model_radar.json",
1764
  "exists": true,
1765
  "bytes": 51064,
1766
+ "sha256": "ca48852ee62c58d83ff9fed7f775a3babb07653aab00a2b4266ea9885cbc45ff"
1767
  },
1768
  "hf_artifacts_data": {
1769
  "path": "hf_artifacts:data/single_episode_task_model_radar.json",
1770
  "exists": true,
1771
  "bytes": 51064,
1772
+ "sha256": "ca48852ee62c58d83ff9fed7f775a3babb07653aab00a2b4266ea9885cbc45ff"
1773
  },
1774
  "hf_artifacts": {
1775
  "path": "hf_artifacts:docs/data/single_episode_task_model_radar.json",
1776
  "exists": true,
1777
  "bytes": 51064,
1778
+ "sha256": "ca48852ee62c58d83ff9fed7f775a3babb07653aab00a2b4266ea9885cbc45ff"
1779
  },
1780
  "hf_model_data": {
1781
  "path": "hf_model:data/single_episode_task_model_radar.json",
1782
  "exists": true,
1783
  "bytes": 51064,
1784
+ "sha256": "ca48852ee62c58d83ff9fed7f775a3babb07653aab00a2b4266ea9885cbc45ff"
1785
  },
1786
  "hf_model_docs_data": {
1787
  "path": "hf_model:docs/data/single_episode_task_model_radar.json",
1788
  "exists": true,
1789
  "bytes": 51064,
1790
+ "sha256": "ca48852ee62c58d83ff9fed7f775a3babb07653aab00a2b4266ea9885cbc45ff"
1791
  },
1792
  "hf_model": {
1793
  "path": "hf_model:metrics/single_episode_task_model_radar.json",
1794
  "exists": true,
1795
  "bytes": 51064,
1796
+ "sha256": "ca48852ee62c58d83ff9fed7f775a3babb07653aab00a2b4266ea9885cbc45ff"
1797
  }
1798
  },
1799
  "failures": []
 
1804
  "local": {
1805
  "path": "repo:docs/data/episode128_task_model_radar.json",
1806
  "exists": true,
1807
+ "bytes": 185480,
1808
+ "sha256": "52250951319a87a069bfca26338a1daa1511a2bd4bb145801e5e44d230dcac1c"
1809
  },
1810
  "mirrors": {
1811
  "hf_space": {
1812
  "path": "hf_space:data/episode128_task_model_radar.json",
1813
  "exists": true,
1814
+ "bytes": 185480,
1815
+ "sha256": "52250951319a87a069bfca26338a1daa1511a2bd4bb145801e5e44d230dcac1c"
1816
  },
1817
  "hf_artifacts_data": {
1818
  "path": "hf_artifacts:data/episode128_task_model_radar.json",
1819
  "exists": true,
1820
+ "bytes": 185480,
1821
+ "sha256": "52250951319a87a069bfca26338a1daa1511a2bd4bb145801e5e44d230dcac1c"
1822
  },
1823
  "hf_artifacts": {
1824
  "path": "hf_artifacts:docs/data/episode128_task_model_radar.json",
1825
  "exists": true,
1826
+ "bytes": 185480,
1827
+ "sha256": "52250951319a87a069bfca26338a1daa1511a2bd4bb145801e5e44d230dcac1c"
1828
  },
1829
  "hf_model_data": {
1830
  "path": "hf_model:data/episode128_task_model_radar.json",
1831
  "exists": true,
1832
+ "bytes": 185480,
1833
+ "sha256": "52250951319a87a069bfca26338a1daa1511a2bd4bb145801e5e44d230dcac1c"
1834
  },
1835
  "hf_model_docs_data": {
1836
  "path": "hf_model:docs/data/episode128_task_model_radar.json",
1837
  "exists": true,
1838
+ "bytes": 185480,
1839
+ "sha256": "52250951319a87a069bfca26338a1daa1511a2bd4bb145801e5e44d230dcac1c"
1840
  },
1841
  "hf_model": {
1842
  "path": "hf_model:metrics/episode128_task_model_radar.json",
1843
  "exists": true,
1844
+ "bytes": 185480,
1845
+ "sha256": "52250951319a87a069bfca26338a1daa1511a2bd4bb145801e5e44d230dcac1c"
1846
  }
1847
  },
1848
  "failures": []
 
2001
  "path": "repo:docs/data/task_surface_integrity.json",
2002
  "exists": true,
2003
  "bytes": 45779,
2004
+ "sha256": "31e3e8540450943c01c1d3523d7c61f13e1d481b41190dd4de8c67431ca3c597"
2005
  },
2006
  "mirrors": {
2007
  "hf_space": {
2008
  "path": "hf_space:data/task_surface_integrity.json",
2009
  "exists": true,
2010
  "bytes": 45779,
2011
+ "sha256": "31e3e8540450943c01c1d3523d7c61f13e1d481b41190dd4de8c67431ca3c597"
2012
  },
2013
  "hf_artifacts_data": {
2014
  "path": "hf_artifacts:data/task_surface_integrity.json",
2015
  "exists": true,
2016
  "bytes": 45779,
2017
+ "sha256": "31e3e8540450943c01c1d3523d7c61f13e1d481b41190dd4de8c67431ca3c597"
2018
  },
2019
  "hf_artifacts": {
2020
  "path": "hf_artifacts:docs/data/task_surface_integrity.json",
2021
  "exists": true,
2022
  "bytes": 45779,
2023
+ "sha256": "31e3e8540450943c01c1d3523d7c61f13e1d481b41190dd4de8c67431ca3c597"
2024
  },
2025
  "hf_model_data": {
2026
  "path": "hf_model:data/task_surface_integrity.json",
2027
  "exists": true,
2028
  "bytes": 45779,
2029
+ "sha256": "31e3e8540450943c01c1d3523d7c61f13e1d481b41190dd4de8c67431ca3c597"
2030
  },
2031
  "hf_model_docs_data": {
2032
  "path": "hf_model:docs/data/task_surface_integrity.json",
2033
  "exists": true,
2034
  "bytes": 45779,
2035
+ "sha256": "31e3e8540450943c01c1d3523d7c61f13e1d481b41190dd4de8c67431ca3c597"
2036
  },
2037
  "hf_model": {
2038
  "path": "hf_model:metrics/task_surface_integrity.json",
2039
  "exists": true,
2040
  "bytes": 45779,
2041
+ "sha256": "31e3e8540450943c01c1d3523d7c61f13e1d481b41190dd4de8c67431ca3c597"
2042
  }
2043
  },
2044
  "failures": []
 
2098
  "local": {
2099
  "path": "repo:docs/data/task_method_20_result_matrix.json",
2100
  "exists": true,
2101
+ "bytes": 128862,
2102
+ "sha256": "7d071dd9d840025d566d430f7c24f7005f8c8d4acb73d14fbbd5df754e996f70"
2103
  },
2104
  "mirrors": {
2105
  "hf_space": {
2106
  "path": "hf_space:data/task_method_20_result_matrix.json",
2107
  "exists": true,
2108
+ "bytes": 128862,
2109
+ "sha256": "7d071dd9d840025d566d430f7c24f7005f8c8d4acb73d14fbbd5df754e996f70"
2110
  },
2111
  "hf_artifacts_data": {
2112
  "path": "hf_artifacts:data/task_method_20_result_matrix.json",
2113
  "exists": true,
2114
+ "bytes": 128862,
2115
+ "sha256": "7d071dd9d840025d566d430f7c24f7005f8c8d4acb73d14fbbd5df754e996f70"
2116
  },
2117
  "hf_artifacts": {
2118
  "path": "hf_artifacts:docs/data/task_method_20_result_matrix.json",
2119
  "exists": true,
2120
+ "bytes": 128862,
2121
+ "sha256": "7d071dd9d840025d566d430f7c24f7005f8c8d4acb73d14fbbd5df754e996f70"
2122
  },
2123
  "hf_model_data": {
2124
  "path": "hf_model:data/task_method_20_result_matrix.json",
2125
  "exists": true,
2126
+ "bytes": 128862,
2127
+ "sha256": "7d071dd9d840025d566d430f7c24f7005f8c8d4acb73d14fbbd5df754e996f70"
2128
  },
2129
  "hf_model_docs_data": {
2130
  "path": "hf_model:docs/data/task_method_20_result_matrix.json",
2131
  "exists": true,
2132
+ "bytes": 128862,
2133
+ "sha256": "7d071dd9d840025d566d430f7c24f7005f8c8d4acb73d14fbbd5df754e996f70"
2134
  },
2135
  "hf_model": {
2136
  "path": "hf_model:metrics/task_method_20_result_matrix.json",
2137
  "exists": true,
2138
+ "bytes": 128862,
2139
+ "sha256": "7d071dd9d840025d566d430f7c24f7005f8c8d4acb73d14fbbd5df754e996f70"
2140
  }
2141
  },
2142
  "failures": []
 
2147
  "local": {
2148
  "path": "repo:docs/data/task_method_20_gap_audit.json",
2149
  "exists": true,
2150
+ "bytes": 34384,
2151
+ "sha256": "ec64d78e07d4951f14832945668b1c2252a61393672e3d607478e7d6f95ccf99"
2152
  },
2153
  "mirrors": {
2154
  "hf_space": {
2155
  "path": "hf_space:data/task_method_20_gap_audit.json",
2156
  "exists": true,
2157
+ "bytes": 34384,
2158
+ "sha256": "ec64d78e07d4951f14832945668b1c2252a61393672e3d607478e7d6f95ccf99"
2159
  },
2160
  "hf_artifacts_data": {
2161
  "path": "hf_artifacts:data/task_method_20_gap_audit.json",
2162
  "exists": true,
2163
+ "bytes": 34384,
2164
+ "sha256": "ec64d78e07d4951f14832945668b1c2252a61393672e3d607478e7d6f95ccf99"
2165
  },
2166
  "hf_artifacts": {
2167
  "path": "hf_artifacts:docs/data/task_method_20_gap_audit.json",
2168
  "exists": true,
2169
+ "bytes": 34384,
2170
+ "sha256": "ec64d78e07d4951f14832945668b1c2252a61393672e3d607478e7d6f95ccf99"
2171
  },
2172
  "hf_model_data": {
2173
  "path": "hf_model:data/task_method_20_gap_audit.json",
2174
  "exists": true,
2175
+ "bytes": 34384,
2176
+ "sha256": "ec64d78e07d4951f14832945668b1c2252a61393672e3d607478e7d6f95ccf99"
2177
  },
2178
  "hf_model_docs_data": {
2179
  "path": "hf_model:docs/data/task_method_20_gap_audit.json",
2180
  "exists": true,
2181
+ "bytes": 34384,
2182
+ "sha256": "ec64d78e07d4951f14832945668b1c2252a61393672e3d607478e7d6f95ccf99"
2183
  },
2184
  "hf_model": {
2185
  "path": "hf_model:metrics/task_method_20_gap_audit.json",
2186
  "exists": true,
2187
+ "bytes": 34384,
2188
+ "sha256": "ec64d78e07d4951f14832945668b1c2252a61393672e3d607478e7d6f95ccf99"
2189
  }
2190
  },
2191
  "failures": []
 
2245
  "local": {
2246
  "path": "repo:docs/data/unified_task_model_radar.json",
2247
  "exists": true,
2248
+ "bytes": 229332,
2249
+ "sha256": "34bccb1afa3dc987a98e774c55b00e23d4345d69b3dca3fd124ef64bde0c3d34"
2250
  },
2251
  "mirrors": {
2252
  "hf_space": {
2253
  "path": "hf_space:data/unified_task_model_radar.json",
2254
  "exists": true,
2255
+ "bytes": 229332,
2256
+ "sha256": "34bccb1afa3dc987a98e774c55b00e23d4345d69b3dca3fd124ef64bde0c3d34"
2257
  },
2258
  "hf_artifacts_data": {
2259
  "path": "hf_artifacts:data/unified_task_model_radar.json",
2260
  "exists": true,
2261
+ "bytes": 229332,
2262
+ "sha256": "34bccb1afa3dc987a98e774c55b00e23d4345d69b3dca3fd124ef64bde0c3d34"
2263
  },
2264
  "hf_artifacts": {
2265
  "path": "hf_artifacts:docs/data/unified_task_model_radar.json",
2266
  "exists": true,
2267
+ "bytes": 229332,
2268
+ "sha256": "34bccb1afa3dc987a98e774c55b00e23d4345d69b3dca3fd124ef64bde0c3d34"
2269
  },
2270
  "hf_model_data": {
2271
  "path": "hf_model:data/unified_task_model_radar.json",
2272
  "exists": true,
2273
+ "bytes": 229332,
2274
+ "sha256": "34bccb1afa3dc987a98e774c55b00e23d4345d69b3dca3fd124ef64bde0c3d34"
2275
  },
2276
  "hf_model_docs_data": {
2277
  "path": "hf_model:docs/data/unified_task_model_radar.json",
2278
  "exists": true,
2279
+ "bytes": 229332,
2280
+ "sha256": "34bccb1afa3dc987a98e774c55b00e23d4345d69b3dca3fd124ef64bde0c3d34"
2281
  },
2282
  "hf_model": {
2283
  "path": "hf_model:metrics/unified_task_model_radar.json",
2284
  "exists": true,
2285
+ "bytes": 229332,
2286
+ "sha256": "34bccb1afa3dc987a98e774c55b00e23d4345d69b3dca3fd124ef64bde0c3d34"
2287
  }
2288
  },
2289
  "failures": []
 
2294
  "local": {
2295
  "path": "repo:docs/data/website_integrity.json",
2296
  "exists": true,
2297
+ "bytes": 20021,
2298
+ "sha256": "3ad229c374e2c3dd05e96e3f4d45c9e8273fdabeffa395dc2c521e9e5392e25e"
2299
  },
2300
  "mirrors": {
2301
  "hf_space": {
2302
  "path": "hf_space:data/website_integrity.json",
2303
  "exists": true,
2304
+ "bytes": 20021,
2305
+ "sha256": "3ad229c374e2c3dd05e96e3f4d45c9e8273fdabeffa395dc2c521e9e5392e25e"
2306
  },
2307
  "hf_artifacts_data": {
2308
  "path": "hf_artifacts:data/website_integrity.json",
2309
  "exists": true,
2310
+ "bytes": 20021,
2311
+ "sha256": "3ad229c374e2c3dd05e96e3f4d45c9e8273fdabeffa395dc2c521e9e5392e25e"
2312
  },
2313
  "hf_artifacts": {
2314
  "path": "hf_artifacts:docs/data/website_integrity.json",
2315
  "exists": true,
2316
+ "bytes": 20021,
2317
+ "sha256": "3ad229c374e2c3dd05e96e3f4d45c9e8273fdabeffa395dc2c521e9e5392e25e"
2318
  },
2319
  "hf_model_data": {
2320
  "path": "hf_model:data/website_integrity.json",
2321
  "exists": true,
2322
+ "bytes": 20021,
2323
+ "sha256": "3ad229c374e2c3dd05e96e3f4d45c9e8273fdabeffa395dc2c521e9e5392e25e"
2324
  },
2325
  "hf_model_docs_data": {
2326
  "path": "hf_model:docs/data/website_integrity.json",
2327
  "exists": true,
2328
+ "bytes": 20021,
2329
+ "sha256": "3ad229c374e2c3dd05e96e3f4d45c9e8273fdabeffa395dc2c521e9e5392e25e"
2330
  },
2331
  "hf_model": {
2332
  "path": "hf_model:metrics/website_integrity.json",
2333
  "exists": true,
2334
+ "bytes": 20021,
2335
+ "sha256": "3ad229c374e2c3dd05e96e3f4d45c9e8273fdabeffa395dc2c521e9e5392e25e"
2336
  }
2337
  },
2338
  "failures": []
 
2515
  "local": {
2516
  "path": "repo:docs/assets/charts/episode128_task_model_radar.svg",
2517
  "exists": true,
2518
+ "bytes": 48019,
2519
+ "sha256": "70fb20c3f8f9574303b5e4832fba7b5e39ae20b75aa006af53ac1457b7daf64e"
2520
  },
2521
  "mirrors": {
2522
  "hf_space": {
2523
  "path": "hf_space:assets/charts/episode128_task_model_radar.svg",
2524
  "exists": true,
2525
+ "bytes": 48019,
2526
+ "sha256": "70fb20c3f8f9574303b5e4832fba7b5e39ae20b75aa006af53ac1457b7daf64e"
2527
  },
2528
  "hf_artifacts_docs": {
2529
  "path": "hf_artifacts:docs/assets/charts/episode128_task_model_radar.svg",
2530
  "exists": true,
2531
+ "bytes": 48019,
2532
+ "sha256": "70fb20c3f8f9574303b5e4832fba7b5e39ae20b75aa006af53ac1457b7daf64e"
2533
  },
2534
  "hf_artifacts_card": {
2535
  "path": "hf_artifacts:assets/charts/episode128_task_model_radar.svg",
2536
  "exists": true,
2537
+ "bytes": 48019,
2538
+ "sha256": "70fb20c3f8f9574303b5e4832fba7b5e39ae20b75aa006af53ac1457b7daf64e"
2539
  },
2540
  "hf_model": {
2541
  "path": "hf_model:assets/charts/episode128_task_model_radar.svg",
2542
  "exists": true,
2543
+ "bytes": 48019,
2544
+ "sha256": "70fb20c3f8f9574303b5e4832fba7b5e39ae20b75aa006af53ac1457b7daf64e"
2545
  }
2546
  },
2547
  "failures": []
 
2589
  "local": {
2590
  "path": "repo:docs/assets/charts/unified_task_model_radar.svg",
2591
  "exists": true,
2592
+ "bytes": 54032,
2593
+ "sha256": "56893b66dfb07f3028844fe96846614715058b808c731ce870232ad6247a3a50"
2594
  },
2595
  "mirrors": {
2596
  "hf_space": {
2597
  "path": "hf_space:assets/charts/unified_task_model_radar.svg",
2598
  "exists": true,
2599
+ "bytes": 54032,
2600
+ "sha256": "56893b66dfb07f3028844fe96846614715058b808c731ce870232ad6247a3a50"
2601
  },
2602
  "hf_artifacts_docs": {
2603
  "path": "hf_artifacts:docs/assets/charts/unified_task_model_radar.svg",
2604
  "exists": true,
2605
+ "bytes": 54032,
2606
+ "sha256": "56893b66dfb07f3028844fe96846614715058b808c731ce870232ad6247a3a50"
2607
  },
2608
  "hf_artifacts_card": {
2609
  "path": "hf_artifacts:assets/charts/unified_task_model_radar.svg",
2610
  "exists": true,
2611
+ "bytes": 54032,
2612
+ "sha256": "56893b66dfb07f3028844fe96846614715058b808c731ce870232ad6247a3a50"
2613
  },
2614
  "hf_model": {
2615
  "path": "hf_model:assets/charts/unified_task_model_radar.svg",
2616
  "exists": true,
2617
+ "bytes": 54032,
2618
+ "sha256": "56893b66dfb07f3028844fe96846614715058b808c731ce870232ad6247a3a50"
2619
  }
2620
  },
2621
  "failures": []
 
4472
  "local": {
4473
  "path": "repo:scripts/omni/score_existing_model_output_task_probes.py",
4474
  "exists": true,
4475
+ "bytes": 27917,
4476
+ "sha256": "421c50262c38dd222ab0c5f50d78f4d92ee18f13b9a96661b292c44c05e89b1d"
4477
  },
4478
  "mirrors": {
4479
  "hf_artifacts": {
4480
  "path": "hf_artifacts:scripts/omni/score_existing_model_output_task_probes.py",
4481
  "exists": true,
4482
+ "bytes": 27917,
4483
+ "sha256": "421c50262c38dd222ab0c5f50d78f4d92ee18f13b9a96661b292c44c05e89b1d"
4484
  },
4485
  "hf_model": {
4486
  "path": "hf_model:scripts/omni/score_existing_model_output_task_probes.py",
4487
  "exists": true,
4488
+ "bytes": 27917,
4489
+ "sha256": "421c50262c38dd222ab0c5f50d78f4d92ee18f13b9a96661b292c44c05e89b1d"
4490
  }
4491
  },
4492
  "failures": []
 
4997
  "local": {
4998
  "path": "repo:scripts/build_unified_task_model_radar.py",
4999
  "exists": true,
5000
+ "bytes": 53705,
5001
+ "sha256": "e35607dd679ce7c199868660cd733e1e67c6877e2c5f207de15e9738483af0dc"
5002
  },
5003
  "mirrors": {
5004
  "hf_artifacts": {
5005
  "path": "hf_artifacts:scripts/build_unified_task_model_radar.py",
5006
  "exists": true,
5007
+ "bytes": 53705,
5008
+ "sha256": "e35607dd679ce7c199868660cd733e1e67c6877e2c5f207de15e9738483af0dc"
5009
  },
5010
  "hf_model": {
5011
  "path": "hf_model:scripts/build_unified_task_model_radar.py",
5012
  "exists": true,
5013
+ "bytes": 53705,
5014
+ "sha256": "e35607dd679ce7c199868660cd733e1e67c6877e2c5f207de15e9738483af0dc"
5015
  }
5016
  },
5017
  "failures": []
 
5427
  "path": "repo:docs/index.html",
5428
  "exists": true,
5429
  "bytes": 254705,
5430
+ "sha256": "72b7cad1b07bc55446bc352a9e653dd1c600ee43ce00e8e284f8d3be3c9aa9d0"
5431
  },
5432
  "mirrors": {
5433
  "hf_space": {
5434
  "path": "hf_space:index.html",
5435
  "exists": true,
5436
  "bytes": 254705,
5437
+ "sha256": "72b7cad1b07bc55446bc352a9e653dd1c600ee43ce00e8e284f8d3be3c9aa9d0"
5438
  },
5439
  "hf_artifacts_root": {
5440
  "path": "hf_artifacts:index.html",
5441
  "exists": true,
5442
  "bytes": 254705,
5443
+ "sha256": "72b7cad1b07bc55446bc352a9e653dd1c600ee43ce00e8e284f8d3be3c9aa9d0"
5444
  },
5445
  "hf_artifacts_docs": {
5446
  "path": "hf_artifacts:docs/index.html",
5447
  "exists": true,
5448
  "bytes": 254705,
5449
+ "sha256": "72b7cad1b07bc55446bc352a9e653dd1c600ee43ce00e8e284f8d3be3c9aa9d0"
5450
  },
5451
  "hf_model": {
5452
  "path": "hf_model:index.html",
5453
  "exists": true,
5454
  "bytes": 254705,
5455
+ "sha256": "72b7cad1b07bc55446bc352a9e653dd1c600ee43ce00e8e284f8d3be3c9aa9d0"
5456
  },
5457
  "hf_model_docs": {
5458
  "path": "hf_model:docs/index.html",
5459
  "exists": true,
5460
  "bytes": 254705,
5461
+ "sha256": "72b7cad1b07bc55446bc352a9e653dd1c600ee43ce00e8e284f8d3be3c9aa9d0"
5462
  }
5463
  },
5464
  "failures": []
 
12498
  "local": {
12499
  "path": "repo:results/omni_finetune/model_output_task_probes_20260616/RUN_REPORT.md",
12500
  "exists": true,
12501
+ "bytes": 1200,
12502
+ "sha256": "f4a99f703b635c3847ac38ee1041431a5ba077342ee7ec8d0685af665b60c1bd"
12503
  },
12504
  "mirrors": {
12505
  "hf_artifacts": {
12506
  "path": "hf_artifacts:results/omni_finetune/model_output_task_probes_20260616/RUN_REPORT.md",
12507
  "exists": true,
12508
+ "bytes": 1200,
12509
+ "sha256": "f4a99f703b635c3847ac38ee1041431a5ba077342ee7ec8d0685af665b60c1bd"
12510
  },
12511
  "hf_model": {
12512
  "path": "hf_model:results/omni_finetune/model_output_task_probes_20260616/RUN_REPORT.md",
12513
  "exists": true,
12514
+ "bytes": 1200,
12515
+ "sha256": "f4a99f703b635c3847ac38ee1041431a5ba077342ee7ec8d0685af665b60c1bd"
12516
  }
12517
  },
12518
  "failures": []
 
12524
  "path": "repo:results/omni_finetune/model_output_task_probes_20260616/action_object_relation/cosmos3_super_reasoner/metrics.json",
12525
  "exists": true,
12526
  "bytes": 21876,
12527
+ "sha256": "82b725f285c833bda60c243430df610118a92f7fe04b5fc84bae88b90554133d"
12528
  },
12529
  "mirrors": {
12530
  "hf_artifacts": {
12531
  "path": "hf_artifacts:results/omni_finetune/model_output_task_probes_20260616/action_object_relation/cosmos3_super_reasoner/metrics.json",
12532
  "exists": true,
12533
  "bytes": 21876,
12534
+ "sha256": "82b725f285c833bda60c243430df610118a92f7fe04b5fc84bae88b90554133d"
12535
  },
12536
  "hf_model": {
12537
  "path": "hf_model:results/omni_finetune/model_output_task_probes_20260616/action_object_relation/cosmos3_super_reasoner/metrics.json",
12538
  "exists": true,
12539
  "bytes": 21876,
12540
+ "sha256": "82b725f285c833bda60c243430df610118a92f7fe04b5fc84bae88b90554133d"
12541
  }
12542
  },
12543
  "failures": []
 
12599
  "path": "repo:results/omni_finetune/model_output_task_probes_20260616/action_object_relation/qwen3_omni_v6_lora/metrics.json",
12600
  "exists": true,
12601
  "bytes": 169938,
12602
+ "sha256": "15ecae97fdd45b313ebe561705bafa9b57c6ff844404245fc74096ac2eccec69"
12603
  },
12604
  "mirrors": {
12605
  "hf_artifacts": {
12606
  "path": "hf_artifacts:results/omni_finetune/model_output_task_probes_20260616/action_object_relation/qwen3_omni_v6_lora/metrics.json",
12607
  "exists": true,
12608
  "bytes": 169938,
12609
+ "sha256": "15ecae97fdd45b313ebe561705bafa9b57c6ff844404245fc74096ac2eccec69"
12610
  },
12611
  "hf_model": {
12612
  "path": "hf_model:results/omni_finetune/model_output_task_probes_20260616/action_object_relation/qwen3_omni_v6_lora/metrics.json",
12613
  "exists": true,
12614
  "bytes": 169938,
12615
+ "sha256": "15ecae97fdd45b313ebe561705bafa9b57c6ff844404245fc74096ac2eccec69"
12616
  }
12617
  },
12618
  "failures": []
 
12674
  "path": "repo:results/omni_finetune/model_output_task_probes_20260616/long_horizon_next_action/cosmos3_nano_future_window/metrics.json",
12675
  "exists": true,
12676
  "bytes": 7404,
12677
+ "sha256": "e5f884eaf3e9d133b52af2e1488163abb64b3b677f8083ba5d100db304b446d9"
12678
  },
12679
  "mirrors": {
12680
  "hf_artifacts": {
12681
  "path": "hf_artifacts:results/omni_finetune/model_output_task_probes_20260616/long_horizon_next_action/cosmos3_nano_future_window/metrics.json",
12682
  "exists": true,
12683
  "bytes": 7404,
12684
+ "sha256": "e5f884eaf3e9d133b52af2e1488163abb64b3b677f8083ba5d100db304b446d9"
12685
  },
12686
  "hf_model": {
12687
  "path": "hf_model:results/omni_finetune/model_output_task_probes_20260616/long_horizon_next_action/cosmos3_nano_future_window/metrics.json",
12688
  "exists": true,
12689
  "bytes": 7404,
12690
+ "sha256": "e5f884eaf3e9d133b52af2e1488163abb64b3b677f8083ba5d100db304b446d9"
12691
  }
12692
  },
12693
  "failures": []
 
12748
  "local": {
12749
  "path": "repo:results/omni_finetune/model_output_task_probes_20260616/summary.json",
12750
  "exists": true,
12751
+ "bytes": 3180,
12752
+ "sha256": "82a36cc5d23fa34792eac6b7124eecbed900d52c8f0b2a7921d409e236efd68a"
12753
  },
12754
  "mirrors": {
12755
  "hf_artifacts": {
12756
  "path": "hf_artifacts:results/omni_finetune/model_output_task_probes_20260616/summary.json",
12757
  "exists": true,
12758
+ "bytes": 3180,
12759
+ "sha256": "82a36cc5d23fa34792eac6b7124eecbed900d52c8f0b2a7921d409e236efd68a"
12760
  },
12761
  "hf_model": {
12762
  "path": "hf_model:results/omni_finetune/model_output_task_probes_20260616/summary.json",
12763
  "exists": true,
12764
+ "bytes": 3180,
12765
+ "sha256": "82a36cc5d23fa34792eac6b7124eecbed900d52c8f0b2a7921d409e236efd68a"
12766
+ }
12767
+ },
12768
+ "failures": []
12769
+ },
12770
+ {
12771
+ "name": "results/omni_finetune/model_output_task_probes_20260616/time_to_transition/cosmos3_super_reasoner/metrics.json",
12772
+ "status": "pass",
12773
+ "local": {
12774
+ "path": "repo:results/omni_finetune/model_output_task_probes_20260616/time_to_transition/cosmos3_super_reasoner/metrics.json",
12775
+ "exists": true,
12776
+ "bytes": 2049,
12777
+ "sha256": "8151b02a75feb144e9a4590715caf2f4301154b0d1b89d3624225628cd1e3f67"
12778
+ },
12779
+ "mirrors": {
12780
+ "hf_artifacts": {
12781
+ "path": "hf_artifacts:results/omni_finetune/model_output_task_probes_20260616/time_to_transition/cosmos3_super_reasoner/metrics.json",
12782
+ "exists": true,
12783
+ "bytes": 2049,
12784
+ "sha256": "8151b02a75feb144e9a4590715caf2f4301154b0d1b89d3624225628cd1e3f67"
12785
+ },
12786
+ "hf_model": {
12787
+ "path": "hf_model:results/omni_finetune/model_output_task_probes_20260616/time_to_transition/cosmos3_super_reasoner/metrics.json",
12788
+ "exists": true,
12789
+ "bytes": 2049,
12790
+ "sha256": "8151b02a75feb144e9a4590715caf2f4301154b0d1b89d3624225628cd1e3f67"
12791
+ }
12792
+ },
12793
+ "failures": []
12794
+ },
12795
+ {
12796
+ "name": "results/omni_finetune/model_output_task_probes_20260616/time_to_transition/cosmos3_super_reasoner/predictions.csv",
12797
+ "status": "pass",
12798
+ "local": {
12799
+ "path": "repo:results/omni_finetune/model_output_task_probes_20260616/time_to_transition/cosmos3_super_reasoner/predictions.csv",
12800
+ "exists": true,
12801
+ "bytes": 76139,
12802
+ "sha256": "a373e6326d33262086b278a365f0612346950b17f0f3bc02b33440e58bde33c3"
12803
+ },
12804
+ "mirrors": {
12805
+ "hf_artifacts": {
12806
+ "path": "hf_artifacts:results/omni_finetune/model_output_task_probes_20260616/time_to_transition/cosmos3_super_reasoner/predictions.csv",
12807
+ "exists": true,
12808
+ "bytes": 76139,
12809
+ "sha256": "a373e6326d33262086b278a365f0612346950b17f0f3bc02b33440e58bde33c3"
12810
+ },
12811
+ "hf_model": {
12812
+ "path": "hf_model:results/omni_finetune/model_output_task_probes_20260616/time_to_transition/cosmos3_super_reasoner/predictions.csv",
12813
+ "exists": true,
12814
+ "bytes": 76139,
12815
+ "sha256": "a373e6326d33262086b278a365f0612346950b17f0f3bc02b33440e58bde33c3"
12816
  }
12817
  },
12818
  "failures": []
 
20711
  "local": {
20712
  "path": "repo:TASK_METHOD_20_GAP_AUDIT.md",
20713
  "exists": true,
20714
+ "bytes": 9908,
20715
+ "sha256": "6b76d3cb4294150c5322b0af6c22fe52ed658d31b87a646fa26a54322d6a55e2"
20716
  },
20717
  "mirrors": {
20718
  "hf_space": {
20719
  "path": "hf_space:TASK_METHOD_20_GAP_AUDIT.md",
20720
  "exists": true,
20721
+ "bytes": 9908,
20722
+ "sha256": "6b76d3cb4294150c5322b0af6c22fe52ed658d31b87a646fa26a54322d6a55e2"
20723
  },
20724
  "hf_artifacts": {
20725
  "path": "hf_artifacts:TASK_METHOD_20_GAP_AUDIT.md",
20726
  "exists": true,
20727
+ "bytes": 9908,
20728
+ "sha256": "6b76d3cb4294150c5322b0af6c22fe52ed658d31b87a646fa26a54322d6a55e2"
20729
  },
20730
  "hf_model": {
20731
  "path": "hf_model:TASK_METHOD_20_GAP_AUDIT.md",
20732
  "exists": true,
20733
+ "bytes": 9908,
20734
+ "sha256": "6b76d3cb4294150c5322b0af6c22fe52ed658d31b87a646fa26a54322d6a55e2"
20735
  }
20736
  },
20737
  "failures": []
 
20742
  "local": {
20743
  "path": "repo:TASK_METHOD_20_RESULT_MATRIX.md",
20744
  "exists": true,
20745
+ "bytes": 3938,
20746
+ "sha256": "b15ca4161fc6aa94e5f452b14d802b37d80d565bbf64a795dfdaeef07e5263de"
20747
  },
20748
  "mirrors": {
20749
  "hf_space": {
20750
  "path": "hf_space:TASK_METHOD_20_RESULT_MATRIX.md",
20751
  "exists": true,
20752
+ "bytes": 3938,
20753
+ "sha256": "b15ca4161fc6aa94e5f452b14d802b37d80d565bbf64a795dfdaeef07e5263de"
20754
  },
20755
  "hf_artifacts": {
20756
  "path": "hf_artifacts:TASK_METHOD_20_RESULT_MATRIX.md",
20757
  "exists": true,
20758
+ "bytes": 3938,
20759
+ "sha256": "b15ca4161fc6aa94e5f452b14d802b37d80d565bbf64a795dfdaeef07e5263de"
20760
  },
20761
  "hf_model": {
20762
  "path": "hf_model:TASK_METHOD_20_RESULT_MATRIX.md",
20763
  "exists": true,
20764
+ "bytes": 3938,
20765
+ "sha256": "b15ca4161fc6aa94e5f452b14d802b37d80d565bbf64a795dfdaeef07e5263de"
20766
  }
20767
  },
20768
  "failures": []
docs/data/public_surface_qa.json CHANGED
@@ -1,7 +1,7 @@
1
  {
2
  "title": "Ropedia Xperience-10M Public Project Surface",
3
  "status": "pass",
4
- "generated_at_utc": "2026-06-18T14:41:36+00:00",
5
  "scope": "Repo README, GitHub Pages HTML, Hugging Face Space card, artifact dataset card, and model card.",
6
  "checks": [
7
  {
@@ -18,7 +18,7 @@
18
  "website_integrity": {
19
  "exists": true,
20
  "status": "pass",
21
- "generated_at_utc": "2026-06-18T14:35:14+00:00"
22
  },
23
  "rendered_site_check": {
24
  "exists": true,
@@ -28,12 +28,12 @@
28
  "task_surface_integrity": {
29
  "exists": true,
30
  "status": "pass",
31
- "generated_at_utc": "2026-06-18T14:34:58+00:00"
32
  },
33
  "source_alignment": {
34
  "exists": true,
35
  "status": "pass",
36
- "generated_at_utc": "2026-06-18T14:34:47+00:00"
37
  },
38
  "scale_up_status": {
39
  "exists": true,
@@ -43,12 +43,12 @@
43
  "publication_package": {
44
  "exists": true,
45
  "status": "pass",
46
- "generated_at_utc": "2026-06-18T14:35:40+00:00"
47
  },
48
  "mirror_parity": {
49
  "exists": true,
50
  "status": "pass",
51
- "generated_at_utc": "2026-06-18T14:37:04+00:00"
52
  }
53
  },
54
  "failures": {}
 
1
  {
2
  "title": "Ropedia Xperience-10M Public Project Surface",
3
  "status": "pass",
4
+ "generated_at_utc": "2026-06-18T15:37:09+00:00",
5
  "scope": "Repo README, GitHub Pages HTML, Hugging Face Space card, artifact dataset card, and model card.",
6
  "checks": [
7
  {
 
18
  "website_integrity": {
19
  "exists": true,
20
  "status": "pass",
21
+ "generated_at_utc": "2026-06-18T15:31:19+00:00"
22
  },
23
  "rendered_site_check": {
24
  "exists": true,
 
28
  "task_surface_integrity": {
29
  "exists": true,
30
  "status": "pass",
31
+ "generated_at_utc": "2026-06-18T15:31:10+00:00"
32
  },
33
  "source_alignment": {
34
  "exists": true,
35
  "status": "pass",
36
+ "generated_at_utc": "2026-06-18T15:31:10+00:00"
37
  },
38
  "scale_up_status": {
39
  "exists": true,
 
43
  "publication_package": {
44
  "exists": true,
45
  "status": "pass",
46
+ "generated_at_utc": "2026-06-18T15:32:30+00:00"
47
  },
48
  "mirror_parity": {
49
  "exists": true,
50
  "status": "pass",
51
+ "generated_at_utc": "2026-06-18T15:36:43+00:00"
52
  }
53
  },
54
  "failures": {}
docs/data/publication_audit.json CHANGED
@@ -1,6 +1,6 @@
1
  {
2
  "status": "pass",
3
- "generated_at_utc": "2026-06-18T14:58:23+00:00",
4
  "checks": [
5
  {
6
  "name": "required_publication_assets_present",
@@ -215,8 +215,8 @@
215
  "github_repo": {
216
  "root": "repo",
217
  "exists": true,
218
- "file_count": 1355,
219
- "text_file_count": 1132,
220
  "largest_file": {
221
  "path": "results/episode_task_suite/modality_reconstruction/predictions.npz",
222
  "bytes": 55702978
 
1
  {
2
  "status": "pass",
3
+ "generated_at_utc": "2026-06-18T15:32:30+00:00",
4
  "checks": [
5
  {
6
  "name": "required_publication_assets_present",
 
215
  "github_repo": {
216
  "root": "repo",
217
  "exists": true,
218
+ "file_count": 1357,
219
+ "text_file_count": 1134,
220
  "largest_file": {
221
  "path": "results/episode_task_suite/modality_reconstruction/predictions.npz",
222
  "bytes": 55702978
docs/data/quality_gates.json CHANGED
@@ -1,7 +1,7 @@
1
  {
2
  "title": "Ropedia Xperience-10M Release Checks",
3
  "status": "pass",
4
- "generated_at_utc": "2026-06-18T14:34:09+00:00",
5
  "rule": "A release is current when the automated reports pass and the live GitHub/Hugging Face mirrors are verified after publishing.",
6
  "automated_gates": [
7
  {
 
1
  {
2
  "title": "Ropedia Xperience-10M Release Checks",
3
  "status": "pass",
4
+ "generated_at_utc": "2026-06-18T15:37:08+00:00",
5
  "rule": "A release is current when the automated reports pass and the live GitHub/Hugging Face mirrors are verified after publishing.",
6
  "automated_gates": [
7
  {
docs/data/single_episode_task_model_radar.json CHANGED
@@ -1,7 +1,7 @@
1
  {
2
  "title": "Single-Episode 20-Task Radar",
3
  "status": "pass",
4
- "generated_at_utc": "2026-06-18T14:32:46+00:00",
5
  "description": "Minimal and Neural MLP baselines on the one public sample episode, both scored on all 20 task contracts.",
6
  "task_count": 20,
7
  "method_count": 2,
 
1
  {
2
  "title": "Single-Episode 20-Task Radar",
3
  "status": "pass",
4
+ "generated_at_utc": "2026-06-18T15:27:21+00:00",
5
  "description": "Minimal and Neural MLP baselines on the one public sample episode, both scored on all 20 task contracts.",
6
  "task_count": 20,
7
  "method_count": 2,
docs/data/source_alignment_audit.json CHANGED
@@ -1,7 +1,7 @@
1
  {
2
  "title": "Ropedia Xperience-10M Source Alignment Note",
3
  "status": "pass",
4
- "generated_at_utc": "2026-06-18T14:41:36+00:00",
5
  "alignment_json": "docs/data/xperience10m_dataset_card_alignment.json",
6
  "alignment_summary": {
7
  "full_dataset_repo": "ropedia-ai/xperience-10m",
 
1
  {
2
  "title": "Ropedia Xperience-10M Source Alignment Note",
3
  "status": "pass",
4
+ "generated_at_utc": "2026-06-18T15:31:10+00:00",
5
  "alignment_json": "docs/data/xperience10m_dataset_card_alignment.json",
6
  "alignment_summary": {
7
  "full_dataset_repo": "ropedia-ai/xperience-10m",
docs/data/task_method_20_gap_audit.json CHANGED
@@ -1,10 +1,10 @@
1
  {
2
- "generated_at_utc": "2026-06-18T14:33:00+00:00",
3
  "immediate_actions": [
4
  {
5
  "artifact": "docs/data/task_method_20_gap_audit.json",
6
  "id": "gap_audit",
7
- "purpose": "Keep the 36 scoreless cells visible and reproducible."
8
  },
9
  {
10
  "artifact": "scripts/omni/score_model_output_probes.py",
@@ -37,11 +37,11 @@
37
  "proxy_scored_task_count": 0,
38
  "result_record_count": 20,
39
  "scope": "128 selected episodes, held-out test",
40
- "scored_task_count": 7,
41
- "scoreless_task_count": 13,
42
  "status_counts": {
43
- "not_evaluated_in_verified_package": 13,
44
- "scored": 7
45
  }
46
  },
47
  "metadata128_neural_mlp": {
@@ -136,13 +136,13 @@
136
  },
137
  "missing_by_method": {
138
  "cosmos3_nano_future_window": 14,
139
- "cosmos3_super_reasoner": 13,
140
  "metadata128_neural_mlp": 2,
141
  "metadata128_simple": 2,
142
  "qwen3_omni_v6_lora": 5
143
  },
144
  "missing_by_status": {
145
- "not_evaluated_in_verified_package": 32,
146
  "not_supported_by_metadata_only_package": 2,
147
  "unsupported_without_required_target": 2
148
  },
@@ -212,8 +212,7 @@
212
  "qwen3_omni_v6_lora"
213
  ],
214
  "20 Time-to-Next-Transition Regression": [
215
- "cosmos3_nano_future_window",
216
- "cosmos3_super_reasoner"
217
  ]
218
  },
219
  "missing_records": [
@@ -659,19 +658,6 @@
659
  "task_label": "Camera-View Synchronization Retrieval",
660
  "task_number": 19
661
  },
662
- {
663
- "method": "Cosmos3-Super Reasoner",
664
- "metric_key": "mae",
665
- "reason": "the verified public model package did not ask this branch to emit that task target; a new task-specific evaluation package is required for a numeric score",
666
- "recommended_next_step": "Generate verified model outputs for this task contract and score them against the held-out labels.",
667
- "scope": "multi_episode_128_partial_model_overlay",
668
- "series_id": "cosmos3_super_reasoner",
669
- "status": "not_evaluated_in_verified_package",
670
- "status_label": "not evaluated",
671
- "task_id": "time_to_transition",
672
- "task_label": "Time-to-Next-Transition Regression",
673
- "task_number": 20
674
- },
675
  {
676
  "method": "Cosmos3-Nano Future Window",
677
  "metric_key": "mae",
@@ -732,8 +718,8 @@
732
  "method_count": 9,
733
  "method_task_record_count": 180,
734
  "proxy_scored_method_task_count": 4,
735
- "scored_method_task_count": 144,
736
- "scoreless_method_task_count": 36,
737
  "task_count": 20
738
  },
739
  "source_matrix": "docs/data/task_method_20_result_matrix.json",
 
1
  {
2
+ "generated_at_utc": "2026-06-18T15:28:01+00:00",
3
  "immediate_actions": [
4
  {
5
  "artifact": "docs/data/task_method_20_gap_audit.json",
6
  "id": "gap_audit",
7
+ "purpose": "Keep the 35 scoreless cells visible and reproducible."
8
  },
9
  {
10
  "artifact": "scripts/omni/score_model_output_probes.py",
 
37
  "proxy_scored_task_count": 0,
38
  "result_record_count": 20,
39
  "scope": "128 selected episodes, held-out test",
40
+ "scored_task_count": 8,
41
+ "scoreless_task_count": 12,
42
  "status_counts": {
43
+ "not_evaluated_in_verified_package": 12,
44
+ "scored": 8
45
  }
46
  },
47
  "metadata128_neural_mlp": {
 
136
  },
137
  "missing_by_method": {
138
  "cosmos3_nano_future_window": 14,
139
+ "cosmos3_super_reasoner": 12,
140
  "metadata128_neural_mlp": 2,
141
  "metadata128_simple": 2,
142
  "qwen3_omni_v6_lora": 5
143
  },
144
  "missing_by_status": {
145
+ "not_evaluated_in_verified_package": 31,
146
  "not_supported_by_metadata_only_package": 2,
147
  "unsupported_without_required_target": 2
148
  },
 
212
  "qwen3_omni_v6_lora"
213
  ],
214
  "20 Time-to-Next-Transition Regression": [
215
+ "cosmos3_nano_future_window"
 
216
  ]
217
  },
218
  "missing_records": [
 
658
  "task_label": "Camera-View Synchronization Retrieval",
659
  "task_number": 19
660
  },
 
 
 
 
 
 
 
 
 
 
 
 
 
661
  {
662
  "method": "Cosmos3-Nano Future Window",
663
  "metric_key": "mae",
 
718
  "method_count": 9,
719
  "method_task_record_count": 180,
720
  "proxy_scored_method_task_count": 4,
721
+ "scored_method_task_count": 145,
722
+ "scoreless_method_task_count": 35,
723
  "task_count": 20
724
  },
725
  "source_matrix": "docs/data/task_method_20_result_matrix.json",
docs/data/task_method_20_result_matrix.json CHANGED
@@ -1,11 +1,11 @@
1
  {
2
  "title": "Task Method 20-Result Matrix",
3
  "status": "pass",
4
- "generated_at_utc": "2026-06-18T14:32:46+00:00",
5
  "task_count": 20,
6
  "method_count": 9,
7
  "method_task_record_count": 180,
8
- "scored_method_task_count": 144,
9
  "series": [
10
  {
11
  "id": "minimal",
@@ -181,20 +181,20 @@
181
  "kind": "partial_128_episode_foundation_model_overlay",
182
  "scope": "128 selected episodes, held-out test",
183
  "stroke_dasharray": "4 7",
184
- "method_detail": "Verified Cosmos3-Super base-weight Reasoner JSON-task evaluation, plus task 16 scored from existing verified action/object JSON.",
185
  "plotted_as": "colored point overlay",
186
  "result_record_count": 20,
187
- "scored_task_count": 7,
188
- "covered_task_count": 7,
189
  "proxy_scored_task_count": 0,
190
- "scoreless_task_count": 13,
191
  "unsupported_task_count": 0,
192
- "not_evaluated_task_count": 13,
193
  "status_counts": {
194
- "not_evaluated_in_verified_package": 13,
195
- "scored": 7
196
  },
197
- "coverage_fraction": 0.35,
198
  "result_record_fraction": 1.0
199
  },
200
  {
@@ -3433,17 +3433,17 @@
3433
  "task_label": "Time-to-Next-Transition Regression",
3434
  "series_id": "cosmos3_super_reasoner",
3435
  "method": "Cosmos3-Super Reasoner",
3436
- "status": "not_evaluated_in_verified_package",
3437
- "status_label": "not evaluated",
3438
- "scored": false,
3439
  "proxy_scored": false,
3440
- "raw": null,
3441
- "raw_text": "n/a",
3442
- "normalized_score": null,
3443
- "metric_key": "mae",
3444
- "source": null,
3445
  "scope": "multi_episode_128_partial_model_overlay",
3446
- "reason": "the verified public model package did not ask this branch to emit that task target; a new task-specific evaluation package is required for a numeric score"
3447
  },
3448
  {
3449
  "task_number": 20,
 
1
  {
2
  "title": "Task Method 20-Result Matrix",
3
  "status": "pass",
4
+ "generated_at_utc": "2026-06-18T15:27:21+00:00",
5
  "task_count": 20,
6
  "method_count": 9,
7
  "method_task_record_count": 180,
8
+ "scored_method_task_count": 145,
9
  "series": [
10
  {
11
  "id": "minimal",
 
181
  "kind": "partial_128_episode_foundation_model_overlay",
182
  "scope": "128 selected episodes, held-out test",
183
  "stroke_dasharray": "4 7",
184
+ "method_detail": "Verified Cosmos3-Super base-weight Reasoner JSON-task evaluation, plus task 16 and a derived task-20 action-boundary timing probe scored from existing verified JSON.",
185
  "plotted_as": "colored point overlay",
186
  "result_record_count": 20,
187
+ "scored_task_count": 8,
188
+ "covered_task_count": 8,
189
  "proxy_scored_task_count": 0,
190
+ "scoreless_task_count": 12,
191
  "unsupported_task_count": 0,
192
+ "not_evaluated_task_count": 12,
193
  "status_counts": {
194
+ "not_evaluated_in_verified_package": 12,
195
+ "scored": 8
196
  },
197
+ "coverage_fraction": 0.4,
198
  "result_record_fraction": 1.0
199
  },
200
  {
 
3433
  "task_label": "Time-to-Next-Transition Regression",
3434
  "series_id": "cosmos3_super_reasoner",
3435
  "method": "Cosmos3-Super Reasoner",
3436
+ "status": "scored",
3437
+ "status_label": "scored",
3438
+ "scored": true,
3439
  "proxy_scored": false,
3440
+ "raw": 52.94642857142857,
3441
+ "raw_text": "52.95",
3442
+ "normalized_score": 0.19901920981190058,
3443
+ "metric_key": "time_to_transition_mae",
3444
+ "source": "results/omni_finetune/model_output_task_probes_20260616/time_to_transition/cosmos3_super_reasoner/metrics.json",
3445
  "scope": "multi_episode_128_partial_model_overlay",
3446
+ "reason": null
3447
  },
3448
  {
3449
  "task_number": 20,
docs/data/task_surface_integrity.json CHANGED
@@ -1,6 +1,6 @@
1
  {
2
  "status": "pass",
3
- "generated_at_utc": "2026-06-18T14:42:41+00:00",
4
  "summary": {
5
  "task_count": 12,
6
  "expected_task_count": 12,
 
1
  {
2
  "status": "pass",
3
+ "generated_at_utc": "2026-06-18T15:31:10+00:00",
4
  "summary": {
5
  "task_count": 12,
6
  "expected_task_count": 12,
docs/data/unified_task_model_radar.json CHANGED
@@ -1,11 +1,11 @@
1
  {
2
  "title": "Unified 20-Task Model Radar",
3
  "status": "pass",
4
- "generated_at_utc": "2026-06-18T14:32:46+00:00",
5
  "task_count": 20,
6
  "method_count": 9,
7
  "method_task_record_count": 180,
8
- "scored_method_task_count": 144,
9
  "normalization_policy": {
10
  "higher_is_better": "bounded metrics are plotted directly on 0-1 axes after clipping to [0, 1]",
11
  "lower_is_better": "lower-error metrics are converted to best_observed_value / raw_value within the same task",
@@ -190,20 +190,20 @@
190
  "kind": "partial_128_episode_foundation_model_overlay",
191
  "scope": "128 selected episodes, held-out test",
192
  "stroke_dasharray": "4 7",
193
- "method_detail": "Verified Cosmos3-Super base-weight Reasoner JSON-task evaluation, plus task 16 scored from existing verified action/object JSON.",
194
  "plotted_as": "colored point overlay",
195
  "result_record_count": 20,
196
- "scored_task_count": 7,
197
- "covered_task_count": 7,
198
  "proxy_scored_task_count": 0,
199
- "scoreless_task_count": 13,
200
  "unsupported_task_count": 0,
201
- "not_evaluated_task_count": 13,
202
  "status_counts": {
203
- "not_evaluated_in_verified_package": 13,
204
- "scored": 7
205
  },
206
- "coverage_fraction": 0.35,
207
  "result_record_fraction": 1.0
208
  },
209
  {
@@ -2373,6 +2373,17 @@
2373
  "raw_text": "10.55",
2374
  "status_label": "scored"
2375
  },
 
 
 
 
 
 
 
 
 
 
 
2376
  "qwen3_omni_v6_lora": {
2377
  "raw": 134.0687422166874,
2378
  "metric_key": "time_to_transition_mae",
@@ -2428,17 +2439,6 @@
2428
  "raw_text": "42.37",
2429
  "status_label": "scored"
2430
  },
2431
- "cosmos3_super_reasoner": {
2432
- "raw": null,
2433
- "metric_key": "mae",
2434
- "source": null,
2435
- "scope": "multi_episode_128_partial_model_overlay",
2436
- "status": "not_evaluated_in_verified_package",
2437
- "reason": "the verified public model package did not ask this branch to emit that task target; a new task-specific evaluation package is required for a numeric score",
2438
- "normalized_score": null,
2439
- "raw_text": "n/a",
2440
- "status_label": "not evaluated"
2441
- },
2442
  "cosmos3_nano_future_window": {
2443
  "raw": null,
2444
  "metric_key": "mae",
@@ -2499,7 +2499,7 @@
2499
  "id": "cosmos3_super_reasoner",
2500
  "title": "Cosmos3-Super Reasoner",
2501
  "status": "verified_base_weight_eval",
2502
- "coverage": "20 records / 7 scored task-aligned axes",
2503
  "headline": "JSON validity 0.5112; action macro-F1 0.0008",
2504
  "source": "results/omni_finetune/verified_public/xperience10m_cosmos3_super_reasoner_128ep_test_full_20260607/eval/metrics.json"
2505
  },
@@ -5731,17 +5731,17 @@
5731
  "task_label": "Time-to-Next-Transition Regression",
5732
  "series_id": "cosmos3_super_reasoner",
5733
  "method": "Cosmos3-Super Reasoner",
5734
- "status": "not_evaluated_in_verified_package",
5735
- "status_label": "not evaluated",
5736
- "scored": false,
5737
  "proxy_scored": false,
5738
- "raw": null,
5739
- "raw_text": "n/a",
5740
- "normalized_score": null,
5741
- "metric_key": "mae",
5742
- "source": null,
5743
  "scope": "multi_episode_128_partial_model_overlay",
5744
- "reason": "the verified public model package did not ask this branch to emit that task target; a new task-specific evaluation package is required for a numeric score"
5745
  },
5746
  {
5747
  "task_number": 20,
 
1
  {
2
  "title": "Unified 20-Task Model Radar",
3
  "status": "pass",
4
+ "generated_at_utc": "2026-06-18T15:27:21+00:00",
5
  "task_count": 20,
6
  "method_count": 9,
7
  "method_task_record_count": 180,
8
+ "scored_method_task_count": 145,
9
  "normalization_policy": {
10
  "higher_is_better": "bounded metrics are plotted directly on 0-1 axes after clipping to [0, 1]",
11
  "lower_is_better": "lower-error metrics are converted to best_observed_value / raw_value within the same task",
 
190
  "kind": "partial_128_episode_foundation_model_overlay",
191
  "scope": "128 selected episodes, held-out test",
192
  "stroke_dasharray": "4 7",
193
+ "method_detail": "Verified Cosmos3-Super base-weight Reasoner JSON-task evaluation, plus task 16 and a derived task-20 action-boundary timing probe scored from existing verified JSON.",
194
  "plotted_as": "colored point overlay",
195
  "result_record_count": 20,
196
+ "scored_task_count": 8,
197
+ "covered_task_count": 8,
198
  "proxy_scored_task_count": 0,
199
+ "scoreless_task_count": 12,
200
  "unsupported_task_count": 0,
201
+ "not_evaluated_task_count": 12,
202
  "status_counts": {
203
+ "not_evaluated_in_verified_package": 12,
204
+ "scored": 8
205
  },
206
+ "coverage_fraction": 0.4,
207
  "result_record_fraction": 1.0
208
  },
209
  {
 
2373
  "raw_text": "10.55",
2374
  "status_label": "scored"
2375
  },
2376
+ "cosmos3_super_reasoner": {
2377
+ "raw": 52.94642857142857,
2378
+ "metric_key": "time_to_transition_mae",
2379
+ "source": "results/omni_finetune/model_output_task_probes_20260616/time_to_transition/cosmos3_super_reasoner/metrics.json",
2380
+ "scope": "multi_episode_128_partial_model_overlay",
2381
+ "status": "scored",
2382
+ "reason": null,
2383
+ "normalized_score": 0.19901920981190058,
2384
+ "raw_text": "52.95",
2385
+ "status_label": "scored"
2386
+ },
2387
  "qwen3_omni_v6_lora": {
2388
  "raw": 134.0687422166874,
2389
  "metric_key": "time_to_transition_mae",
 
2439
  "raw_text": "42.37",
2440
  "status_label": "scored"
2441
  },
 
 
 
 
 
 
 
 
 
 
 
2442
  "cosmos3_nano_future_window": {
2443
  "raw": null,
2444
  "metric_key": "mae",
 
2499
  "id": "cosmos3_super_reasoner",
2500
  "title": "Cosmos3-Super Reasoner",
2501
  "status": "verified_base_weight_eval",
2502
+ "coverage": "20 records / 8 scored task-aligned axes",
2503
  "headline": "JSON validity 0.5112; action macro-F1 0.0008",
2504
  "source": "results/omni_finetune/verified_public/xperience10m_cosmos3_super_reasoner_128ep_test_full_20260607/eval/metrics.json"
2505
  },
 
5731
  "task_label": "Time-to-Next-Transition Regression",
5732
  "series_id": "cosmos3_super_reasoner",
5733
  "method": "Cosmos3-Super Reasoner",
5734
+ "status": "scored",
5735
+ "status_label": "scored",
5736
+ "scored": true,
5737
  "proxy_scored": false,
5738
+ "raw": 52.94642857142857,
5739
+ "raw_text": "52.95",
5740
+ "normalized_score": 0.19901920981190058,
5741
+ "metric_key": "time_to_transition_mae",
5742
+ "source": "results/omni_finetune/model_output_task_probes_20260616/time_to_transition/cosmos3_super_reasoner/metrics.json",
5743
  "scope": "multi_episode_128_partial_model_overlay",
5744
+ "reason": null
5745
  },
5746
  {
5747
  "task_number": 20,
docs/data/website_integrity.json CHANGED
@@ -1,6 +1,6 @@
1
  {
2
  "status": "pass",
3
- "generated_at_utc": "2026-06-18T14:41:36+00:00",
4
  "docs_root": "docs",
5
  "site_base": "/ropedia-xperience-10m-task-suite/",
6
  "summary": {
@@ -301,7 +301,7 @@
301
  },
302
  {
303
  "path": "data/artifact_index.json",
304
- "bytes": 116111,
305
  "top_level_type": "dict"
306
  },
307
  {
@@ -316,7 +316,7 @@
316
  },
317
  {
318
  "path": "data/episode128_task_model_radar.json",
319
- "bytes": 185503,
320
  "top_level_type": "dict"
321
  },
322
  {
@@ -351,7 +351,7 @@
351
  },
352
  {
353
  "path": "data/mirror_parity.json",
354
- "bytes": 1106958,
355
  "top_level_type": "dict"
356
  },
357
  {
@@ -401,7 +401,7 @@
401
  },
402
  {
403
  "path": "data/publication_audit.json",
404
- "bytes": 9598,
405
  "top_level_type": "dict"
406
  },
407
  {
@@ -486,12 +486,12 @@
486
  },
487
  {
488
  "path": "data/task_method_20_gap_audit.json",
489
- "bytes": 35121,
490
  "top_level_type": "dict"
491
  },
492
  {
493
  "path": "data/task_method_20_result_matrix.json",
494
- "bytes": 128856,
495
  "top_level_type": "dict"
496
  },
497
  {
@@ -526,12 +526,12 @@
526
  },
527
  {
528
  "path": "data/unified_task_model_radar.json",
529
- "bytes": 229355,
530
  "top_level_type": "dict"
531
  },
532
  {
533
  "path": "data/website_integrity.json",
534
- "bytes": 20022,
535
  "top_level_type": "dict"
536
  },
537
  {
@@ -571,7 +571,7 @@
571
  {
572
  "path": "assets/charts/episode128_task_model_radar.svg",
573
  "exists": true,
574
- "bytes": 47886,
575
  "format": "SVG",
576
  "has_viewbox": true
577
  },
@@ -641,7 +641,7 @@
641
  {
642
  "path": "assets/charts/unified_task_model_radar.svg",
643
  "exists": true,
644
- "bytes": 53899,
645
  "format": "SVG",
646
  "has_viewbox": true
647
  },
 
1
  {
2
  "status": "pass",
3
+ "generated_at_utc": "2026-06-18T15:31:19+00:00",
4
  "docs_root": "docs",
5
  "site_base": "/ropedia-xperience-10m-task-suite/",
6
  "summary": {
 
301
  },
302
  {
303
  "path": "data/artifact_index.json",
304
+ "bytes": 116109,
305
  "top_level_type": "dict"
306
  },
307
  {
 
316
  },
317
  {
318
  "path": "data/episode128_task_model_radar.json",
319
+ "bytes": 185480,
320
  "top_level_type": "dict"
321
  },
322
  {
 
351
  },
352
  {
353
  "path": "data/mirror_parity.json",
354
+ "bytes": 919718,
355
  "top_level_type": "dict"
356
  },
357
  {
 
401
  },
402
  {
403
  "path": "data/publication_audit.json",
404
+ "bytes": 9520,
405
  "top_level_type": "dict"
406
  },
407
  {
 
486
  },
487
  {
488
  "path": "data/task_method_20_gap_audit.json",
489
+ "bytes": 34384,
490
  "top_level_type": "dict"
491
  },
492
  {
493
  "path": "data/task_method_20_result_matrix.json",
494
+ "bytes": 128862,
495
  "top_level_type": "dict"
496
  },
497
  {
 
526
  },
527
  {
528
  "path": "data/unified_task_model_radar.json",
529
+ "bytes": 229332,
530
  "top_level_type": "dict"
531
  },
532
  {
533
  "path": "data/website_integrity.json",
534
+ "bytes": 20021,
535
  "top_level_type": "dict"
536
  },
537
  {
 
571
  {
572
  "path": "assets/charts/episode128_task_model_radar.svg",
573
  "exists": true,
574
+ "bytes": 48019,
575
  "format": "SVG",
576
  "has_viewbox": true
577
  },
 
641
  {
642
  "path": "assets/charts/unified_task_model_radar.svg",
643
  "exists": true,
644
+ "bytes": 54032,
645
  "format": "SVG",
646
  "has_viewbox": true
647
  },