cy0307 commited on
Commit
094eb82
·
verified ·
1 Parent(s): 557a248

Add files using upload-large-folder tool

Browse files
Files changed (27) hide show
  1. data/artifact_index.json +29 -29
  2. data/episode128_task_model_radar.json +52 -52
  3. data/mirror_parity.json +493 -273
  4. data/public_surface_qa.json +7 -7
  5. data/quality_gates.json +1 -1
  6. data/single_episode_task_model_radar.json +1 -1
  7. data/source_alignment_audit.json +1 -1
  8. data/task_method_20_gap_audit.json +16 -46
  9. data/task_method_20_result_matrix.json +36 -36
  10. data/task_surface_integrity.json +1 -1
  11. data/website_integrity.json +9 -9
  12. results/omni_finetune/model_output_probe_readiness/RUN_REPORT.md +4 -4
  13. results/omni_finetune/model_output_probe_readiness/model_output_probe_readiness.json +9 -14
  14. results/omni_finetune/model_output_task_probes_20260616/action_object_relation/cosmos3_nano_future_window/metrics.json +187 -0
  15. results/omni_finetune/model_output_task_probes_20260616/action_object_relation/cosmos3_nano_future_window/per_class_metrics.csv +152 -0
  16. results/omni_finetune/model_output_task_probes_20260616/action_object_relation/cosmos3_nano_future_window/predictions.csv +0 -0
  17. results/omni_finetune/model_output_task_probes_20260616/action_object_relation/cosmos3_super_reasoner/metrics.json +1 -1
  18. results/omni_finetune/model_output_task_probes_20260616/action_object_relation/qwen3_omni_v6_lora/metrics.json +1 -1
  19. results/omni_finetune/model_output_task_probes_20260616/caption_grounding/cosmos3_super_reasoner/metrics.json +28 -0
  20. results/omni_finetune/model_output_task_probes_20260616/caption_grounding/cosmos3_super_reasoner/predictions.csv +449 -0
  21. results/omni_finetune/model_output_task_probes_20260616/next_subtask_forecast/cosmos3_nano_future_window/metrics.json +1 -1
  22. results/omni_finetune/model_output_task_probes_20260616/object_set_forecast/cosmos3_nano_future_window/metrics.json +1 -1
  23. results/omni_finetune/model_output_task_probes_20260616/summary.json +17 -5
  24. results/omni_finetune/model_output_task_probes_20260616/time_to_transition/cosmos3_nano_future_window/metrics.json +1 -1
  25. results/omni_finetune/model_output_task_probes_20260616/time_to_transition/cosmos3_super_reasoner/metrics.json +1 -1
  26. scripts/build_unified_task_model_radar.py +16 -2
  27. scripts/omni/score_existing_model_output_task_probes.py +296 -6
data/artifact_index.json CHANGED
@@ -1,6 +1,6 @@
1
  {
2
  "title": "Ropedia Xperience-10M Task Suite Artifact Index",
3
- "generated_at_utc": "2026-06-18T22:26:00+00:00",
4
  "status": "pass",
5
  "artifact_count": 214,
6
  "missing": [],
@@ -610,7 +610,7 @@
610
  "shows": "Machine-readable source-alignment pass/fail check for repo, website, and HF surfaces.",
611
  "exists": true,
612
  "bytes": 4432,
613
- "sha256": "e767067c3568632f9ae600cdf123a2dae41a1cf703b7554fde7cd9b1bfee425f"
614
  },
615
  {
616
  "id": "source_alignment_validator",
@@ -730,8 +730,8 @@
730
  "surface": "website_hf",
731
  "shows": "Stores normalized 20-axis radar values, raw task metrics, Qwen3/Cosmos overlay mappings, branch-card caveats, and explicit scoreless status records.",
732
  "exists": true,
733
- "bytes": 229244,
734
- "sha256": "6e9de603b3f2ca60ee099135e9df559781f7481a87f6cdc7ec8873b798e14990"
735
  },
736
  {
737
  "id": "single_episode_task_model_radar_json",
@@ -742,7 +742,7 @@
742
  "shows": "Machine-readable split radar for the one-episode Minimal and Neural MLP baselines, both scored on all 20 task contracts.",
743
  "exists": true,
744
  "bytes": 51064,
745
- "sha256": "6a78822649c3318371bd1943bc4aceb6216052d832b682a98d4f887dab9c2756"
746
  },
747
  {
748
  "id": "episode128_task_model_radar_json",
@@ -752,8 +752,8 @@
752
  "surface": "website_hf",
753
  "shows": "Machine-readable split radar for selected 128-episode metadata/raw baselines and verified Qwen3/Cosmos branches, preserving explicit scoreless cells.",
754
  "exists": true,
755
- "bytes": 185391,
756
- "sha256": "53fbfad3e38a6accae25bb345f4682e39ebab69948df5a3423096eb7ed68b5d7"
757
  },
758
  {
759
  "id": "task_method_20_result_matrix_json",
@@ -763,8 +763,8 @@
763
  "surface": "website_hf",
764
  "shows": "Machine-readable 9-method by 20-task matrix where every method has 20 records and scoreless cells carry unsupported/not-evaluated reasons.",
765
  "exists": true,
766
- "bytes": 128842,
767
- "sha256": "a361c2528ccbbd6b1b53ede78e6d39353aa98630bcfed7b8014b77b05c4f226b"
768
  },
769
  {
770
  "id": "task_method_20_result_matrix",
@@ -774,8 +774,8 @@
774
  "surface": "repo_hf",
775
  "shows": "Reader-facing table that separates 20 records per method from numeric scored axes, documented raw128 proxy scores, unsupported metadata targets, and model targets not evaluated in verified packages.",
776
  "exists": true,
777
- "bytes": 3892,
778
- "sha256": "590d9362624d64b81b1b19638c46faa7969730d40415e4825abd2ff09d76340a"
779
  },
780
  {
781
  "id": "task_method_20_gap_audit_json",
@@ -785,8 +785,8 @@
785
  "surface": "website_hf",
786
  "shows": "Machine-readable 180-record gap ledger with numeric scores, scoreless cells, explicit status reasons, and next evidence needed before new scores can be published.",
787
  "exists": true,
788
- "bytes": 29788,
789
- "sha256": "143e03828559e706ab083b3824731d652bcb5a915cfb441caa4a3e6447a982f2"
790
  },
791
  {
792
  "id": "task_method_20_gap_audit",
@@ -796,8 +796,8 @@
796
  "surface": "repo_hf",
797
  "shows": "Reader-facing ledger that lists every scoreless method-task cell and the concrete target or model-output evidence required before it can become numeric.",
798
  "exists": true,
799
- "bytes": 8787,
800
- "sha256": "8fd8555f75cd96c31346618ab622e24655027cea5c52e8a09a7a53793ef7b72b"
801
  },
802
  {
803
  "id": "unified_task_model_radar_chart",
@@ -807,8 +807,8 @@
807
  "surface": "website_hf",
808
  "shows": "Compares minimal and neural MLP baselines across all 20 tasks, with Qwen3/Cosmos task-aligned model overlays.",
809
  "exists": true,
810
- "bytes": 54717,
811
- "sha256": "8fb6de7004e8463c28d6ada669c475d19986a1a3689778c691717cff39a7531a"
812
  },
813
  {
814
  "id": "single_episode_task_model_radar_chart",
@@ -829,8 +829,8 @@
829
  "surface": "website_hf",
830
  "shows": "Separates the selected 128-episode methods: raw-feature simple/NN as complete 20/20 scored polygons and metadata/Qwen/Cosmos as task-aligned overlays.",
831
  "exists": true,
832
- "bytes": 48704,
833
- "sha256": "45f8a79dc764ddbf0182ab7994fbfa5002b52b075951ab42831ecbfb3fd0405c"
834
  },
835
  {
836
  "id": "unified_task_model_radar_builder",
@@ -840,8 +840,8 @@
840
  "surface": "repo_hf",
841
  "shows": "Regenerates the direction-aware radar chart and machine-readable metric overlay JSON.",
842
  "exists": true,
843
- "bytes": 56295,
844
- "sha256": "237ef6a08dd81b9fcb0256f6f6b54394f74c14daea0cbba8f1726fdbbb7feff0"
845
  },
846
  {
847
  "id": "task_method_20_gap_audit_builder",
@@ -873,8 +873,8 @@
873
  "surface": "repo_hf",
874
  "shows": "Checks whether Qwen3/Cosmos branches have train, validation, and test prediction files before extending model overlays to all 20 task contracts.",
875
  "exists": true,
876
- "bytes": 5144,
877
- "sha256": "86835a291c659d335ab5b51d09ea3f36710c14d23466a72d9c2a23137dc9ae8a"
878
  },
879
  {
880
  "id": "model_output_probe_script",
@@ -895,8 +895,8 @@
895
  "surface": "repo_hf",
896
  "shows": "Scores task-specific Qwen3/Cosmos overlays only where verified held-out prediction JSON or compact target maps already contain the required targets.",
897
  "exists": true,
898
- "bytes": 5278,
899
- "sha256": "4a27f39807e8ac13771e2109584a8b0265961bcea88445058cbfe87265457d7f"
900
  },
901
  {
902
  "id": "existing_model_output_task_probe_script",
@@ -906,8 +906,8 @@
906
  "surface": "repo_hf",
907
  "shows": "Derives task-specific scores from committed verified model outputs without running new inference or backfilling absent targets.",
908
  "exists": true,
909
- "bytes": 57470,
910
- "sha256": "9a0708885c1a22addc0bec199488021e277c7a7b7e23d6a37344fbbb3e5f1b96"
911
  },
912
  {
913
  "id": "a100_128_metadata_task_baselines",
@@ -1116,7 +1116,7 @@
1116
  "shows": "Machine-readable release-check summary for validators, mirrors, and public project surfaces.",
1117
  "exists": true,
1118
  "bytes": 8100,
1119
- "sha256": "12cec90cfb4bd783f397852f04ffba5b9d0ae9316667bdee4719cbd6f2d3579a"
1120
  },
1121
  {
1122
  "id": "public_surface_qa",
@@ -1321,7 +1321,7 @@
1321
  "volatile": true,
1322
  "shows": "Confirms prepared GitHub/HF Space/artifact/model mirrors share the same critical data, figure, website HTML, and validator files.",
1323
  "exists": true,
1324
- "bytes": 938745,
1325
  "hash_policy": "existence_and_size_only"
1326
  },
1327
  {
 
1
  {
2
  "title": "Ropedia Xperience-10M Task Suite Artifact Index",
3
+ "generated_at_utc": "2026-06-18T22:57:14+00:00",
4
  "status": "pass",
5
  "artifact_count": 214,
6
  "missing": [],
 
610
  "shows": "Machine-readable source-alignment pass/fail check for repo, website, and HF surfaces.",
611
  "exists": true,
612
  "bytes": 4432,
613
+ "sha256": "1df30908392b455cc7263154126d55709cf97c60ff4213f0eee9ce17d92fb234"
614
  },
615
  {
616
  "id": "source_alignment_validator",
 
730
  "surface": "website_hf",
731
  "shows": "Stores normalized 20-axis radar values, raw task metrics, Qwen3/Cosmos overlay mappings, branch-card caveats, and explicit scoreless status records.",
732
  "exists": true,
733
+ "bytes": 229168,
734
+ "sha256": "64c7c10f3ce663178f2eea4740bb45de0f94b1246448f14f5521d293be916e77"
735
  },
736
  {
737
  "id": "single_episode_task_model_radar_json",
 
742
  "shows": "Machine-readable split radar for the one-episode Minimal and Neural MLP baselines, both scored on all 20 task contracts.",
743
  "exists": true,
744
  "bytes": 51064,
745
+ "sha256": "9d42b045d833e50a2bfa8905203150af1f28ea4736d22edb0fe27e39eedf4574"
746
  },
747
  {
748
  "id": "episode128_task_model_radar_json",
 
752
  "surface": "website_hf",
753
  "shows": "Machine-readable split radar for selected 128-episode metadata/raw baselines and verified Qwen3/Cosmos branches, preserving explicit scoreless cells.",
754
  "exists": true,
755
+ "bytes": 185314,
756
+ "sha256": "5c61c8f9a4a9a7b6bdc65e39ef5fda6117df48412afe260c0be4da501bd7e8db"
757
  },
758
  {
759
  "id": "task_method_20_result_matrix_json",
 
763
  "surface": "website_hf",
764
  "shows": "Machine-readable 9-method by 20-task matrix where every method has 20 records and scoreless cells carry unsupported/not-evaluated reasons.",
765
  "exists": true,
766
+ "bytes": 128805,
767
+ "sha256": "d5572768c6fb671eadf87870d20c8645dfae384f862aa63e929b2db50a5cc51a"
768
  },
769
  {
770
  "id": "task_method_20_result_matrix",
 
774
  "surface": "repo_hf",
775
  "shows": "Reader-facing table that separates 20 records per method from numeric scored axes, documented raw128 proxy scores, unsupported metadata targets, and model targets not evaluated in verified packages.",
776
  "exists": true,
777
+ "bytes": 3876,
778
+ "sha256": "a9ce23a452ca73b6d08219ffaac1782d5baad11f9e3662138b62cb4cd5ff206f"
779
  },
780
  {
781
  "id": "task_method_20_gap_audit_json",
 
785
  "surface": "website_hf",
786
  "shows": "Machine-readable 180-record gap ledger with numeric scores, scoreless cells, explicit status reasons, and next evidence needed before new scores can be published.",
787
  "exists": true,
788
+ "bytes": 28259,
789
+ "sha256": "860dea3d3ce2f2c2146c97918a5deca05ae315238b584c10e53f74a9d2c26dcd"
790
  },
791
  {
792
  "id": "task_method_20_gap_audit",
 
796
  "surface": "repo_hf",
797
  "shows": "Reader-facing ledger that lists every scoreless method-task cell and the concrete target or model-output evidence required before it can become numeric.",
798
  "exists": true,
799
+ "bytes": 8428,
800
+ "sha256": "b33c7f91565a2603b138eb4ec1c6df32d823225b16563eba279f416b0fe2a964"
801
  },
802
  {
803
  "id": "unified_task_model_radar_chart",
 
807
  "surface": "website_hf",
808
  "shows": "Compares minimal and neural MLP baselines across all 20 tasks, with Qwen3/Cosmos task-aligned model overlays.",
809
  "exists": true,
810
+ "bytes": 54936,
811
+ "sha256": "f29db4099d60c093ebd092bee37a2fc1338bbff17d7e52b8a1b27ae6fc06727a"
812
  },
813
  {
814
  "id": "single_episode_task_model_radar_chart",
 
829
  "surface": "website_hf",
830
  "shows": "Separates the selected 128-episode methods: raw-feature simple/NN as complete 20/20 scored polygons and metadata/Qwen/Cosmos as task-aligned overlays.",
831
  "exists": true,
832
+ "bytes": 48923,
833
+ "sha256": "75c389122a413548bdc26fd05cbbad2a85015ebd222ba1a23571f3ff4f0eddcf"
834
  },
835
  {
836
  "id": "unified_task_model_radar_builder",
 
840
  "surface": "repo_hf",
841
  "shows": "Regenerates the direction-aware radar chart and machine-readable metric overlay JSON.",
842
  "exists": true,
843
+ "bytes": 57104,
844
+ "sha256": "805cfce89529fec73edd3e436c1a76afae46cebe31ba5e441b6dfb5cc142c935"
845
  },
846
  {
847
  "id": "task_method_20_gap_audit_builder",
 
873
  "surface": "repo_hf",
874
  "shows": "Checks whether Qwen3/Cosmos branches have train, validation, and test prediction files before extending model overlays to all 20 task contracts.",
875
  "exists": true,
876
+ "bytes": 4977,
877
+ "sha256": "b9caf6d32bb801d845b57b4450b92c10a4c3f9d14890f6a209e5a52aede92568"
878
  },
879
  {
880
  "id": "model_output_probe_script",
 
895
  "surface": "repo_hf",
896
  "shows": "Scores task-specific Qwen3/Cosmos overlays only where verified held-out prediction JSON or compact target maps already contain the required targets.",
897
  "exists": true,
898
+ "bytes": 5951,
899
+ "sha256": "910477d2fba648605dda128d0ecd2a2c13cfa460573e350dc850014ac91c6c2b"
900
  },
901
  {
902
  "id": "existing_model_output_task_probe_script",
 
906
  "surface": "repo_hf",
907
  "shows": "Derives task-specific scores from committed verified model outputs without running new inference or backfilling absent targets.",
908
  "exists": true,
909
+ "bytes": 69411,
910
+ "sha256": "a78889e5225405fcbb0156aa8c63cbbe79022a12283d0b398c5f2bb015175fe7"
911
  },
912
  {
913
  "id": "a100_128_metadata_task_baselines",
 
1116
  "shows": "Machine-readable release-check summary for validators, mirrors, and public project surfaces.",
1117
  "exists": true,
1118
  "bytes": 8100,
1119
+ "sha256": "b88b46bd9b16d4afaf4836d0acff208b46559a493cfcffa881f1528fa282292c"
1120
  },
1121
  {
1122
  "id": "public_surface_qa",
 
1321
  "volatile": true,
1322
  "shows": "Confirms prepared GitHub/HF Space/artifact/model mirrors share the same critical data, figure, website HTML, and validator files.",
1323
  "exists": true,
1324
+ "bytes": 1015184,
1325
  "hash_policy": "existence_and_size_only"
1326
  },
1327
  {
data/episode128_task_model_radar.json CHANGED
@@ -1,12 +1,12 @@
1
  {
2
  "title": "128-Episode 20-Task Radar",
3
  "status": "pass",
4
- "generated_at_utc": "2026-06-18T22:25:59+00:00",
5
  "description": "Selected 128-episode metadata/raw baselines plus verified Qwen3/Cosmos branches. Every method has 20 records; numeric scores appear only where the public artifact produced that task target.",
6
  "task_count": 20,
7
  "method_count": 7,
8
  "method_task_record_count": 140,
9
- "scored_method_task_count": 111,
10
  "normalization_policy": {
11
  "higher_is_better": "bounded metrics are plotted directly on 0-1 axes after clipping to [0, 1]",
12
  "lower_is_better": "lower-error metrics are converted to best_observed_value / raw_value within the same task",
@@ -147,20 +147,20 @@
147
  "kind": "partial_128_episode_foundation_model_overlay",
148
  "scope": "128 selected episodes, held-out test",
149
  "stroke_dasharray": "4 7",
150
- "method_detail": "Verified Cosmos3-Super base-weight Reasoner JSON-task evaluation, plus task 16 and a derived task-20 action-boundary timing probe scored from existing verified JSON.",
151
  "plotted_as": "colored point overlay",
152
  "result_record_count": 20,
153
- "scored_task_count": 9,
154
- "covered_task_count": 9,
155
  "proxy_scored_task_count": 0,
156
- "scoreless_task_count": 11,
157
  "unsupported_task_count": 0,
158
- "not_evaluated_task_count": 11,
159
  "status_counts": {
160
- "not_evaluated_in_verified_package": 11,
161
- "scored": 9
162
  },
163
- "coverage_fraction": 0.45,
164
  "result_record_fraction": 1.0
165
  },
166
  {
@@ -171,20 +171,20 @@
171
  "kind": "partial_128_episode_world_model_overlay",
172
  "scope": "128 selected episodes, held-out test",
173
  "stroke_dasharray": "2 7",
174
- "method_detail": "Verified Cosmos3-Nano future-window compatibility metrics, plus tasks 10/13/14/17 and a derived task-20 boundary timing probe scored from existing held-out future-window artifacts.",
175
  "plotted_as": "colored point overlay",
176
  "result_record_count": 20,
177
- "scored_task_count": 10,
178
- "covered_task_count": 10,
179
  "proxy_scored_task_count": 0,
180
- "scoreless_task_count": 10,
181
  "unsupported_task_count": 0,
182
- "not_evaluated_task_count": 10,
183
  "status_counts": {
184
- "not_evaluated_in_verified_package": 10,
185
- "scored": 10
186
  },
187
- "coverage_fraction": 0.5,
188
  "result_record_fraction": 1.0
189
  }
190
  ],
@@ -894,15 +894,15 @@
894
  "status_label": "scored"
895
  },
896
  "cosmos3_super_reasoner": {
897
- "raw": null,
898
- "metric_key": "mrr",
899
- "source": null,
900
  "scope": "multi_episode_128_partial_model_overlay",
901
- "status": "not_evaluated_in_verified_package",
902
- "reason": "the verified public model package did not ask this branch to emit that task target; a new task-specific evaluation package is required for a numeric score",
903
- "normalized_score": null,
904
- "raw_text": "n/a",
905
- "status_label": "not evaluated"
906
  },
907
  "cosmos3_nano_future_window": {
908
  "raw": null,
@@ -1633,15 +1633,15 @@
1633
  "status_label": "scored"
1634
  },
1635
  "cosmos3_nano_future_window": {
1636
- "raw": null,
1637
- "metric_key": "macro_f1",
1638
- "source": null,
1639
  "scope": "multi_episode_128_partial_model_overlay",
1640
- "status": "not_evaluated_in_verified_package",
1641
- "reason": "the verified public model package did not ask this branch to emit that task target; a new task-specific evaluation package is required for a numeric score",
1642
- "normalized_score": null,
1643
- "raw_text": "n/a",
1644
- "status_label": "not evaluated"
1645
  }
1646
  }
1647
  },
@@ -2989,17 +2989,17 @@
2989
  "task_label": "Language Grounding",
2990
  "series_id": "cosmos3_super_reasoner",
2991
  "method": "Cosmos3-Super Reasoner",
2992
- "status": "not_evaluated_in_verified_package",
2993
- "status_label": "not evaluated",
2994
- "scored": false,
2995
  "proxy_scored": false,
2996
- "raw": null,
2997
- "raw_text": "n/a",
2998
- "normalized_score": null,
2999
- "metric_key": "mrr",
3000
- "source": null,
3001
  "scope": "multi_episode_128_partial_model_overlay",
3002
- "reason": "the verified public model package did not ask this branch to emit that task target; a new task-specific evaluation package is required for a numeric score"
3003
  },
3004
  {
3005
  "task_number": 8,
@@ -4015,17 +4015,17 @@
4015
  "task_label": "Action-Object Relation Prediction",
4016
  "series_id": "cosmos3_nano_future_window",
4017
  "method": "Cosmos3-Nano Future Window",
4018
- "status": "not_evaluated_in_verified_package",
4019
- "status_label": "not evaluated",
4020
- "scored": false,
4021
  "proxy_scored": false,
4022
- "raw": null,
4023
- "raw_text": "n/a",
4024
- "normalized_score": null,
4025
- "metric_key": "macro_f1",
4026
- "source": null,
4027
  "scope": "multi_episode_128_partial_model_overlay",
4028
- "reason": "the verified public model package did not ask this branch to emit that task target; a new task-specific evaluation package is required for a numeric score"
4029
  },
4030
  {
4031
  "task_number": 17,
 
1
  {
2
  "title": "128-Episode 20-Task Radar",
3
  "status": "pass",
4
+ "generated_at_utc": "2026-06-18T22:55:01+00:00",
5
  "description": "Selected 128-episode metadata/raw baselines plus verified Qwen3/Cosmos branches. Every method has 20 records; numeric scores appear only where the public artifact produced that task target.",
6
  "task_count": 20,
7
  "method_count": 7,
8
  "method_task_record_count": 140,
9
+ "scored_method_task_count": 113,
10
  "normalization_policy": {
11
  "higher_is_better": "bounded metrics are plotted directly on 0-1 axes after clipping to [0, 1]",
12
  "lower_is_better": "lower-error metrics are converted to best_observed_value / raw_value within the same task",
 
147
  "kind": "partial_128_episode_foundation_model_overlay",
148
  "scope": "128 selected episodes, held-out test",
149
  "stroke_dasharray": "4 7",
150
+ "method_detail": "Verified Cosmos3-Super base-weight Reasoner JSON-task evaluation, plus task 8/16 and a derived task-20 action-boundary timing probe scored from existing verified JSON.",
151
  "plotted_as": "colored point overlay",
152
  "result_record_count": 20,
153
+ "scored_task_count": 10,
154
+ "covered_task_count": 10,
155
  "proxy_scored_task_count": 0,
156
+ "scoreless_task_count": 10,
157
  "unsupported_task_count": 0,
158
+ "not_evaluated_task_count": 10,
159
  "status_counts": {
160
+ "not_evaluated_in_verified_package": 10,
161
+ "scored": 10
162
  },
163
+ "coverage_fraction": 0.5,
164
  "result_record_fraction": 1.0
165
  },
166
  {
 
171
  "kind": "partial_128_episode_world_model_overlay",
172
  "scope": "128 selected episodes, held-out test",
173
  "stroke_dasharray": "2 7",
174
+ "method_detail": "Verified Cosmos3-Nano future-window compatibility metrics, plus tasks 10/13/14/16/17 and a derived task-20 boundary timing probe scored from existing held-out future-window artifacts.",
175
  "plotted_as": "colored point overlay",
176
  "result_record_count": 20,
177
+ "scored_task_count": 11,
178
+ "covered_task_count": 11,
179
  "proxy_scored_task_count": 0,
180
+ "scoreless_task_count": 9,
181
  "unsupported_task_count": 0,
182
+ "not_evaluated_task_count": 9,
183
  "status_counts": {
184
+ "not_evaluated_in_verified_package": 9,
185
+ "scored": 11
186
  },
187
+ "coverage_fraction": 0.55,
188
  "result_record_fraction": 1.0
189
  }
190
  ],
 
894
  "status_label": "scored"
895
  },
896
  "cosmos3_super_reasoner": {
897
+ "raw": 0.30639899644580487,
898
+ "metric_key": "caption_grounding_iou",
899
+ "source": "results/omni_finetune/model_output_task_probes_20260616/caption_grounding/cosmos3_super_reasoner/metrics.json",
900
  "scope": "multi_episode_128_partial_model_overlay",
901
+ "status": "scored",
902
+ "reason": null,
903
+ "normalized_score": 0.30639899644580487,
904
+ "raw_text": "0.3064",
905
+ "status_label": "scored"
906
  },
907
  "cosmos3_nano_future_window": {
908
  "raw": null,
 
1633
  "status_label": "scored"
1634
  },
1635
  "cosmos3_nano_future_window": {
1636
+ "raw": 0.002794157670325683,
1637
+ "metric_key": "action_object_relation_macro_f1",
1638
+ "source": "results/omni_finetune/model_output_task_probes_20260616/action_object_relation/cosmos3_nano_future_window/metrics.json",
1639
  "scope": "multi_episode_128_partial_model_overlay",
1640
+ "status": "scored",
1641
+ "reason": null,
1642
+ "normalized_score": 0.002794157670325683,
1643
+ "raw_text": "0.0028",
1644
+ "status_label": "scored"
1645
  }
1646
  }
1647
  },
 
2989
  "task_label": "Language Grounding",
2990
  "series_id": "cosmos3_super_reasoner",
2991
  "method": "Cosmos3-Super Reasoner",
2992
+ "status": "scored",
2993
+ "status_label": "scored",
2994
+ "scored": true,
2995
  "proxy_scored": false,
2996
+ "raw": 0.30639899644580487,
2997
+ "raw_text": "0.3064",
2998
+ "normalized_score": 0.30639899644580487,
2999
+ "metric_key": "caption_grounding_iou",
3000
+ "source": "results/omni_finetune/model_output_task_probes_20260616/caption_grounding/cosmos3_super_reasoner/metrics.json",
3001
  "scope": "multi_episode_128_partial_model_overlay",
3002
+ "reason": null
3003
  },
3004
  {
3005
  "task_number": 8,
 
4015
  "task_label": "Action-Object Relation Prediction",
4016
  "series_id": "cosmos3_nano_future_window",
4017
  "method": "Cosmos3-Nano Future Window",
4018
+ "status": "scored",
4019
+ "status_label": "scored",
4020
+ "scored": true,
4021
  "proxy_scored": false,
4022
+ "raw": 0.002794157670325683,
4023
+ "raw_text": "0.0028",
4024
+ "normalized_score": 0.002794157670325683,
4025
+ "metric_key": "action_object_relation_macro_f1",
4026
+ "source": "results/omni_finetune/model_output_task_probes_20260616/action_object_relation/cosmos3_nano_future_window/metrics.json",
4027
  "scope": "multi_episode_128_partial_model_overlay",
4028
+ "reason": null
4029
  },
4030
  {
4031
  "task_number": 17,
data/mirror_parity.json CHANGED
@@ -1,9 +1,9 @@
1
  {
2
  "status": "pass",
3
- "generated_at_utc": "2026-06-18T22:36:57+00:00",
4
  "hf_root": "hf_publish",
5
  "summary": {
6
- "group_count": 855,
7
  "failure_count": 0,
8
  "failures_by_surface": {}
9
  },
@@ -138,45 +138,45 @@
138
  "local": {
139
  "path": "repo:docs/data/artifact_index.json",
140
  "exists": true,
141
- "bytes": 116643,
142
- "sha256": "52e9ef2ca8b7bdcb1ab53f5bbed55a1a1e846eb7c4dbf13eaf25b210f581e2bd"
143
  },
144
  "mirrors": {
145
  "hf_space": {
146
  "path": "hf_space:data/artifact_index.json",
147
  "exists": true,
148
- "bytes": 116643,
149
- "sha256": "52e9ef2ca8b7bdcb1ab53f5bbed55a1a1e846eb7c4dbf13eaf25b210f581e2bd"
150
  },
151
  "hf_artifacts_data": {
152
  "path": "hf_artifacts:data/artifact_index.json",
153
  "exists": true,
154
- "bytes": 116643,
155
- "sha256": "52e9ef2ca8b7bdcb1ab53f5bbed55a1a1e846eb7c4dbf13eaf25b210f581e2bd"
156
  },
157
  "hf_artifacts": {
158
  "path": "hf_artifacts:docs/data/artifact_index.json",
159
  "exists": true,
160
- "bytes": 116643,
161
- "sha256": "52e9ef2ca8b7bdcb1ab53f5bbed55a1a1e846eb7c4dbf13eaf25b210f581e2bd"
162
  },
163
  "hf_model_data": {
164
  "path": "hf_model:data/artifact_index.json",
165
  "exists": true,
166
- "bytes": 116643,
167
- "sha256": "52e9ef2ca8b7bdcb1ab53f5bbed55a1a1e846eb7c4dbf13eaf25b210f581e2bd"
168
  },
169
  "hf_model_docs_data": {
170
  "path": "hf_model:docs/data/artifact_index.json",
171
  "exists": true,
172
- "bytes": 116643,
173
- "sha256": "52e9ef2ca8b7bdcb1ab53f5bbed55a1a1e846eb7c4dbf13eaf25b210f581e2bd"
174
  },
175
  "hf_model": {
176
  "path": "hf_model:metrics/artifact_index.json",
177
  "exists": true,
178
- "bytes": 116643,
179
- "sha256": "52e9ef2ca8b7bdcb1ab53f5bbed55a1a1e846eb7c4dbf13eaf25b210f581e2bd"
180
  }
181
  },
182
  "failures": []
@@ -922,45 +922,45 @@
922
  "local": {
923
  "path": "repo:docs/data/publication_audit.json",
924
  "exists": true,
925
- "bytes": 9613,
926
- "sha256": "1f9344871b3783f39e6ed709d892cf0e60c2b2d29fcd635f711672625a3404b1"
927
  },
928
  "mirrors": {
929
  "hf_space": {
930
  "path": "hf_space:data/publication_audit.json",
931
  "exists": true,
932
- "bytes": 9613,
933
- "sha256": "1f9344871b3783f39e6ed709d892cf0e60c2b2d29fcd635f711672625a3404b1"
934
  },
935
  "hf_artifacts_data": {
936
  "path": "hf_artifacts:data/publication_audit.json",
937
  "exists": true,
938
- "bytes": 9613,
939
- "sha256": "1f9344871b3783f39e6ed709d892cf0e60c2b2d29fcd635f711672625a3404b1"
940
  },
941
  "hf_artifacts": {
942
  "path": "hf_artifacts:docs/data/publication_audit.json",
943
  "exists": true,
944
- "bytes": 9613,
945
- "sha256": "1f9344871b3783f39e6ed709d892cf0e60c2b2d29fcd635f711672625a3404b1"
946
  },
947
  "hf_model_data": {
948
  "path": "hf_model:data/publication_audit.json",
949
  "exists": true,
950
- "bytes": 9613,
951
- "sha256": "1f9344871b3783f39e6ed709d892cf0e60c2b2d29fcd635f711672625a3404b1"
952
  },
953
  "hf_model_docs_data": {
954
  "path": "hf_model:docs/data/publication_audit.json",
955
  "exists": true,
956
- "bytes": 9613,
957
- "sha256": "1f9344871b3783f39e6ed709d892cf0e60c2b2d29fcd635f711672625a3404b1"
958
  },
959
  "hf_model": {
960
  "path": "hf_model:metrics/publication_audit.json",
961
  "exists": true,
962
- "bytes": 9613,
963
- "sha256": "1f9344871b3783f39e6ed709d892cf0e60c2b2d29fcd635f711672625a3404b1"
964
  }
965
  },
966
  "failures": []
@@ -972,44 +972,44 @@
972
  "path": "repo:docs/data/public_surface_qa.json",
973
  "exists": true,
974
  "bytes": 7126,
975
- "sha256": "1f57b699b7ad919698e69b8cdef576cd525878468c6d8e86621431eb15402c5e"
976
  },
977
  "mirrors": {
978
  "hf_space": {
979
  "path": "hf_space:data/public_surface_qa.json",
980
  "exists": true,
981
  "bytes": 7126,
982
- "sha256": "1f57b699b7ad919698e69b8cdef576cd525878468c6d8e86621431eb15402c5e"
983
  },
984
  "hf_artifacts_data": {
985
  "path": "hf_artifacts:data/public_surface_qa.json",
986
  "exists": true,
987
  "bytes": 7126,
988
- "sha256": "1f57b699b7ad919698e69b8cdef576cd525878468c6d8e86621431eb15402c5e"
989
  },
990
  "hf_artifacts": {
991
  "path": "hf_artifacts:docs/data/public_surface_qa.json",
992
  "exists": true,
993
  "bytes": 7126,
994
- "sha256": "1f57b699b7ad919698e69b8cdef576cd525878468c6d8e86621431eb15402c5e"
995
  },
996
  "hf_model_data": {
997
  "path": "hf_model:data/public_surface_qa.json",
998
  "exists": true,
999
  "bytes": 7126,
1000
- "sha256": "1f57b699b7ad919698e69b8cdef576cd525878468c6d8e86621431eb15402c5e"
1001
  },
1002
  "hf_model_docs_data": {
1003
  "path": "hf_model:docs/data/public_surface_qa.json",
1004
  "exists": true,
1005
  "bytes": 7126,
1006
- "sha256": "1f57b699b7ad919698e69b8cdef576cd525878468c6d8e86621431eb15402c5e"
1007
  },
1008
  "hf_model": {
1009
  "path": "hf_model:metrics/public_surface_qa.json",
1010
  "exists": true,
1011
  "bytes": 7126,
1012
- "sha256": "1f57b699b7ad919698e69b8cdef576cd525878468c6d8e86621431eb15402c5e"
1013
  }
1014
  },
1015
  "failures": []
@@ -1119,44 +1119,44 @@
1119
  "path": "repo:docs/data/quality_gates.json",
1120
  "exists": true,
1121
  "bytes": 8100,
1122
- "sha256": "16a1241e753b46169ee937ed28b00dc63a41509c6d127a9068aabd831e9e40cc"
1123
  },
1124
  "mirrors": {
1125
  "hf_space": {
1126
  "path": "hf_space:data/quality_gates.json",
1127
  "exists": true,
1128
  "bytes": 8100,
1129
- "sha256": "16a1241e753b46169ee937ed28b00dc63a41509c6d127a9068aabd831e9e40cc"
1130
  },
1131
  "hf_artifacts_data": {
1132
  "path": "hf_artifacts:data/quality_gates.json",
1133
  "exists": true,
1134
  "bytes": 8100,
1135
- "sha256": "16a1241e753b46169ee937ed28b00dc63a41509c6d127a9068aabd831e9e40cc"
1136
  },
1137
  "hf_artifacts": {
1138
  "path": "hf_artifacts:docs/data/quality_gates.json",
1139
  "exists": true,
1140
  "bytes": 8100,
1141
- "sha256": "16a1241e753b46169ee937ed28b00dc63a41509c6d127a9068aabd831e9e40cc"
1142
  },
1143
  "hf_model_data": {
1144
  "path": "hf_model:data/quality_gates.json",
1145
  "exists": true,
1146
  "bytes": 8100,
1147
- "sha256": "16a1241e753b46169ee937ed28b00dc63a41509c6d127a9068aabd831e9e40cc"
1148
  },
1149
  "hf_model_docs_data": {
1150
  "path": "hf_model:docs/data/quality_gates.json",
1151
  "exists": true,
1152
  "bytes": 8100,
1153
- "sha256": "16a1241e753b46169ee937ed28b00dc63a41509c6d127a9068aabd831e9e40cc"
1154
  },
1155
  "hf_model": {
1156
  "path": "hf_model:metrics/quality_gates.json",
1157
  "exists": true,
1158
  "bytes": 8100,
1159
- "sha256": "16a1241e753b46169ee937ed28b00dc63a41509c6d127a9068aabd831e9e40cc"
1160
  }
1161
  },
1162
  "failures": []
@@ -1560,44 +1560,44 @@
1560
  "path": "repo:docs/data/scope_claims_audit.json",
1561
  "exists": true,
1562
  "bytes": 21630,
1563
- "sha256": "2fef6d1cee15981aec3aa4af933c767997e01500a0fd6141f61d144223e24ad3"
1564
  },
1565
  "mirrors": {
1566
  "hf_space": {
1567
  "path": "hf_space:data/scope_claims_audit.json",
1568
  "exists": true,
1569
  "bytes": 21630,
1570
- "sha256": "2fef6d1cee15981aec3aa4af933c767997e01500a0fd6141f61d144223e24ad3"
1571
  },
1572
  "hf_artifacts_data": {
1573
  "path": "hf_artifacts:data/scope_claims_audit.json",
1574
  "exists": true,
1575
  "bytes": 21630,
1576
- "sha256": "2fef6d1cee15981aec3aa4af933c767997e01500a0fd6141f61d144223e24ad3"
1577
  },
1578
  "hf_artifacts": {
1579
  "path": "hf_artifacts:docs/data/scope_claims_audit.json",
1580
  "exists": true,
1581
  "bytes": 21630,
1582
- "sha256": "2fef6d1cee15981aec3aa4af933c767997e01500a0fd6141f61d144223e24ad3"
1583
  },
1584
  "hf_model_data": {
1585
  "path": "hf_model:data/scope_claims_audit.json",
1586
  "exists": true,
1587
  "bytes": 21630,
1588
- "sha256": "2fef6d1cee15981aec3aa4af933c767997e01500a0fd6141f61d144223e24ad3"
1589
  },
1590
  "hf_model_docs_data": {
1591
  "path": "hf_model:docs/data/scope_claims_audit.json",
1592
  "exists": true,
1593
  "bytes": 21630,
1594
- "sha256": "2fef6d1cee15981aec3aa4af933c767997e01500a0fd6141f61d144223e24ad3"
1595
  },
1596
  "hf_model": {
1597
  "path": "hf_model:metrics/scope_claims_audit.json",
1598
  "exists": true,
1599
  "bytes": 21630,
1600
- "sha256": "2fef6d1cee15981aec3aa4af933c767997e01500a0fd6141f61d144223e24ad3"
1601
  }
1602
  },
1603
  "failures": []
@@ -1658,44 +1658,44 @@
1658
  "path": "repo:docs/data/source_alignment_audit.json",
1659
  "exists": true,
1660
  "bytes": 4432,
1661
- "sha256": "1df30908392b455cc7263154126d55709cf97c60ff4213f0eee9ce17d92fb234"
1662
  },
1663
  "mirrors": {
1664
  "hf_space": {
1665
  "path": "hf_space:data/source_alignment_audit.json",
1666
  "exists": true,
1667
  "bytes": 4432,
1668
- "sha256": "1df30908392b455cc7263154126d55709cf97c60ff4213f0eee9ce17d92fb234"
1669
  },
1670
  "hf_artifacts_data": {
1671
  "path": "hf_artifacts:data/source_alignment_audit.json",
1672
  "exists": true,
1673
  "bytes": 4432,
1674
- "sha256": "1df30908392b455cc7263154126d55709cf97c60ff4213f0eee9ce17d92fb234"
1675
  },
1676
  "hf_artifacts": {
1677
  "path": "hf_artifacts:docs/data/source_alignment_audit.json",
1678
  "exists": true,
1679
  "bytes": 4432,
1680
- "sha256": "1df30908392b455cc7263154126d55709cf97c60ff4213f0eee9ce17d92fb234"
1681
  },
1682
  "hf_model_data": {
1683
  "path": "hf_model:data/source_alignment_audit.json",
1684
  "exists": true,
1685
  "bytes": 4432,
1686
- "sha256": "1df30908392b455cc7263154126d55709cf97c60ff4213f0eee9ce17d92fb234"
1687
  },
1688
  "hf_model_docs_data": {
1689
  "path": "hf_model:docs/data/source_alignment_audit.json",
1690
  "exists": true,
1691
  "bytes": 4432,
1692
- "sha256": "1df30908392b455cc7263154126d55709cf97c60ff4213f0eee9ce17d92fb234"
1693
  },
1694
  "hf_model": {
1695
  "path": "hf_model:metrics/source_alignment_audit.json",
1696
  "exists": true,
1697
  "bytes": 4432,
1698
- "sha256": "1df30908392b455cc7263154126d55709cf97c60ff4213f0eee9ce17d92fb234"
1699
  }
1700
  },
1701
  "failures": []
@@ -1756,44 +1756,44 @@
1756
  "path": "repo:docs/data/single_episode_task_model_radar.json",
1757
  "exists": true,
1758
  "bytes": 51064,
1759
- "sha256": "6a78822649c3318371bd1943bc4aceb6216052d832b682a98d4f887dab9c2756"
1760
  },
1761
  "mirrors": {
1762
  "hf_space": {
1763
  "path": "hf_space:data/single_episode_task_model_radar.json",
1764
  "exists": true,
1765
  "bytes": 51064,
1766
- "sha256": "6a78822649c3318371bd1943bc4aceb6216052d832b682a98d4f887dab9c2756"
1767
  },
1768
  "hf_artifacts_data": {
1769
  "path": "hf_artifacts:data/single_episode_task_model_radar.json",
1770
  "exists": true,
1771
  "bytes": 51064,
1772
- "sha256": "6a78822649c3318371bd1943bc4aceb6216052d832b682a98d4f887dab9c2756"
1773
  },
1774
  "hf_artifacts": {
1775
  "path": "hf_artifacts:docs/data/single_episode_task_model_radar.json",
1776
  "exists": true,
1777
  "bytes": 51064,
1778
- "sha256": "6a78822649c3318371bd1943bc4aceb6216052d832b682a98d4f887dab9c2756"
1779
  },
1780
  "hf_model_data": {
1781
  "path": "hf_model:data/single_episode_task_model_radar.json",
1782
  "exists": true,
1783
  "bytes": 51064,
1784
- "sha256": "6a78822649c3318371bd1943bc4aceb6216052d832b682a98d4f887dab9c2756"
1785
  },
1786
  "hf_model_docs_data": {
1787
  "path": "hf_model:docs/data/single_episode_task_model_radar.json",
1788
  "exists": true,
1789
  "bytes": 51064,
1790
- "sha256": "6a78822649c3318371bd1943bc4aceb6216052d832b682a98d4f887dab9c2756"
1791
  },
1792
  "hf_model": {
1793
  "path": "hf_model:metrics/single_episode_task_model_radar.json",
1794
  "exists": true,
1795
  "bytes": 51064,
1796
- "sha256": "6a78822649c3318371bd1943bc4aceb6216052d832b682a98d4f887dab9c2756"
1797
  }
1798
  },
1799
  "failures": []
@@ -1804,45 +1804,45 @@
1804
  "local": {
1805
  "path": "repo:docs/data/episode128_task_model_radar.json",
1806
  "exists": true,
1807
- "bytes": 185391,
1808
- "sha256": "53fbfad3e38a6accae25bb345f4682e39ebab69948df5a3423096eb7ed68b5d7"
1809
  },
1810
  "mirrors": {
1811
  "hf_space": {
1812
  "path": "hf_space:data/episode128_task_model_radar.json",
1813
  "exists": true,
1814
- "bytes": 185391,
1815
- "sha256": "53fbfad3e38a6accae25bb345f4682e39ebab69948df5a3423096eb7ed68b5d7"
1816
  },
1817
  "hf_artifacts_data": {
1818
  "path": "hf_artifacts:data/episode128_task_model_radar.json",
1819
  "exists": true,
1820
- "bytes": 185391,
1821
- "sha256": "53fbfad3e38a6accae25bb345f4682e39ebab69948df5a3423096eb7ed68b5d7"
1822
  },
1823
  "hf_artifacts": {
1824
  "path": "hf_artifacts:docs/data/episode128_task_model_radar.json",
1825
  "exists": true,
1826
- "bytes": 185391,
1827
- "sha256": "53fbfad3e38a6accae25bb345f4682e39ebab69948df5a3423096eb7ed68b5d7"
1828
  },
1829
  "hf_model_data": {
1830
  "path": "hf_model:data/episode128_task_model_radar.json",
1831
  "exists": true,
1832
- "bytes": 185391,
1833
- "sha256": "53fbfad3e38a6accae25bb345f4682e39ebab69948df5a3423096eb7ed68b5d7"
1834
  },
1835
  "hf_model_docs_data": {
1836
  "path": "hf_model:docs/data/episode128_task_model_radar.json",
1837
  "exists": true,
1838
- "bytes": 185391,
1839
- "sha256": "53fbfad3e38a6accae25bb345f4682e39ebab69948df5a3423096eb7ed68b5d7"
1840
  },
1841
  "hf_model": {
1842
  "path": "hf_model:metrics/episode128_task_model_radar.json",
1843
  "exists": true,
1844
- "bytes": 185391,
1845
- "sha256": "53fbfad3e38a6accae25bb345f4682e39ebab69948df5a3423096eb7ed68b5d7"
1846
  }
1847
  },
1848
  "failures": []
@@ -2001,44 +2001,44 @@
2001
  "path": "repo:docs/data/task_surface_integrity.json",
2002
  "exists": true,
2003
  "bytes": 45779,
2004
- "sha256": "4c0b7c81b916d32d7b2d8453c5b3e8dbf5e19d0e4002c966b9d4a34f33e49f0d"
2005
  },
2006
  "mirrors": {
2007
  "hf_space": {
2008
  "path": "hf_space:data/task_surface_integrity.json",
2009
  "exists": true,
2010
  "bytes": 45779,
2011
- "sha256": "4c0b7c81b916d32d7b2d8453c5b3e8dbf5e19d0e4002c966b9d4a34f33e49f0d"
2012
  },
2013
  "hf_artifacts_data": {
2014
  "path": "hf_artifacts:data/task_surface_integrity.json",
2015
  "exists": true,
2016
  "bytes": 45779,
2017
- "sha256": "4c0b7c81b916d32d7b2d8453c5b3e8dbf5e19d0e4002c966b9d4a34f33e49f0d"
2018
  },
2019
  "hf_artifacts": {
2020
  "path": "hf_artifacts:docs/data/task_surface_integrity.json",
2021
  "exists": true,
2022
  "bytes": 45779,
2023
- "sha256": "4c0b7c81b916d32d7b2d8453c5b3e8dbf5e19d0e4002c966b9d4a34f33e49f0d"
2024
  },
2025
  "hf_model_data": {
2026
  "path": "hf_model:data/task_surface_integrity.json",
2027
  "exists": true,
2028
  "bytes": 45779,
2029
- "sha256": "4c0b7c81b916d32d7b2d8453c5b3e8dbf5e19d0e4002c966b9d4a34f33e49f0d"
2030
  },
2031
  "hf_model_docs_data": {
2032
  "path": "hf_model:docs/data/task_surface_integrity.json",
2033
  "exists": true,
2034
  "bytes": 45779,
2035
- "sha256": "4c0b7c81b916d32d7b2d8453c5b3e8dbf5e19d0e4002c966b9d4a34f33e49f0d"
2036
  },
2037
  "hf_model": {
2038
  "path": "hf_model:metrics/task_surface_integrity.json",
2039
  "exists": true,
2040
  "bytes": 45779,
2041
- "sha256": "4c0b7c81b916d32d7b2d8453c5b3e8dbf5e19d0e4002c966b9d4a34f33e49f0d"
2042
  }
2043
  },
2044
  "failures": []
@@ -2098,45 +2098,45 @@
2098
  "local": {
2099
  "path": "repo:docs/data/task_method_20_result_matrix.json",
2100
  "exists": true,
2101
- "bytes": 128842,
2102
- "sha256": "a361c2528ccbbd6b1b53ede78e6d39353aa98630bcfed7b8014b77b05c4f226b"
2103
  },
2104
  "mirrors": {
2105
  "hf_space": {
2106
  "path": "hf_space:data/task_method_20_result_matrix.json",
2107
  "exists": true,
2108
- "bytes": 128842,
2109
- "sha256": "a361c2528ccbbd6b1b53ede78e6d39353aa98630bcfed7b8014b77b05c4f226b"
2110
  },
2111
  "hf_artifacts_data": {
2112
  "path": "hf_artifacts:data/task_method_20_result_matrix.json",
2113
  "exists": true,
2114
- "bytes": 128842,
2115
- "sha256": "a361c2528ccbbd6b1b53ede78e6d39353aa98630bcfed7b8014b77b05c4f226b"
2116
  },
2117
  "hf_artifacts": {
2118
  "path": "hf_artifacts:docs/data/task_method_20_result_matrix.json",
2119
  "exists": true,
2120
- "bytes": 128842,
2121
- "sha256": "a361c2528ccbbd6b1b53ede78e6d39353aa98630bcfed7b8014b77b05c4f226b"
2122
  },
2123
  "hf_model_data": {
2124
  "path": "hf_model:data/task_method_20_result_matrix.json",
2125
  "exists": true,
2126
- "bytes": 128842,
2127
- "sha256": "a361c2528ccbbd6b1b53ede78e6d39353aa98630bcfed7b8014b77b05c4f226b"
2128
  },
2129
  "hf_model_docs_data": {
2130
  "path": "hf_model:docs/data/task_method_20_result_matrix.json",
2131
  "exists": true,
2132
- "bytes": 128842,
2133
- "sha256": "a361c2528ccbbd6b1b53ede78e6d39353aa98630bcfed7b8014b77b05c4f226b"
2134
  },
2135
  "hf_model": {
2136
  "path": "hf_model:metrics/task_method_20_result_matrix.json",
2137
  "exists": true,
2138
- "bytes": 128842,
2139
- "sha256": "a361c2528ccbbd6b1b53ede78e6d39353aa98630bcfed7b8014b77b05c4f226b"
2140
  }
2141
  },
2142
  "failures": []
@@ -2147,45 +2147,45 @@
2147
  "local": {
2148
  "path": "repo:docs/data/task_method_20_gap_audit.json",
2149
  "exists": true,
2150
- "bytes": 29788,
2151
- "sha256": "143e03828559e706ab083b3824731d652bcb5a915cfb441caa4a3e6447a982f2"
2152
  },
2153
  "mirrors": {
2154
  "hf_space": {
2155
  "path": "hf_space:data/task_method_20_gap_audit.json",
2156
  "exists": true,
2157
- "bytes": 29788,
2158
- "sha256": "143e03828559e706ab083b3824731d652bcb5a915cfb441caa4a3e6447a982f2"
2159
  },
2160
  "hf_artifacts_data": {
2161
  "path": "hf_artifacts:data/task_method_20_gap_audit.json",
2162
  "exists": true,
2163
- "bytes": 29788,
2164
- "sha256": "143e03828559e706ab083b3824731d652bcb5a915cfb441caa4a3e6447a982f2"
2165
  },
2166
  "hf_artifacts": {
2167
  "path": "hf_artifacts:docs/data/task_method_20_gap_audit.json",
2168
  "exists": true,
2169
- "bytes": 29788,
2170
- "sha256": "143e03828559e706ab083b3824731d652bcb5a915cfb441caa4a3e6447a982f2"
2171
  },
2172
  "hf_model_data": {
2173
  "path": "hf_model:data/task_method_20_gap_audit.json",
2174
  "exists": true,
2175
- "bytes": 29788,
2176
- "sha256": "143e03828559e706ab083b3824731d652bcb5a915cfb441caa4a3e6447a982f2"
2177
  },
2178
  "hf_model_docs_data": {
2179
  "path": "hf_model:docs/data/task_method_20_gap_audit.json",
2180
  "exists": true,
2181
- "bytes": 29788,
2182
- "sha256": "143e03828559e706ab083b3824731d652bcb5a915cfb441caa4a3e6447a982f2"
2183
  },
2184
  "hf_model": {
2185
  "path": "hf_model:metrics/task_method_20_gap_audit.json",
2186
  "exists": true,
2187
- "bytes": 29788,
2188
- "sha256": "143e03828559e706ab083b3824731d652bcb5a915cfb441caa4a3e6447a982f2"
2189
  }
2190
  },
2191
  "failures": []
@@ -2245,45 +2245,45 @@
2245
  "local": {
2246
  "path": "repo:docs/data/unified_task_model_radar.json",
2247
  "exists": true,
2248
- "bytes": 229244,
2249
- "sha256": "6e9de603b3f2ca60ee099135e9df559781f7481a87f6cdc7ec8873b798e14990"
2250
  },
2251
  "mirrors": {
2252
  "hf_space": {
2253
  "path": "hf_space:data/unified_task_model_radar.json",
2254
  "exists": true,
2255
- "bytes": 229244,
2256
- "sha256": "6e9de603b3f2ca60ee099135e9df559781f7481a87f6cdc7ec8873b798e14990"
2257
  },
2258
  "hf_artifacts_data": {
2259
  "path": "hf_artifacts:data/unified_task_model_radar.json",
2260
  "exists": true,
2261
- "bytes": 229244,
2262
- "sha256": "6e9de603b3f2ca60ee099135e9df559781f7481a87f6cdc7ec8873b798e14990"
2263
  },
2264
  "hf_artifacts": {
2265
  "path": "hf_artifacts:docs/data/unified_task_model_radar.json",
2266
  "exists": true,
2267
- "bytes": 229244,
2268
- "sha256": "6e9de603b3f2ca60ee099135e9df559781f7481a87f6cdc7ec8873b798e14990"
2269
  },
2270
  "hf_model_data": {
2271
  "path": "hf_model:data/unified_task_model_radar.json",
2272
  "exists": true,
2273
- "bytes": 229244,
2274
- "sha256": "6e9de603b3f2ca60ee099135e9df559781f7481a87f6cdc7ec8873b798e14990"
2275
  },
2276
  "hf_model_docs_data": {
2277
  "path": "hf_model:docs/data/unified_task_model_radar.json",
2278
  "exists": true,
2279
- "bytes": 229244,
2280
- "sha256": "6e9de603b3f2ca60ee099135e9df559781f7481a87f6cdc7ec8873b798e14990"
2281
  },
2282
  "hf_model": {
2283
  "path": "hf_model:metrics/unified_task_model_radar.json",
2284
  "exists": true,
2285
- "bytes": 229244,
2286
- "sha256": "6e9de603b3f2ca60ee099135e9df559781f7481a87f6cdc7ec8873b798e14990"
2287
  }
2288
  },
2289
  "failures": []
@@ -2294,45 +2294,45 @@
2294
  "local": {
2295
  "path": "repo:docs/data/website_integrity.json",
2296
  "exists": true,
2297
- "bytes": 20021,
2298
- "sha256": "f9b0ce37c945cd95d809eb447ac950464ec6e450411ecd816618a79f83581bbd"
2299
  },
2300
  "mirrors": {
2301
  "hf_space": {
2302
  "path": "hf_space:data/website_integrity.json",
2303
  "exists": true,
2304
- "bytes": 20021,
2305
- "sha256": "f9b0ce37c945cd95d809eb447ac950464ec6e450411ecd816618a79f83581bbd"
2306
  },
2307
  "hf_artifacts_data": {
2308
  "path": "hf_artifacts:data/website_integrity.json",
2309
  "exists": true,
2310
- "bytes": 20021,
2311
- "sha256": "f9b0ce37c945cd95d809eb447ac950464ec6e450411ecd816618a79f83581bbd"
2312
  },
2313
  "hf_artifacts": {
2314
  "path": "hf_artifacts:docs/data/website_integrity.json",
2315
  "exists": true,
2316
- "bytes": 20021,
2317
- "sha256": "f9b0ce37c945cd95d809eb447ac950464ec6e450411ecd816618a79f83581bbd"
2318
  },
2319
  "hf_model_data": {
2320
  "path": "hf_model:data/website_integrity.json",
2321
  "exists": true,
2322
- "bytes": 20021,
2323
- "sha256": "f9b0ce37c945cd95d809eb447ac950464ec6e450411ecd816618a79f83581bbd"
2324
  },
2325
  "hf_model_docs_data": {
2326
  "path": "hf_model:docs/data/website_integrity.json",
2327
  "exists": true,
2328
- "bytes": 20021,
2329
- "sha256": "f9b0ce37c945cd95d809eb447ac950464ec6e450411ecd816618a79f83581bbd"
2330
  },
2331
  "hf_model": {
2332
  "path": "hf_model:metrics/website_integrity.json",
2333
  "exists": true,
2334
- "bytes": 20021,
2335
- "sha256": "f9b0ce37c945cd95d809eb447ac950464ec6e450411ecd816618a79f83581bbd"
2336
  }
2337
  },
2338
  "failures": []
@@ -2515,33 +2515,33 @@
2515
  "local": {
2516
  "path": "repo:docs/assets/charts/episode128_task_model_radar.svg",
2517
  "exists": true,
2518
- "bytes": 48704,
2519
- "sha256": "45f8a79dc764ddbf0182ab7994fbfa5002b52b075951ab42831ecbfb3fd0405c"
2520
  },
2521
  "mirrors": {
2522
  "hf_space": {
2523
  "path": "hf_space:assets/charts/episode128_task_model_radar.svg",
2524
  "exists": true,
2525
- "bytes": 48704,
2526
- "sha256": "45f8a79dc764ddbf0182ab7994fbfa5002b52b075951ab42831ecbfb3fd0405c"
2527
  },
2528
  "hf_artifacts_docs": {
2529
  "path": "hf_artifacts:docs/assets/charts/episode128_task_model_radar.svg",
2530
  "exists": true,
2531
- "bytes": 48704,
2532
- "sha256": "45f8a79dc764ddbf0182ab7994fbfa5002b52b075951ab42831ecbfb3fd0405c"
2533
  },
2534
  "hf_artifacts_card": {
2535
  "path": "hf_artifacts:assets/charts/episode128_task_model_radar.svg",
2536
  "exists": true,
2537
- "bytes": 48704,
2538
- "sha256": "45f8a79dc764ddbf0182ab7994fbfa5002b52b075951ab42831ecbfb3fd0405c"
2539
  },
2540
  "hf_model": {
2541
  "path": "hf_model:assets/charts/episode128_task_model_radar.svg",
2542
  "exists": true,
2543
- "bytes": 48704,
2544
- "sha256": "45f8a79dc764ddbf0182ab7994fbfa5002b52b075951ab42831ecbfb3fd0405c"
2545
  }
2546
  },
2547
  "failures": []
@@ -2589,33 +2589,33 @@
2589
  "local": {
2590
  "path": "repo:docs/assets/charts/unified_task_model_radar.svg",
2591
  "exists": true,
2592
- "bytes": 54717,
2593
- "sha256": "8fb6de7004e8463c28d6ada669c475d19986a1a3689778c691717cff39a7531a"
2594
  },
2595
  "mirrors": {
2596
  "hf_space": {
2597
  "path": "hf_space:assets/charts/unified_task_model_radar.svg",
2598
  "exists": true,
2599
- "bytes": 54717,
2600
- "sha256": "8fb6de7004e8463c28d6ada669c475d19986a1a3689778c691717cff39a7531a"
2601
  },
2602
  "hf_artifacts_docs": {
2603
  "path": "hf_artifacts:docs/assets/charts/unified_task_model_radar.svg",
2604
  "exists": true,
2605
- "bytes": 54717,
2606
- "sha256": "8fb6de7004e8463c28d6ada669c475d19986a1a3689778c691717cff39a7531a"
2607
  },
2608
  "hf_artifacts_card": {
2609
  "path": "hf_artifacts:assets/charts/unified_task_model_radar.svg",
2610
  "exists": true,
2611
- "bytes": 54717,
2612
- "sha256": "8fb6de7004e8463c28d6ada669c475d19986a1a3689778c691717cff39a7531a"
2613
  },
2614
  "hf_model": {
2615
  "path": "hf_model:assets/charts/unified_task_model_radar.svg",
2616
  "exists": true,
2617
- "bytes": 54717,
2618
- "sha256": "8fb6de7004e8463c28d6ada669c475d19986a1a3689778c691717cff39a7531a"
2619
  }
2620
  },
2621
  "failures": []
@@ -4509,21 +4509,21 @@
4509
  "local": {
4510
  "path": "repo:scripts/omni/score_existing_model_output_task_probes.py",
4511
  "exists": true,
4512
- "bytes": 57470,
4513
- "sha256": "9a0708885c1a22addc0bec199488021e277c7a7b7e23d6a37344fbbb3e5f1b96"
4514
  },
4515
  "mirrors": {
4516
  "hf_artifacts": {
4517
  "path": "hf_artifacts:scripts/omni/score_existing_model_output_task_probes.py",
4518
  "exists": true,
4519
- "bytes": 57470,
4520
- "sha256": "9a0708885c1a22addc0bec199488021e277c7a7b7e23d6a37344fbbb3e5f1b96"
4521
  },
4522
  "hf_model": {
4523
  "path": "hf_model:scripts/omni/score_existing_model_output_task_probes.py",
4524
  "exists": true,
4525
- "bytes": 57470,
4526
- "sha256": "9a0708885c1a22addc0bec199488021e277c7a7b7e23d6a37344fbbb3e5f1b96"
4527
  }
4528
  },
4529
  "failures": []
@@ -5034,21 +5034,21 @@
5034
  "local": {
5035
  "path": "repo:scripts/build_unified_task_model_radar.py",
5036
  "exists": true,
5037
- "bytes": 56295,
5038
- "sha256": "237ef6a08dd81b9fcb0256f6f6b54394f74c14daea0cbba8f1726fdbbb7feff0"
5039
  },
5040
  "mirrors": {
5041
  "hf_artifacts": {
5042
  "path": "hf_artifacts:scripts/build_unified_task_model_radar.py",
5043
  "exists": true,
5044
- "bytes": 56295,
5045
- "sha256": "237ef6a08dd81b9fcb0256f6f6b54394f74c14daea0cbba8f1726fdbbb7feff0"
5046
  },
5047
  "hf_model": {
5048
  "path": "hf_model:scripts/build_unified_task_model_radar.py",
5049
  "exists": true,
5050
- "bytes": 56295,
5051
- "sha256": "237ef6a08dd81b9fcb0256f6f6b54394f74c14daea0cbba8f1726fdbbb7feff0"
5052
  }
5053
  },
5054
  "failures": []
@@ -5464,38 +5464,38 @@
5464
  "path": "repo:docs/index.html",
5465
  "exists": true,
5466
  "bytes": 254770,
5467
- "sha256": "9273d6b20b166a8d18bb30f13c9f15389a3808e8c71265d68dd9481911fc5d66"
5468
  },
5469
  "mirrors": {
5470
  "hf_space": {
5471
  "path": "hf_space:index.html",
5472
  "exists": true,
5473
  "bytes": 254770,
5474
- "sha256": "9273d6b20b166a8d18bb30f13c9f15389a3808e8c71265d68dd9481911fc5d66"
5475
  },
5476
  "hf_artifacts_root": {
5477
  "path": "hf_artifacts:index.html",
5478
  "exists": true,
5479
  "bytes": 254770,
5480
- "sha256": "9273d6b20b166a8d18bb30f13c9f15389a3808e8c71265d68dd9481911fc5d66"
5481
  },
5482
  "hf_artifacts_docs": {
5483
  "path": "hf_artifacts:docs/index.html",
5484
  "exists": true,
5485
  "bytes": 254770,
5486
- "sha256": "9273d6b20b166a8d18bb30f13c9f15389a3808e8c71265d68dd9481911fc5d66"
5487
  },
5488
  "hf_model": {
5489
  "path": "hf_model:index.html",
5490
  "exists": true,
5491
  "bytes": 254770,
5492
- "sha256": "9273d6b20b166a8d18bb30f13c9f15389a3808e8c71265d68dd9481911fc5d66"
5493
  },
5494
  "hf_model_docs": {
5495
  "path": "hf_model:docs/index.html",
5496
  "exists": true,
5497
  "bytes": 254770,
5498
- "sha256": "9273d6b20b166a8d18bb30f13c9f15389a3808e8c71265d68dd9481911fc5d66"
5499
  }
5500
  },
5501
  "failures": []
@@ -12510,21 +12510,21 @@
12510
  "local": {
12511
  "path": "repo:results/omni_finetune/model_output_probe_readiness/RUN_REPORT.md",
12512
  "exists": true,
12513
- "bytes": 1047,
12514
- "sha256": "823b4dcc50bbaf8e5124abf3b9ec3c88dbfe7f5be1995769f7a537f31adfa31d"
12515
  },
12516
  "mirrors": {
12517
  "hf_artifacts": {
12518
  "path": "hf_artifacts:results/omni_finetune/model_output_probe_readiness/RUN_REPORT.md",
12519
  "exists": true,
12520
- "bytes": 1047,
12521
- "sha256": "823b4dcc50bbaf8e5124abf3b9ec3c88dbfe7f5be1995769f7a537f31adfa31d"
12522
  },
12523
  "hf_model": {
12524
  "path": "hf_model:results/omni_finetune/model_output_probe_readiness/RUN_REPORT.md",
12525
  "exists": true,
12526
- "bytes": 1047,
12527
- "sha256": "823b4dcc50bbaf8e5124abf3b9ec3c88dbfe7f5be1995769f7a537f31adfa31d"
12528
  }
12529
  },
12530
  "failures": []
@@ -12535,21 +12535,21 @@
12535
  "local": {
12536
  "path": "repo:results/omni_finetune/model_output_probe_readiness/model_output_probe_readiness.json",
12537
  "exists": true,
12538
- "bytes": 5144,
12539
- "sha256": "86835a291c659d335ab5b51d09ea3f36710c14d23466a72d9c2a23137dc9ae8a"
12540
  },
12541
  "mirrors": {
12542
  "hf_artifacts": {
12543
  "path": "hf_artifacts:results/omni_finetune/model_output_probe_readiness/model_output_probe_readiness.json",
12544
  "exists": true,
12545
- "bytes": 5144,
12546
- "sha256": "86835a291c659d335ab5b51d09ea3f36710c14d23466a72d9c2a23137dc9ae8a"
12547
  },
12548
  "hf_model": {
12549
  "path": "hf_model:results/omni_finetune/model_output_probe_readiness/model_output_probe_readiness.json",
12550
  "exists": true,
12551
- "bytes": 5144,
12552
- "sha256": "86835a291c659d335ab5b51d09ea3f36710c14d23466a72d9c2a23137dc9ae8a"
12553
  }
12554
  },
12555
  "failures": []
@@ -12560,21 +12560,96 @@
12560
  "local": {
12561
  "path": "repo:results/omni_finetune/model_output_task_probes_20260616/RUN_REPORT.md",
12562
  "exists": true,
12563
- "bytes": 1421,
12564
- "sha256": "7f2156454573d3174ed5ddb029864fdf65214d9f8c09a151d0a3bd9a0ef86452"
12565
  },
12566
  "mirrors": {
12567
  "hf_artifacts": {
12568
  "path": "hf_artifacts:results/omni_finetune/model_output_task_probes_20260616/RUN_REPORT.md",
12569
  "exists": true,
12570
- "bytes": 1421,
12571
- "sha256": "7f2156454573d3174ed5ddb029864fdf65214d9f8c09a151d0a3bd9a0ef86452"
12572
  },
12573
  "hf_model": {
12574
  "path": "hf_model:results/omni_finetune/model_output_task_probes_20260616/RUN_REPORT.md",
12575
  "exists": true,
12576
- "bytes": 1421,
12577
- "sha256": "7f2156454573d3174ed5ddb029864fdf65214d9f8c09a151d0a3bd9a0ef86452"
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
12578
  }
12579
  },
12580
  "failures": []
@@ -12586,20 +12661,20 @@
12586
  "path": "repo:results/omni_finetune/model_output_task_probes_20260616/action_object_relation/cosmos3_super_reasoner/metrics.json",
12587
  "exists": true,
12588
  "bytes": 21876,
12589
- "sha256": "a1d506a2c132d1d0e8bf31a9ba8618fec88bac75b056f99c50219514fdf3e22e"
12590
  },
12591
  "mirrors": {
12592
  "hf_artifacts": {
12593
  "path": "hf_artifacts:results/omni_finetune/model_output_task_probes_20260616/action_object_relation/cosmos3_super_reasoner/metrics.json",
12594
  "exists": true,
12595
  "bytes": 21876,
12596
- "sha256": "a1d506a2c132d1d0e8bf31a9ba8618fec88bac75b056f99c50219514fdf3e22e"
12597
  },
12598
  "hf_model": {
12599
  "path": "hf_model:results/omni_finetune/model_output_task_probes_20260616/action_object_relation/cosmos3_super_reasoner/metrics.json",
12600
  "exists": true,
12601
  "bytes": 21876,
12602
- "sha256": "a1d506a2c132d1d0e8bf31a9ba8618fec88bac75b056f99c50219514fdf3e22e"
12603
  }
12604
  },
12605
  "failures": []
@@ -12661,20 +12736,20 @@
12661
  "path": "repo:results/omni_finetune/model_output_task_probes_20260616/action_object_relation/qwen3_omni_v6_lora/metrics.json",
12662
  "exists": true,
12663
  "bytes": 169938,
12664
- "sha256": "e5754d22070d2b25b60e03e1c9acde49daacce48b871c7f4520d130355c07eb1"
12665
  },
12666
  "mirrors": {
12667
  "hf_artifacts": {
12668
  "path": "hf_artifacts:results/omni_finetune/model_output_task_probes_20260616/action_object_relation/qwen3_omni_v6_lora/metrics.json",
12669
  "exists": true,
12670
  "bytes": 169938,
12671
- "sha256": "e5754d22070d2b25b60e03e1c9acde49daacce48b871c7f4520d130355c07eb1"
12672
  },
12673
  "hf_model": {
12674
  "path": "hf_model:results/omni_finetune/model_output_task_probes_20260616/action_object_relation/qwen3_omni_v6_lora/metrics.json",
12675
  "exists": true,
12676
  "bytes": 169938,
12677
- "sha256": "e5754d22070d2b25b60e03e1c9acde49daacce48b871c7f4520d130355c07eb1"
12678
  }
12679
  },
12680
  "failures": []
@@ -12729,6 +12804,56 @@
12729
  },
12730
  "failures": []
12731
  },
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
12732
  {
12733
  "name": "results/omni_finetune/model_output_task_probes_20260616/cosmos3_nano_future_window_source_window_map.jsonl",
12734
  "status": "pass",
@@ -12786,20 +12911,20 @@
12786
  "path": "repo:results/omni_finetune/model_output_task_probes_20260616/long_horizon_next_action/cosmos3_nano_future_window/metrics.json",
12787
  "exists": true,
12788
  "bytes": 7404,
12789
- "sha256": "fe39f6894d2b71411b4272e555d1801e55f3b4ed419e0d4cd19e0e4ed53f60f1"
12790
  },
12791
  "mirrors": {
12792
  "hf_artifacts": {
12793
  "path": "hf_artifacts:results/omni_finetune/model_output_task_probes_20260616/long_horizon_next_action/cosmos3_nano_future_window/metrics.json",
12794
  "exists": true,
12795
  "bytes": 7404,
12796
- "sha256": "fe39f6894d2b71411b4272e555d1801e55f3b4ed419e0d4cd19e0e4ed53f60f1"
12797
  },
12798
  "hf_model": {
12799
  "path": "hf_model:results/omni_finetune/model_output_task_probes_20260616/long_horizon_next_action/cosmos3_nano_future_window/metrics.json",
12800
  "exists": true,
12801
  "bytes": 7404,
12802
- "sha256": "fe39f6894d2b71411b4272e555d1801e55f3b4ed419e0d4cd19e0e4ed53f60f1"
12803
  }
12804
  },
12805
  "failures": []
@@ -12861,20 +12986,20 @@
12861
  "path": "repo:results/omni_finetune/model_output_task_probes_20260616/long_horizon_next_action/cosmos3_super_reasoner/metrics.json",
12862
  "exists": true,
12863
  "bytes": 10051,
12864
- "sha256": "b7773f4af1284dfb498c69ba174049056e038ce10465281b657223629d1dab5f"
12865
  },
12866
  "mirrors": {
12867
  "hf_artifacts": {
12868
  "path": "hf_artifacts:results/omni_finetune/model_output_task_probes_20260616/long_horizon_next_action/cosmos3_super_reasoner/metrics.json",
12869
  "exists": true,
12870
  "bytes": 10051,
12871
- "sha256": "b7773f4af1284dfb498c69ba174049056e038ce10465281b657223629d1dab5f"
12872
  },
12873
  "hf_model": {
12874
  "path": "hf_model:results/omni_finetune/model_output_task_probes_20260616/long_horizon_next_action/cosmos3_super_reasoner/metrics.json",
12875
  "exists": true,
12876
  "bytes": 10051,
12877
- "sha256": "b7773f4af1284dfb498c69ba174049056e038ce10465281b657223629d1dab5f"
12878
  }
12879
  },
12880
  "failures": []
@@ -12936,20 +13061,20 @@
12936
  "path": "repo:results/omni_finetune/model_output_task_probes_20260616/modality_reconstruction/cosmos3_nano_future_window/metrics.json",
12937
  "exists": true,
12938
  "bytes": 1825,
12939
- "sha256": "4d04bb2e461a76d0a8f9ec37f6b73915c87544472406b3ca576cb791f100db92"
12940
  },
12941
  "mirrors": {
12942
  "hf_artifacts": {
12943
  "path": "hf_artifacts:results/omni_finetune/model_output_task_probes_20260616/modality_reconstruction/cosmos3_nano_future_window/metrics.json",
12944
  "exists": true,
12945
  "bytes": 1825,
12946
- "sha256": "4d04bb2e461a76d0a8f9ec37f6b73915c87544472406b3ca576cb791f100db92"
12947
  },
12948
  "hf_model": {
12949
  "path": "hf_model:results/omni_finetune/model_output_task_probes_20260616/modality_reconstruction/cosmos3_nano_future_window/metrics.json",
12950
  "exists": true,
12951
  "bytes": 1825,
12952
- "sha256": "4d04bb2e461a76d0a8f9ec37f6b73915c87544472406b3ca576cb791f100db92"
12953
  }
12954
  },
12955
  "failures": []
@@ -12961,20 +13086,20 @@
12961
  "path": "repo:results/omni_finetune/model_output_task_probes_20260616/next_subtask_forecast/cosmos3_nano_future_window/metrics.json",
12962
  "exists": true,
12963
  "bytes": 5594,
12964
- "sha256": "0f2b7b041ae7cd46b128427634d0328178303c1ede02643fb86a68933c149099"
12965
  },
12966
  "mirrors": {
12967
  "hf_artifacts": {
12968
  "path": "hf_artifacts:results/omni_finetune/model_output_task_probes_20260616/next_subtask_forecast/cosmos3_nano_future_window/metrics.json",
12969
  "exists": true,
12970
  "bytes": 5594,
12971
- "sha256": "0f2b7b041ae7cd46b128427634d0328178303c1ede02643fb86a68933c149099"
12972
  },
12973
  "hf_model": {
12974
  "path": "hf_model:results/omni_finetune/model_output_task_probes_20260616/next_subtask_forecast/cosmos3_nano_future_window/metrics.json",
12975
  "exists": true,
12976
  "bytes": 5594,
12977
- "sha256": "0f2b7b041ae7cd46b128427634d0328178303c1ede02643fb86a68933c149099"
12978
  }
12979
  },
12980
  "failures": []
@@ -13036,20 +13161,20 @@
13036
  "path": "repo:results/omni_finetune/model_output_task_probes_20260616/object_set_forecast/cosmos3_nano_future_window/metrics.json",
13037
  "exists": true,
13038
  "bytes": 2225,
13039
- "sha256": "f080f27c4457005ae1383d31cde22fc3c51b0c065eda3e0b5842135048254877"
13040
  },
13041
  "mirrors": {
13042
  "hf_artifacts": {
13043
  "path": "hf_artifacts:results/omni_finetune/model_output_task_probes_20260616/object_set_forecast/cosmos3_nano_future_window/metrics.json",
13044
  "exists": true,
13045
  "bytes": 2225,
13046
- "sha256": "f080f27c4457005ae1383d31cde22fc3c51b0c065eda3e0b5842135048254877"
13047
  },
13048
  "hf_model": {
13049
  "path": "hf_model:results/omni_finetune/model_output_task_probes_20260616/object_set_forecast/cosmos3_nano_future_window/metrics.json",
13050
  "exists": true,
13051
  "bytes": 2225,
13052
- "sha256": "f080f27c4457005ae1383d31cde22fc3c51b0c065eda3e0b5842135048254877"
13053
  }
13054
  },
13055
  "failures": []
@@ -13085,21 +13210,21 @@
13085
  "local": {
13086
  "path": "repo:results/omni_finetune/model_output_task_probes_20260616/summary.json",
13087
  "exists": true,
13088
- "bytes": 5278,
13089
- "sha256": "4a27f39807e8ac13771e2109584a8b0265961bcea88445058cbfe87265457d7f"
13090
  },
13091
  "mirrors": {
13092
  "hf_artifacts": {
13093
  "path": "hf_artifacts:results/omni_finetune/model_output_task_probes_20260616/summary.json",
13094
  "exists": true,
13095
- "bytes": 5278,
13096
- "sha256": "4a27f39807e8ac13771e2109584a8b0265961bcea88445058cbfe87265457d7f"
13097
  },
13098
  "hf_model": {
13099
  "path": "hf_model:results/omni_finetune/model_output_task_probes_20260616/summary.json",
13100
  "exists": true,
13101
- "bytes": 5278,
13102
- "sha256": "4a27f39807e8ac13771e2109584a8b0265961bcea88445058cbfe87265457d7f"
13103
  }
13104
  },
13105
  "failures": []
@@ -13111,20 +13236,20 @@
13111
  "path": "repo:results/omni_finetune/model_output_task_probes_20260616/time_to_transition/cosmos3_nano_future_window/metrics.json",
13112
  "exists": true,
13113
  "bytes": 2398,
13114
- "sha256": "31b36b403d37ee21efed27e9c2c5c4b46806bb1caff9f9159c5914c6c104a61c"
13115
  },
13116
  "mirrors": {
13117
  "hf_artifacts": {
13118
  "path": "hf_artifacts:results/omni_finetune/model_output_task_probes_20260616/time_to_transition/cosmos3_nano_future_window/metrics.json",
13119
  "exists": true,
13120
  "bytes": 2398,
13121
- "sha256": "31b36b403d37ee21efed27e9c2c5c4b46806bb1caff9f9159c5914c6c104a61c"
13122
  },
13123
  "hf_model": {
13124
  "path": "hf_model:results/omni_finetune/model_output_task_probes_20260616/time_to_transition/cosmos3_nano_future_window/metrics.json",
13125
  "exists": true,
13126
  "bytes": 2398,
13127
- "sha256": "31b36b403d37ee21efed27e9c2c5c4b46806bb1caff9f9159c5914c6c104a61c"
13128
  }
13129
  },
13130
  "failures": []
@@ -13161,20 +13286,20 @@
13161
  "path": "repo:results/omni_finetune/model_output_task_probes_20260616/time_to_transition/cosmos3_super_reasoner/metrics.json",
13162
  "exists": true,
13163
  "bytes": 2049,
13164
- "sha256": "6eae6e5b12a4073e98531046451c8ef332f0ca469a741aab09e94c952dc754cb"
13165
  },
13166
  "mirrors": {
13167
  "hf_artifacts": {
13168
  "path": "hf_artifacts:results/omni_finetune/model_output_task_probes_20260616/time_to_transition/cosmos3_super_reasoner/metrics.json",
13169
  "exists": true,
13170
  "bytes": 2049,
13171
- "sha256": "6eae6e5b12a4073e98531046451c8ef332f0ca469a741aab09e94c952dc754cb"
13172
  },
13173
  "hf_model": {
13174
  "path": "hf_model:results/omni_finetune/model_output_task_probes_20260616/time_to_transition/cosmos3_super_reasoner/metrics.json",
13175
  "exists": true,
13176
  "bytes": 2049,
13177
- "sha256": "6eae6e5b12a4073e98531046451c8ef332f0ca469a741aab09e94c952dc754cb"
13178
  }
13179
  },
13180
  "failures": []
@@ -20667,15 +20792,72 @@
20667
  "local": {
20668
  "path": "repo:results/omni_finetune/model_output_task_probes_20260616/RUN_REPORT.md",
20669
  "exists": true,
20670
- "bytes": 1421,
20671
- "sha256": "7f2156454573d3174ed5ddb029864fdf65214d9f8c09a151d0a3bd9a0ef86452"
20672
  },
20673
  "mirrors": {
20674
  "hf_space": {
20675
  "path": "hf_space:results/omni_finetune/model_output_task_probes_20260616/RUN_REPORT.md",
20676
  "exists": true,
20677
- "bytes": 1421,
20678
- "sha256": "7f2156454573d3174ed5ddb029864fdf65214d9f8c09a151d0a3bd9a0ef86452"
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
20679
  }
20680
  },
20681
  "failures": []
@@ -20687,14 +20869,14 @@
20687
  "path": "repo:results/omni_finetune/model_output_task_probes_20260616/action_object_relation/cosmos3_super_reasoner/metrics.json",
20688
  "exists": true,
20689
  "bytes": 21876,
20690
- "sha256": "a1d506a2c132d1d0e8bf31a9ba8618fec88bac75b056f99c50219514fdf3e22e"
20691
  },
20692
  "mirrors": {
20693
  "hf_space": {
20694
  "path": "hf_space:results/omni_finetune/model_output_task_probes_20260616/action_object_relation/cosmos3_super_reasoner/metrics.json",
20695
  "exists": true,
20696
  "bytes": 21876,
20697
- "sha256": "a1d506a2c132d1d0e8bf31a9ba8618fec88bac75b056f99c50219514fdf3e22e"
20698
  }
20699
  },
20700
  "failures": []
@@ -20744,14 +20926,14 @@
20744
  "path": "repo:results/omni_finetune/model_output_task_probes_20260616/action_object_relation/qwen3_omni_v6_lora/metrics.json",
20745
  "exists": true,
20746
  "bytes": 169938,
20747
- "sha256": "e5754d22070d2b25b60e03e1c9acde49daacce48b871c7f4520d130355c07eb1"
20748
  },
20749
  "mirrors": {
20750
  "hf_space": {
20751
  "path": "hf_space:results/omni_finetune/model_output_task_probes_20260616/action_object_relation/qwen3_omni_v6_lora/metrics.json",
20752
  "exists": true,
20753
  "bytes": 169938,
20754
- "sha256": "e5754d22070d2b25b60e03e1c9acde49daacce48b871c7f4520d130355c07eb1"
20755
  }
20756
  },
20757
  "failures": []
@@ -20794,6 +20976,44 @@
20794
  },
20795
  "failures": []
20796
  },
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
20797
  {
20798
  "name": "space_results/omni_finetune/model_output_task_probes_20260616/cosmos3_nano_future_window_source_window_map.jsonl",
20799
  "status": "pass",
@@ -20839,14 +21059,14 @@
20839
  "path": "repo:results/omni_finetune/model_output_task_probes_20260616/long_horizon_next_action/cosmos3_nano_future_window/metrics.json",
20840
  "exists": true,
20841
  "bytes": 7404,
20842
- "sha256": "fe39f6894d2b71411b4272e555d1801e55f3b4ed419e0d4cd19e0e4ed53f60f1"
20843
  },
20844
  "mirrors": {
20845
  "hf_space": {
20846
  "path": "hf_space:results/omni_finetune/model_output_task_probes_20260616/long_horizon_next_action/cosmos3_nano_future_window/metrics.json",
20847
  "exists": true,
20848
  "bytes": 7404,
20849
- "sha256": "fe39f6894d2b71411b4272e555d1801e55f3b4ed419e0d4cd19e0e4ed53f60f1"
20850
  }
20851
  },
20852
  "failures": []
@@ -20896,14 +21116,14 @@
20896
  "path": "repo:results/omni_finetune/model_output_task_probes_20260616/long_horizon_next_action/cosmos3_super_reasoner/metrics.json",
20897
  "exists": true,
20898
  "bytes": 10051,
20899
- "sha256": "b7773f4af1284dfb498c69ba174049056e038ce10465281b657223629d1dab5f"
20900
  },
20901
  "mirrors": {
20902
  "hf_space": {
20903
  "path": "hf_space:results/omni_finetune/model_output_task_probes_20260616/long_horizon_next_action/cosmos3_super_reasoner/metrics.json",
20904
  "exists": true,
20905
  "bytes": 10051,
20906
- "sha256": "b7773f4af1284dfb498c69ba174049056e038ce10465281b657223629d1dab5f"
20907
  }
20908
  },
20909
  "failures": []
@@ -20953,14 +21173,14 @@
20953
  "path": "repo:results/omni_finetune/model_output_task_probes_20260616/modality_reconstruction/cosmos3_nano_future_window/metrics.json",
20954
  "exists": true,
20955
  "bytes": 1825,
20956
- "sha256": "4d04bb2e461a76d0a8f9ec37f6b73915c87544472406b3ca576cb791f100db92"
20957
  },
20958
  "mirrors": {
20959
  "hf_space": {
20960
  "path": "hf_space:results/omni_finetune/model_output_task_probes_20260616/modality_reconstruction/cosmos3_nano_future_window/metrics.json",
20961
  "exists": true,
20962
  "bytes": 1825,
20963
- "sha256": "4d04bb2e461a76d0a8f9ec37f6b73915c87544472406b3ca576cb791f100db92"
20964
  }
20965
  },
20966
  "failures": []
@@ -20972,14 +21192,14 @@
20972
  "path": "repo:results/omni_finetune/model_output_task_probes_20260616/next_subtask_forecast/cosmos3_nano_future_window/metrics.json",
20973
  "exists": true,
20974
  "bytes": 5594,
20975
- "sha256": "0f2b7b041ae7cd46b128427634d0328178303c1ede02643fb86a68933c149099"
20976
  },
20977
  "mirrors": {
20978
  "hf_space": {
20979
  "path": "hf_space:results/omni_finetune/model_output_task_probes_20260616/next_subtask_forecast/cosmos3_nano_future_window/metrics.json",
20980
  "exists": true,
20981
  "bytes": 5594,
20982
- "sha256": "0f2b7b041ae7cd46b128427634d0328178303c1ede02643fb86a68933c149099"
20983
  }
20984
  },
20985
  "failures": []
@@ -21029,14 +21249,14 @@
21029
  "path": "repo:results/omni_finetune/model_output_task_probes_20260616/object_set_forecast/cosmos3_nano_future_window/metrics.json",
21030
  "exists": true,
21031
  "bytes": 2225,
21032
- "sha256": "f080f27c4457005ae1383d31cde22fc3c51b0c065eda3e0b5842135048254877"
21033
  },
21034
  "mirrors": {
21035
  "hf_space": {
21036
  "path": "hf_space:results/omni_finetune/model_output_task_probes_20260616/object_set_forecast/cosmos3_nano_future_window/metrics.json",
21037
  "exists": true,
21038
  "bytes": 2225,
21039
- "sha256": "f080f27c4457005ae1383d31cde22fc3c51b0c065eda3e0b5842135048254877"
21040
  }
21041
  },
21042
  "failures": []
@@ -21066,15 +21286,15 @@
21066
  "local": {
21067
  "path": "repo:results/omni_finetune/model_output_task_probes_20260616/summary.json",
21068
  "exists": true,
21069
- "bytes": 5278,
21070
- "sha256": "4a27f39807e8ac13771e2109584a8b0265961bcea88445058cbfe87265457d7f"
21071
  },
21072
  "mirrors": {
21073
  "hf_space": {
21074
  "path": "hf_space:results/omni_finetune/model_output_task_probes_20260616/summary.json",
21075
  "exists": true,
21076
- "bytes": 5278,
21077
- "sha256": "4a27f39807e8ac13771e2109584a8b0265961bcea88445058cbfe87265457d7f"
21078
  }
21079
  },
21080
  "failures": []
@@ -21086,14 +21306,14 @@
21086
  "path": "repo:results/omni_finetune/model_output_task_probes_20260616/time_to_transition/cosmos3_nano_future_window/metrics.json",
21087
  "exists": true,
21088
  "bytes": 2398,
21089
- "sha256": "31b36b403d37ee21efed27e9c2c5c4b46806bb1caff9f9159c5914c6c104a61c"
21090
  },
21091
  "mirrors": {
21092
  "hf_space": {
21093
  "path": "hf_space:results/omni_finetune/model_output_task_probes_20260616/time_to_transition/cosmos3_nano_future_window/metrics.json",
21094
  "exists": true,
21095
  "bytes": 2398,
21096
- "sha256": "31b36b403d37ee21efed27e9c2c5c4b46806bb1caff9f9159c5914c6c104a61c"
21097
  }
21098
  },
21099
  "failures": []
@@ -21124,14 +21344,14 @@
21124
  "path": "repo:results/omni_finetune/model_output_task_probes_20260616/time_to_transition/cosmos3_super_reasoner/metrics.json",
21125
  "exists": true,
21126
  "bytes": 2049,
21127
- "sha256": "6eae6e5b12a4073e98531046451c8ef332f0ca469a741aab09e94c952dc754cb"
21128
  },
21129
  "mirrors": {
21130
  "hf_space": {
21131
  "path": "hf_space:results/omni_finetune/model_output_task_probes_20260616/time_to_transition/cosmos3_super_reasoner/metrics.json",
21132
  "exists": true,
21133
  "bytes": 2049,
21134
- "sha256": "6eae6e5b12a4073e98531046451c8ef332f0ca469a741aab09e94c952dc754cb"
21135
  }
21136
  },
21137
  "failures": []
@@ -22710,27 +22930,27 @@
22710
  "local": {
22711
  "path": "repo:TASK_METHOD_20_GAP_AUDIT.md",
22712
  "exists": true,
22713
- "bytes": 8787,
22714
- "sha256": "8fd8555f75cd96c31346618ab622e24655027cea5c52e8a09a7a53793ef7b72b"
22715
  },
22716
  "mirrors": {
22717
  "hf_space": {
22718
  "path": "hf_space:TASK_METHOD_20_GAP_AUDIT.md",
22719
  "exists": true,
22720
- "bytes": 8787,
22721
- "sha256": "8fd8555f75cd96c31346618ab622e24655027cea5c52e8a09a7a53793ef7b72b"
22722
  },
22723
  "hf_artifacts": {
22724
  "path": "hf_artifacts:TASK_METHOD_20_GAP_AUDIT.md",
22725
  "exists": true,
22726
- "bytes": 8787,
22727
- "sha256": "8fd8555f75cd96c31346618ab622e24655027cea5c52e8a09a7a53793ef7b72b"
22728
  },
22729
  "hf_model": {
22730
  "path": "hf_model:TASK_METHOD_20_GAP_AUDIT.md",
22731
  "exists": true,
22732
- "bytes": 8787,
22733
- "sha256": "8fd8555f75cd96c31346618ab622e24655027cea5c52e8a09a7a53793ef7b72b"
22734
  }
22735
  },
22736
  "failures": []
@@ -22741,27 +22961,27 @@
22741
  "local": {
22742
  "path": "repo:TASK_METHOD_20_RESULT_MATRIX.md",
22743
  "exists": true,
22744
- "bytes": 3892,
22745
- "sha256": "590d9362624d64b81b1b19638c46faa7969730d40415e4825abd2ff09d76340a"
22746
  },
22747
  "mirrors": {
22748
  "hf_space": {
22749
  "path": "hf_space:TASK_METHOD_20_RESULT_MATRIX.md",
22750
  "exists": true,
22751
- "bytes": 3892,
22752
- "sha256": "590d9362624d64b81b1b19638c46faa7969730d40415e4825abd2ff09d76340a"
22753
  },
22754
  "hf_artifacts": {
22755
  "path": "hf_artifacts:TASK_METHOD_20_RESULT_MATRIX.md",
22756
  "exists": true,
22757
- "bytes": 3892,
22758
- "sha256": "590d9362624d64b81b1b19638c46faa7969730d40415e4825abd2ff09d76340a"
22759
  },
22760
  "hf_model": {
22761
  "path": "hf_model:TASK_METHOD_20_RESULT_MATRIX.md",
22762
  "exists": true,
22763
- "bytes": 3892,
22764
- "sha256": "590d9362624d64b81b1b19638c46faa7969730d40415e4825abd2ff09d76340a"
22765
  }
22766
  },
22767
  "failures": []
 
1
  {
2
  "status": "pass",
3
+ "generated_at_utc": "2026-06-18T22:59:08+00:00",
4
  "hf_root": "hf_publish",
5
  "summary": {
6
+ "group_count": 865,
7
  "failure_count": 0,
8
  "failures_by_surface": {}
9
  },
 
138
  "local": {
139
  "path": "repo:docs/data/artifact_index.json",
140
  "exists": true,
141
+ "bytes": 116644,
142
+ "sha256": "af87562c9963c897035e5d2a2f562423989a750c24809438f41b982986b7c658"
143
  },
144
  "mirrors": {
145
  "hf_space": {
146
  "path": "hf_space:data/artifact_index.json",
147
  "exists": true,
148
+ "bytes": 116644,
149
+ "sha256": "af87562c9963c897035e5d2a2f562423989a750c24809438f41b982986b7c658"
150
  },
151
  "hf_artifacts_data": {
152
  "path": "hf_artifacts:data/artifact_index.json",
153
  "exists": true,
154
+ "bytes": 116644,
155
+ "sha256": "af87562c9963c897035e5d2a2f562423989a750c24809438f41b982986b7c658"
156
  },
157
  "hf_artifacts": {
158
  "path": "hf_artifacts:docs/data/artifact_index.json",
159
  "exists": true,
160
+ "bytes": 116644,
161
+ "sha256": "af87562c9963c897035e5d2a2f562423989a750c24809438f41b982986b7c658"
162
  },
163
  "hf_model_data": {
164
  "path": "hf_model:data/artifact_index.json",
165
  "exists": true,
166
+ "bytes": 116644,
167
+ "sha256": "af87562c9963c897035e5d2a2f562423989a750c24809438f41b982986b7c658"
168
  },
169
  "hf_model_docs_data": {
170
  "path": "hf_model:docs/data/artifact_index.json",
171
  "exists": true,
172
+ "bytes": 116644,
173
+ "sha256": "af87562c9963c897035e5d2a2f562423989a750c24809438f41b982986b7c658"
174
  },
175
  "hf_model": {
176
  "path": "hf_model:metrics/artifact_index.json",
177
  "exists": true,
178
+ "bytes": 116644,
179
+ "sha256": "af87562c9963c897035e5d2a2f562423989a750c24809438f41b982986b7c658"
180
  }
181
  },
182
  "failures": []
 
922
  "local": {
923
  "path": "repo:docs/data/publication_audit.json",
924
  "exists": true,
925
+ "bytes": 9713,
926
+ "sha256": "33c3601546d5ff2e7c093071d8db2331d73097ac5360b60bbebb8902c2a6dda5"
927
  },
928
  "mirrors": {
929
  "hf_space": {
930
  "path": "hf_space:data/publication_audit.json",
931
  "exists": true,
932
+ "bytes": 9713,
933
+ "sha256": "33c3601546d5ff2e7c093071d8db2331d73097ac5360b60bbebb8902c2a6dda5"
934
  },
935
  "hf_artifacts_data": {
936
  "path": "hf_artifacts:data/publication_audit.json",
937
  "exists": true,
938
+ "bytes": 9713,
939
+ "sha256": "33c3601546d5ff2e7c093071d8db2331d73097ac5360b60bbebb8902c2a6dda5"
940
  },
941
  "hf_artifacts": {
942
  "path": "hf_artifacts:docs/data/publication_audit.json",
943
  "exists": true,
944
+ "bytes": 9713,
945
+ "sha256": "33c3601546d5ff2e7c093071d8db2331d73097ac5360b60bbebb8902c2a6dda5"
946
  },
947
  "hf_model_data": {
948
  "path": "hf_model:data/publication_audit.json",
949
  "exists": true,
950
+ "bytes": 9713,
951
+ "sha256": "33c3601546d5ff2e7c093071d8db2331d73097ac5360b60bbebb8902c2a6dda5"
952
  },
953
  "hf_model_docs_data": {
954
  "path": "hf_model:docs/data/publication_audit.json",
955
  "exists": true,
956
+ "bytes": 9713,
957
+ "sha256": "33c3601546d5ff2e7c093071d8db2331d73097ac5360b60bbebb8902c2a6dda5"
958
  },
959
  "hf_model": {
960
  "path": "hf_model:metrics/publication_audit.json",
961
  "exists": true,
962
+ "bytes": 9713,
963
+ "sha256": "33c3601546d5ff2e7c093071d8db2331d73097ac5360b60bbebb8902c2a6dda5"
964
  }
965
  },
966
  "failures": []
 
972
  "path": "repo:docs/data/public_surface_qa.json",
973
  "exists": true,
974
  "bytes": 7126,
975
+ "sha256": "0fd0ee7e07b83212d50cf95fa1e97c78baa0020ad26148122f28649b6829f082"
976
  },
977
  "mirrors": {
978
  "hf_space": {
979
  "path": "hf_space:data/public_surface_qa.json",
980
  "exists": true,
981
  "bytes": 7126,
982
+ "sha256": "0fd0ee7e07b83212d50cf95fa1e97c78baa0020ad26148122f28649b6829f082"
983
  },
984
  "hf_artifacts_data": {
985
  "path": "hf_artifacts:data/public_surface_qa.json",
986
  "exists": true,
987
  "bytes": 7126,
988
+ "sha256": "0fd0ee7e07b83212d50cf95fa1e97c78baa0020ad26148122f28649b6829f082"
989
  },
990
  "hf_artifacts": {
991
  "path": "hf_artifacts:docs/data/public_surface_qa.json",
992
  "exists": true,
993
  "bytes": 7126,
994
+ "sha256": "0fd0ee7e07b83212d50cf95fa1e97c78baa0020ad26148122f28649b6829f082"
995
  },
996
  "hf_model_data": {
997
  "path": "hf_model:data/public_surface_qa.json",
998
  "exists": true,
999
  "bytes": 7126,
1000
+ "sha256": "0fd0ee7e07b83212d50cf95fa1e97c78baa0020ad26148122f28649b6829f082"
1001
  },
1002
  "hf_model_docs_data": {
1003
  "path": "hf_model:docs/data/public_surface_qa.json",
1004
  "exists": true,
1005
  "bytes": 7126,
1006
+ "sha256": "0fd0ee7e07b83212d50cf95fa1e97c78baa0020ad26148122f28649b6829f082"
1007
  },
1008
  "hf_model": {
1009
  "path": "hf_model:metrics/public_surface_qa.json",
1010
  "exists": true,
1011
  "bytes": 7126,
1012
+ "sha256": "0fd0ee7e07b83212d50cf95fa1e97c78baa0020ad26148122f28649b6829f082"
1013
  }
1014
  },
1015
  "failures": []
 
1119
  "path": "repo:docs/data/quality_gates.json",
1120
  "exists": true,
1121
  "bytes": 8100,
1122
+ "sha256": "b88b46bd9b16d4afaf4836d0acff208b46559a493cfcffa881f1528fa282292c"
1123
  },
1124
  "mirrors": {
1125
  "hf_space": {
1126
  "path": "hf_space:data/quality_gates.json",
1127
  "exists": true,
1128
  "bytes": 8100,
1129
+ "sha256": "b88b46bd9b16d4afaf4836d0acff208b46559a493cfcffa881f1528fa282292c"
1130
  },
1131
  "hf_artifacts_data": {
1132
  "path": "hf_artifacts:data/quality_gates.json",
1133
  "exists": true,
1134
  "bytes": 8100,
1135
+ "sha256": "b88b46bd9b16d4afaf4836d0acff208b46559a493cfcffa881f1528fa282292c"
1136
  },
1137
  "hf_artifacts": {
1138
  "path": "hf_artifacts:docs/data/quality_gates.json",
1139
  "exists": true,
1140
  "bytes": 8100,
1141
+ "sha256": "b88b46bd9b16d4afaf4836d0acff208b46559a493cfcffa881f1528fa282292c"
1142
  },
1143
  "hf_model_data": {
1144
  "path": "hf_model:data/quality_gates.json",
1145
  "exists": true,
1146
  "bytes": 8100,
1147
+ "sha256": "b88b46bd9b16d4afaf4836d0acff208b46559a493cfcffa881f1528fa282292c"
1148
  },
1149
  "hf_model_docs_data": {
1150
  "path": "hf_model:docs/data/quality_gates.json",
1151
  "exists": true,
1152
  "bytes": 8100,
1153
+ "sha256": "b88b46bd9b16d4afaf4836d0acff208b46559a493cfcffa881f1528fa282292c"
1154
  },
1155
  "hf_model": {
1156
  "path": "hf_model:metrics/quality_gates.json",
1157
  "exists": true,
1158
  "bytes": 8100,
1159
+ "sha256": "b88b46bd9b16d4afaf4836d0acff208b46559a493cfcffa881f1528fa282292c"
1160
  }
1161
  },
1162
  "failures": []
 
1560
  "path": "repo:docs/data/scope_claims_audit.json",
1561
  "exists": true,
1562
  "bytes": 21630,
1563
+ "sha256": "a4d8a83955779c23e3cf985a2cbbc49fd544c85bf8495c1ff7d37d9630fcc479"
1564
  },
1565
  "mirrors": {
1566
  "hf_space": {
1567
  "path": "hf_space:data/scope_claims_audit.json",
1568
  "exists": true,
1569
  "bytes": 21630,
1570
+ "sha256": "a4d8a83955779c23e3cf985a2cbbc49fd544c85bf8495c1ff7d37d9630fcc479"
1571
  },
1572
  "hf_artifacts_data": {
1573
  "path": "hf_artifacts:data/scope_claims_audit.json",
1574
  "exists": true,
1575
  "bytes": 21630,
1576
+ "sha256": "a4d8a83955779c23e3cf985a2cbbc49fd544c85bf8495c1ff7d37d9630fcc479"
1577
  },
1578
  "hf_artifacts": {
1579
  "path": "hf_artifacts:docs/data/scope_claims_audit.json",
1580
  "exists": true,
1581
  "bytes": 21630,
1582
+ "sha256": "a4d8a83955779c23e3cf985a2cbbc49fd544c85bf8495c1ff7d37d9630fcc479"
1583
  },
1584
  "hf_model_data": {
1585
  "path": "hf_model:data/scope_claims_audit.json",
1586
  "exists": true,
1587
  "bytes": 21630,
1588
+ "sha256": "a4d8a83955779c23e3cf985a2cbbc49fd544c85bf8495c1ff7d37d9630fcc479"
1589
  },
1590
  "hf_model_docs_data": {
1591
  "path": "hf_model:docs/data/scope_claims_audit.json",
1592
  "exists": true,
1593
  "bytes": 21630,
1594
+ "sha256": "a4d8a83955779c23e3cf985a2cbbc49fd544c85bf8495c1ff7d37d9630fcc479"
1595
  },
1596
  "hf_model": {
1597
  "path": "hf_model:metrics/scope_claims_audit.json",
1598
  "exists": true,
1599
  "bytes": 21630,
1600
+ "sha256": "a4d8a83955779c23e3cf985a2cbbc49fd544c85bf8495c1ff7d37d9630fcc479"
1601
  }
1602
  },
1603
  "failures": []
 
1658
  "path": "repo:docs/data/source_alignment_audit.json",
1659
  "exists": true,
1660
  "bytes": 4432,
1661
+ "sha256": "d51f321ea35f0e57aeaaa41dad9af0cccdc1fde2c61e9559cc374a1e5fd85f4a"
1662
  },
1663
  "mirrors": {
1664
  "hf_space": {
1665
  "path": "hf_space:data/source_alignment_audit.json",
1666
  "exists": true,
1667
  "bytes": 4432,
1668
+ "sha256": "d51f321ea35f0e57aeaaa41dad9af0cccdc1fde2c61e9559cc374a1e5fd85f4a"
1669
  },
1670
  "hf_artifacts_data": {
1671
  "path": "hf_artifacts:data/source_alignment_audit.json",
1672
  "exists": true,
1673
  "bytes": 4432,
1674
+ "sha256": "d51f321ea35f0e57aeaaa41dad9af0cccdc1fde2c61e9559cc374a1e5fd85f4a"
1675
  },
1676
  "hf_artifacts": {
1677
  "path": "hf_artifacts:docs/data/source_alignment_audit.json",
1678
  "exists": true,
1679
  "bytes": 4432,
1680
+ "sha256": "d51f321ea35f0e57aeaaa41dad9af0cccdc1fde2c61e9559cc374a1e5fd85f4a"
1681
  },
1682
  "hf_model_data": {
1683
  "path": "hf_model:data/source_alignment_audit.json",
1684
  "exists": true,
1685
  "bytes": 4432,
1686
+ "sha256": "d51f321ea35f0e57aeaaa41dad9af0cccdc1fde2c61e9559cc374a1e5fd85f4a"
1687
  },
1688
  "hf_model_docs_data": {
1689
  "path": "hf_model:docs/data/source_alignment_audit.json",
1690
  "exists": true,
1691
  "bytes": 4432,
1692
+ "sha256": "d51f321ea35f0e57aeaaa41dad9af0cccdc1fde2c61e9559cc374a1e5fd85f4a"
1693
  },
1694
  "hf_model": {
1695
  "path": "hf_model:metrics/source_alignment_audit.json",
1696
  "exists": true,
1697
  "bytes": 4432,
1698
+ "sha256": "d51f321ea35f0e57aeaaa41dad9af0cccdc1fde2c61e9559cc374a1e5fd85f4a"
1699
  }
1700
  },
1701
  "failures": []
 
1756
  "path": "repo:docs/data/single_episode_task_model_radar.json",
1757
  "exists": true,
1758
  "bytes": 51064,
1759
+ "sha256": "9d42b045d833e50a2bfa8905203150af1f28ea4736d22edb0fe27e39eedf4574"
1760
  },
1761
  "mirrors": {
1762
  "hf_space": {
1763
  "path": "hf_space:data/single_episode_task_model_radar.json",
1764
  "exists": true,
1765
  "bytes": 51064,
1766
+ "sha256": "9d42b045d833e50a2bfa8905203150af1f28ea4736d22edb0fe27e39eedf4574"
1767
  },
1768
  "hf_artifacts_data": {
1769
  "path": "hf_artifacts:data/single_episode_task_model_radar.json",
1770
  "exists": true,
1771
  "bytes": 51064,
1772
+ "sha256": "9d42b045d833e50a2bfa8905203150af1f28ea4736d22edb0fe27e39eedf4574"
1773
  },
1774
  "hf_artifacts": {
1775
  "path": "hf_artifacts:docs/data/single_episode_task_model_radar.json",
1776
  "exists": true,
1777
  "bytes": 51064,
1778
+ "sha256": "9d42b045d833e50a2bfa8905203150af1f28ea4736d22edb0fe27e39eedf4574"
1779
  },
1780
  "hf_model_data": {
1781
  "path": "hf_model:data/single_episode_task_model_radar.json",
1782
  "exists": true,
1783
  "bytes": 51064,
1784
+ "sha256": "9d42b045d833e50a2bfa8905203150af1f28ea4736d22edb0fe27e39eedf4574"
1785
  },
1786
  "hf_model_docs_data": {
1787
  "path": "hf_model:docs/data/single_episode_task_model_radar.json",
1788
  "exists": true,
1789
  "bytes": 51064,
1790
+ "sha256": "9d42b045d833e50a2bfa8905203150af1f28ea4736d22edb0fe27e39eedf4574"
1791
  },
1792
  "hf_model": {
1793
  "path": "hf_model:metrics/single_episode_task_model_radar.json",
1794
  "exists": true,
1795
  "bytes": 51064,
1796
+ "sha256": "9d42b045d833e50a2bfa8905203150af1f28ea4736d22edb0fe27e39eedf4574"
1797
  }
1798
  },
1799
  "failures": []
 
1804
  "local": {
1805
  "path": "repo:docs/data/episode128_task_model_radar.json",
1806
  "exists": true,
1807
+ "bytes": 185314,
1808
+ "sha256": "5c61c8f9a4a9a7b6bdc65e39ef5fda6117df48412afe260c0be4da501bd7e8db"
1809
  },
1810
  "mirrors": {
1811
  "hf_space": {
1812
  "path": "hf_space:data/episode128_task_model_radar.json",
1813
  "exists": true,
1814
+ "bytes": 185314,
1815
+ "sha256": "5c61c8f9a4a9a7b6bdc65e39ef5fda6117df48412afe260c0be4da501bd7e8db"
1816
  },
1817
  "hf_artifacts_data": {
1818
  "path": "hf_artifacts:data/episode128_task_model_radar.json",
1819
  "exists": true,
1820
+ "bytes": 185314,
1821
+ "sha256": "5c61c8f9a4a9a7b6bdc65e39ef5fda6117df48412afe260c0be4da501bd7e8db"
1822
  },
1823
  "hf_artifacts": {
1824
  "path": "hf_artifacts:docs/data/episode128_task_model_radar.json",
1825
  "exists": true,
1826
+ "bytes": 185314,
1827
+ "sha256": "5c61c8f9a4a9a7b6bdc65e39ef5fda6117df48412afe260c0be4da501bd7e8db"
1828
  },
1829
  "hf_model_data": {
1830
  "path": "hf_model:data/episode128_task_model_radar.json",
1831
  "exists": true,
1832
+ "bytes": 185314,
1833
+ "sha256": "5c61c8f9a4a9a7b6bdc65e39ef5fda6117df48412afe260c0be4da501bd7e8db"
1834
  },
1835
  "hf_model_docs_data": {
1836
  "path": "hf_model:docs/data/episode128_task_model_radar.json",
1837
  "exists": true,
1838
+ "bytes": 185314,
1839
+ "sha256": "5c61c8f9a4a9a7b6bdc65e39ef5fda6117df48412afe260c0be4da501bd7e8db"
1840
  },
1841
  "hf_model": {
1842
  "path": "hf_model:metrics/episode128_task_model_radar.json",
1843
  "exists": true,
1844
+ "bytes": 185314,
1845
+ "sha256": "5c61c8f9a4a9a7b6bdc65e39ef5fda6117df48412afe260c0be4da501bd7e8db"
1846
  }
1847
  },
1848
  "failures": []
 
2001
  "path": "repo:docs/data/task_surface_integrity.json",
2002
  "exists": true,
2003
  "bytes": 45779,
2004
+ "sha256": "53473545e9177adee1eb5c4245008c7b101a7b16232dce9dd38e509ae8c867dd"
2005
  },
2006
  "mirrors": {
2007
  "hf_space": {
2008
  "path": "hf_space:data/task_surface_integrity.json",
2009
  "exists": true,
2010
  "bytes": 45779,
2011
+ "sha256": "53473545e9177adee1eb5c4245008c7b101a7b16232dce9dd38e509ae8c867dd"
2012
  },
2013
  "hf_artifacts_data": {
2014
  "path": "hf_artifacts:data/task_surface_integrity.json",
2015
  "exists": true,
2016
  "bytes": 45779,
2017
+ "sha256": "53473545e9177adee1eb5c4245008c7b101a7b16232dce9dd38e509ae8c867dd"
2018
  },
2019
  "hf_artifacts": {
2020
  "path": "hf_artifacts:docs/data/task_surface_integrity.json",
2021
  "exists": true,
2022
  "bytes": 45779,
2023
+ "sha256": "53473545e9177adee1eb5c4245008c7b101a7b16232dce9dd38e509ae8c867dd"
2024
  },
2025
  "hf_model_data": {
2026
  "path": "hf_model:data/task_surface_integrity.json",
2027
  "exists": true,
2028
  "bytes": 45779,
2029
+ "sha256": "53473545e9177adee1eb5c4245008c7b101a7b16232dce9dd38e509ae8c867dd"
2030
  },
2031
  "hf_model_docs_data": {
2032
  "path": "hf_model:docs/data/task_surface_integrity.json",
2033
  "exists": true,
2034
  "bytes": 45779,
2035
+ "sha256": "53473545e9177adee1eb5c4245008c7b101a7b16232dce9dd38e509ae8c867dd"
2036
  },
2037
  "hf_model": {
2038
  "path": "hf_model:metrics/task_surface_integrity.json",
2039
  "exists": true,
2040
  "bytes": 45779,
2041
+ "sha256": "53473545e9177adee1eb5c4245008c7b101a7b16232dce9dd38e509ae8c867dd"
2042
  }
2043
  },
2044
  "failures": []
 
2098
  "local": {
2099
  "path": "repo:docs/data/task_method_20_result_matrix.json",
2100
  "exists": true,
2101
+ "bytes": 128805,
2102
+ "sha256": "d5572768c6fb671eadf87870d20c8645dfae384f862aa63e929b2db50a5cc51a"
2103
  },
2104
  "mirrors": {
2105
  "hf_space": {
2106
  "path": "hf_space:data/task_method_20_result_matrix.json",
2107
  "exists": true,
2108
+ "bytes": 128805,
2109
+ "sha256": "d5572768c6fb671eadf87870d20c8645dfae384f862aa63e929b2db50a5cc51a"
2110
  },
2111
  "hf_artifacts_data": {
2112
  "path": "hf_artifacts:data/task_method_20_result_matrix.json",
2113
  "exists": true,
2114
+ "bytes": 128805,
2115
+ "sha256": "d5572768c6fb671eadf87870d20c8645dfae384f862aa63e929b2db50a5cc51a"
2116
  },
2117
  "hf_artifacts": {
2118
  "path": "hf_artifacts:docs/data/task_method_20_result_matrix.json",
2119
  "exists": true,
2120
+ "bytes": 128805,
2121
+ "sha256": "d5572768c6fb671eadf87870d20c8645dfae384f862aa63e929b2db50a5cc51a"
2122
  },
2123
  "hf_model_data": {
2124
  "path": "hf_model:data/task_method_20_result_matrix.json",
2125
  "exists": true,
2126
+ "bytes": 128805,
2127
+ "sha256": "d5572768c6fb671eadf87870d20c8645dfae384f862aa63e929b2db50a5cc51a"
2128
  },
2129
  "hf_model_docs_data": {
2130
  "path": "hf_model:docs/data/task_method_20_result_matrix.json",
2131
  "exists": true,
2132
+ "bytes": 128805,
2133
+ "sha256": "d5572768c6fb671eadf87870d20c8645dfae384f862aa63e929b2db50a5cc51a"
2134
  },
2135
  "hf_model": {
2136
  "path": "hf_model:metrics/task_method_20_result_matrix.json",
2137
  "exists": true,
2138
+ "bytes": 128805,
2139
+ "sha256": "d5572768c6fb671eadf87870d20c8645dfae384f862aa63e929b2db50a5cc51a"
2140
  }
2141
  },
2142
  "failures": []
 
2147
  "local": {
2148
  "path": "repo:docs/data/task_method_20_gap_audit.json",
2149
  "exists": true,
2150
+ "bytes": 28259,
2151
+ "sha256": "860dea3d3ce2f2c2146c97918a5deca05ae315238b584c10e53f74a9d2c26dcd"
2152
  },
2153
  "mirrors": {
2154
  "hf_space": {
2155
  "path": "hf_space:data/task_method_20_gap_audit.json",
2156
  "exists": true,
2157
+ "bytes": 28259,
2158
+ "sha256": "860dea3d3ce2f2c2146c97918a5deca05ae315238b584c10e53f74a9d2c26dcd"
2159
  },
2160
  "hf_artifacts_data": {
2161
  "path": "hf_artifacts:data/task_method_20_gap_audit.json",
2162
  "exists": true,
2163
+ "bytes": 28259,
2164
+ "sha256": "860dea3d3ce2f2c2146c97918a5deca05ae315238b584c10e53f74a9d2c26dcd"
2165
  },
2166
  "hf_artifacts": {
2167
  "path": "hf_artifacts:docs/data/task_method_20_gap_audit.json",
2168
  "exists": true,
2169
+ "bytes": 28259,
2170
+ "sha256": "860dea3d3ce2f2c2146c97918a5deca05ae315238b584c10e53f74a9d2c26dcd"
2171
  },
2172
  "hf_model_data": {
2173
  "path": "hf_model:data/task_method_20_gap_audit.json",
2174
  "exists": true,
2175
+ "bytes": 28259,
2176
+ "sha256": "860dea3d3ce2f2c2146c97918a5deca05ae315238b584c10e53f74a9d2c26dcd"
2177
  },
2178
  "hf_model_docs_data": {
2179
  "path": "hf_model:docs/data/task_method_20_gap_audit.json",
2180
  "exists": true,
2181
+ "bytes": 28259,
2182
+ "sha256": "860dea3d3ce2f2c2146c97918a5deca05ae315238b584c10e53f74a9d2c26dcd"
2183
  },
2184
  "hf_model": {
2185
  "path": "hf_model:metrics/task_method_20_gap_audit.json",
2186
  "exists": true,
2187
+ "bytes": 28259,
2188
+ "sha256": "860dea3d3ce2f2c2146c97918a5deca05ae315238b584c10e53f74a9d2c26dcd"
2189
  }
2190
  },
2191
  "failures": []
 
2245
  "local": {
2246
  "path": "repo:docs/data/unified_task_model_radar.json",
2247
  "exists": true,
2248
+ "bytes": 229168,
2249
+ "sha256": "64c7c10f3ce663178f2eea4740bb45de0f94b1246448f14f5521d293be916e77"
2250
  },
2251
  "mirrors": {
2252
  "hf_space": {
2253
  "path": "hf_space:data/unified_task_model_radar.json",
2254
  "exists": true,
2255
+ "bytes": 229168,
2256
+ "sha256": "64c7c10f3ce663178f2eea4740bb45de0f94b1246448f14f5521d293be916e77"
2257
  },
2258
  "hf_artifacts_data": {
2259
  "path": "hf_artifacts:data/unified_task_model_radar.json",
2260
  "exists": true,
2261
+ "bytes": 229168,
2262
+ "sha256": "64c7c10f3ce663178f2eea4740bb45de0f94b1246448f14f5521d293be916e77"
2263
  },
2264
  "hf_artifacts": {
2265
  "path": "hf_artifacts:docs/data/unified_task_model_radar.json",
2266
  "exists": true,
2267
+ "bytes": 229168,
2268
+ "sha256": "64c7c10f3ce663178f2eea4740bb45de0f94b1246448f14f5521d293be916e77"
2269
  },
2270
  "hf_model_data": {
2271
  "path": "hf_model:data/unified_task_model_radar.json",
2272
  "exists": true,
2273
+ "bytes": 229168,
2274
+ "sha256": "64c7c10f3ce663178f2eea4740bb45de0f94b1246448f14f5521d293be916e77"
2275
  },
2276
  "hf_model_docs_data": {
2277
  "path": "hf_model:docs/data/unified_task_model_radar.json",
2278
  "exists": true,
2279
+ "bytes": 229168,
2280
+ "sha256": "64c7c10f3ce663178f2eea4740bb45de0f94b1246448f14f5521d293be916e77"
2281
  },
2282
  "hf_model": {
2283
  "path": "hf_model:metrics/unified_task_model_radar.json",
2284
  "exists": true,
2285
+ "bytes": 229168,
2286
+ "sha256": "64c7c10f3ce663178f2eea4740bb45de0f94b1246448f14f5521d293be916e77"
2287
  }
2288
  },
2289
  "failures": []
 
2294
  "local": {
2295
  "path": "repo:docs/data/website_integrity.json",
2296
  "exists": true,
2297
+ "bytes": 20022,
2298
+ "sha256": "4b46dacca993c2a0645cc79518d40b4e57198fe304daa322d0daa5a268043538"
2299
  },
2300
  "mirrors": {
2301
  "hf_space": {
2302
  "path": "hf_space:data/website_integrity.json",
2303
  "exists": true,
2304
+ "bytes": 20022,
2305
+ "sha256": "4b46dacca993c2a0645cc79518d40b4e57198fe304daa322d0daa5a268043538"
2306
  },
2307
  "hf_artifacts_data": {
2308
  "path": "hf_artifacts:data/website_integrity.json",
2309
  "exists": true,
2310
+ "bytes": 20022,
2311
+ "sha256": "4b46dacca993c2a0645cc79518d40b4e57198fe304daa322d0daa5a268043538"
2312
  },
2313
  "hf_artifacts": {
2314
  "path": "hf_artifacts:docs/data/website_integrity.json",
2315
  "exists": true,
2316
+ "bytes": 20022,
2317
+ "sha256": "4b46dacca993c2a0645cc79518d40b4e57198fe304daa322d0daa5a268043538"
2318
  },
2319
  "hf_model_data": {
2320
  "path": "hf_model:data/website_integrity.json",
2321
  "exists": true,
2322
+ "bytes": 20022,
2323
+ "sha256": "4b46dacca993c2a0645cc79518d40b4e57198fe304daa322d0daa5a268043538"
2324
  },
2325
  "hf_model_docs_data": {
2326
  "path": "hf_model:docs/data/website_integrity.json",
2327
  "exists": true,
2328
+ "bytes": 20022,
2329
+ "sha256": "4b46dacca993c2a0645cc79518d40b4e57198fe304daa322d0daa5a268043538"
2330
  },
2331
  "hf_model": {
2332
  "path": "hf_model:metrics/website_integrity.json",
2333
  "exists": true,
2334
+ "bytes": 20022,
2335
+ "sha256": "4b46dacca993c2a0645cc79518d40b4e57198fe304daa322d0daa5a268043538"
2336
  }
2337
  },
2338
  "failures": []
 
2515
  "local": {
2516
  "path": "repo:docs/assets/charts/episode128_task_model_radar.svg",
2517
  "exists": true,
2518
+ "bytes": 48923,
2519
+ "sha256": "75c389122a413548bdc26fd05cbbad2a85015ebd222ba1a23571f3ff4f0eddcf"
2520
  },
2521
  "mirrors": {
2522
  "hf_space": {
2523
  "path": "hf_space:assets/charts/episode128_task_model_radar.svg",
2524
  "exists": true,
2525
+ "bytes": 48923,
2526
+ "sha256": "75c389122a413548bdc26fd05cbbad2a85015ebd222ba1a23571f3ff4f0eddcf"
2527
  },
2528
  "hf_artifacts_docs": {
2529
  "path": "hf_artifacts:docs/assets/charts/episode128_task_model_radar.svg",
2530
  "exists": true,
2531
+ "bytes": 48923,
2532
+ "sha256": "75c389122a413548bdc26fd05cbbad2a85015ebd222ba1a23571f3ff4f0eddcf"
2533
  },
2534
  "hf_artifacts_card": {
2535
  "path": "hf_artifacts:assets/charts/episode128_task_model_radar.svg",
2536
  "exists": true,
2537
+ "bytes": 48923,
2538
+ "sha256": "75c389122a413548bdc26fd05cbbad2a85015ebd222ba1a23571f3ff4f0eddcf"
2539
  },
2540
  "hf_model": {
2541
  "path": "hf_model:assets/charts/episode128_task_model_radar.svg",
2542
  "exists": true,
2543
+ "bytes": 48923,
2544
+ "sha256": "75c389122a413548bdc26fd05cbbad2a85015ebd222ba1a23571f3ff4f0eddcf"
2545
  }
2546
  },
2547
  "failures": []
 
2589
  "local": {
2590
  "path": "repo:docs/assets/charts/unified_task_model_radar.svg",
2591
  "exists": true,
2592
+ "bytes": 54936,
2593
+ "sha256": "f29db4099d60c093ebd092bee37a2fc1338bbff17d7e52b8a1b27ae6fc06727a"
2594
  },
2595
  "mirrors": {
2596
  "hf_space": {
2597
  "path": "hf_space:assets/charts/unified_task_model_radar.svg",
2598
  "exists": true,
2599
+ "bytes": 54936,
2600
+ "sha256": "f29db4099d60c093ebd092bee37a2fc1338bbff17d7e52b8a1b27ae6fc06727a"
2601
  },
2602
  "hf_artifacts_docs": {
2603
  "path": "hf_artifacts:docs/assets/charts/unified_task_model_radar.svg",
2604
  "exists": true,
2605
+ "bytes": 54936,
2606
+ "sha256": "f29db4099d60c093ebd092bee37a2fc1338bbff17d7e52b8a1b27ae6fc06727a"
2607
  },
2608
  "hf_artifacts_card": {
2609
  "path": "hf_artifacts:assets/charts/unified_task_model_radar.svg",
2610
  "exists": true,
2611
+ "bytes": 54936,
2612
+ "sha256": "f29db4099d60c093ebd092bee37a2fc1338bbff17d7e52b8a1b27ae6fc06727a"
2613
  },
2614
  "hf_model": {
2615
  "path": "hf_model:assets/charts/unified_task_model_radar.svg",
2616
  "exists": true,
2617
+ "bytes": 54936,
2618
+ "sha256": "f29db4099d60c093ebd092bee37a2fc1338bbff17d7e52b8a1b27ae6fc06727a"
2619
  }
2620
  },
2621
  "failures": []
 
4509
  "local": {
4510
  "path": "repo:scripts/omni/score_existing_model_output_task_probes.py",
4511
  "exists": true,
4512
+ "bytes": 69411,
4513
+ "sha256": "a78889e5225405fcbb0156aa8c63cbbe79022a12283d0b398c5f2bb015175fe7"
4514
  },
4515
  "mirrors": {
4516
  "hf_artifacts": {
4517
  "path": "hf_artifacts:scripts/omni/score_existing_model_output_task_probes.py",
4518
  "exists": true,
4519
+ "bytes": 69411,
4520
+ "sha256": "a78889e5225405fcbb0156aa8c63cbbe79022a12283d0b398c5f2bb015175fe7"
4521
  },
4522
  "hf_model": {
4523
  "path": "hf_model:scripts/omni/score_existing_model_output_task_probes.py",
4524
  "exists": true,
4525
+ "bytes": 69411,
4526
+ "sha256": "a78889e5225405fcbb0156aa8c63cbbe79022a12283d0b398c5f2bb015175fe7"
4527
  }
4528
  },
4529
  "failures": []
 
5034
  "local": {
5035
  "path": "repo:scripts/build_unified_task_model_radar.py",
5036
  "exists": true,
5037
+ "bytes": 57104,
5038
+ "sha256": "805cfce89529fec73edd3e436c1a76afae46cebe31ba5e441b6dfb5cc142c935"
5039
  },
5040
  "mirrors": {
5041
  "hf_artifacts": {
5042
  "path": "hf_artifacts:scripts/build_unified_task_model_radar.py",
5043
  "exists": true,
5044
+ "bytes": 57104,
5045
+ "sha256": "805cfce89529fec73edd3e436c1a76afae46cebe31ba5e441b6dfb5cc142c935"
5046
  },
5047
  "hf_model": {
5048
  "path": "hf_model:scripts/build_unified_task_model_radar.py",
5049
  "exists": true,
5050
+ "bytes": 57104,
5051
+ "sha256": "805cfce89529fec73edd3e436c1a76afae46cebe31ba5e441b6dfb5cc142c935"
5052
  }
5053
  },
5054
  "failures": []
 
5464
  "path": "repo:docs/index.html",
5465
  "exists": true,
5466
  "bytes": 254770,
5467
+ "sha256": "55fbaf659f3ffe067603938476f895c52782ab8978c701545b6ed53dc23ec8bd"
5468
  },
5469
  "mirrors": {
5470
  "hf_space": {
5471
  "path": "hf_space:index.html",
5472
  "exists": true,
5473
  "bytes": 254770,
5474
+ "sha256": "55fbaf659f3ffe067603938476f895c52782ab8978c701545b6ed53dc23ec8bd"
5475
  },
5476
  "hf_artifacts_root": {
5477
  "path": "hf_artifacts:index.html",
5478
  "exists": true,
5479
  "bytes": 254770,
5480
+ "sha256": "55fbaf659f3ffe067603938476f895c52782ab8978c701545b6ed53dc23ec8bd"
5481
  },
5482
  "hf_artifacts_docs": {
5483
  "path": "hf_artifacts:docs/index.html",
5484
  "exists": true,
5485
  "bytes": 254770,
5486
+ "sha256": "55fbaf659f3ffe067603938476f895c52782ab8978c701545b6ed53dc23ec8bd"
5487
  },
5488
  "hf_model": {
5489
  "path": "hf_model:index.html",
5490
  "exists": true,
5491
  "bytes": 254770,
5492
+ "sha256": "55fbaf659f3ffe067603938476f895c52782ab8978c701545b6ed53dc23ec8bd"
5493
  },
5494
  "hf_model_docs": {
5495
  "path": "hf_model:docs/index.html",
5496
  "exists": true,
5497
  "bytes": 254770,
5498
+ "sha256": "55fbaf659f3ffe067603938476f895c52782ab8978c701545b6ed53dc23ec8bd"
5499
  }
5500
  },
5501
  "failures": []
 
12510
  "local": {
12511
  "path": "repo:results/omni_finetune/model_output_probe_readiness/RUN_REPORT.md",
12512
  "exists": true,
12513
+ "bytes": 1048,
12514
+ "sha256": "5744154e5c35e1c842826ea9bf33a800517e90572a562449e56d638c3211f064"
12515
  },
12516
  "mirrors": {
12517
  "hf_artifacts": {
12518
  "path": "hf_artifacts:results/omni_finetune/model_output_probe_readiness/RUN_REPORT.md",
12519
  "exists": true,
12520
+ "bytes": 1048,
12521
+ "sha256": "5744154e5c35e1c842826ea9bf33a800517e90572a562449e56d638c3211f064"
12522
  },
12523
  "hf_model": {
12524
  "path": "hf_model:results/omni_finetune/model_output_probe_readiness/RUN_REPORT.md",
12525
  "exists": true,
12526
+ "bytes": 1048,
12527
+ "sha256": "5744154e5c35e1c842826ea9bf33a800517e90572a562449e56d638c3211f064"
12528
  }
12529
  },
12530
  "failures": []
 
12535
  "local": {
12536
  "path": "repo:results/omni_finetune/model_output_probe_readiness/model_output_probe_readiness.json",
12537
  "exists": true,
12538
+ "bytes": 4977,
12539
+ "sha256": "b9caf6d32bb801d845b57b4450b92c10a4c3f9d14890f6a209e5a52aede92568"
12540
  },
12541
  "mirrors": {
12542
  "hf_artifacts": {
12543
  "path": "hf_artifacts:results/omni_finetune/model_output_probe_readiness/model_output_probe_readiness.json",
12544
  "exists": true,
12545
+ "bytes": 4977,
12546
+ "sha256": "b9caf6d32bb801d845b57b4450b92c10a4c3f9d14890f6a209e5a52aede92568"
12547
  },
12548
  "hf_model": {
12549
  "path": "hf_model:results/omni_finetune/model_output_probe_readiness/model_output_probe_readiness.json",
12550
  "exists": true,
12551
+ "bytes": 4977,
12552
+ "sha256": "b9caf6d32bb801d845b57b4450b92c10a4c3f9d14890f6a209e5a52aede92568"
12553
  }
12554
  },
12555
  "failures": []
 
12560
  "local": {
12561
  "path": "repo:results/omni_finetune/model_output_task_probes_20260616/RUN_REPORT.md",
12562
  "exists": true,
12563
+ "bytes": 1512,
12564
+ "sha256": "12ea92277ddc22fdd29adc3c7288ca0e0ebec3be3ffdc47f1ff7c4ec075dd015"
12565
  },
12566
  "mirrors": {
12567
  "hf_artifacts": {
12568
  "path": "hf_artifacts:results/omni_finetune/model_output_task_probes_20260616/RUN_REPORT.md",
12569
  "exists": true,
12570
+ "bytes": 1512,
12571
+ "sha256": "12ea92277ddc22fdd29adc3c7288ca0e0ebec3be3ffdc47f1ff7c4ec075dd015"
12572
  },
12573
  "hf_model": {
12574
  "path": "hf_model:results/omni_finetune/model_output_task_probes_20260616/RUN_REPORT.md",
12575
  "exists": true,
12576
+ "bytes": 1512,
12577
+ "sha256": "12ea92277ddc22fdd29adc3c7288ca0e0ebec3be3ffdc47f1ff7c4ec075dd015"
12578
+ }
12579
+ },
12580
+ "failures": []
12581
+ },
12582
+ {
12583
+ "name": "results/omni_finetune/model_output_task_probes_20260616/action_object_relation/cosmos3_nano_future_window/metrics.json",
12584
+ "status": "pass",
12585
+ "local": {
12586
+ "path": "repo:results/omni_finetune/model_output_task_probes_20260616/action_object_relation/cosmos3_nano_future_window/metrics.json",
12587
+ "exists": true,
12588
+ "bytes": 12958,
12589
+ "sha256": "0ea0cacdea44ed714fd47166a999606d76200a30453a39142554cc6bf1b12269"
12590
+ },
12591
+ "mirrors": {
12592
+ "hf_artifacts": {
12593
+ "path": "hf_artifacts:results/omni_finetune/model_output_task_probes_20260616/action_object_relation/cosmos3_nano_future_window/metrics.json",
12594
+ "exists": true,
12595
+ "bytes": 12958,
12596
+ "sha256": "0ea0cacdea44ed714fd47166a999606d76200a30453a39142554cc6bf1b12269"
12597
+ },
12598
+ "hf_model": {
12599
+ "path": "hf_model:results/omni_finetune/model_output_task_probes_20260616/action_object_relation/cosmos3_nano_future_window/metrics.json",
12600
+ "exists": true,
12601
+ "bytes": 12958,
12602
+ "sha256": "0ea0cacdea44ed714fd47166a999606d76200a30453a39142554cc6bf1b12269"
12603
+ }
12604
+ },
12605
+ "failures": []
12606
+ },
12607
+ {
12608
+ "name": "results/omni_finetune/model_output_task_probes_20260616/action_object_relation/cosmos3_nano_future_window/per_class_metrics.csv",
12609
+ "status": "pass",
12610
+ "local": {
12611
+ "path": "repo:results/omni_finetune/model_output_task_probes_20260616/action_object_relation/cosmos3_nano_future_window/per_class_metrics.csv",
12612
+ "exists": true,
12613
+ "bytes": 12133,
12614
+ "sha256": "579c606563073db2ff09a636b294b41aad1ec8d0fa8ae19b8649d3273cf88a51"
12615
+ },
12616
+ "mirrors": {
12617
+ "hf_artifacts": {
12618
+ "path": "hf_artifacts:results/omni_finetune/model_output_task_probes_20260616/action_object_relation/cosmos3_nano_future_window/per_class_metrics.csv",
12619
+ "exists": true,
12620
+ "bytes": 12133,
12621
+ "sha256": "579c606563073db2ff09a636b294b41aad1ec8d0fa8ae19b8649d3273cf88a51"
12622
+ },
12623
+ "hf_model": {
12624
+ "path": "hf_model:results/omni_finetune/model_output_task_probes_20260616/action_object_relation/cosmos3_nano_future_window/per_class_metrics.csv",
12625
+ "exists": true,
12626
+ "bytes": 12133,
12627
+ "sha256": "579c606563073db2ff09a636b294b41aad1ec8d0fa8ae19b8649d3273cf88a51"
12628
+ }
12629
+ },
12630
+ "failures": []
12631
+ },
12632
+ {
12633
+ "name": "results/omni_finetune/model_output_task_probes_20260616/action_object_relation/cosmos3_nano_future_window/predictions.csv",
12634
+ "status": "pass",
12635
+ "local": {
12636
+ "path": "repo:results/omni_finetune/model_output_task_probes_20260616/action_object_relation/cosmos3_nano_future_window/predictions.csv",
12637
+ "exists": true,
12638
+ "bytes": 125863,
12639
+ "sha256": "e8a55a2b42315e2febea992138f9ae31a5543c81219127a25f00f90cdc2440ba"
12640
+ },
12641
+ "mirrors": {
12642
+ "hf_artifacts": {
12643
+ "path": "hf_artifacts:results/omni_finetune/model_output_task_probes_20260616/action_object_relation/cosmos3_nano_future_window/predictions.csv",
12644
+ "exists": true,
12645
+ "bytes": 125863,
12646
+ "sha256": "e8a55a2b42315e2febea992138f9ae31a5543c81219127a25f00f90cdc2440ba"
12647
+ },
12648
+ "hf_model": {
12649
+ "path": "hf_model:results/omni_finetune/model_output_task_probes_20260616/action_object_relation/cosmos3_nano_future_window/predictions.csv",
12650
+ "exists": true,
12651
+ "bytes": 125863,
12652
+ "sha256": "e8a55a2b42315e2febea992138f9ae31a5543c81219127a25f00f90cdc2440ba"
12653
  }
12654
  },
12655
  "failures": []
 
12661
  "path": "repo:results/omni_finetune/model_output_task_probes_20260616/action_object_relation/cosmos3_super_reasoner/metrics.json",
12662
  "exists": true,
12663
  "bytes": 21876,
12664
+ "sha256": "af47c1007e54e06553578a2fee4c9c6a9cbd730bbef0330a32ffd846bb364f14"
12665
  },
12666
  "mirrors": {
12667
  "hf_artifacts": {
12668
  "path": "hf_artifacts:results/omni_finetune/model_output_task_probes_20260616/action_object_relation/cosmos3_super_reasoner/metrics.json",
12669
  "exists": true,
12670
  "bytes": 21876,
12671
+ "sha256": "af47c1007e54e06553578a2fee4c9c6a9cbd730bbef0330a32ffd846bb364f14"
12672
  },
12673
  "hf_model": {
12674
  "path": "hf_model:results/omni_finetune/model_output_task_probes_20260616/action_object_relation/cosmos3_super_reasoner/metrics.json",
12675
  "exists": true,
12676
  "bytes": 21876,
12677
+ "sha256": "af47c1007e54e06553578a2fee4c9c6a9cbd730bbef0330a32ffd846bb364f14"
12678
  }
12679
  },
12680
  "failures": []
 
12736
  "path": "repo:results/omni_finetune/model_output_task_probes_20260616/action_object_relation/qwen3_omni_v6_lora/metrics.json",
12737
  "exists": true,
12738
  "bytes": 169938,
12739
+ "sha256": "d1f1c299960ad62c684fe8b798467b49157b75f6bc89e8a10066cda71b66e305"
12740
  },
12741
  "mirrors": {
12742
  "hf_artifacts": {
12743
  "path": "hf_artifacts:results/omni_finetune/model_output_task_probes_20260616/action_object_relation/qwen3_omni_v6_lora/metrics.json",
12744
  "exists": true,
12745
  "bytes": 169938,
12746
+ "sha256": "d1f1c299960ad62c684fe8b798467b49157b75f6bc89e8a10066cda71b66e305"
12747
  },
12748
  "hf_model": {
12749
  "path": "hf_model:results/omni_finetune/model_output_task_probes_20260616/action_object_relation/qwen3_omni_v6_lora/metrics.json",
12750
  "exists": true,
12751
  "bytes": 169938,
12752
+ "sha256": "d1f1c299960ad62c684fe8b798467b49157b75f6bc89e8a10066cda71b66e305"
12753
  }
12754
  },
12755
  "failures": []
 
12804
  },
12805
  "failures": []
12806
  },
12807
+ {
12808
+ "name": "results/omni_finetune/model_output_task_probes_20260616/caption_grounding/cosmos3_super_reasoner/metrics.json",
12809
+ "status": "pass",
12810
+ "local": {
12811
+ "path": "repo:results/omni_finetune/model_output_task_probes_20260616/caption_grounding/cosmos3_super_reasoner/metrics.json",
12812
+ "exists": true,
12813
+ "bytes": 1738,
12814
+ "sha256": "990efd574e384b785187d442858f17d6da1342ff4ab435ee569e5aa1f6faebc3"
12815
+ },
12816
+ "mirrors": {
12817
+ "hf_artifacts": {
12818
+ "path": "hf_artifacts:results/omni_finetune/model_output_task_probes_20260616/caption_grounding/cosmos3_super_reasoner/metrics.json",
12819
+ "exists": true,
12820
+ "bytes": 1738,
12821
+ "sha256": "990efd574e384b785187d442858f17d6da1342ff4ab435ee569e5aa1f6faebc3"
12822
+ },
12823
+ "hf_model": {
12824
+ "path": "hf_model:results/omni_finetune/model_output_task_probes_20260616/caption_grounding/cosmos3_super_reasoner/metrics.json",
12825
+ "exists": true,
12826
+ "bytes": 1738,
12827
+ "sha256": "990efd574e384b785187d442858f17d6da1342ff4ab435ee569e5aa1f6faebc3"
12828
+ }
12829
+ },
12830
+ "failures": []
12831
+ },
12832
+ {
12833
+ "name": "results/omni_finetune/model_output_task_probes_20260616/caption_grounding/cosmos3_super_reasoner/predictions.csv",
12834
+ "status": "pass",
12835
+ "local": {
12836
+ "path": "repo:results/omni_finetune/model_output_task_probes_20260616/caption_grounding/cosmos3_super_reasoner/predictions.csv",
12837
+ "exists": true,
12838
+ "bytes": 57340,
12839
+ "sha256": "4216a73df04338edf271aaeafe66b041675726d21909e1eb25e7face575c567f"
12840
+ },
12841
+ "mirrors": {
12842
+ "hf_artifacts": {
12843
+ "path": "hf_artifacts:results/omni_finetune/model_output_task_probes_20260616/caption_grounding/cosmos3_super_reasoner/predictions.csv",
12844
+ "exists": true,
12845
+ "bytes": 57340,
12846
+ "sha256": "4216a73df04338edf271aaeafe66b041675726d21909e1eb25e7face575c567f"
12847
+ },
12848
+ "hf_model": {
12849
+ "path": "hf_model:results/omni_finetune/model_output_task_probes_20260616/caption_grounding/cosmos3_super_reasoner/predictions.csv",
12850
+ "exists": true,
12851
+ "bytes": 57340,
12852
+ "sha256": "4216a73df04338edf271aaeafe66b041675726d21909e1eb25e7face575c567f"
12853
+ }
12854
+ },
12855
+ "failures": []
12856
+ },
12857
  {
12858
  "name": "results/omni_finetune/model_output_task_probes_20260616/cosmos3_nano_future_window_source_window_map.jsonl",
12859
  "status": "pass",
 
12911
  "path": "repo:results/omni_finetune/model_output_task_probes_20260616/long_horizon_next_action/cosmos3_nano_future_window/metrics.json",
12912
  "exists": true,
12913
  "bytes": 7404,
12914
+ "sha256": "4d6781bdd3baffdefa929097624be08b8217b3ab03b6f091dd712665a7b3bc21"
12915
  },
12916
  "mirrors": {
12917
  "hf_artifacts": {
12918
  "path": "hf_artifacts:results/omni_finetune/model_output_task_probes_20260616/long_horizon_next_action/cosmos3_nano_future_window/metrics.json",
12919
  "exists": true,
12920
  "bytes": 7404,
12921
+ "sha256": "4d6781bdd3baffdefa929097624be08b8217b3ab03b6f091dd712665a7b3bc21"
12922
  },
12923
  "hf_model": {
12924
  "path": "hf_model:results/omni_finetune/model_output_task_probes_20260616/long_horizon_next_action/cosmos3_nano_future_window/metrics.json",
12925
  "exists": true,
12926
  "bytes": 7404,
12927
+ "sha256": "4d6781bdd3baffdefa929097624be08b8217b3ab03b6f091dd712665a7b3bc21"
12928
  }
12929
  },
12930
  "failures": []
 
12986
  "path": "repo:results/omni_finetune/model_output_task_probes_20260616/long_horizon_next_action/cosmos3_super_reasoner/metrics.json",
12987
  "exists": true,
12988
  "bytes": 10051,
12989
+ "sha256": "19eda7f488885383787498cb081b3e9e6cdd37a64d8f20be1e8f035677e59bea"
12990
  },
12991
  "mirrors": {
12992
  "hf_artifacts": {
12993
  "path": "hf_artifacts:results/omni_finetune/model_output_task_probes_20260616/long_horizon_next_action/cosmos3_super_reasoner/metrics.json",
12994
  "exists": true,
12995
  "bytes": 10051,
12996
+ "sha256": "19eda7f488885383787498cb081b3e9e6cdd37a64d8f20be1e8f035677e59bea"
12997
  },
12998
  "hf_model": {
12999
  "path": "hf_model:results/omni_finetune/model_output_task_probes_20260616/long_horizon_next_action/cosmos3_super_reasoner/metrics.json",
13000
  "exists": true,
13001
  "bytes": 10051,
13002
+ "sha256": "19eda7f488885383787498cb081b3e9e6cdd37a64d8f20be1e8f035677e59bea"
13003
  }
13004
  },
13005
  "failures": []
 
13061
  "path": "repo:results/omni_finetune/model_output_task_probes_20260616/modality_reconstruction/cosmos3_nano_future_window/metrics.json",
13062
  "exists": true,
13063
  "bytes": 1825,
13064
+ "sha256": "12f7b713dd4b203b6d5043e04600a47123a4b098e243388245849f85f9632b47"
13065
  },
13066
  "mirrors": {
13067
  "hf_artifacts": {
13068
  "path": "hf_artifacts:results/omni_finetune/model_output_task_probes_20260616/modality_reconstruction/cosmos3_nano_future_window/metrics.json",
13069
  "exists": true,
13070
  "bytes": 1825,
13071
+ "sha256": "12f7b713dd4b203b6d5043e04600a47123a4b098e243388245849f85f9632b47"
13072
  },
13073
  "hf_model": {
13074
  "path": "hf_model:results/omni_finetune/model_output_task_probes_20260616/modality_reconstruction/cosmos3_nano_future_window/metrics.json",
13075
  "exists": true,
13076
  "bytes": 1825,
13077
+ "sha256": "12f7b713dd4b203b6d5043e04600a47123a4b098e243388245849f85f9632b47"
13078
  }
13079
  },
13080
  "failures": []
 
13086
  "path": "repo:results/omni_finetune/model_output_task_probes_20260616/next_subtask_forecast/cosmos3_nano_future_window/metrics.json",
13087
  "exists": true,
13088
  "bytes": 5594,
13089
+ "sha256": "0d9a271a814c09b0be12effce60b59cb9d67a98fa532dca33a84f1332de362f3"
13090
  },
13091
  "mirrors": {
13092
  "hf_artifacts": {
13093
  "path": "hf_artifacts:results/omni_finetune/model_output_task_probes_20260616/next_subtask_forecast/cosmos3_nano_future_window/metrics.json",
13094
  "exists": true,
13095
  "bytes": 5594,
13096
+ "sha256": "0d9a271a814c09b0be12effce60b59cb9d67a98fa532dca33a84f1332de362f3"
13097
  },
13098
  "hf_model": {
13099
  "path": "hf_model:results/omni_finetune/model_output_task_probes_20260616/next_subtask_forecast/cosmos3_nano_future_window/metrics.json",
13100
  "exists": true,
13101
  "bytes": 5594,
13102
+ "sha256": "0d9a271a814c09b0be12effce60b59cb9d67a98fa532dca33a84f1332de362f3"
13103
  }
13104
  },
13105
  "failures": []
 
13161
  "path": "repo:results/omni_finetune/model_output_task_probes_20260616/object_set_forecast/cosmos3_nano_future_window/metrics.json",
13162
  "exists": true,
13163
  "bytes": 2225,
13164
+ "sha256": "0c2f6c5685c474082d41d1358f277afc04f2a1150b748979e7ac93e06e42b730"
13165
  },
13166
  "mirrors": {
13167
  "hf_artifacts": {
13168
  "path": "hf_artifacts:results/omni_finetune/model_output_task_probes_20260616/object_set_forecast/cosmos3_nano_future_window/metrics.json",
13169
  "exists": true,
13170
  "bytes": 2225,
13171
+ "sha256": "0c2f6c5685c474082d41d1358f277afc04f2a1150b748979e7ac93e06e42b730"
13172
  },
13173
  "hf_model": {
13174
  "path": "hf_model:results/omni_finetune/model_output_task_probes_20260616/object_set_forecast/cosmos3_nano_future_window/metrics.json",
13175
  "exists": true,
13176
  "bytes": 2225,
13177
+ "sha256": "0c2f6c5685c474082d41d1358f277afc04f2a1150b748979e7ac93e06e42b730"
13178
  }
13179
  },
13180
  "failures": []
 
13210
  "local": {
13211
  "path": "repo:results/omni_finetune/model_output_task_probes_20260616/summary.json",
13212
  "exists": true,
13213
+ "bytes": 5951,
13214
+ "sha256": "910477d2fba648605dda128d0ecd2a2c13cfa460573e350dc850014ac91c6c2b"
13215
  },
13216
  "mirrors": {
13217
  "hf_artifacts": {
13218
  "path": "hf_artifacts:results/omni_finetune/model_output_task_probes_20260616/summary.json",
13219
  "exists": true,
13220
+ "bytes": 5951,
13221
+ "sha256": "910477d2fba648605dda128d0ecd2a2c13cfa460573e350dc850014ac91c6c2b"
13222
  },
13223
  "hf_model": {
13224
  "path": "hf_model:results/omni_finetune/model_output_task_probes_20260616/summary.json",
13225
  "exists": true,
13226
+ "bytes": 5951,
13227
+ "sha256": "910477d2fba648605dda128d0ecd2a2c13cfa460573e350dc850014ac91c6c2b"
13228
  }
13229
  },
13230
  "failures": []
 
13236
  "path": "repo:results/omni_finetune/model_output_task_probes_20260616/time_to_transition/cosmos3_nano_future_window/metrics.json",
13237
  "exists": true,
13238
  "bytes": 2398,
13239
+ "sha256": "8fc3464d2183c8e1604b499262327ef315ad0eef0f7c66464fb1229ed23e7a8d"
13240
  },
13241
  "mirrors": {
13242
  "hf_artifacts": {
13243
  "path": "hf_artifacts:results/omni_finetune/model_output_task_probes_20260616/time_to_transition/cosmos3_nano_future_window/metrics.json",
13244
  "exists": true,
13245
  "bytes": 2398,
13246
+ "sha256": "8fc3464d2183c8e1604b499262327ef315ad0eef0f7c66464fb1229ed23e7a8d"
13247
  },
13248
  "hf_model": {
13249
  "path": "hf_model:results/omni_finetune/model_output_task_probes_20260616/time_to_transition/cosmos3_nano_future_window/metrics.json",
13250
  "exists": true,
13251
  "bytes": 2398,
13252
+ "sha256": "8fc3464d2183c8e1604b499262327ef315ad0eef0f7c66464fb1229ed23e7a8d"
13253
  }
13254
  },
13255
  "failures": []
 
13286
  "path": "repo:results/omni_finetune/model_output_task_probes_20260616/time_to_transition/cosmos3_super_reasoner/metrics.json",
13287
  "exists": true,
13288
  "bytes": 2049,
13289
+ "sha256": "0d3b07e5b66015b6f3cfa61e2fddcc669e2397b3659367f58eb0371b7955413d"
13290
  },
13291
  "mirrors": {
13292
  "hf_artifacts": {
13293
  "path": "hf_artifacts:results/omni_finetune/model_output_task_probes_20260616/time_to_transition/cosmos3_super_reasoner/metrics.json",
13294
  "exists": true,
13295
  "bytes": 2049,
13296
+ "sha256": "0d3b07e5b66015b6f3cfa61e2fddcc669e2397b3659367f58eb0371b7955413d"
13297
  },
13298
  "hf_model": {
13299
  "path": "hf_model:results/omni_finetune/model_output_task_probes_20260616/time_to_transition/cosmos3_super_reasoner/metrics.json",
13300
  "exists": true,
13301
  "bytes": 2049,
13302
+ "sha256": "0d3b07e5b66015b6f3cfa61e2fddcc669e2397b3659367f58eb0371b7955413d"
13303
  }
13304
  },
13305
  "failures": []
 
20792
  "local": {
20793
  "path": "repo:results/omni_finetune/model_output_task_probes_20260616/RUN_REPORT.md",
20794
  "exists": true,
20795
+ "bytes": 1512,
20796
+ "sha256": "12ea92277ddc22fdd29adc3c7288ca0e0ebec3be3ffdc47f1ff7c4ec075dd015"
20797
  },
20798
  "mirrors": {
20799
  "hf_space": {
20800
  "path": "hf_space:results/omni_finetune/model_output_task_probes_20260616/RUN_REPORT.md",
20801
  "exists": true,
20802
+ "bytes": 1512,
20803
+ "sha256": "12ea92277ddc22fdd29adc3c7288ca0e0ebec3be3ffdc47f1ff7c4ec075dd015"
20804
+ }
20805
+ },
20806
+ "failures": []
20807
+ },
20808
+ {
20809
+ "name": "space_results/omni_finetune/model_output_task_probes_20260616/action_object_relation/cosmos3_nano_future_window/metrics.json",
20810
+ "status": "pass",
20811
+ "local": {
20812
+ "path": "repo:results/omni_finetune/model_output_task_probes_20260616/action_object_relation/cosmos3_nano_future_window/metrics.json",
20813
+ "exists": true,
20814
+ "bytes": 12958,
20815
+ "sha256": "0ea0cacdea44ed714fd47166a999606d76200a30453a39142554cc6bf1b12269"
20816
+ },
20817
+ "mirrors": {
20818
+ "hf_space": {
20819
+ "path": "hf_space:results/omni_finetune/model_output_task_probes_20260616/action_object_relation/cosmos3_nano_future_window/metrics.json",
20820
+ "exists": true,
20821
+ "bytes": 12958,
20822
+ "sha256": "0ea0cacdea44ed714fd47166a999606d76200a30453a39142554cc6bf1b12269"
20823
+ }
20824
+ },
20825
+ "failures": []
20826
+ },
20827
+ {
20828
+ "name": "space_results/omni_finetune/model_output_task_probes_20260616/action_object_relation/cosmos3_nano_future_window/per_class_metrics.csv",
20829
+ "status": "pass",
20830
+ "local": {
20831
+ "path": "repo:results/omni_finetune/model_output_task_probes_20260616/action_object_relation/cosmos3_nano_future_window/per_class_metrics.csv",
20832
+ "exists": true,
20833
+ "bytes": 12133,
20834
+ "sha256": "579c606563073db2ff09a636b294b41aad1ec8d0fa8ae19b8649d3273cf88a51"
20835
+ },
20836
+ "mirrors": {
20837
+ "hf_space": {
20838
+ "path": "hf_space:results/omni_finetune/model_output_task_probes_20260616/action_object_relation/cosmos3_nano_future_window/per_class_metrics.csv",
20839
+ "exists": true,
20840
+ "bytes": 12133,
20841
+ "sha256": "579c606563073db2ff09a636b294b41aad1ec8d0fa8ae19b8649d3273cf88a51"
20842
+ }
20843
+ },
20844
+ "failures": []
20845
+ },
20846
+ {
20847
+ "name": "space_results/omni_finetune/model_output_task_probes_20260616/action_object_relation/cosmos3_nano_future_window/predictions.csv",
20848
+ "status": "pass",
20849
+ "local": {
20850
+ "path": "repo:results/omni_finetune/model_output_task_probes_20260616/action_object_relation/cosmos3_nano_future_window/predictions.csv",
20851
+ "exists": true,
20852
+ "bytes": 125863,
20853
+ "sha256": "e8a55a2b42315e2febea992138f9ae31a5543c81219127a25f00f90cdc2440ba"
20854
+ },
20855
+ "mirrors": {
20856
+ "hf_space": {
20857
+ "path": "hf_space:results/omni_finetune/model_output_task_probes_20260616/action_object_relation/cosmos3_nano_future_window/predictions.csv",
20858
+ "exists": true,
20859
+ "bytes": 125863,
20860
+ "sha256": "e8a55a2b42315e2febea992138f9ae31a5543c81219127a25f00f90cdc2440ba"
20861
  }
20862
  },
20863
  "failures": []
 
20869
  "path": "repo:results/omni_finetune/model_output_task_probes_20260616/action_object_relation/cosmos3_super_reasoner/metrics.json",
20870
  "exists": true,
20871
  "bytes": 21876,
20872
+ "sha256": "af47c1007e54e06553578a2fee4c9c6a9cbd730bbef0330a32ffd846bb364f14"
20873
  },
20874
  "mirrors": {
20875
  "hf_space": {
20876
  "path": "hf_space:results/omni_finetune/model_output_task_probes_20260616/action_object_relation/cosmos3_super_reasoner/metrics.json",
20877
  "exists": true,
20878
  "bytes": 21876,
20879
+ "sha256": "af47c1007e54e06553578a2fee4c9c6a9cbd730bbef0330a32ffd846bb364f14"
20880
  }
20881
  },
20882
  "failures": []
 
20926
  "path": "repo:results/omni_finetune/model_output_task_probes_20260616/action_object_relation/qwen3_omni_v6_lora/metrics.json",
20927
  "exists": true,
20928
  "bytes": 169938,
20929
+ "sha256": "d1f1c299960ad62c684fe8b798467b49157b75f6bc89e8a10066cda71b66e305"
20930
  },
20931
  "mirrors": {
20932
  "hf_space": {
20933
  "path": "hf_space:results/omni_finetune/model_output_task_probes_20260616/action_object_relation/qwen3_omni_v6_lora/metrics.json",
20934
  "exists": true,
20935
  "bytes": 169938,
20936
+ "sha256": "d1f1c299960ad62c684fe8b798467b49157b75f6bc89e8a10066cda71b66e305"
20937
  }
20938
  },
20939
  "failures": []
 
20976
  },
20977
  "failures": []
20978
  },
20979
+ {
20980
+ "name": "space_results/omni_finetune/model_output_task_probes_20260616/caption_grounding/cosmos3_super_reasoner/metrics.json",
20981
+ "status": "pass",
20982
+ "local": {
20983
+ "path": "repo:results/omni_finetune/model_output_task_probes_20260616/caption_grounding/cosmos3_super_reasoner/metrics.json",
20984
+ "exists": true,
20985
+ "bytes": 1738,
20986
+ "sha256": "990efd574e384b785187d442858f17d6da1342ff4ab435ee569e5aa1f6faebc3"
20987
+ },
20988
+ "mirrors": {
20989
+ "hf_space": {
20990
+ "path": "hf_space:results/omni_finetune/model_output_task_probes_20260616/caption_grounding/cosmos3_super_reasoner/metrics.json",
20991
+ "exists": true,
20992
+ "bytes": 1738,
20993
+ "sha256": "990efd574e384b785187d442858f17d6da1342ff4ab435ee569e5aa1f6faebc3"
20994
+ }
20995
+ },
20996
+ "failures": []
20997
+ },
20998
+ {
20999
+ "name": "space_results/omni_finetune/model_output_task_probes_20260616/caption_grounding/cosmos3_super_reasoner/predictions.csv",
21000
+ "status": "pass",
21001
+ "local": {
21002
+ "path": "repo:results/omni_finetune/model_output_task_probes_20260616/caption_grounding/cosmos3_super_reasoner/predictions.csv",
21003
+ "exists": true,
21004
+ "bytes": 57340,
21005
+ "sha256": "4216a73df04338edf271aaeafe66b041675726d21909e1eb25e7face575c567f"
21006
+ },
21007
+ "mirrors": {
21008
+ "hf_space": {
21009
+ "path": "hf_space:results/omni_finetune/model_output_task_probes_20260616/caption_grounding/cosmos3_super_reasoner/predictions.csv",
21010
+ "exists": true,
21011
+ "bytes": 57340,
21012
+ "sha256": "4216a73df04338edf271aaeafe66b041675726d21909e1eb25e7face575c567f"
21013
+ }
21014
+ },
21015
+ "failures": []
21016
+ },
21017
  {
21018
  "name": "space_results/omni_finetune/model_output_task_probes_20260616/cosmos3_nano_future_window_source_window_map.jsonl",
21019
  "status": "pass",
 
21059
  "path": "repo:results/omni_finetune/model_output_task_probes_20260616/long_horizon_next_action/cosmos3_nano_future_window/metrics.json",
21060
  "exists": true,
21061
  "bytes": 7404,
21062
+ "sha256": "4d6781bdd3baffdefa929097624be08b8217b3ab03b6f091dd712665a7b3bc21"
21063
  },
21064
  "mirrors": {
21065
  "hf_space": {
21066
  "path": "hf_space:results/omni_finetune/model_output_task_probes_20260616/long_horizon_next_action/cosmos3_nano_future_window/metrics.json",
21067
  "exists": true,
21068
  "bytes": 7404,
21069
+ "sha256": "4d6781bdd3baffdefa929097624be08b8217b3ab03b6f091dd712665a7b3bc21"
21070
  }
21071
  },
21072
  "failures": []
 
21116
  "path": "repo:results/omni_finetune/model_output_task_probes_20260616/long_horizon_next_action/cosmos3_super_reasoner/metrics.json",
21117
  "exists": true,
21118
  "bytes": 10051,
21119
+ "sha256": "19eda7f488885383787498cb081b3e9e6cdd37a64d8f20be1e8f035677e59bea"
21120
  },
21121
  "mirrors": {
21122
  "hf_space": {
21123
  "path": "hf_space:results/omni_finetune/model_output_task_probes_20260616/long_horizon_next_action/cosmos3_super_reasoner/metrics.json",
21124
  "exists": true,
21125
  "bytes": 10051,
21126
+ "sha256": "19eda7f488885383787498cb081b3e9e6cdd37a64d8f20be1e8f035677e59bea"
21127
  }
21128
  },
21129
  "failures": []
 
21173
  "path": "repo:results/omni_finetune/model_output_task_probes_20260616/modality_reconstruction/cosmos3_nano_future_window/metrics.json",
21174
  "exists": true,
21175
  "bytes": 1825,
21176
+ "sha256": "12f7b713dd4b203b6d5043e04600a47123a4b098e243388245849f85f9632b47"
21177
  },
21178
  "mirrors": {
21179
  "hf_space": {
21180
  "path": "hf_space:results/omni_finetune/model_output_task_probes_20260616/modality_reconstruction/cosmos3_nano_future_window/metrics.json",
21181
  "exists": true,
21182
  "bytes": 1825,
21183
+ "sha256": "12f7b713dd4b203b6d5043e04600a47123a4b098e243388245849f85f9632b47"
21184
  }
21185
  },
21186
  "failures": []
 
21192
  "path": "repo:results/omni_finetune/model_output_task_probes_20260616/next_subtask_forecast/cosmos3_nano_future_window/metrics.json",
21193
  "exists": true,
21194
  "bytes": 5594,
21195
+ "sha256": "0d9a271a814c09b0be12effce60b59cb9d67a98fa532dca33a84f1332de362f3"
21196
  },
21197
  "mirrors": {
21198
  "hf_space": {
21199
  "path": "hf_space:results/omni_finetune/model_output_task_probes_20260616/next_subtask_forecast/cosmos3_nano_future_window/metrics.json",
21200
  "exists": true,
21201
  "bytes": 5594,
21202
+ "sha256": "0d9a271a814c09b0be12effce60b59cb9d67a98fa532dca33a84f1332de362f3"
21203
  }
21204
  },
21205
  "failures": []
 
21249
  "path": "repo:results/omni_finetune/model_output_task_probes_20260616/object_set_forecast/cosmos3_nano_future_window/metrics.json",
21250
  "exists": true,
21251
  "bytes": 2225,
21252
+ "sha256": "0c2f6c5685c474082d41d1358f277afc04f2a1150b748979e7ac93e06e42b730"
21253
  },
21254
  "mirrors": {
21255
  "hf_space": {
21256
  "path": "hf_space:results/omni_finetune/model_output_task_probes_20260616/object_set_forecast/cosmos3_nano_future_window/metrics.json",
21257
  "exists": true,
21258
  "bytes": 2225,
21259
+ "sha256": "0c2f6c5685c474082d41d1358f277afc04f2a1150b748979e7ac93e06e42b730"
21260
  }
21261
  },
21262
  "failures": []
 
21286
  "local": {
21287
  "path": "repo:results/omni_finetune/model_output_task_probes_20260616/summary.json",
21288
  "exists": true,
21289
+ "bytes": 5951,
21290
+ "sha256": "910477d2fba648605dda128d0ecd2a2c13cfa460573e350dc850014ac91c6c2b"
21291
  },
21292
  "mirrors": {
21293
  "hf_space": {
21294
  "path": "hf_space:results/omni_finetune/model_output_task_probes_20260616/summary.json",
21295
  "exists": true,
21296
+ "bytes": 5951,
21297
+ "sha256": "910477d2fba648605dda128d0ecd2a2c13cfa460573e350dc850014ac91c6c2b"
21298
  }
21299
  },
21300
  "failures": []
 
21306
  "path": "repo:results/omni_finetune/model_output_task_probes_20260616/time_to_transition/cosmos3_nano_future_window/metrics.json",
21307
  "exists": true,
21308
  "bytes": 2398,
21309
+ "sha256": "8fc3464d2183c8e1604b499262327ef315ad0eef0f7c66464fb1229ed23e7a8d"
21310
  },
21311
  "mirrors": {
21312
  "hf_space": {
21313
  "path": "hf_space:results/omni_finetune/model_output_task_probes_20260616/time_to_transition/cosmos3_nano_future_window/metrics.json",
21314
  "exists": true,
21315
  "bytes": 2398,
21316
+ "sha256": "8fc3464d2183c8e1604b499262327ef315ad0eef0f7c66464fb1229ed23e7a8d"
21317
  }
21318
  },
21319
  "failures": []
 
21344
  "path": "repo:results/omni_finetune/model_output_task_probes_20260616/time_to_transition/cosmos3_super_reasoner/metrics.json",
21345
  "exists": true,
21346
  "bytes": 2049,
21347
+ "sha256": "0d3b07e5b66015b6f3cfa61e2fddcc669e2397b3659367f58eb0371b7955413d"
21348
  },
21349
  "mirrors": {
21350
  "hf_space": {
21351
  "path": "hf_space:results/omni_finetune/model_output_task_probes_20260616/time_to_transition/cosmos3_super_reasoner/metrics.json",
21352
  "exists": true,
21353
  "bytes": 2049,
21354
+ "sha256": "0d3b07e5b66015b6f3cfa61e2fddcc669e2397b3659367f58eb0371b7955413d"
21355
  }
21356
  },
21357
  "failures": []
 
22930
  "local": {
22931
  "path": "repo:TASK_METHOD_20_GAP_AUDIT.md",
22932
  "exists": true,
22933
+ "bytes": 8428,
22934
+ "sha256": "b33c7f91565a2603b138eb4ec1c6df32d823225b16563eba279f416b0fe2a964"
22935
  },
22936
  "mirrors": {
22937
  "hf_space": {
22938
  "path": "hf_space:TASK_METHOD_20_GAP_AUDIT.md",
22939
  "exists": true,
22940
+ "bytes": 8428,
22941
+ "sha256": "b33c7f91565a2603b138eb4ec1c6df32d823225b16563eba279f416b0fe2a964"
22942
  },
22943
  "hf_artifacts": {
22944
  "path": "hf_artifacts:TASK_METHOD_20_GAP_AUDIT.md",
22945
  "exists": true,
22946
+ "bytes": 8428,
22947
+ "sha256": "b33c7f91565a2603b138eb4ec1c6df32d823225b16563eba279f416b0fe2a964"
22948
  },
22949
  "hf_model": {
22950
  "path": "hf_model:TASK_METHOD_20_GAP_AUDIT.md",
22951
  "exists": true,
22952
+ "bytes": 8428,
22953
+ "sha256": "b33c7f91565a2603b138eb4ec1c6df32d823225b16563eba279f416b0fe2a964"
22954
  }
22955
  },
22956
  "failures": []
 
22961
  "local": {
22962
  "path": "repo:TASK_METHOD_20_RESULT_MATRIX.md",
22963
  "exists": true,
22964
+ "bytes": 3876,
22965
+ "sha256": "a9ce23a452ca73b6d08219ffaac1782d5baad11f9e3662138b62cb4cd5ff206f"
22966
  },
22967
  "mirrors": {
22968
  "hf_space": {
22969
  "path": "hf_space:TASK_METHOD_20_RESULT_MATRIX.md",
22970
  "exists": true,
22971
+ "bytes": 3876,
22972
+ "sha256": "a9ce23a452ca73b6d08219ffaac1782d5baad11f9e3662138b62cb4cd5ff206f"
22973
  },
22974
  "hf_artifacts": {
22975
  "path": "hf_artifacts:TASK_METHOD_20_RESULT_MATRIX.md",
22976
  "exists": true,
22977
+ "bytes": 3876,
22978
+ "sha256": "a9ce23a452ca73b6d08219ffaac1782d5baad11f9e3662138b62cb4cd5ff206f"
22979
  },
22980
  "hf_model": {
22981
  "path": "hf_model:TASK_METHOD_20_RESULT_MATRIX.md",
22982
  "exists": true,
22983
+ "bytes": 3876,
22984
+ "sha256": "a9ce23a452ca73b6d08219ffaac1782d5baad11f9e3662138b62cb4cd5ff206f"
22985
  }
22986
  },
22987
  "failures": []
data/public_surface_qa.json CHANGED
@@ -1,7 +1,7 @@
1
  {
2
  "title": "Ropedia Xperience-10M Public Project Surface",
3
  "status": "pass",
4
- "generated_at_utc": "2026-06-18T22:26:00+00:00",
5
  "scope": "Repo README, GitHub Pages HTML, Hugging Face Space card, artifact dataset card, and model card.",
6
  "checks": [
7
  {
@@ -18,7 +18,7 @@
18
  "website_integrity": {
19
  "exists": true,
20
  "status": "pass",
21
- "generated_at_utc": "2026-06-18T21:01:47+00:00"
22
  },
23
  "rendered_site_check": {
24
  "exists": true,
@@ -28,27 +28,27 @@
28
  "task_surface_integrity": {
29
  "exists": true,
30
  "status": "pass",
31
- "generated_at_utc": "2026-06-18T21:01:45+00:00"
32
  },
33
  "source_alignment": {
34
  "exists": true,
35
  "status": "pass",
36
- "generated_at_utc": "2026-06-18T21:01:45+00:00"
37
  },
38
  "scale_up_status": {
39
  "exists": true,
40
  "status": "pass",
41
- "generated_at_utc": "2026-06-18T21:01:43+00:00"
42
  },
43
  "publication_package": {
44
  "exists": true,
45
  "status": "pass",
46
- "generated_at_utc": "2026-06-18T21:02:20+00:00"
47
  },
48
  "mirror_parity": {
49
  "exists": true,
50
  "status": "pass",
51
- "generated_at_utc": "2026-06-18T21:03:15+00:00"
52
  }
53
  },
54
  "failures": {}
 
1
  {
2
  "title": "Ropedia Xperience-10M Public Project Surface",
3
  "status": "pass",
4
+ "generated_at_utc": "2026-06-18T22:57:13+00:00",
5
  "scope": "Repo README, GitHub Pages HTML, Hugging Face Space card, artifact dataset card, and model card.",
6
  "checks": [
7
  {
 
18
  "website_integrity": {
19
  "exists": true,
20
  "status": "pass",
21
+ "generated_at_utc": "2026-06-18T22:27:45+00:00"
22
  },
23
  "rendered_site_check": {
24
  "exists": true,
 
28
  "task_surface_integrity": {
29
  "exists": true,
30
  "status": "pass",
31
+ "generated_at_utc": "2026-06-18T22:27:40+00:00"
32
  },
33
  "source_alignment": {
34
  "exists": true,
35
  "status": "pass",
36
+ "generated_at_utc": "2026-06-18T22:27:40+00:00"
37
  },
38
  "scale_up_status": {
39
  "exists": true,
40
  "status": "pass",
41
+ "generated_at_utc": "2026-06-18T22:27:40+00:00"
42
  },
43
  "publication_package": {
44
  "exists": true,
45
  "status": "pass",
46
+ "generated_at_utc": "2026-06-18T22:27:55+00:00"
47
  },
48
  "mirror_parity": {
49
  "exists": true,
50
  "status": "pass",
51
+ "generated_at_utc": "2026-06-18T22:36:57+00:00"
52
  }
53
  },
54
  "failures": {}
data/quality_gates.json CHANGED
@@ -1,7 +1,7 @@
1
  {
2
  "title": "Ropedia Xperience-10M Release Checks",
3
  "status": "pass",
4
- "generated_at_utc": "2026-06-18T22:26:00+00:00",
5
  "rule": "A release is current when the automated reports pass and the live GitHub/Hugging Face mirrors are verified after publishing.",
6
  "automated_gates": [
7
  {
 
1
  {
2
  "title": "Ropedia Xperience-10M Release Checks",
3
  "status": "pass",
4
+ "generated_at_utc": "2026-06-18T22:57:13+00:00",
5
  "rule": "A release is current when the automated reports pass and the live GitHub/Hugging Face mirrors are verified after publishing.",
6
  "automated_gates": [
7
  {
data/single_episode_task_model_radar.json CHANGED
@@ -1,7 +1,7 @@
1
  {
2
  "title": "Single-Episode 20-Task Radar",
3
  "status": "pass",
4
- "generated_at_utc": "2026-06-18T22:25:59+00:00",
5
  "description": "Minimal and Neural MLP baselines on the one public sample episode, both scored on all 20 task contracts.",
6
  "task_count": 20,
7
  "method_count": 2,
 
1
  {
2
  "title": "Single-Episode 20-Task Radar",
3
  "status": "pass",
4
+ "generated_at_utc": "2026-06-18T22:55:01+00:00",
5
  "description": "Minimal and Neural MLP baselines on the one public sample episode, both scored on all 20 task contracts.",
6
  "task_count": 20,
7
  "method_count": 2,
data/source_alignment_audit.json CHANGED
@@ -1,7 +1,7 @@
1
  {
2
  "title": "Ropedia Xperience-10M Source Alignment Note",
3
  "status": "pass",
4
- "generated_at_utc": "2026-06-18T22:27:40+00:00",
5
  "alignment_json": "docs/data/xperience10m_dataset_card_alignment.json",
6
  "alignment_summary": {
7
  "full_dataset_repo": "ropedia-ai/xperience-10m",
 
1
  {
2
  "title": "Ropedia Xperience-10M Source Alignment Note",
3
  "status": "pass",
4
+ "generated_at_utc": "2026-06-18T22:57:59+00:00",
5
  "alignment_json": "docs/data/xperience10m_dataset_card_alignment.json",
6
  "alignment_summary": {
7
  "full_dataset_repo": "ropedia-ai/xperience-10m",
data/task_method_20_gap_audit.json CHANGED
@@ -1,10 +1,10 @@
1
  {
2
- "generated_at_utc": "2026-06-18T22:25:59+00:00",
3
  "immediate_actions": [
4
  {
5
  "artifact": "docs/data/task_method_20_gap_audit.json",
6
  "id": "gap_audit",
7
- "purpose": "Keep the 29 scoreless cells visible and reproducible."
8
  },
9
  {
10
  "artifact": "scripts/omni/score_model_output_probes.py",
@@ -24,11 +24,11 @@
24
  "proxy_scored_task_count": 0,
25
  "result_record_count": 20,
26
  "scope": "128 selected episodes, held-out test",
27
- "scored_task_count": 10,
28
- "scoreless_task_count": 10,
29
  "status_counts": {
30
- "not_evaluated_in_verified_package": 10,
31
- "scored": 10
32
  }
33
  },
34
  "cosmos3_super_reasoner": {
@@ -37,11 +37,11 @@
37
  "proxy_scored_task_count": 0,
38
  "result_record_count": 20,
39
  "scope": "128 selected episodes, held-out test",
40
- "scored_task_count": 9,
41
- "scoreless_task_count": 11,
42
  "status_counts": {
43
- "not_evaluated_in_verified_package": 11,
44
- "scored": 9
45
  }
46
  },
47
  "metadata128_neural_mlp": {
@@ -135,14 +135,14 @@
135
  }
136
  },
137
  "missing_by_method": {
138
- "cosmos3_nano_future_window": 10,
139
- "cosmos3_super_reasoner": 11,
140
  "metadata128_neural_mlp": 2,
141
  "metadata128_simple": 2,
142
  "qwen3_omni_v6_lora": 4
143
  },
144
  "missing_by_status": {
145
- "not_evaluated_in_verified_package": 25,
146
  "not_supported_by_metadata_only_package": 2,
147
  "unsupported_without_required_target": 2
148
  },
@@ -159,8 +159,7 @@
159
  "cosmos3_nano_future_window"
160
  ],
161
  "08 Language Grounding": [
162
- "cosmos3_nano_future_window",
163
- "cosmos3_super_reasoner"
164
  ],
165
  "09 Cross-Modal Retrieval": [
166
  "cosmos3_super_reasoner"
@@ -187,9 +186,6 @@
187
  "metadata128_simple",
188
  "qwen3_omni_v6_lora"
189
  ],
190
- "16 Action-Object Relation Prediction": [
191
- "cosmos3_nano_future_window"
192
- ],
193
  "17 Future Object-Set Forecasting": [
194
  "cosmos3_super_reasoner"
195
  ],
@@ -271,19 +267,6 @@
271
  "task_label": "Object Relevance Prediction",
272
  "task_number": 7
273
  },
274
- {
275
- "method": "Cosmos3-Super Reasoner",
276
- "metric_key": "mrr",
277
- "reason": "the verified public model package did not ask this branch to emit that task target; a new task-specific evaluation package is required for a numeric score",
278
- "recommended_next_step": "Generate verified model outputs for this task contract and score them against the held-out labels.",
279
- "scope": "multi_episode_128_partial_model_overlay",
280
- "series_id": "cosmos3_super_reasoner",
281
- "status": "not_evaluated_in_verified_package",
282
- "status_label": "not evaluated",
283
- "task_id": "caption_grounding",
284
- "task_label": "Language Grounding",
285
- "task_number": 8
286
- },
287
  {
288
  "method": "Cosmos3-Nano Future Window",
289
  "metric_key": "mrr",
@@ -466,19 +449,6 @@
466
  "task_label": "Interaction Text Prediction",
467
  "task_number": 15
468
  },
469
- {
470
- "method": "Cosmos3-Nano Future Window",
471
- "metric_key": "macro_f1",
472
- "reason": "the verified public model package did not ask this branch to emit that task target; a new task-specific evaluation package is required for a numeric score",
473
- "recommended_next_step": "Generate verified model outputs for this task contract and score them against the held-out labels.",
474
- "scope": "multi_episode_128_partial_model_overlay",
475
- "series_id": "cosmos3_nano_future_window",
476
- "status": "not_evaluated_in_verified_package",
477
- "status_label": "not evaluated",
478
- "task_id": "action_object_relation",
479
- "task_label": "Action-Object Relation Prediction",
480
- "task_number": 16
481
- },
482
  {
483
  "method": "Cosmos3-Super Reasoner",
484
  "metric_key": "micro_f1",
@@ -630,8 +600,8 @@
630
  "method_count": 9,
631
  "method_task_record_count": 180,
632
  "proxy_scored_method_task_count": 4,
633
- "scored_method_task_count": 151,
634
- "scoreless_method_task_count": 29,
635
  "task_count": 20
636
  },
637
  "source_matrix": "docs/data/task_method_20_result_matrix.json",
 
1
  {
2
+ "generated_at_utc": "2026-06-18T22:55:35+00:00",
3
  "immediate_actions": [
4
  {
5
  "artifact": "docs/data/task_method_20_gap_audit.json",
6
  "id": "gap_audit",
7
+ "purpose": "Keep the 27 scoreless cells visible and reproducible."
8
  },
9
  {
10
  "artifact": "scripts/omni/score_model_output_probes.py",
 
24
  "proxy_scored_task_count": 0,
25
  "result_record_count": 20,
26
  "scope": "128 selected episodes, held-out test",
27
+ "scored_task_count": 11,
28
+ "scoreless_task_count": 9,
29
  "status_counts": {
30
+ "not_evaluated_in_verified_package": 9,
31
+ "scored": 11
32
  }
33
  },
34
  "cosmos3_super_reasoner": {
 
37
  "proxy_scored_task_count": 0,
38
  "result_record_count": 20,
39
  "scope": "128 selected episodes, held-out test",
40
+ "scored_task_count": 10,
41
+ "scoreless_task_count": 10,
42
  "status_counts": {
43
+ "not_evaluated_in_verified_package": 10,
44
+ "scored": 10
45
  }
46
  },
47
  "metadata128_neural_mlp": {
 
135
  }
136
  },
137
  "missing_by_method": {
138
+ "cosmos3_nano_future_window": 9,
139
+ "cosmos3_super_reasoner": 10,
140
  "metadata128_neural_mlp": 2,
141
  "metadata128_simple": 2,
142
  "qwen3_omni_v6_lora": 4
143
  },
144
  "missing_by_status": {
145
+ "not_evaluated_in_verified_package": 23,
146
  "not_supported_by_metadata_only_package": 2,
147
  "unsupported_without_required_target": 2
148
  },
 
159
  "cosmos3_nano_future_window"
160
  ],
161
  "08 Language Grounding": [
162
+ "cosmos3_nano_future_window"
 
163
  ],
164
  "09 Cross-Modal Retrieval": [
165
  "cosmos3_super_reasoner"
 
186
  "metadata128_simple",
187
  "qwen3_omni_v6_lora"
188
  ],
 
 
 
189
  "17 Future Object-Set Forecasting": [
190
  "cosmos3_super_reasoner"
191
  ],
 
267
  "task_label": "Object Relevance Prediction",
268
  "task_number": 7
269
  },
 
 
 
 
 
 
 
 
 
 
 
 
 
270
  {
271
  "method": "Cosmos3-Nano Future Window",
272
  "metric_key": "mrr",
 
449
  "task_label": "Interaction Text Prediction",
450
  "task_number": 15
451
  },
 
 
 
 
 
 
 
 
 
 
 
 
 
452
  {
453
  "method": "Cosmos3-Super Reasoner",
454
  "metric_key": "micro_f1",
 
600
  "method_count": 9,
601
  "method_task_record_count": 180,
602
  "proxy_scored_method_task_count": 4,
603
+ "scored_method_task_count": 153,
604
+ "scoreless_method_task_count": 27,
605
  "task_count": 20
606
  },
607
  "source_matrix": "docs/data/task_method_20_result_matrix.json",
data/task_method_20_result_matrix.json CHANGED
@@ -1,11 +1,11 @@
1
  {
2
  "title": "Task Method 20-Result Matrix",
3
  "status": "pass",
4
- "generated_at_utc": "2026-06-18T22:25:59+00:00",
5
  "task_count": 20,
6
  "method_count": 9,
7
  "method_task_record_count": 180,
8
- "scored_method_task_count": 151,
9
  "series": [
10
  {
11
  "id": "minimal",
@@ -181,20 +181,20 @@
181
  "kind": "partial_128_episode_foundation_model_overlay",
182
  "scope": "128 selected episodes, held-out test",
183
  "stroke_dasharray": "4 7",
184
- "method_detail": "Verified Cosmos3-Super base-weight Reasoner JSON-task evaluation, plus task 16 and a derived task-20 action-boundary timing probe scored from existing verified JSON.",
185
  "plotted_as": "colored point overlay",
186
  "result_record_count": 20,
187
- "scored_task_count": 9,
188
- "covered_task_count": 9,
189
  "proxy_scored_task_count": 0,
190
- "scoreless_task_count": 11,
191
  "unsupported_task_count": 0,
192
- "not_evaluated_task_count": 11,
193
  "status_counts": {
194
- "not_evaluated_in_verified_package": 11,
195
- "scored": 9
196
  },
197
- "coverage_fraction": 0.45,
198
  "result_record_fraction": 1.0
199
  },
200
  {
@@ -205,20 +205,20 @@
205
  "kind": "partial_128_episode_world_model_overlay",
206
  "scope": "128 selected episodes, held-out test",
207
  "stroke_dasharray": "2 7",
208
- "method_detail": "Verified Cosmos3-Nano future-window compatibility metrics, plus tasks 10/13/14/17 and a derived task-20 boundary timing probe scored from existing held-out future-window artifacts.",
209
  "plotted_as": "colored point overlay",
210
  "result_record_count": 20,
211
- "scored_task_count": 10,
212
- "covered_task_count": 10,
213
  "proxy_scored_task_count": 0,
214
- "scoreless_task_count": 10,
215
  "unsupported_task_count": 0,
216
- "not_evaluated_task_count": 10,
217
  "status_counts": {
218
- "not_evaluated_in_verified_package": 10,
219
- "scored": 10
220
  },
221
- "coverage_fraction": 0.5,
222
  "result_record_fraction": 1.0
223
  }
224
  ],
@@ -1489,17 +1489,17 @@
1489
  "task_label": "Language Grounding",
1490
  "series_id": "cosmos3_super_reasoner",
1491
  "method": "Cosmos3-Super Reasoner",
1492
- "status": "not_evaluated_in_verified_package",
1493
- "status_label": "not evaluated",
1494
- "scored": false,
1495
  "proxy_scored": false,
1496
- "raw": null,
1497
- "raw_text": "n/a",
1498
- "normalized_score": null,
1499
- "metric_key": "mrr",
1500
- "source": null,
1501
  "scope": "multi_episode_128_partial_model_overlay",
1502
- "reason": "the verified public model package did not ask this branch to emit that task target; a new task-specific evaluation package is required for a numeric score"
1503
  },
1504
  {
1505
  "task_number": 8,
@@ -2803,17 +2803,17 @@
2803
  "task_label": "Action-Object Relation Prediction",
2804
  "series_id": "cosmos3_nano_future_window",
2805
  "method": "Cosmos3-Nano Future Window",
2806
- "status": "not_evaluated_in_verified_package",
2807
- "status_label": "not evaluated",
2808
- "scored": false,
2809
  "proxy_scored": false,
2810
- "raw": null,
2811
- "raw_text": "n/a",
2812
- "normalized_score": null,
2813
- "metric_key": "macro_f1",
2814
- "source": null,
2815
  "scope": "multi_episode_128_partial_model_overlay",
2816
- "reason": "the verified public model package did not ask this branch to emit that task target; a new task-specific evaluation package is required for a numeric score"
2817
  },
2818
  {
2819
  "task_number": 17,
 
1
  {
2
  "title": "Task Method 20-Result Matrix",
3
  "status": "pass",
4
+ "generated_at_utc": "2026-06-18T22:55:01+00:00",
5
  "task_count": 20,
6
  "method_count": 9,
7
  "method_task_record_count": 180,
8
+ "scored_method_task_count": 153,
9
  "series": [
10
  {
11
  "id": "minimal",
 
181
  "kind": "partial_128_episode_foundation_model_overlay",
182
  "scope": "128 selected episodes, held-out test",
183
  "stroke_dasharray": "4 7",
184
+ "method_detail": "Verified Cosmos3-Super base-weight Reasoner JSON-task evaluation, plus task 8/16 and a derived task-20 action-boundary timing probe scored from existing verified JSON.",
185
  "plotted_as": "colored point overlay",
186
  "result_record_count": 20,
187
+ "scored_task_count": 10,
188
+ "covered_task_count": 10,
189
  "proxy_scored_task_count": 0,
190
+ "scoreless_task_count": 10,
191
  "unsupported_task_count": 0,
192
+ "not_evaluated_task_count": 10,
193
  "status_counts": {
194
+ "not_evaluated_in_verified_package": 10,
195
+ "scored": 10
196
  },
197
+ "coverage_fraction": 0.5,
198
  "result_record_fraction": 1.0
199
  },
200
  {
 
205
  "kind": "partial_128_episode_world_model_overlay",
206
  "scope": "128 selected episodes, held-out test",
207
  "stroke_dasharray": "2 7",
208
+ "method_detail": "Verified Cosmos3-Nano future-window compatibility metrics, plus tasks 10/13/14/16/17 and a derived task-20 boundary timing probe scored from existing held-out future-window artifacts.",
209
  "plotted_as": "colored point overlay",
210
  "result_record_count": 20,
211
+ "scored_task_count": 11,
212
+ "covered_task_count": 11,
213
  "proxy_scored_task_count": 0,
214
+ "scoreless_task_count": 9,
215
  "unsupported_task_count": 0,
216
+ "not_evaluated_task_count": 9,
217
  "status_counts": {
218
+ "not_evaluated_in_verified_package": 9,
219
+ "scored": 11
220
  },
221
+ "coverage_fraction": 0.55,
222
  "result_record_fraction": 1.0
223
  }
224
  ],
 
1489
  "task_label": "Language Grounding",
1490
  "series_id": "cosmos3_super_reasoner",
1491
  "method": "Cosmos3-Super Reasoner",
1492
+ "status": "scored",
1493
+ "status_label": "scored",
1494
+ "scored": true,
1495
  "proxy_scored": false,
1496
+ "raw": 0.30639899644580487,
1497
+ "raw_text": "0.3064",
1498
+ "normalized_score": 0.30639899644580487,
1499
+ "metric_key": "caption_grounding_iou",
1500
+ "source": "results/omni_finetune/model_output_task_probes_20260616/caption_grounding/cosmos3_super_reasoner/metrics.json",
1501
  "scope": "multi_episode_128_partial_model_overlay",
1502
+ "reason": null
1503
  },
1504
  {
1505
  "task_number": 8,
 
2803
  "task_label": "Action-Object Relation Prediction",
2804
  "series_id": "cosmos3_nano_future_window",
2805
  "method": "Cosmos3-Nano Future Window",
2806
+ "status": "scored",
2807
+ "status_label": "scored",
2808
+ "scored": true,
2809
  "proxy_scored": false,
2810
+ "raw": 0.002794157670325683,
2811
+ "raw_text": "0.0028",
2812
+ "normalized_score": 0.002794157670325683,
2813
+ "metric_key": "action_object_relation_macro_f1",
2814
+ "source": "results/omni_finetune/model_output_task_probes_20260616/action_object_relation/cosmos3_nano_future_window/metrics.json",
2815
  "scope": "multi_episode_128_partial_model_overlay",
2816
+ "reason": null
2817
  },
2818
  {
2819
  "task_number": 17,
data/task_surface_integrity.json CHANGED
@@ -1,6 +1,6 @@
1
  {
2
  "status": "pass",
3
- "generated_at_utc": "2026-06-18T22:27:40+00:00",
4
  "summary": {
5
  "task_count": 12,
6
  "expected_task_count": 12,
 
1
  {
2
  "status": "pass",
3
+ "generated_at_utc": "2026-06-18T22:57:59+00:00",
4
  "summary": {
5
  "task_count": 12,
6
  "expected_task_count": 12,
data/website_integrity.json CHANGED
@@ -1,6 +1,6 @@
1
  {
2
  "status": "pass",
3
- "generated_at_utc": "2026-06-18T22:27:45+00:00",
4
  "docs_root": "docs",
5
  "site_base": "/ropedia-xperience-10m-task-suite/",
6
  "summary": {
@@ -301,7 +301,7 @@
301
  },
302
  {
303
  "path": "data/artifact_index.json",
304
- "bytes": 116643,
305
  "top_level_type": "dict"
306
  },
307
  {
@@ -316,7 +316,7 @@
316
  },
317
  {
318
  "path": "data/episode128_task_model_radar.json",
319
- "bytes": 185391,
320
  "top_level_type": "dict"
321
  },
322
  {
@@ -351,7 +351,7 @@
351
  },
352
  {
353
  "path": "data/mirror_parity.json",
354
- "bytes": 938745,
355
  "top_level_type": "dict"
356
  },
357
  {
@@ -486,12 +486,12 @@
486
  },
487
  {
488
  "path": "data/task_method_20_gap_audit.json",
489
- "bytes": 29788,
490
  "top_level_type": "dict"
491
  },
492
  {
493
  "path": "data/task_method_20_result_matrix.json",
494
- "bytes": 128842,
495
  "top_level_type": "dict"
496
  },
497
  {
@@ -526,7 +526,7 @@
526
  },
527
  {
528
  "path": "data/unified_task_model_radar.json",
529
- "bytes": 229244,
530
  "top_level_type": "dict"
531
  },
532
  {
@@ -571,7 +571,7 @@
571
  {
572
  "path": "assets/charts/episode128_task_model_radar.svg",
573
  "exists": true,
574
- "bytes": 48704,
575
  "format": "SVG",
576
  "has_viewbox": true
577
  },
@@ -641,7 +641,7 @@
641
  {
642
  "path": "assets/charts/unified_task_model_radar.svg",
643
  "exists": true,
644
- "bytes": 54717,
645
  "format": "SVG",
646
  "has_viewbox": true
647
  },
 
1
  {
2
  "status": "pass",
3
+ "generated_at_utc": "2026-06-18T22:58:01+00:00",
4
  "docs_root": "docs",
5
  "site_base": "/ropedia-xperience-10m-task-suite/",
6
  "summary": {
 
301
  },
302
  {
303
  "path": "data/artifact_index.json",
304
+ "bytes": 116644,
305
  "top_level_type": "dict"
306
  },
307
  {
 
316
  },
317
  {
318
  "path": "data/episode128_task_model_radar.json",
319
+ "bytes": 185314,
320
  "top_level_type": "dict"
321
  },
322
  {
 
351
  },
352
  {
353
  "path": "data/mirror_parity.json",
354
+ "bytes": 1015184,
355
  "top_level_type": "dict"
356
  },
357
  {
 
486
  },
487
  {
488
  "path": "data/task_method_20_gap_audit.json",
489
+ "bytes": 28259,
490
  "top_level_type": "dict"
491
  },
492
  {
493
  "path": "data/task_method_20_result_matrix.json",
494
+ "bytes": 128805,
495
  "top_level_type": "dict"
496
  },
497
  {
 
526
  },
527
  {
528
  "path": "data/unified_task_model_radar.json",
529
+ "bytes": 229168,
530
  "top_level_type": "dict"
531
  },
532
  {
 
571
  {
572
  "path": "assets/charts/episode128_task_model_radar.svg",
573
  "exists": true,
574
+ "bytes": 48923,
575
  "format": "SVG",
576
  "has_viewbox": true
577
  },
 
641
  {
642
  "path": "assets/charts/unified_task_model_radar.svg",
643
  "exists": true,
644
+ "bytes": 54936,
645
  "format": "SVG",
646
  "has_viewbox": true
647
  },
results/omni_finetune/model_output_probe_readiness/RUN_REPORT.md CHANGED
@@ -1,6 +1,6 @@
1
  # Model Output Probe Readiness
2
 
3
- Generated: `2026-06-18T18:10:07+00:00`
4
 
5
  This report checks whether verified model branches have the prediction files
6
  needed to extend them to every 20-task contract. It is readiness evidence only;
@@ -8,6 +8,6 @@ it does not assign new task scores.
8
 
9
  | Method | ID | Matrix scores | Status | Split files | Next step |
10
  | --- | --- | --- | --- | --- | --- |
11
- | Cosmos3-Nano Future Window | cosmos3_nano_future_window | 7/20 | missing_required_model_outputs | train: missing; validation: missing; test: missing | Collect or generate train, validation, and test prediction JSONL files first. |
12
- | Cosmos3-Super Reasoner | cosmos3_super_reasoner | 8/20 | missing_required_model_outputs | train: missing; validation: missing; test: present | Collect or generate train, validation, and test prediction JSONL files first. |
13
- | Qwen3-Omni v6 LoRA | qwen3_omni_v6_lora | 15/20 | missing_required_model_outputs | train: missing; validation: missing; test: present | Collect or generate train, validation, and test prediction JSONL files first. |
 
1
  # Model Output Probe Readiness
2
 
3
+ Generated: `2026-06-18T22:44:42+00:00`
4
 
5
  This report checks whether verified model branches have the prediction files
6
  needed to extend them to every 20-task contract. It is readiness evidence only;
 
8
 
9
  | Method | ID | Matrix scores | Status | Split files | Next step |
10
  | --- | --- | --- | --- | --- | --- |
11
+ | Cosmos3-Nano Future Window | cosmos3_nano_future_window | 10/20 | missing_required_model_outputs | train: missing; validation: missing; test: missing | Collect or generate train, validation, and test prediction JSONL files first. |
12
+ | Cosmos3-Super Reasoner | cosmos3_super_reasoner | 9/20 | missing_required_model_outputs | train: missing; validation: missing; test: present | Collect or generate train, validation, and test prediction JSONL files first. |
13
+ | Qwen3-Omni v6 LoRA | qwen3_omni_v6_lora | 16/20 | missing_required_model_outputs | train: missing; validation: missing; test: present | Collect or generate train, validation, and test prediction JSONL files first. |
results/omni_finetune/model_output_probe_readiness/model_output_probe_readiness.json CHANGED
@@ -1,10 +1,10 @@
1
  {
2
- "generated_at_utc": "2026-06-18T18:10:07+00:00",
3
  "methods": {
4
  "cosmos3_nano_future_window": {
5
  "label": "Cosmos3-Nano Future Window",
6
- "matrix_scored_task_count": 7,
7
- "matrix_scoreless_task_count": 13,
8
  "next_step": "Collect or generate train, validation, and test prediction JSONL files first.",
9
  "ready_for_all_task_probe": false,
10
  "required_splits": [
@@ -19,13 +19,10 @@
19
  "caption_grounding",
20
  "temporal_order",
21
  "misalignment_detection",
22
- "next_subtask_forecast",
23
  "interaction_text_prediction",
24
  "action_object_relation",
25
- "object_set_forecast",
26
  "imu_to_hand_pose",
27
- "camera_view_sync_retrieval",
28
- "time_to_transition"
29
  ],
30
  "split_status": {
31
  "test": {
@@ -54,8 +51,8 @@
54
  },
55
  "cosmos3_super_reasoner": {
56
  "label": "Cosmos3-Super Reasoner",
57
- "matrix_scored_task_count": 8,
58
- "matrix_scoreless_task_count": 12,
59
  "next_step": "Collect or generate train, validation, and test prediction JSONL files first.",
60
  "ready_for_all_task_probe": false,
61
  "required_splits": [
@@ -70,7 +67,6 @@
70
  "modality_reconstruction",
71
  "temporal_order",
72
  "misalignment_detection",
73
- "long_horizon_next_action",
74
  "next_subtask_forecast",
75
  "interaction_text_prediction",
76
  "object_set_forecast",
@@ -103,8 +99,8 @@
103
  },
104
  "qwen3_omni_v6_lora": {
105
  "label": "Qwen3-Omni v6 LoRA",
106
- "matrix_scored_task_count": 15,
107
- "matrix_scoreless_task_count": 5,
108
  "next_step": "Collect or generate train, validation, and test prediction JSONL files first.",
109
  "ready_for_all_task_probe": false,
110
  "required_splits": [
@@ -116,8 +112,7 @@
116
  "hand_trajectory_forecast",
117
  "modality_reconstruction",
118
  "interaction_text_prediction",
119
- "imu_to_hand_pose",
120
- "camera_view_sync_retrieval"
121
  ],
122
  "split_status": {
123
  "test": {
 
1
  {
2
+ "generated_at_utc": "2026-06-18T22:44:42+00:00",
3
  "methods": {
4
  "cosmos3_nano_future_window": {
5
  "label": "Cosmos3-Nano Future Window",
6
+ "matrix_scored_task_count": 10,
7
+ "matrix_scoreless_task_count": 10,
8
  "next_step": "Collect or generate train, validation, and test prediction JSONL files first.",
9
  "ready_for_all_task_probe": false,
10
  "required_splits": [
 
19
  "caption_grounding",
20
  "temporal_order",
21
  "misalignment_detection",
 
22
  "interaction_text_prediction",
23
  "action_object_relation",
 
24
  "imu_to_hand_pose",
25
+ "camera_view_sync_retrieval"
 
26
  ],
27
  "split_status": {
28
  "test": {
 
51
  },
52
  "cosmos3_super_reasoner": {
53
  "label": "Cosmos3-Super Reasoner",
54
+ "matrix_scored_task_count": 9,
55
+ "matrix_scoreless_task_count": 11,
56
  "next_step": "Collect or generate train, validation, and test prediction JSONL files first.",
57
  "ready_for_all_task_probe": false,
58
  "required_splits": [
 
67
  "modality_reconstruction",
68
  "temporal_order",
69
  "misalignment_detection",
 
70
  "next_subtask_forecast",
71
  "interaction_text_prediction",
72
  "object_set_forecast",
 
99
  },
100
  "qwen3_omni_v6_lora": {
101
  "label": "Qwen3-Omni v6 LoRA",
102
+ "matrix_scored_task_count": 16,
103
+ "matrix_scoreless_task_count": 4,
104
  "next_step": "Collect or generate train, validation, and test prediction JSONL files first.",
105
  "ready_for_all_task_probe": false,
106
  "required_splits": [
 
112
  "hand_trajectory_forecast",
113
  "modality_reconstruction",
114
  "interaction_text_prediction",
115
+ "imu_to_hand_pose"
 
116
  ],
117
  "split_status": {
118
  "test": {
results/omni_finetune/model_output_task_probes_20260616/action_object_relation/cosmos3_nano_future_window/metrics.json ADDED
@@ -0,0 +1,187 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "accuracy": 0.013297872340425532,
3
+ "action_object_relation_accuracy": 0.013297872340425532,
4
+ "action_object_relation_macro_f1": 0.002794157670325683,
5
+ "artifact_files": {
6
+ "metrics_json": "results/omni_finetune/model_output_task_probes_20260616/action_object_relation/cosmos3_nano_future_window/metrics.json",
7
+ "per_class_metrics_csv": "results/omni_finetune/model_output_task_probes_20260616/action_object_relation/cosmos3_nano_future_window/per_class_metrics.csv",
8
+ "predictions_csv": "results/omni_finetune/model_output_task_probes_20260616/action_object_relation/cosmos3_nano_future_window/predictions.csv"
9
+ },
10
+ "generated_at_utc": "2026-06-18T22:52:18+00:00",
11
+ "known_limitation": "This is a retrieval-derived future relation score, not a separately prompted action-object generation head.",
12
+ "labels": [
13
+ "Adjust canned food on shelf :: canned food | cardboard box | store shelf",
14
+ "Adjust item on shelf :: shelf | stationery package",
15
+ "Adjust lantern shape :: red pleated paper lantern",
16
+ "Adjust paper :: cardboard square | paper | pen | star beads",
17
+ "Adjust pot position :: pot",
18
+ "Adjust puzzle piece :: jigsaw puzzle | puzzle box | puzzle pieces",
19
+ "Align edges of paper lantern :: hands | red paper lantern",
20
+ "Align paper lantern edges :: hands | red paper lantern",
21
+ "Apply adhesive tape to lantern :: adhesive tape | red paper lantern",
22
+ "Approach boxes :: cardboard boxes | colleague | shelving unit",
23
+ "Approaching and pressing the door switch :: glass door | switch | wall",
24
+ "Approaching the table :: beads | chairs | table",
25
+ "Arrange buttons :: red buttons | smartphone | table",
26
+ "Arrange buttons in a line :: buttons | phone | table",
27
+ "Arrange star beads for counting :: paper | pen | star beads",
28
+ "Attempt to fit puzzle piece :: puzzle board | puzzle piece",
29
+ "Attempt to fit puzzle piece :: puzzle piece",
30
+ "Bend and manipulate plastic strip :: plastic strip | stationary box | table | water bottle",
31
+ "Browse smartphone screen :: paper strips | smartphone | star ornaments",
32
+ "Closing the door :: door | dustpan",
33
+ "Counting and organizing beads :: cardboard squares | paper | pen | star-shaped beads",
34
+ "Counting star beads :: paper | pen | star beads",
35
+ "Cut along the marked line :: cardboard | hand | utility knife",
36
+ "Cut cardboard piece :: cardboard strip | scissors",
37
+ "Entering the VR training room :: doorway | person | table",
38
+ "Expand paper lantern :: adhesive tape roll | cardboard box | red paper lantern",
39
+ "Extract wire hangers from box :: cardboard box | wire hangers",
40
+ "Fold paper lantern :: red paper honeycomb lantern",
41
+ "Gesturing :: cardboard pieces | marker | pencil case | ruler | scissors",
42
+ "Grasp cleaning bottle :: bowls | chopping board | cleaning fluid bottle",
43
+ "Grasp lantern :: red paper honeycomb lantern",
44
+ "Grasping cleaning cloth :: cleaning cloth | countertop",
45
+ "Greeting/acknowledging participants :: person | table | vr headset",
46
+ "Handle paper lantern component :: cardboard box | paper lantern component | plastic bag | red paper lantern",
47
+ "Hold and bend plastic strip :: bottle | purple plastic strip | stationery box",
48
+ "Hold and manipulate paper strip :: beads | mobile phone | power bank | yellow paper strip",
49
+ "Hold and manipulate paper strip :: beads | paper strip | power bank | smartphone",
50
+ "Hold beads :: paper | pen | power bank | smartphone | star-shaped beads",
51
+ "Hold container lid :: dustpan | red plastic container lid",
52
+ "Hold earbud case :: box of products | earbud case | shelf",
53
+ "Hold smartphone :: quilling paper strips | small blue beads | smartphone",
54
+ "Identify next cardboard piece :: cardboard pieces | marker",
55
+ "Inspect shelf condition :: colleague | shelf",
56
+ "Interact with smartphone :: beads | smartphone | yellow paper strip",
57
+ "Interact with smartphone :: cans | cereal box | shelf | smartphone",
58
+ "Interact with smartphone :: cans | shelf | smartphone",
59
+ "Lift pot lid :: pot | pot lid",
60
+ "Manipulate adhesive strip :: adhesive strip | paper sheets | puzzle box | smartphone | water bottle",
61
+ "Manipulate bead :: bead piles | container | paper strips | yellow bead",
62
+ "Manipulate bead :: bead | bead piles | pen holder | table",
63
+ "Manipulate bead :: bead | bead piles | table",
64
+ "Manipulate beads :: blue beads | power bank | smartphone | yellow beads",
65
+ "Manipulate craft paper strips :: paper strips | scissors | smartphone",
66
+ "Manipulate craft piece :: craft pieces | scissors | smartphone",
67
+ "Manipulate material :: blue crafting material | hand",
68
+ "Manipulate paper edge :: hands | paper cone | puzzle box | smartphone | water bottle",
69
+ "Manipulate paper strip :: container with tools | table | yellow paper strip",
70
+ "Manipulate paper strip :: craft materials | purple paper strip | scissors | smartphone",
71
+ "Manipulate paper strip :: paper cone | paper strip | puzzle box | smartphone | water bottle",
72
+ "Manipulate paper strip :: purple paper strip | quilling paper pile | smartphone",
73
+ "Manipulate plastic strip :: purple plastic strip | storage bin | water bottle",
74
+ "Manipulate plastic strips :: desk | plastic strips | water bottle",
75
+ "Manipulate puzzle pieces :: puzzle box | puzzle mat | puzzle pieces",
76
+ "Manipulate yellow strip :: beads | cell phone | pen | yellow strip",
77
+ "Manipulating paper strips :: beads | blue paper strip | yellow paper strip",
78
+ "Marking cardboard piece :: cardboard pieces | marker | ruler | scissors",
79
+ "Move dustpan to side :: dustpan",
80
+ "Move marker and adjust hand :: cardboard pieces | marker",
81
+ "Move phone :: cardboard | smartphone | utility knife",
82
+ "Move pot :: faucet | pot | sink",
83
+ "Move smartphone :: craft beads | paper strips | smartphone",
84
+ "Observe and pause :: cardboard pieces | marker | pencil case | ruler | scissors",
85
+ "Open earbud case :: earbud case",
86
+ "Open folded paper lantern :: cardboard box | red pleated paper lantern",
87
+ "Open paper lantern component :: paper lantern component",
88
+ "Open stove pot lid :: blue bowl | cloth | faucet | red bowl | sink | soap dispenser | white bowl",
89
+ "Operate smartphone :: craft paper strips | folded paper fan | paper scraps | scissors | smartphone | table",
90
+ "Operate smartphone :: craft paper strips | folded paper fan | smartphone",
91
+ "Operate smartphone :: paper scraps | scissors | smartphone | table",
92
+ "Organize cardboard pieces :: cardboard pieces | marker | pencil case | ruler | scissors",
93
+ "Pick up button :: buttons | table",
94
+ "Pick up items from the shopping bag :: cardboard boxes | red shopping bag | retail shelf",
95
+ "Pick up new cardboard piece :: cardboard piece | marker",
96
+ "Pick up packaged paper lantern component :: cardboard box | packaged paper lantern component",
97
+ "Pick up smartphone :: cans | shelf | smartphone",
98
+ "Pick up star bead :: cardboard squares | mobile phone | paper | pen | power bank | star beads",
99
+ "Pick up utility knife :: cardboard | utility knife",
100
+ "Picking up bottle :: bottle",
101
+ "Picking up crafting material :: beads | smartphone | table | yellow strip",
102
+ "Place and count bead :: paper | pen | star beads",
103
+ "Place another canned food on shelf :: box | canned food",
104
+ "Place button :: buttons | hand | smartphone | table",
105
+ "Place can on shelf :: canned food | retail shelf",
106
+ "Place canned food on shelf :: canned food | store shelf",
107
+ "Place cloth on floor :: cloth",
108
+ "Place item on shelf :: stationery package",
109
+ "Place items on the shelf :: packaged items | retail shelf",
110
+ "Place material :: bead design | blue crafting material | hand",
111
+ "Place phone down :: beads | pencil holder | smartphone | yellow paper strip",
112
+ "Place piece into puzzle :: jigsaw puzzle | puzzle piece",
113
+ "Place puzzle piece :: puzzle board | puzzle piece",
114
+ "Place smartphone down :: power bank | quilling paper strips | small paper stars | smartphone",
115
+ "Place smartphone down :: quilling paper strips | small paper stars | smartphone",
116
+ "Place smartphone on stand :: saucepan | smartphone | smartphone stand | yellow jacket",
117
+ "Place towel :: pot | towel",
118
+ "Placing paper strip :: adhesive strip | paper cone | phone",
119
+ "Put down smartphone :: paper quilling strips | power bank | smartphone | star beads",
120
+ "Put down smartphone :: paper quilling strips | smartphone | star beads",
121
+ "Put down smartphone :: power bank | smartphone",
122
+ "Reach for another item :: item | packaged item | shelf",
123
+ "Reach for cleaning supplies :: bowls | chopping board | cleaning fluid bottle",
124
+ "Reach for next canned food :: box | canned food",
125
+ "Reach for next canned food :: box | canned food | retail shelf",
126
+ "Reach for next item :: packaged item | shelf",
127
+ "Reach for puzzle piece :: puzzle board | puzzle box | puzzle pieces",
128
+ "Reach for wire hangers :: cardboard box | wire hangers",
129
+ "Reach into box :: box of cans",
130
+ "Release cardboard piece and gesture :: cardboard piece | cardboard piles | marker | pouch | ruler | scissors",
131
+ "Release hook :: display hook",
132
+ "Release lantern :: red paper lantern",
133
+ "Remove paper lantern part from packaging :: paper lantern component | plastic packaging",
134
+ "Remove paper lantern part from packaging :: paper lantern | red hand fan",
135
+ "Remove plastic packaging :: packaging | paper lantern component",
136
+ "Reposition hand :: cardboard | utility knife",
137
+ "Resume observation :: cardboard pieces | marker | pencil case | ruler | scissors",
138
+ "Retrieve canned food from box :: box | canned food",
139
+ "Retrieve next canned food item :: canned food | cardboard box",
140
+ "Retrieving more beads :: paper | pen | star beads",
141
+ "Rinse cloth in sink :: cloth | sink | water faucet",
142
+ "Scroll smartphone screen :: paper stars | paper strips | smartphone",
143
+ "Search for puzzle piece :: jigsaw puzzle | puzzle pieces",
144
+ "Secure paper edges with adhesive :: adhesive strip | paper cone pieces | puzzle box | smartphone | water bottle",
145
+ "Secure paper edges with adhesive :: adhesive strip | paper cone | paper cone pieces | puzzle box | smartphone | water bottle",
146
+ "Securing paper structure :: paper cone | paper strip | puzzle box | smartphone | water bottle",
147
+ "Sort and adjust button line :: buttons | smartphone | table",
148
+ "Sort and arrange buttons :: buttons | smartphones | soda can | table",
149
+ "Sort and arrange buttons :: buttons | smartphones | table",
150
+ "Sort and count beads :: cell phone | paper | pen | star beads",
151
+ "Sort and count beads :: paper | pen | star beads",
152
+ "Sort beads and write count :: paper | pen | power bank | smartphone | star-shaped beads",
153
+ "Sort button :: buttons | cell phone",
154
+ "Sort craft items :: star-shaped craft items | table",
155
+ "Sort puzzle pieces :: jigsaw puzzle pieces | table",
156
+ "Sort star-shaped beads :: marker | mobile phone | paper | power bank | star-shaped beads",
157
+ "Stir contents :: cooking utensil | pot",
158
+ "Use smartphone :: buttons | chair | smartphone | table",
159
+ "Use smartphone :: buttons | smartphone | table",
160
+ "Use smartphone :: charging cable | paper strips | power bank | smartphone | star-shaped paper crafts",
161
+ "Walk towards shelves :: cardboard boxes | red bin | shelving unit",
162
+ "Walking towards door :: door | dustpan",
163
+ "Write count on paper :: marker | mobile phone | paper | power bank | star-shaped beads"
164
+ ],
165
+ "macro_f1": 0.002794157670325683,
166
+ "metric_key": "action_object_relation_macro_f1",
167
+ "missing_pred_target_count": 0,
168
+ "missing_true_target_count": 0,
169
+ "model_id": "cosmos3_nano_future_window",
170
+ "model_label": "Cosmos3-Nano Future Window",
171
+ "normalization_policy": "Action text is whitespace-normalized. Objects are casefolded, deduplicated, sorted, and joined into a canonical relation label before macro-F1 scoring.",
172
+ "num_samples": 376,
173
+ "primary_metric": "action_object_relation_macro_f1",
174
+ "primary_score": 0.002794157670325683,
175
+ "scope": "held_out_test_existing_future_window_retrieval_probe",
176
+ "score_policy": "Derived from existing verified held-out Cosmos3-Nano future-window predictions. The true future record and retrieved future record are joined to the public-safe target map, then scored on the action plus object-set relation.",
177
+ "scored_rows": 376,
178
+ "source_prediction_jsonl": "results/omni_finetune/verified_public/xperience10m_cosmos3_nano_128ep_future_window_h5_compat_adapter_eval_test_full/eval/future_predictions.jsonl",
179
+ "source_target_map_jsonl": "results/omni_finetune/model_output_task_probes_20260616/cosmos3_nano_future_window_target_map.jsonl",
180
+ "status": "pass",
181
+ "target_map_rows": 448,
182
+ "task_id": "action_object_relation",
183
+ "task_label": "Action-Object Relation",
184
+ "task_number": 16,
185
+ "title": "Cosmos3-Nano Future Window Future Action-Object Relation Probe",
186
+ "total_prediction_rows": 378
187
+ }
results/omni_finetune/model_output_task_probes_20260616/action_object_relation/cosmos3_nano_future_window/per_class_metrics.csv ADDED
@@ -0,0 +1,152 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ class_name,support,predicted,precision,recall,f1
2
+ Adjust canned food on shelf :: canned food | cardboard box | store shelf,2,0,0.0,0.0,0.0
3
+ Adjust item on shelf :: shelf | stationery package,4,1,0.0,0.0,0.0
4
+ Adjust lantern shape :: red pleated paper lantern,2,0,0.0,0.0,0.0
5
+ Adjust paper :: cardboard square | paper | pen | star beads,3,0,0.0,0.0,0.0
6
+ Adjust pot position :: pot,3,0,0.0,0.0,0.0
7
+ Adjust puzzle piece :: jigsaw puzzle | puzzle box | puzzle pieces,3,0,0.0,0.0,0.0
8
+ Align edges of paper lantern :: hands | red paper lantern,2,0,0.0,0.0,0.0
9
+ Align paper lantern edges :: hands | red paper lantern,2,0,0.0,0.0,0.0
10
+ Apply adhesive tape to lantern :: adhesive tape | red paper lantern,3,0,0.0,0.0,0.0
11
+ Approach boxes :: cardboard boxes | colleague | shelving unit,3,0,0.0,0.0,0.0
12
+ Approaching and pressing the door switch :: glass door | switch | wall,6,0,0.0,0.0,0.0
13
+ Approaching the table :: beads | chairs | table,2,0,0.0,0.0,0.0
14
+ Arrange buttons :: red buttons | smartphone | table,2,0,0.0,0.0,0.0
15
+ Arrange buttons in a line :: buttons | phone | table,7,0,0.0,0.0,0.0
16
+ Arrange star beads for counting :: paper | pen | star beads,4,0,0.0,0.0,0.0
17
+ Attempt to fit puzzle piece :: puzzle board | puzzle piece,3,0,0.0,0.0,0.0
18
+ Attempt to fit puzzle piece :: puzzle piece,2,0,0.0,0.0,0.0
19
+ Bend and manipulate plastic strip :: plastic strip | stationary box | table | water bottle,1,0,0.0,0.0,0.0
20
+ Browse smartphone screen :: paper strips | smartphone | star ornaments,3,0,0.0,0.0,0.0
21
+ Closing the door :: door | dustpan,2,0,0.0,0.0,0.0
22
+ Counting and organizing beads :: cardboard squares | paper | pen | star-shaped beads,2,0,0.0,0.0,0.0
23
+ Counting star beads :: paper | pen | star beads,2,0,0.0,0.0,0.0
24
+ Cut along the marked line :: cardboard | hand | utility knife,7,0,0.0,0.0,0.0
25
+ Cut cardboard piece :: cardboard strip | scissors,3,0,0.0,0.0,0.0
26
+ Entering the VR training room :: doorway | person | table,3,0,0.0,0.0,0.0
27
+ Expand paper lantern :: adhesive tape roll | cardboard box | red paper lantern,3,0,0.0,0.0,0.0
28
+ Extract wire hangers from box :: cardboard box | wire hangers,1,0,0.0,0.0,0.0
29
+ Fold paper lantern :: red paper honeycomb lantern,2,0,0.0,0.0,0.0
30
+ Gesturing :: cardboard pieces | marker | pencil case | ruler | scissors,2,0,0.0,0.0,0.0
31
+ Grasp cleaning bottle :: bowls | chopping board | cleaning fluid bottle,1,0,0.0,0.0,0.0
32
+ Grasp lantern :: red paper honeycomb lantern,1,0,0.0,0.0,0.0
33
+ Grasping cleaning cloth :: cleaning cloth | countertop,4,361,0.0110803324099723,1.0,0.021917808219178086
34
+ Greeting/acknowledging participants :: person | table | vr headset,2,0,0.0,0.0,0.0
35
+ Handle paper lantern component :: cardboard box | paper lantern component | plastic bag | red paper lantern,1,0,0.0,0.0,0.0
36
+ Hold and bend plastic strip :: bottle | purple plastic strip | stationery box,2,0,0.0,0.0,0.0
37
+ Hold and manipulate paper strip :: beads | mobile phone | power bank | yellow paper strip,3,0,0.0,0.0,0.0
38
+ Hold and manipulate paper strip :: beads | paper strip | power bank | smartphone,1,0,0.0,0.0,0.0
39
+ Hold beads :: paper | pen | power bank | smartphone | star-shaped beads,2,0,0.0,0.0,0.0
40
+ Hold container lid :: dustpan | red plastic container lid,1,0,0.0,0.0,0.0
41
+ Hold earbud case :: box of products | earbud case | shelf,1,0,0.0,0.0,0.0
42
+ Hold smartphone :: quilling paper strips | small blue beads | smartphone,1,0,0.0,0.0,0.0
43
+ Identify next cardboard piece :: cardboard pieces | marker,3,0,0.0,0.0,0.0
44
+ Inspect shelf condition :: colleague | shelf,1,0,0.0,0.0,0.0
45
+ Interact with smartphone :: beads | smartphone | yellow paper strip,2,0,0.0,0.0,0.0
46
+ Interact with smartphone :: cans | cereal box | shelf | smartphone,1,0,0.0,0.0,0.0
47
+ Interact with smartphone :: cans | shelf | smartphone,4,0,0.0,0.0,0.0
48
+ Lift pot lid :: pot | pot lid,1,0,0.0,0.0,0.0
49
+ Manipulate adhesive strip :: adhesive strip | paper sheets | puzzle box | smartphone | water bottle,5,0,0.0,0.0,0.0
50
+ Manipulate bead :: bead piles | container | paper strips | yellow bead,2,0,0.0,0.0,0.0
51
+ Manipulate bead :: bead | bead piles | pen holder | table,1,0,0.0,0.0,0.0
52
+ Manipulate bead :: bead | bead piles | table,1,0,0.0,0.0,0.0
53
+ Manipulate beads :: blue beads | power bank | smartphone | yellow beads,2,0,0.0,0.0,0.0
54
+ Manipulate craft paper strips :: paper strips | scissors | smartphone,8,0,0.0,0.0,0.0
55
+ Manipulate craft piece :: craft pieces | scissors | smartphone,2,0,0.0,0.0,0.0
56
+ Manipulate material :: blue crafting material | hand,2,0,0.0,0.0,0.0
57
+ Manipulate paper edge :: hands | paper cone | puzzle box | smartphone | water bottle,8,0,0.0,0.0,0.0
58
+ Manipulate paper strip :: container with tools | table | yellow paper strip,2,0,0.0,0.0,0.0
59
+ Manipulate paper strip :: craft materials | purple paper strip | scissors | smartphone,7,0,0.0,0.0,0.0
60
+ Manipulate paper strip :: paper cone | paper strip | puzzle box | smartphone | water bottle,2,0,0.0,0.0,0.0
61
+ Manipulate paper strip :: purple paper strip | quilling paper pile | smartphone,3,0,0.0,0.0,0.0
62
+ Manipulate plastic strip :: purple plastic strip | storage bin | water bottle,6,0,0.0,0.0,0.0
63
+ Manipulate plastic strips :: desk | plastic strips | water bottle,7,0,0.0,0.0,0.0
64
+ Manipulate puzzle pieces :: puzzle box | puzzle mat | puzzle pieces,6,0,0.0,0.0,0.0
65
+ Manipulate yellow strip :: beads | cell phone | pen | yellow strip,2,0,0.0,0.0,0.0
66
+ Manipulating paper strips :: beads | blue paper strip | yellow paper strip,1,0,0.0,0.0,0.0
67
+ Marking cardboard piece :: cardboard pieces | marker | ruler | scissors,3,0,0.0,0.0,0.0
68
+ Move dustpan to side :: dustpan,1,2,0.0,0.0,0.0
69
+ Move marker and adjust hand :: cardboard pieces | marker,3,0,0.0,0.0,0.0
70
+ Move phone :: cardboard | smartphone | utility knife,13,0,0.0,0.0,0.0
71
+ Move pot :: faucet | pot | sink,1,0,0.0,0.0,0.0
72
+ Move smartphone :: craft beads | paper strips | smartphone,3,2,0.5,0.3333333333333333,0.4
73
+ Observe and pause :: cardboard pieces | marker | pencil case | ruler | scissors,2,0,0.0,0.0,0.0
74
+ Open earbud case :: earbud case,3,0,0.0,0.0,0.0
75
+ Open folded paper lantern :: cardboard box | red pleated paper lantern,4,0,0.0,0.0,0.0
76
+ Open paper lantern component :: paper lantern component,1,0,0.0,0.0,0.0
77
+ Open stove pot lid :: blue bowl | cloth | faucet | red bowl | sink | soap dispenser | white bowl,2,0,0.0,0.0,0.0
78
+ Operate smartphone :: craft paper strips | folded paper fan | paper scraps | scissors | smartphone | table,1,0,0.0,0.0,0.0
79
+ Operate smartphone :: craft paper strips | folded paper fan | smartphone,7,1,0.0,0.0,0.0
80
+ Operate smartphone :: paper scraps | scissors | smartphone | table,2,0,0.0,0.0,0.0
81
+ Organize cardboard pieces :: cardboard pieces | marker | pencil case | ruler | scissors,5,0,0.0,0.0,0.0
82
+ Pick up button :: buttons | table,3,0,0.0,0.0,0.0
83
+ Pick up items from the shopping bag :: cardboard boxes | red shopping bag | retail shelf,3,3,0.0,0.0,0.0
84
+ Pick up new cardboard piece :: cardboard piece | marker,2,0,0.0,0.0,0.0
85
+ Pick up packaged paper lantern component :: cardboard box | packaged paper lantern component,1,0,0.0,0.0,0.0
86
+ Pick up smartphone :: cans | shelf | smartphone,2,0,0.0,0.0,0.0
87
+ Pick up star bead :: cardboard squares | mobile phone | paper | pen | power bank | star beads,1,0,0.0,0.0,0.0
88
+ Pick up utility knife :: cardboard | utility knife,4,0,0.0,0.0,0.0
89
+ Picking up bottle :: bottle,1,0,0.0,0.0,0.0
90
+ Picking up crafting material :: beads | smartphone | table | yellow strip,3,0,0.0,0.0,0.0
91
+ Place and count bead :: paper | pen | star beads,4,0,0.0,0.0,0.0
92
+ Place another canned food on shelf :: box | canned food,2,0,0.0,0.0,0.0
93
+ Place button :: buttons | hand | smartphone | table,3,0,0.0,0.0,0.0
94
+ Place can on shelf :: canned food | retail shelf,3,0,0.0,0.0,0.0
95
+ Place canned food on shelf :: canned food | store shelf,1,0,0.0,0.0,0.0
96
+ Place cloth on floor :: cloth,1,0,0.0,0.0,0.0
97
+ Place item on shelf :: stationery package,2,0,0.0,0.0,0.0
98
+ Place items on the shelf :: packaged items | retail shelf,4,0,0.0,0.0,0.0
99
+ Place material :: bead design | blue crafting material | hand,1,0,0.0,0.0,0.0
100
+ Place phone down :: beads | pencil holder | smartphone | yellow paper strip,2,0,0.0,0.0,0.0
101
+ Place piece into puzzle :: jigsaw puzzle | puzzle piece,4,0,0.0,0.0,0.0
102
+ Place puzzle piece :: puzzle board | puzzle piece,3,0,0.0,0.0,0.0
103
+ Place smartphone down :: power bank | quilling paper strips | small paper stars | smartphone,1,0,0.0,0.0,0.0
104
+ Place smartphone down :: quilling paper strips | small paper stars | smartphone,2,0,0.0,0.0,0.0
105
+ Place smartphone on stand :: saucepan | smartphone | smartphone stand | yellow jacket,1,0,0.0,0.0,0.0
106
+ Place towel :: pot | towel,1,0,0.0,0.0,0.0
107
+ Placing paper strip :: adhesive strip | paper cone | phone,4,2,0.0,0.0,0.0
108
+ Put down smartphone :: paper quilling strips | power bank | smartphone | star beads,1,0,0.0,0.0,0.0
109
+ Put down smartphone :: paper quilling strips | smartphone | star beads,1,2,0.0,0.0,0.0
110
+ Put down smartphone :: power bank | smartphone,1,0,0.0,0.0,0.0
111
+ Reach for another item :: item | packaged item | shelf,1,0,0.0,0.0,0.0
112
+ Reach for cleaning supplies :: bowls | chopping board | cleaning fluid bottle,3,0,0.0,0.0,0.0
113
+ Reach for next canned food :: box | canned food,1,0,0.0,0.0,0.0
114
+ Reach for next canned food :: box | canned food | retail shelf,1,0,0.0,0.0,0.0
115
+ Reach for next item :: packaged item | shelf,1,0,0.0,0.0,0.0
116
+ Reach for puzzle piece :: puzzle board | puzzle box | puzzle pieces,2,0,0.0,0.0,0.0
117
+ Reach for wire hangers :: cardboard box | wire hangers,2,0,0.0,0.0,0.0
118
+ Reach into box :: box of cans,1,0,0.0,0.0,0.0
119
+ Release cardboard piece and gesture :: cardboard piece | cardboard piles | marker | pouch | ruler | scissors,2,0,0.0,0.0,0.0
120
+ Release hook :: display hook,1,0,0.0,0.0,0.0
121
+ Release lantern :: red paper lantern,2,0,0.0,0.0,0.0
122
+ Remove paper lantern part from packaging :: paper lantern component | plastic packaging,1,0,0.0,0.0,0.0
123
+ Remove paper lantern part from packaging :: paper lantern | red hand fan,1,0,0.0,0.0,0.0
124
+ Remove plastic packaging :: packaging | paper lantern component,1,0,0.0,0.0,0.0
125
+ Reposition hand :: cardboard | utility knife,3,0,0.0,0.0,0.0
126
+ Resume observation :: cardboard pieces | marker | pencil case | ruler | scissors,2,0,0.0,0.0,0.0
127
+ Retrieve canned food from box :: box | canned food,1,0,0.0,0.0,0.0
128
+ Retrieve next canned food item :: canned food | cardboard box,2,0,0.0,0.0,0.0
129
+ Retrieving more beads :: paper | pen | star beads,2,0,0.0,0.0,0.0
130
+ Rinse cloth in sink :: cloth | sink | water faucet,2,0,0.0,0.0,0.0
131
+ Scroll smartphone screen :: paper stars | paper strips | smartphone,2,0,0.0,0.0,0.0
132
+ Search for puzzle piece :: jigsaw puzzle | puzzle pieces,2,0,0.0,0.0,0.0
133
+ Secure paper edges with adhesive :: adhesive strip | paper cone pieces | puzzle box | smartphone | water bottle,3,0,0.0,0.0,0.0
134
+ Secure paper edges with adhesive :: adhesive strip | paper cone | paper cone pieces | puzzle box | smartphone | water bottle,1,0,0.0,0.0,0.0
135
+ Securing paper structure :: paper cone | paper strip | puzzle box | smartphone | water bottle,4,0,0.0,0.0,0.0
136
+ Sort and adjust button line :: buttons | smartphone | table,3,0,0.0,0.0,0.0
137
+ Sort and arrange buttons :: buttons | smartphones | soda can | table,1,0,0.0,0.0,0.0
138
+ Sort and arrange buttons :: buttons | smartphones | table,2,0,0.0,0.0,0.0
139
+ Sort and count beads :: cell phone | paper | pen | star beads,1,0,0.0,0.0,0.0
140
+ Sort and count beads :: paper | pen | star beads,2,0,0.0,0.0,0.0
141
+ Sort beads and write count :: paper | pen | power bank | smartphone | star-shaped beads,2,0,0.0,0.0,0.0
142
+ Sort button :: buttons | cell phone,3,0,0.0,0.0,0.0
143
+ Sort craft items :: star-shaped craft items | table,4,2,0.0,0.0,0.0
144
+ Sort puzzle pieces :: jigsaw puzzle pieces | table,2,0,0.0,0.0,0.0
145
+ Sort star-shaped beads :: marker | mobile phone | paper | power bank | star-shaped beads,1,0,0.0,0.0,0.0
146
+ Stir contents :: cooking utensil | pot,1,0,0.0,0.0,0.0
147
+ Use smartphone :: buttons | chair | smartphone | table,1,0,0.0,0.0,0.0
148
+ Use smartphone :: buttons | smartphone | table,2,0,0.0,0.0,0.0
149
+ Use smartphone :: charging cable | paper strips | power bank | smartphone | star-shaped paper crafts,5,0,0.0,0.0,0.0
150
+ Walk towards shelves :: cardboard boxes | red bin | shelving unit,4,0,0.0,0.0,0.0
151
+ Walking towards door :: door | dustpan,1,0,0.0,0.0,0.0
152
+ Write count on paper :: marker | mobile phone | paper | power bank | star-shaped beads,1,0,0.0,0.0,0.0
results/omni_finetune/model_output_task_probes_20260616/action_object_relation/cosmos3_nano_future_window/predictions.csv ADDED
The diff for this file is too large to render. See raw diff
 
results/omni_finetune/model_output_task_probes_20260616/action_object_relation/cosmos3_super_reasoner/metrics.json CHANGED
@@ -8,7 +8,7 @@
8
  "predictions_csv": "results/omni_finetune/model_output_task_probes_20260616/action_object_relation/cosmos3_super_reasoner/predictions.csv"
9
  },
10
  "excluded_rows_without_true_relation": 2,
11
- "generated_at_utc": "2026-06-18T20:58:29+00:00",
12
  "labels": [
13
  "Adjust canned food on shelf :: canned food | cardboard box | store shelf",
14
  "Adjust item on shelf :: shelf | stationery package",
 
8
  "predictions_csv": "results/omni_finetune/model_output_task_probes_20260616/action_object_relation/cosmos3_super_reasoner/predictions.csv"
9
  },
10
  "excluded_rows_without_true_relation": 2,
11
+ "generated_at_utc": "2026-06-18T22:52:18+00:00",
12
  "labels": [
13
  "Adjust canned food on shelf :: canned food | cardboard box | store shelf",
14
  "Adjust item on shelf :: shelf | stationery package",
results/omni_finetune/model_output_task_probes_20260616/action_object_relation/qwen3_omni_v6_lora/metrics.json CHANGED
@@ -8,7 +8,7 @@
8
  "predictions_csv": "results/omni_finetune/model_output_task_probes_20260616/action_object_relation/qwen3_omni_v6_lora/predictions.csv"
9
  },
10
  "excluded_rows_without_true_relation": 18,
11
- "generated_at_utc": "2026-06-18T20:58:29+00:00",
12
  "labels": [
13
  "Adjust canned food on shelf :: canned food | cardboard box | store shelf",
14
  "Adjust item on shelf :: hand | packaged item | shelf",
 
8
  "predictions_csv": "results/omni_finetune/model_output_task_probes_20260616/action_object_relation/qwen3_omni_v6_lora/predictions.csv"
9
  },
10
  "excluded_rows_without_true_relation": 18,
11
+ "generated_at_utc": "2026-06-18T22:52:17+00:00",
12
  "labels": [
13
  "Adjust canned food on shelf :: canned food | cardboard box | store shelf",
14
  "Adjust item on shelf :: hand | packaged item | shelf",
results/omni_finetune/model_output_task_probes_20260616/caption_grounding/cosmos3_super_reasoner/metrics.json ADDED
@@ -0,0 +1,28 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "artifact_files": {
3
+ "metrics_json": "results/omni_finetune/model_output_task_probes_20260616/caption_grounding/cosmos3_super_reasoner/metrics.json",
4
+ "predictions_csv": "results/omni_finetune/model_output_task_probes_20260616/caption_grounding/cosmos3_super_reasoner/predictions.csv"
5
+ },
6
+ "caption_grounding_center_hit_rate": 0.3236607142857143,
7
+ "caption_grounding_iou": 0.30639899644580487,
8
+ "caption_grounding_within_20_frames": 0.35267857142857145,
9
+ "generated_at_utc": "2026-06-18T22:52:18+00:00",
10
+ "known_limitation": "This is an evidence-window localization score, not a candidate-set retrieval MRR.",
11
+ "metric_key": "caption_grounding_iou",
12
+ "missing_pred_evidence_window_count": 219,
13
+ "model_id": "cosmos3_super_reasoner",
14
+ "model_label": "Cosmos3-Super Reasoner",
15
+ "normalization_policy": "Evidence windows are frame intervals. The primary score is mean interval IoU; center-hit and within-20-frame rates are reported as diagnostics.",
16
+ "primary_metric": "caption_grounding_iou",
17
+ "primary_score": 0.30639899644580487,
18
+ "scope": "held_out_test_existing_verified_prediction_json",
19
+ "score_policy": "Derived from existing verified held-out structured JSON predictions. The task target is the evidence_window field already present in the true JSON; missing or invalid predicted evidence windows receive zero IoU.",
20
+ "scored_rows": 448,
21
+ "source_prediction_jsonl": "results/omni_finetune/verified_public/xperience10m_cosmos3_super_reasoner_128ep_test_full_20260607/eval/predictions.jsonl",
22
+ "status": "pass",
23
+ "task_id": "caption_grounding",
24
+ "task_label": "Language Grounding",
25
+ "task_number": 8,
26
+ "title": "Cosmos3-Super Reasoner Evidence-Window Grounding Probe",
27
+ "total_prediction_rows": 448
28
+ }
results/omni_finetune/model_output_task_probes_20260616/caption_grounding/cosmos3_super_reasoner/predictions.csv ADDED
@@ -0,0 +1,449 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ id,split,episode_id,true_start_frame,true_end_frame,pred_start_frame,pred_end_frame,pred_center_frame,center_error_frames,iou
2
+ 8a8e1b3c-607e-4ada-b3fd-fa639727e92c__ep1:qa:0,test,8a8e1b3c-607e-4ada-b3fd-fa639727e92c__ep1,0.0,19.0,0.0,19.0,9.5,0.0,1.0
3
+ 8a8e1b3c-607e-4ada-b3fd-fa639727e92c__ep1:qa:20,test,8a8e1b3c-607e-4ada-b3fd-fa639727e92c__ep1,400.0,419.0,400.0,419.0,409.5,0.0,1.0
4
+ 8a8e1b3c-607e-4ada-b3fd-fa639727e92c__ep1:qa:46,test,8a8e1b3c-607e-4ada-b3fd-fa639727e92c__ep1,920.0,939.0,914.0,939.0,926.5,3.0,0.7692307692307693
5
+ 8a8e1b3c-607e-4ada-b3fd-fa639727e92c__ep1:qa:50,test,8a8e1b3c-607e-4ada-b3fd-fa639727e92c__ep1,1000.0,1019.0,0.0,19.0,9.5,1000.0,0.0
6
+ 8a8e1b3c-607e-4ada-b3fd-fa639727e92c__ep1:qa:62,test,8a8e1b3c-607e-4ada-b3fd-fa639727e92c__ep1,1240.0,1259.0,1240.0,1259.0,1249.5,0.0,1.0
7
+ 8a8e1b3c-607e-4ada-b3fd-fa639727e92c__ep1:qa:70,test,8a8e1b3c-607e-4ada-b3fd-fa639727e92c__ep1,1400.0,1419.0,1410.0,1419.0,1414.5,5.0,0.5
8
+ 8a8e1b3c-607e-4ada-b3fd-fa639727e92c__ep1:qa:71,test,8a8e1b3c-607e-4ada-b3fd-fa639727e92c__ep1,1420.0,1439.0,1420.0,1439.0,1429.5,0.0,1.0
9
+ 8a8e1b3c-607e-4ada-b3fd-fa639727e92c__ep1:qa:90,test,8a8e1b3c-607e-4ada-b3fd-fa639727e92c__ep1,1800.0,1819.0,,,,,0.0
10
+ 8a8e1b3c-607e-4ada-b3fd-fa639727e92c__ep1:qa:100,test,8a8e1b3c-607e-4ada-b3fd-fa639727e92c__ep1,2000.0,2019.0,,,,,0.0
11
+ 8a8e1b3c-607e-4ada-b3fd-fa639727e92c__ep1:qa:120,test,8a8e1b3c-607e-4ada-b3fd-fa639727e92c__ep1,2400.0,2419.0,,,,,0.0
12
+ 8a8e1b3c-607e-4ada-b3fd-fa639727e92c__ep1:qa:126,test,8a8e1b3c-607e-4ada-b3fd-fa639727e92c__ep1,2520.0,2539.0,,,,,0.0
13
+ 8a8e1b3c-607e-4ada-b3fd-fa639727e92c__ep1:qa:127,test,8a8e1b3c-607e-4ada-b3fd-fa639727e92c__ep1,2540.0,2559.0,0.0,1.0,0.5,2549.0,0.0
14
+ 8a8e1b3c-607e-4ada-b3fd-fa639727e92c__ep1:qa:134,test,8a8e1b3c-607e-4ada-b3fd-fa639727e92c__ep1,2680.0,2699.0,2680.0,2699.0,2689.5,0.0,1.0
15
+ 8a8e1b3c-607e-4ada-b3fd-fa639727e92c__ep1:qa:140,test,8a8e1b3c-607e-4ada-b3fd-fa639727e92c__ep1,2800.0,2819.0,,,,,0.0
16
+ 8a8e1b3c-607e-4ada-b3fd-fa639727e92c__ep1:qa:150,test,8a8e1b3c-607e-4ada-b3fd-fa639727e92c__ep1,3000.0,3019.0,0.0,1.0,0.5,3009.0,0.0
17
+ 8a8e1b3c-607e-4ada-b3fd-fa639727e92c__ep1:qa:156,test,8a8e1b3c-607e-4ada-b3fd-fa639727e92c__ep1,3120.0,3139.0,3120.0,3139.0,3129.5,0.0,1.0
18
+ 8a8e1b3c-607e-4ada-b3fd-fa639727e92c__ep1:qa:166,test,8a8e1b3c-607e-4ada-b3fd-fa639727e92c__ep1,3320.0,3339.0,,,,,0.0
19
+ 8a8e1b3c-607e-4ada-b3fd-fa639727e92c__ep1:qa:170,test,8a8e1b3c-607e-4ada-b3fd-fa639727e92c__ep1,3400.0,3419.0,3264.0,3419.0,3341.5,68.0,0.1282051282051282
20
+ 8a8e1b3c-607e-4ada-b3fd-fa639727e92c__ep1:qa:184,test,8a8e1b3c-607e-4ada-b3fd-fa639727e92c__ep1,3680.0,3699.0,3680.0,3699.0,3689.5,0.0,1.0
21
+ 8a8e1b3c-607e-4ada-b3fd-fa639727e92c__ep1:qa:185,test,8a8e1b3c-607e-4ada-b3fd-fa639727e92c__ep1,3700.0,3719.0,3681.0,3719.0,3700.0,9.5,0.5128205128205128
22
+ 8a8e1b3c-607e-4ada-b3fd-fa639727e92c__ep1:qa:192,test,8a8e1b3c-607e-4ada-b3fd-fa639727e92c__ep1,3840.0,3859.0,3840.0,3859.0,3849.5,0.0,1.0
23
+ 8a8e1b3c-607e-4ada-b3fd-fa639727e92c__ep1:qa:200,test,8a8e1b3c-607e-4ada-b3fd-fa639727e92c__ep1,4000.0,4019.0,4000.0,4019.0,4009.5,0.0,1.0
24
+ 8a8e1b3c-607e-4ada-b3fd-fa639727e92c__ep1:qa:204,test,8a8e1b3c-607e-4ada-b3fd-fa639727e92c__ep1,4080.0,4099.0,4080.0,4099.0,4089.5,0.0,1.0
25
+ 8a8e1b3c-607e-4ada-b3fd-fa639727e92c__ep1:qa:205,test,8a8e1b3c-607e-4ada-b3fd-fa639727e92c__ep1,4100.0,4119.0,,,,,0.0
26
+ 8a8e1b3c-607e-4ada-b3fd-fa639727e92c__ep1:qa:212,test,8a8e1b3c-607e-4ada-b3fd-fa639727e92c__ep1,4240.0,4259.0,4240.0,4259.0,4249.5,0.0,1.0
27
+ 8a8e1b3c-607e-4ada-b3fd-fa639727e92c__ep1:qa:220,test,8a8e1b3c-607e-4ada-b3fd-fa639727e92c__ep1,4400.0,4419.0,,,,,0.0
28
+ 8a8e1b3c-607e-4ada-b3fd-fa639727e92c__ep1:qa:224,test,8a8e1b3c-607e-4ada-b3fd-fa639727e92c__ep1,4480.0,4499.0,0.0,1.0,0.5,4489.0,0.0
29
+ 8a8e1b3c-607e-4ada-b3fd-fa639727e92c__ep1:qa:232,test,8a8e1b3c-607e-4ada-b3fd-fa639727e92c__ep1,4640.0,4659.0,4640.0,4659.0,4649.5,0.0,1.0
30
+ 8a8e1b3c-607e-4ada-b3fd-fa639727e92c__ep1:qa:236,test,8a8e1b3c-607e-4ada-b3fd-fa639727e92c__ep1,4720.0,4739.0,4720.0,4739.0,4729.5,0.0,1.0
31
+ 8a8e1b3c-607e-4ada-b3fd-fa639727e92c__ep1:qa:237,test,8a8e1b3c-607e-4ada-b3fd-fa639727e92c__ep1,4740.0,4759.0,4740.0,4759.0,4749.5,0.0,1.0
32
+ 8a8e1b3c-607e-4ada-b3fd-fa639727e92c__ep1:qa:240,test,8a8e1b3c-607e-4ada-b3fd-fa639727e92c__ep1,4800.0,4819.0,4790.0,4819.0,4804.5,5.0,0.6666666666666666
33
+ 8a8e1b3c-607e-4ada-b3fd-fa639727e92c__ep1:qa:244,test,8a8e1b3c-607e-4ada-b3fd-fa639727e92c__ep1,4880.0,4899.0,4880.0,4899.0,4889.5,0.0,1.0
34
+ a1012a57-385e-45a9-8a59-694a26fe92a5__ep1:qa:0,test,a1012a57-385e-45a9-8a59-694a26fe92a5__ep1,0.0,19.0,0.0,19.0,9.5,0.0,1.0
35
+ a1012a57-385e-45a9-8a59-694a26fe92a5__ep1:qa:1,test,a1012a57-385e-45a9-8a59-694a26fe92a5__ep1,20.0,39.0,0.0,1.0,0.5,29.0,0.0
36
+ a1012a57-385e-45a9-8a59-694a26fe92a5__ep1:qa:2,test,a1012a57-385e-45a9-8a59-694a26fe92a5__ep1,40.0,59.0,0.0,59.0,29.5,20.0,0.3333333333333333
37
+ a1012a57-385e-45a9-8a59-694a26fe92a5__ep1:qa:3,test,a1012a57-385e-45a9-8a59-694a26fe92a5__ep1,60.0,79.0,0.0,1.0,0.5,69.0,0.0
38
+ a1012a57-385e-45a9-8a59-694a26fe92a5__ep1:qa:4,test,a1012a57-385e-45a9-8a59-694a26fe92a5__ep1,80.0,99.0,0.0,99.0,49.5,40.0,0.2
39
+ a1012a57-385e-45a9-8a59-694a26fe92a5__ep1:qa:5,test,a1012a57-385e-45a9-8a59-694a26fe92a5__ep1,100.0,119.0,0.0,119.0,59.5,50.0,0.16666666666666666
40
+ a1012a57-385e-45a9-8a59-694a26fe92a5__ep1:qa:6,test,a1012a57-385e-45a9-8a59-694a26fe92a5__ep1,120.0,139.0,0.0,139.0,69.5,60.0,0.14285714285714285
41
+ a1012a57-385e-45a9-8a59-694a26fe92a5__ep1:qa:12,test,a1012a57-385e-45a9-8a59-694a26fe92a5__ep1,240.0,259.0,,,,,0.0
42
+ a1012a57-385e-45a9-8a59-694a26fe92a5__ep1:qa:13,test,a1012a57-385e-45a9-8a59-694a26fe92a5__ep1,260.0,279.0,,,,,0.0
43
+ a1012a57-385e-45a9-8a59-694a26fe92a5__ep1:qa:14,test,a1012a57-385e-45a9-8a59-694a26fe92a5__ep1,280.0,299.0,,,,,0.0
44
+ a1012a57-385e-45a9-8a59-694a26fe92a5__ep1:qa:15,test,a1012a57-385e-45a9-8a59-694a26fe92a5__ep1,300.0,319.0,290.0,319.0,304.5,5.0,0.6666666666666666
45
+ a1012a57-385e-45a9-8a59-694a26fe92a5__ep1:qa:16,test,a1012a57-385e-45a9-8a59-694a26fe92a5__ep1,320.0,339.0,310.0,339.0,324.5,5.0,0.6666666666666666
46
+ a1012a57-385e-45a9-8a59-694a26fe92a5__ep1:qa:17,test,a1012a57-385e-45a9-8a59-694a26fe92a5__ep1,340.0,359.0,,,,,0.0
47
+ a1012a57-385e-45a9-8a59-694a26fe92a5__ep1:qa:18,test,a1012a57-385e-45a9-8a59-694a26fe92a5__ep1,360.0,379.0,360.0,379.0,369.5,0.0,1.0
48
+ a1012a57-385e-45a9-8a59-694a26fe92a5__ep1:qa:19,test,a1012a57-385e-45a9-8a59-694a26fe92a5__ep1,380.0,399.0,380.0,399.0,389.5,0.0,1.0
49
+ a1012a57-385e-45a9-8a59-694a26fe92a5__ep1:qa:20,test,a1012a57-385e-45a9-8a59-694a26fe92a5__ep1,400.0,419.0,393.0,419.0,406.0,3.5,0.7407407407407407
50
+ a1012a57-385e-45a9-8a59-694a26fe92a5__ep1:qa:21,test,a1012a57-385e-45a9-8a59-694a26fe92a5__ep1,420.0,439.0,419.0,439.0,429.0,0.5,0.9523809523809523
51
+ a1012a57-385e-45a9-8a59-694a26fe92a5__ep1:qa:22,test,a1012a57-385e-45a9-8a59-694a26fe92a5__ep1,440.0,459.0,430.0,459.0,444.5,5.0,0.6666666666666666
52
+ a1012a57-385e-45a9-8a59-694a26fe92a5__ep1:qa:23,test,a1012a57-385e-45a9-8a59-694a26fe92a5__ep1,460.0,479.0,460.0,479.0,469.5,0.0,1.0
53
+ a1012a57-385e-45a9-8a59-694a26fe92a5__ep1:qa:24,test,a1012a57-385e-45a9-8a59-694a26fe92a5__ep1,480.0,499.0,480.0,499.0,489.5,0.0,1.0
54
+ a1012a57-385e-45a9-8a59-694a26fe92a5__ep1:qa:25,test,a1012a57-385e-45a9-8a59-694a26fe92a5__ep1,500.0,519.0,493.0,519.0,506.0,3.5,0.7407407407407407
55
+ a1012a57-385e-45a9-8a59-694a26fe92a5__ep1:qa:26,test,a1012a57-385e-45a9-8a59-694a26fe92a5__ep1,520.0,539.0,,,,,0.0
56
+ a1012a57-385e-45a9-8a59-694a26fe92a5__ep1:qa:250,test,a1012a57-385e-45a9-8a59-694a26fe92a5__ep1,5000.0,5019.0,,,,,0.0
57
+ a1012a57-385e-45a9-8a59-694a26fe92a5__ep1:qa:251,test,a1012a57-385e-45a9-8a59-694a26fe92a5__ep1,5020.0,5039.0,,,,,0.0
58
+ a1012a57-385e-45a9-8a59-694a26fe92a5__ep1:qa:252,test,a1012a57-385e-45a9-8a59-694a26fe92a5__ep1,5040.0,5059.0,5040.0,5059.0,5049.5,0.0,1.0
59
+ a1012a57-385e-45a9-8a59-694a26fe92a5__ep1:qa:253,test,a1012a57-385e-45a9-8a59-694a26fe92a5__ep1,5060.0,5079.0,,,,,0.0
60
+ a1012a57-385e-45a9-8a59-694a26fe92a5__ep1:qa:254,test,a1012a57-385e-45a9-8a59-694a26fe92a5__ep1,5080.0,5099.0,,,,,0.0
61
+ a1012a57-385e-45a9-8a59-694a26fe92a5__ep1:qa:255,test,a1012a57-385e-45a9-8a59-694a26fe92a5__ep1,5100.0,5119.0,5090.0,5119.0,5104.5,5.0,0.6666666666666666
62
+ a1012a57-385e-45a9-8a59-694a26fe92a5__ep1:qa:256,test,a1012a57-385e-45a9-8a59-694a26fe92a5__ep1,5120.0,5139.0,5114.0,5139.0,5126.5,3.0,0.7692307692307693
63
+ a1012a57-385e-45a9-8a59-694a26fe92a5__ep1:qa:294,test,a1012a57-385e-45a9-8a59-694a26fe92a5__ep1,5880.0,5899.0,,,,,0.0
64
+ a1012a57-385e-45a9-8a59-694a26fe92a5__ep1:qa:295,test,a1012a57-385e-45a9-8a59-694a26fe92a5__ep1,5900.0,5919.0,,,,,0.0
65
+ a1012a57-385e-45a9-8a59-694a26fe92a5__ep1:qa:296,test,a1012a57-385e-45a9-8a59-694a26fe92a5__ep1,5920.0,5939.0,0.0,1.0,0.5,5929.0,0.0
66
+ 33f7ae08-ac1d-4321-9cb9-eca79016b359__ep1:qa:0,test,33f7ae08-ac1d-4321-9cb9-eca79016b359__ep1,0.0,19.0,0.0,1.0,0.5,9.0,0.1
67
+ 33f7ae08-ac1d-4321-9cb9-eca79016b359__ep1:qa:1,test,33f7ae08-ac1d-4321-9cb9-eca79016b359__ep1,20.0,39.0,,,,,0.0
68
+ 33f7ae08-ac1d-4321-9cb9-eca79016b359__ep1:qa:16,test,33f7ae08-ac1d-4321-9cb9-eca79016b359__ep1,320.0,339.0,0.0,1.0,0.5,329.0,0.0
69
+ 33f7ae08-ac1d-4321-9cb9-eca79016b359__ep1:qa:17,test,33f7ae08-ac1d-4321-9cb9-eca79016b359__ep1,340.0,359.0,0.0,1.0,0.5,349.0,0.0
70
+ 33f7ae08-ac1d-4321-9cb9-eca79016b359__ep1:qa:20,test,33f7ae08-ac1d-4321-9cb9-eca79016b359__ep1,400.0,419.0,380.0,419.0,399.5,10.0,0.5
71
+ 33f7ae08-ac1d-4321-9cb9-eca79016b359__ep1:qa:21,test,33f7ae08-ac1d-4321-9cb9-eca79016b359__ep1,420.0,439.0,,,,,0.0
72
+ 33f7ae08-ac1d-4321-9cb9-eca79016b359__ep1:qa:46,test,33f7ae08-ac1d-4321-9cb9-eca79016b359__ep1,920.0,939.0,,,,,0.0
73
+ 33f7ae08-ac1d-4321-9cb9-eca79016b359__ep1:qa:47,test,33f7ae08-ac1d-4321-9cb9-eca79016b359__ep1,940.0,959.0,,,,,0.0
74
+ 33f7ae08-ac1d-4321-9cb9-eca79016b359__ep1:qa:50,test,33f7ae08-ac1d-4321-9cb9-eca79016b359__ep1,1000.0,1019.0,0.0,1.0,0.5,1009.0,0.0
75
+ 33f7ae08-ac1d-4321-9cb9-eca79016b359__ep1:qa:58,test,33f7ae08-ac1d-4321-9cb9-eca79016b359__ep1,1160.0,1179.0,1160.0,1179.0,1169.5,0.0,1.0
76
+ 33f7ae08-ac1d-4321-9cb9-eca79016b359__ep1:qa:59,test,33f7ae08-ac1d-4321-9cb9-eca79016b359__ep1,1180.0,1199.0,0.0,0.0,0.0,1189.5,0.0
77
+ 33f7ae08-ac1d-4321-9cb9-eca79016b359__ep1:qa:64,test,33f7ae08-ac1d-4321-9cb9-eca79016b359__ep1,1280.0,1299.0,1280.0,1299.0,1289.5,0.0,1.0
78
+ 33f7ae08-ac1d-4321-9cb9-eca79016b359__ep1:qa:65,test,33f7ae08-ac1d-4321-9cb9-eca79016b359__ep1,1300.0,1319.0,1300.0,1319.0,1309.5,0.0,1.0
79
+ 33f7ae08-ac1d-4321-9cb9-eca79016b359__ep1:qa:70,test,33f7ae08-ac1d-4321-9cb9-eca79016b359__ep1,1400.0,1419.0,1398.0,1419.0,1408.5,1.0,0.9090909090909091
80
+ 33f7ae08-ac1d-4321-9cb9-eca79016b359__ep1:qa:76,test,33f7ae08-ac1d-4321-9cb9-eca79016b359__ep1,1520.0,1539.0,1520.0,1539.0,1529.5,0.0,1.0
81
+ 33f7ae08-ac1d-4321-9cb9-eca79016b359__ep1:qa:77,test,33f7ae08-ac1d-4321-9cb9-eca79016b359__ep1,1540.0,1559.0,,,,,0.0
82
+ 33f7ae08-ac1d-4321-9cb9-eca79016b359__ep1:qa:100,test,33f7ae08-ac1d-4321-9cb9-eca79016b359__ep1,2000.0,2019.0,1965.0,2019.0,1992.0,17.5,0.36363636363636365
83
+ 33f7ae08-ac1d-4321-9cb9-eca79016b359__ep1:qa:101,test,33f7ae08-ac1d-4321-9cb9-eca79016b359__ep1,2020.0,2039.0,0.0,1.0,0.5,2029.0,0.0
84
+ 33f7ae08-ac1d-4321-9cb9-eca79016b359__ep1:qa:126,test,33f7ae08-ac1d-4321-9cb9-eca79016b359__ep1,2520.0,2539.0,2518.0,2539.0,2528.5,1.0,0.9090909090909091
85
+ 33f7ae08-ac1d-4321-9cb9-eca79016b359__ep1:qa:138,test,33f7ae08-ac1d-4321-9cb9-eca79016b359__ep1,2760.0,2779.0,0.0,1.0,0.5,2769.0,0.0
86
+ 33f7ae08-ac1d-4321-9cb9-eca79016b359__ep1:qa:140,test,33f7ae08-ac1d-4321-9cb9-eca79016b359__ep1,2800.0,2819.0,0.0,19.0,9.5,2800.0,0.0
87
+ 33f7ae08-ac1d-4321-9cb9-eca79016b359__ep1:qa:141,test,33f7ae08-ac1d-4321-9cb9-eca79016b359__ep1,2820.0,2839.0,2820.0,2839.0,2829.5,0.0,1.0
88
+ 33f7ae08-ac1d-4321-9cb9-eca79016b359__ep1:qa:150,test,33f7ae08-ac1d-4321-9cb9-eca79016b359__ep1,3000.0,3019.0,3000.0,3019.0,3009.5,0.0,1.0
89
+ 33f7ae08-ac1d-4321-9cb9-eca79016b359__ep1:qa:151,test,33f7ae08-ac1d-4321-9cb9-eca79016b359__ep1,3020.0,3039.0,3020.0,3039.0,3029.5,0.0,1.0
90
+ 33f7ae08-ac1d-4321-9cb9-eca79016b359__ep1:qa:164,test,33f7ae08-ac1d-4321-9cb9-eca79016b359__ep1,3280.0,3299.0,3280.0,3299.0,3289.5,0.0,1.0
91
+ 33f7ae08-ac1d-4321-9cb9-eca79016b359__ep1:qa:165,test,33f7ae08-ac1d-4321-9cb9-eca79016b359__ep1,3300.0,3319.0,0.0,19.0,9.5,3300.0,0.0
92
+ 33f7ae08-ac1d-4321-9cb9-eca79016b359__ep1:qa:172,test,33f7ae08-ac1d-4321-9cb9-eca79016b359__ep1,3440.0,3459.0,3380.0,3459.0,3419.5,30.0,0.25
93
+ 33f7ae08-ac1d-4321-9cb9-eca79016b359__ep1:qa:173,test,33f7ae08-ac1d-4321-9cb9-eca79016b359__ep1,3460.0,3479.0,3460.0,3479.0,3469.5,0.0,1.0
94
+ 33f7ae08-ac1d-4321-9cb9-eca79016b359__ep1:qa:182,test,33f7ae08-ac1d-4321-9cb9-eca79016b359__ep1,3640.0,3659.0,3639.0,3659.0,3649.0,0.5,0.9523809523809523
95
+ 33f7ae08-ac1d-4321-9cb9-eca79016b359__ep1:qa:183,test,33f7ae08-ac1d-4321-9cb9-eca79016b359__ep1,3660.0,3679.0,3660.0,3679.0,3669.5,0.0,1.0
96
+ 33f7ae08-ac1d-4321-9cb9-eca79016b359__ep1:qa:226,test,33f7ae08-ac1d-4321-9cb9-eca79016b359__ep1,4520.0,4539.0,4518.0,4539.0,4528.5,1.0,0.9090909090909091
97
+ 33f7ae08-ac1d-4321-9cb9-eca79016b359__ep1:qa:244,test,33f7ae08-ac1d-4321-9cb9-eca79016b359__ep1,4880.0,4899.0,4880.0,4899.0,4889.5,0.0,1.0
98
+ 9c553886-83c5-4dc4-be5c-dcb269b3a771__ep2:qa:0,test,9c553886-83c5-4dc4-be5c-dcb269b3a771__ep2,0.0,19.0,,,,,0.0
99
+ 9c553886-83c5-4dc4-be5c-dcb269b3a771__ep2:qa:1,test,9c553886-83c5-4dc4-be5c-dcb269b3a771__ep2,20.0,39.0,,,,,0.0
100
+ 9c553886-83c5-4dc4-be5c-dcb269b3a771__ep2:qa:2,test,9c553886-83c5-4dc4-be5c-dcb269b3a771__ep2,40.0,59.0,,,,,0.0
101
+ 9c553886-83c5-4dc4-be5c-dcb269b3a771__ep2:qa:26,test,9c553886-83c5-4dc4-be5c-dcb269b3a771__ep2,520.0,539.0,,,,,0.0
102
+ 9c553886-83c5-4dc4-be5c-dcb269b3a771__ep2:qa:27,test,9c553886-83c5-4dc4-be5c-dcb269b3a771__ep2,540.0,559.0,,,,,0.0
103
+ 9c553886-83c5-4dc4-be5c-dcb269b3a771__ep2:qa:30,test,9c553886-83c5-4dc4-be5c-dcb269b3a771__ep2,600.0,619.0,,,,,0.0
104
+ 9c553886-83c5-4dc4-be5c-dcb269b3a771__ep2:qa:31,test,9c553886-83c5-4dc4-be5c-dcb269b3a771__ep2,620.0,639.0,,,,,0.0
105
+ 9c553886-83c5-4dc4-be5c-dcb269b3a771__ep2:qa:70,test,9c553886-83c5-4dc4-be5c-dcb269b3a771__ep2,1400.0,1419.0,,,,,0.0
106
+ 9c553886-83c5-4dc4-be5c-dcb269b3a771__ep2:qa:71,test,9c553886-83c5-4dc4-be5c-dcb269b3a771__ep2,1420.0,1439.0,,,,,0.0
107
+ 9c553886-83c5-4dc4-be5c-dcb269b3a771__ep2:qa:72,test,9c553886-83c5-4dc4-be5c-dcb269b3a771__ep2,1440.0,1459.0,,,,,0.0
108
+ 9c553886-83c5-4dc4-be5c-dcb269b3a771__ep2:qa:90,test,9c553886-83c5-4dc4-be5c-dcb269b3a771__ep2,1800.0,1819.0,,,,,0.0
109
+ 9c553886-83c5-4dc4-be5c-dcb269b3a771__ep2:qa:91,test,9c553886-83c5-4dc4-be5c-dcb269b3a771__ep2,1820.0,1839.0,,,,,0.0
110
+ 9c553886-83c5-4dc4-be5c-dcb269b3a771__ep2:qa:110,test,9c553886-83c5-4dc4-be5c-dcb269b3a771__ep2,2200.0,2219.0,2194.0,2219.0,2206.5,3.0,0.7692307692307693
111
+ 9c553886-83c5-4dc4-be5c-dcb269b3a771__ep2:qa:111,test,9c553886-83c5-4dc4-be5c-dcb269b3a771__ep2,2220.0,2239.0,2220.0,2239.0,2229.5,0.0,1.0
112
+ 9c553886-83c5-4dc4-be5c-dcb269b3a771__ep2:qa:112,test,9c553886-83c5-4dc4-be5c-dcb269b3a771__ep2,2240.0,2259.0,2240.0,2259.0,2249.5,0.0,1.0
113
+ 9c553886-83c5-4dc4-be5c-dcb269b3a771__ep2:qa:170,test,9c553886-83c5-4dc4-be5c-dcb269b3a771__ep2,3400.0,3419.0,,,,,0.0
114
+ 9c553886-83c5-4dc4-be5c-dcb269b3a771__ep2:qa:171,test,9c553886-83c5-4dc4-be5c-dcb269b3a771__ep2,3420.0,3439.0,,,,,0.0
115
+ 9c553886-83c5-4dc4-be5c-dcb269b3a771__ep2:qa:172,test,9c553886-83c5-4dc4-be5c-dcb269b3a771__ep2,3440.0,3459.0,,,,,0.0
116
+ 9c553886-83c5-4dc4-be5c-dcb269b3a771__ep2:qa:230,test,9c553886-83c5-4dc4-be5c-dcb269b3a771__ep2,4600.0,4619.0,,,,,0.0
117
+ 9c553886-83c5-4dc4-be5c-dcb269b3a771__ep2:qa:231,test,9c553886-83c5-4dc4-be5c-dcb269b3a771__ep2,4620.0,4639.0,,,,,0.0
118
+ 9c553886-83c5-4dc4-be5c-dcb269b3a771__ep2:qa:276,test,9c553886-83c5-4dc4-be5c-dcb269b3a771__ep2,5520.0,5539.0,,,,,0.0
119
+ 9c553886-83c5-4dc4-be5c-dcb269b3a771__ep2:qa:277,test,9c553886-83c5-4dc4-be5c-dcb269b3a771__ep2,5540.0,5559.0,,,,,0.0
120
+ 9c553886-83c5-4dc4-be5c-dcb269b3a771__ep2:qa:278,test,9c553886-83c5-4dc4-be5c-dcb269b3a771__ep2,5560.0,5579.0,,,,,0.0
121
+ 9c553886-83c5-4dc4-be5c-dcb269b3a771__ep2:qa:282,test,9c553886-83c5-4dc4-be5c-dcb269b3a771__ep2,5640.0,5659.0,,,,,0.0
122
+ 9c553886-83c5-4dc4-be5c-dcb269b3a771__ep2:qa:283,test,9c553886-83c5-4dc4-be5c-dcb269b3a771__ep2,5660.0,5679.0,,,,,0.0
123
+ 9c553886-83c5-4dc4-be5c-dcb269b3a771__ep2:qa:284,test,9c553886-83c5-4dc4-be5c-dcb269b3a771__ep2,5680.0,5699.0,,,,,0.0
124
+ 9c553886-83c5-4dc4-be5c-dcb269b3a771__ep2:qa:290,test,9c553886-83c5-4dc4-be5c-dcb269b3a771__ep2,5800.0,5819.0,,,,,0.0
125
+ 9c553886-83c5-4dc4-be5c-dcb269b3a771__ep2:qa:291,test,9c553886-83c5-4dc4-be5c-dcb269b3a771__ep2,5820.0,5839.0,,,,,0.0
126
+ 9c553886-83c5-4dc4-be5c-dcb269b3a771__ep2:qa:292,test,9c553886-83c5-4dc4-be5c-dcb269b3a771__ep2,5840.0,5859.0,,,,,0.0
127
+ 9c553886-83c5-4dc4-be5c-dcb269b3a771__ep2:qa:293,test,9c553886-83c5-4dc4-be5c-dcb269b3a771__ep2,5860.0,5879.0,,,,,0.0
128
+ 9c553886-83c5-4dc4-be5c-dcb269b3a771__ep2:qa:294,test,9c553886-83c5-4dc4-be5c-dcb269b3a771__ep2,5880.0,5899.0,,,,,0.0
129
+ 9c553886-83c5-4dc4-be5c-dcb269b3a771__ep2:qa:295,test,9c553886-83c5-4dc4-be5c-dcb269b3a771__ep2,5900.0,5919.0,,,,,0.0
130
+ 34f07a04-eb37-45a3-95ec-189ed5f4a85b__ep5:qa:0,test,34f07a04-eb37-45a3-95ec-189ed5f4a85b__ep5,0.0,19.0,0.0,19.0,9.5,0.0,1.0
131
+ 34f07a04-eb37-45a3-95ec-189ed5f4a85b__ep5:qa:12,test,34f07a04-eb37-45a3-95ec-189ed5f4a85b__ep5,240.0,259.0,240.0,259.0,249.5,0.0,1.0
132
+ 34f07a04-eb37-45a3-95ec-189ed5f4a85b__ep5:qa:64,test,34f07a04-eb37-45a3-95ec-189ed5f4a85b__ep5,1280.0,1299.0,1280.0,1299.0,1289.5,0.0,1.0
133
+ 34f07a04-eb37-45a3-95ec-189ed5f4a85b__ep5:qa:65,test,34f07a04-eb37-45a3-95ec-189ed5f4a85b__ep5,1300.0,1319.0,1300.0,1319.0,1309.5,0.0,1.0
134
+ 34f07a04-eb37-45a3-95ec-189ed5f4a85b__ep5:qa:70,test,34f07a04-eb37-45a3-95ec-189ed5f4a85b__ep5,1400.0,1419.0,1395.0,1419.0,1407.0,2.5,0.8
135
+ 34f07a04-eb37-45a3-95ec-189ed5f4a85b__ep5:qa:71,test,34f07a04-eb37-45a3-95ec-189ed5f4a85b__ep5,1420.0,1439.0,1420.0,1439.0,1429.5,0.0,1.0
136
+ 34f07a04-eb37-45a3-95ec-189ed5f4a85b__ep5:qa:82,test,34f07a04-eb37-45a3-95ec-189ed5f4a85b__ep5,1640.0,1659.0,1640.0,1659.0,1649.5,0.0,1.0
137
+ 34f07a04-eb37-45a3-95ec-189ed5f4a85b__ep5:qa:90,test,34f07a04-eb37-45a3-95ec-189ed5f4a85b__ep5,1800.0,1819.0,1796.0,1819.0,1807.5,2.0,0.8333333333333334
138
+ 34f07a04-eb37-45a3-95ec-189ed5f4a85b__ep5:qa:91,test,34f07a04-eb37-45a3-95ec-189ed5f4a85b__ep5,1820.0,1839.0,1820.0,1839.0,1829.5,0.0,1.0
139
+ 34f07a04-eb37-45a3-95ec-189ed5f4a85b__ep5:qa:106,test,34f07a04-eb37-45a3-95ec-189ed5f4a85b__ep5,2120.0,2139.0,2120.0,2139.0,2129.5,0.0,1.0
140
+ 34f07a04-eb37-45a3-95ec-189ed5f4a85b__ep5:qa:140,test,34f07a04-eb37-45a3-95ec-189ed5f4a85b__ep5,2800.0,2819.0,2698.0,2819.0,2758.5,51.0,0.16393442622950818
141
+ 34f07a04-eb37-45a3-95ec-189ed5f4a85b__ep5:qa:141,test,34f07a04-eb37-45a3-95ec-189ed5f4a85b__ep5,2820.0,2839.0,2816.0,2839.0,2827.5,2.0,0.8333333333333334
142
+ 34f07a04-eb37-45a3-95ec-189ed5f4a85b__ep5:qa:154,test,34f07a04-eb37-45a3-95ec-189ed5f4a85b__ep5,3080.0,3099.0,3080.0,3099.0,3089.5,0.0,1.0
143
+ 34f07a04-eb37-45a3-95ec-189ed5f4a85b__ep5:qa:160,test,34f07a04-eb37-45a3-95ec-189ed5f4a85b__ep5,3200.0,3219.0,0.0,19.0,9.5,3200.0,0.0
144
+ 34f07a04-eb37-45a3-95ec-189ed5f4a85b__ep5:qa:166,test,34f07a04-eb37-45a3-95ec-189ed5f4a85b__ep5,3320.0,3339.0,3320.0,3339.0,3329.5,0.0,1.0
145
+ 34f07a04-eb37-45a3-95ec-189ed5f4a85b__ep5:qa:167,test,34f07a04-eb37-45a3-95ec-189ed5f4a85b__ep5,3340.0,3359.0,3340.0,3359.0,3349.5,0.0,1.0
146
+ 34f07a04-eb37-45a3-95ec-189ed5f4a85b__ep5:qa:190,test,34f07a04-eb37-45a3-95ec-189ed5f4a85b__ep5,3800.0,3819.0,3795.0,3819.0,3807.0,2.5,0.8
147
+ 34f07a04-eb37-45a3-95ec-189ed5f4a85b__ep5:qa:191,test,34f07a04-eb37-45a3-95ec-189ed5f4a85b__ep5,3820.0,3839.0,3819.0,3839.0,3829.0,0.5,0.9523809523809523
148
+ 34f07a04-eb37-45a3-95ec-189ed5f4a85b__ep5:qa:198,test,34f07a04-eb37-45a3-95ec-189ed5f4a85b__ep5,3960.0,3979.0,3960.0,3979.0,3969.5,0.0,1.0
149
+ 34f07a04-eb37-45a3-95ec-189ed5f4a85b__ep5:qa:199,test,34f07a04-eb37-45a3-95ec-189ed5f4a85b__ep5,3980.0,3999.0,3980.0,3999.0,3989.5,0.0,1.0
150
+ 34f07a04-eb37-45a3-95ec-189ed5f4a85b__ep5:qa:206,test,34f07a04-eb37-45a3-95ec-189ed5f4a85b__ep5,4120.0,4139.0,4116.0,4139.0,4127.5,2.0,0.8333333333333334
151
+ 34f07a04-eb37-45a3-95ec-189ed5f4a85b__ep5:qa:207,test,34f07a04-eb37-45a3-95ec-189ed5f4a85b__ep5,4140.0,4159.0,4140.0,4159.0,4149.5,0.0,1.0
152
+ 34f07a04-eb37-45a3-95ec-189ed5f4a85b__ep5:qa:218,test,34f07a04-eb37-45a3-95ec-189ed5f4a85b__ep5,4360.0,4379.0,,,,,0.0
153
+ 34f07a04-eb37-45a3-95ec-189ed5f4a85b__ep5:qa:219,test,34f07a04-eb37-45a3-95ec-189ed5f4a85b__ep5,4380.0,4399.0,4380.0,4399.0,4389.5,0.0,1.0
154
+ 34f07a04-eb37-45a3-95ec-189ed5f4a85b__ep5:qa:220,test,34f07a04-eb37-45a3-95ec-189ed5f4a85b__ep5,4400.0,4419.0,,,,,0.0
155
+ 34f07a04-eb37-45a3-95ec-189ed5f4a85b__ep5:qa:221,test,34f07a04-eb37-45a3-95ec-189ed5f4a85b__ep5,4420.0,4439.0,4420.0,4439.0,4429.5,0.0,1.0
156
+ 34f07a04-eb37-45a3-95ec-189ed5f4a85b__ep5:qa:236,test,34f07a04-eb37-45a3-95ec-189ed5f4a85b__ep5,4720.0,4739.0,,,,,0.0
157
+ 34f07a04-eb37-45a3-95ec-189ed5f4a85b__ep5:qa:237,test,34f07a04-eb37-45a3-95ec-189ed5f4a85b__ep5,4740.0,4759.0,4740.0,4759.0,4749.5,0.0,1.0
158
+ 34f07a04-eb37-45a3-95ec-189ed5f4a85b__ep5:qa:240,test,34f07a04-eb37-45a3-95ec-189ed5f4a85b__ep5,4800.0,4819.0,4799.0,4819.0,4809.0,0.5,0.9523809523809523
159
+ 34f07a04-eb37-45a3-95ec-189ed5f4a85b__ep5:qa:241,test,34f07a04-eb37-45a3-95ec-189ed5f4a85b__ep5,4820.0,4839.0,0.0,1.0,0.5,4829.0,0.0
160
+ 34f07a04-eb37-45a3-95ec-189ed5f4a85b__ep5:qa:244,test,34f07a04-eb37-45a3-95ec-189ed5f4a85b__ep5,4880.0,4899.0,4880.0,4899.0,4889.5,0.0,1.0
161
+ 34f07a04-eb37-45a3-95ec-189ed5f4a85b__ep5:qa:245,test,34f07a04-eb37-45a3-95ec-189ed5f4a85b__ep5,4900.0,4919.0,0.0,19.0,9.5,4900.0,0.0
162
+ b9dd769b-e31a-4fdb-945e-5a60db6487b0__ep2:qa:0,test,b9dd769b-e31a-4fdb-945e-5a60db6487b0__ep2,0.0,19.0,0.0,1.0,0.5,9.0,0.1
163
+ b9dd769b-e31a-4fdb-945e-5a60db6487b0__ep2:qa:1,test,b9dd769b-e31a-4fdb-945e-5a60db6487b0__ep2,20.0,39.0,,,,,0.0
164
+ b9dd769b-e31a-4fdb-945e-5a60db6487b0__ep2:qa:2,test,b9dd769b-e31a-4fdb-945e-5a60db6487b0__ep2,40.0,59.0,,,,,0.0
165
+ b9dd769b-e31a-4fdb-945e-5a60db6487b0__ep2:qa:40,test,b9dd769b-e31a-4fdb-945e-5a60db6487b0__ep2,800.0,819.0,782.0,819.0,800.5,9.0,0.5263157894736842
166
+ b9dd769b-e31a-4fdb-945e-5a60db6487b0__ep2:qa:41,test,b9dd769b-e31a-4fdb-945e-5a60db6487b0__ep2,820.0,839.0,,,,,0.0
167
+ b9dd769b-e31a-4fdb-945e-5a60db6487b0__ep2:qa:42,test,b9dd769b-e31a-4fdb-945e-5a60db6487b0__ep2,840.0,859.0,840.0,859.0,849.5,0.0,1.0
168
+ b9dd769b-e31a-4fdb-945e-5a60db6487b0__ep2:qa:43,test,b9dd769b-e31a-4fdb-945e-5a60db6487b0__ep2,860.0,879.0,,,,,0.0
169
+ b9dd769b-e31a-4fdb-945e-5a60db6487b0__ep2:qa:70,test,b9dd769b-e31a-4fdb-945e-5a60db6487b0__ep2,1400.0,1419.0,,,,,0.0
170
+ b9dd769b-e31a-4fdb-945e-5a60db6487b0__ep2:qa:71,test,b9dd769b-e31a-4fdb-945e-5a60db6487b0__ep2,1420.0,1439.0,,,,,0.0
171
+ b9dd769b-e31a-4fdb-945e-5a60db6487b0__ep2:qa:72,test,b9dd769b-e31a-4fdb-945e-5a60db6487b0__ep2,1440.0,1459.0,,,,,0.0
172
+ b9dd769b-e31a-4fdb-945e-5a60db6487b0__ep2:qa:73,test,b9dd769b-e31a-4fdb-945e-5a60db6487b0__ep2,1460.0,1479.0,,,,,0.0
173
+ b9dd769b-e31a-4fdb-945e-5a60db6487b0__ep2:qa:90,test,b9dd769b-e31a-4fdb-945e-5a60db6487b0__ep2,1800.0,1819.0,,,,,0.0
174
+ b9dd769b-e31a-4fdb-945e-5a60db6487b0__ep2:qa:91,test,b9dd769b-e31a-4fdb-945e-5a60db6487b0__ep2,1820.0,1839.0,,,,,0.0
175
+ b9dd769b-e31a-4fdb-945e-5a60db6487b0__ep2:qa:92,test,b9dd769b-e31a-4fdb-945e-5a60db6487b0__ep2,1840.0,1859.0,,,,,0.0
176
+ b9dd769b-e31a-4fdb-945e-5a60db6487b0__ep2:qa:94,test,b9dd769b-e31a-4fdb-945e-5a60db6487b0__ep2,1880.0,1899.0,0.0,1.0,0.5,1889.0,0.0
177
+ b9dd769b-e31a-4fdb-945e-5a60db6487b0__ep2:qa:95,test,b9dd769b-e31a-4fdb-945e-5a60db6487b0__ep2,1900.0,1919.0,,,,,0.0
178
+ b9dd769b-e31a-4fdb-945e-5a60db6487b0__ep2:qa:96,test,b9dd769b-e31a-4fdb-945e-5a60db6487b0__ep2,1920.0,1939.0,1920.0,1939.0,1929.5,0.0,1.0
179
+ b9dd769b-e31a-4fdb-945e-5a60db6487b0__ep2:qa:97,test,b9dd769b-e31a-4fdb-945e-5a60db6487b0__ep2,1940.0,1959.0,0.0,1.0,0.5,1949.0,0.0
180
+ b9dd769b-e31a-4fdb-945e-5a60db6487b0__ep2:qa:114,test,b9dd769b-e31a-4fdb-945e-5a60db6487b0__ep2,2280.0,2299.0,2280.0,2299.0,2289.5,0.0,1.0
181
+ b9dd769b-e31a-4fdb-945e-5a60db6487b0__ep2:qa:115,test,b9dd769b-e31a-4fdb-945e-5a60db6487b0__ep2,2300.0,2319.0,,,,,0.0
182
+ b9dd769b-e31a-4fdb-945e-5a60db6487b0__ep2:qa:116,test,b9dd769b-e31a-4fdb-945e-5a60db6487b0__ep2,2320.0,2339.0,,,,,0.0
183
+ b9dd769b-e31a-4fdb-945e-5a60db6487b0__ep2:qa:120,test,b9dd769b-e31a-4fdb-945e-5a60db6487b0__ep2,2400.0,2419.0,,,,,0.0
184
+ b9dd769b-e31a-4fdb-945e-5a60db6487b0__ep2:qa:121,test,b9dd769b-e31a-4fdb-945e-5a60db6487b0__ep2,2420.0,2439.0,2390.0,2439.0,2414.5,15.0,0.4
185
+ b9dd769b-e31a-4fdb-945e-5a60db6487b0__ep2:qa:122,test,b9dd769b-e31a-4fdb-945e-5a60db6487b0__ep2,2440.0,2459.0,,,,,0.0
186
+ b9dd769b-e31a-4fdb-945e-5a60db6487b0__ep2:qa:123,test,b9dd769b-e31a-4fdb-945e-5a60db6487b0__ep2,2460.0,2479.0,,,,,0.0
187
+ b9dd769b-e31a-4fdb-945e-5a60db6487b0__ep2:qa:144,test,b9dd769b-e31a-4fdb-945e-5a60db6487b0__ep2,2880.0,2899.0,,,,,0.0
188
+ b9dd769b-e31a-4fdb-945e-5a60db6487b0__ep2:qa:145,test,b9dd769b-e31a-4fdb-945e-5a60db6487b0__ep2,2900.0,2919.0,,,,,0.0
189
+ b9dd769b-e31a-4fdb-945e-5a60db6487b0__ep2:qa:146,test,b9dd769b-e31a-4fdb-945e-5a60db6487b0__ep2,2920.0,2939.0,,,,,0.0
190
+ b9dd769b-e31a-4fdb-945e-5a60db6487b0__ep2:qa:147,test,b9dd769b-e31a-4fdb-945e-5a60db6487b0__ep2,2940.0,2959.0,,,,,0.0
191
+ b9dd769b-e31a-4fdb-945e-5a60db6487b0__ep2:qa:190,test,b9dd769b-e31a-4fdb-945e-5a60db6487b0__ep2,3800.0,3819.0,,,,,0.0
192
+ b9dd769b-e31a-4fdb-945e-5a60db6487b0__ep2:qa:191,test,b9dd769b-e31a-4fdb-945e-5a60db6487b0__ep2,3820.0,3839.0,3820.0,3839.0,3829.5,0.0,1.0
193
+ b9dd769b-e31a-4fdb-945e-5a60db6487b0__ep2:qa:192,test,b9dd769b-e31a-4fdb-945e-5a60db6487b0__ep2,3840.0,3859.0,,,,,0.0
194
+ ba045ed4-ef25-404d-b756-8dcbd45b18fa__ep2:qa:0,test,ba045ed4-ef25-404d-b756-8dcbd45b18fa__ep2,0.0,19.0,,,,,0.0
195
+ ba045ed4-ef25-404d-b756-8dcbd45b18fa__ep2:qa:1,test,ba045ed4-ef25-404d-b756-8dcbd45b18fa__ep2,20.0,39.0,,,,,0.0
196
+ ba045ed4-ef25-404d-b756-8dcbd45b18fa__ep2:qa:20,test,ba045ed4-ef25-404d-b756-8dcbd45b18fa__ep2,400.0,419.0,400.0,419.0,409.5,0.0,1.0
197
+ ba045ed4-ef25-404d-b756-8dcbd45b18fa__ep2:qa:21,test,ba045ed4-ef25-404d-b756-8dcbd45b18fa__ep2,420.0,439.0,0.0,1.0,0.5,429.0,0.0
198
+ ba045ed4-ef25-404d-b756-8dcbd45b18fa__ep2:qa:30,test,ba045ed4-ef25-404d-b756-8dcbd45b18fa__ep2,600.0,619.0,,,,,0.0
199
+ ba045ed4-ef25-404d-b756-8dcbd45b18fa__ep2:qa:31,test,ba045ed4-ef25-404d-b756-8dcbd45b18fa__ep2,620.0,639.0,,,,,0.0
200
+ ba045ed4-ef25-404d-b756-8dcbd45b18fa__ep2:qa:40,test,ba045ed4-ef25-404d-b756-8dcbd45b18fa__ep2,800.0,819.0,,,,,0.0
201
+ ba045ed4-ef25-404d-b756-8dcbd45b18fa__ep2:qa:41,test,ba045ed4-ef25-404d-b756-8dcbd45b18fa__ep2,820.0,839.0,0.0,1.0,0.5,829.0,0.0
202
+ ba045ed4-ef25-404d-b756-8dcbd45b18fa__ep2:qa:70,test,ba045ed4-ef25-404d-b756-8dcbd45b18fa__ep2,1400.0,1419.0,1380.0,1419.0,1399.5,10.0,0.5
203
+ ba045ed4-ef25-404d-b756-8dcbd45b18fa__ep2:qa:71,test,ba045ed4-ef25-404d-b756-8dcbd45b18fa__ep2,1420.0,1439.0,1420.0,1439.0,1429.5,0.0,1.0
204
+ ba045ed4-ef25-404d-b756-8dcbd45b18fa__ep2:qa:170,test,ba045ed4-ef25-404d-b756-8dcbd45b18fa__ep2,3400.0,3419.0,,,,,0.0
205
+ ba045ed4-ef25-404d-b756-8dcbd45b18fa__ep2:qa:171,test,ba045ed4-ef25-404d-b756-8dcbd45b18fa__ep2,3420.0,3439.0,3420.0,3439.0,3429.5,0.0,1.0
206
+ ba045ed4-ef25-404d-b756-8dcbd45b18fa__ep2:qa:176,test,ba045ed4-ef25-404d-b756-8dcbd45b18fa__ep2,3520.0,3539.0,,,,,0.0
207
+ ba045ed4-ef25-404d-b756-8dcbd45b18fa__ep2:qa:182,test,ba045ed4-ef25-404d-b756-8dcbd45b18fa__ep2,3640.0,3659.0,0.0,1.0,0.5,3649.0,0.0
208
+ ba045ed4-ef25-404d-b756-8dcbd45b18fa__ep2:qa:190,test,ba045ed4-ef25-404d-b756-8dcbd45b18fa__ep2,3800.0,3819.0,0.0,1.0,0.5,3809.0,0.0
209
+ ba045ed4-ef25-404d-b756-8dcbd45b18fa__ep2:qa:191,test,ba045ed4-ef25-404d-b756-8dcbd45b18fa__ep2,3820.0,3839.0,0.0,1.0,0.5,3829.0,0.0
210
+ ba045ed4-ef25-404d-b756-8dcbd45b18fa__ep2:qa:200,test,ba045ed4-ef25-404d-b756-8dcbd45b18fa__ep2,4000.0,4019.0,,,,,0.0
211
+ ba045ed4-ef25-404d-b756-8dcbd45b18fa__ep2:qa:201,test,ba045ed4-ef25-404d-b756-8dcbd45b18fa__ep2,4020.0,4039.0,,,,,0.0
212
+ ba045ed4-ef25-404d-b756-8dcbd45b18fa__ep2:qa:214,test,ba045ed4-ef25-404d-b756-8dcbd45b18fa__ep2,4280.0,4299.0,,,,,0.0
213
+ ba045ed4-ef25-404d-b756-8dcbd45b18fa__ep2:qa:215,test,ba045ed4-ef25-404d-b756-8dcbd45b18fa__ep2,4300.0,4319.0,4285.0,4319.0,4302.0,7.5,0.5714285714285714
214
+ ba045ed4-ef25-404d-b756-8dcbd45b18fa__ep2:qa:220,test,ba045ed4-ef25-404d-b756-8dcbd45b18fa__ep2,4400.0,4419.0,4399.0,4419.0,4409.0,0.5,0.9523809523809523
215
+ ba045ed4-ef25-404d-b756-8dcbd45b18fa__ep2:qa:221,test,ba045ed4-ef25-404d-b756-8dcbd45b18fa__ep2,4420.0,4439.0,,,,,0.0
216
+ ba045ed4-ef25-404d-b756-8dcbd45b18fa__ep2:qa:230,test,ba045ed4-ef25-404d-b756-8dcbd45b18fa__ep2,4600.0,4619.0,,,,,0.0
217
+ ba045ed4-ef25-404d-b756-8dcbd45b18fa__ep2:qa:231,test,ba045ed4-ef25-404d-b756-8dcbd45b18fa__ep2,4620.0,4639.0,,,,,0.0
218
+ ba045ed4-ef25-404d-b756-8dcbd45b18fa__ep2:qa:240,test,ba045ed4-ef25-404d-b756-8dcbd45b18fa__ep2,4800.0,4819.0,,,,,0.0
219
+ ba045ed4-ef25-404d-b756-8dcbd45b18fa__ep2:qa:250,test,ba045ed4-ef25-404d-b756-8dcbd45b18fa__ep2,5000.0,5019.0,,,,,0.0
220
+ ba045ed4-ef25-404d-b756-8dcbd45b18fa__ep2:qa:258,test,ba045ed4-ef25-404d-b756-8dcbd45b18fa__ep2,5160.0,5179.0,0.0,1.0,0.5,5169.0,0.0
221
+ ba045ed4-ef25-404d-b756-8dcbd45b18fa__ep2:qa:259,test,ba045ed4-ef25-404d-b756-8dcbd45b18fa__ep2,5180.0,5199.0,,,,,0.0
222
+ ba045ed4-ef25-404d-b756-8dcbd45b18fa__ep2:qa:270,test,ba045ed4-ef25-404d-b756-8dcbd45b18fa__ep2,5400.0,5419.0,5400.0,5419.0,5409.5,0.0,1.0
223
+ ba045ed4-ef25-404d-b756-8dcbd45b18fa__ep2:qa:271,test,ba045ed4-ef25-404d-b756-8dcbd45b18fa__ep2,5420.0,5439.0,,,,,0.0
224
+ ba045ed4-ef25-404d-b756-8dcbd45b18fa__ep2:qa:290,test,ba045ed4-ef25-404d-b756-8dcbd45b18fa__ep2,5800.0,5819.0,5785.0,5819.0,5802.0,7.5,0.5714285714285714
225
+ ba045ed4-ef25-404d-b756-8dcbd45b18fa__ep2:qa:291,test,ba045ed4-ef25-404d-b756-8dcbd45b18fa__ep2,5820.0,5839.0,,,,,0.0
226
+ 4b02bb38-384a-438a-b5f9-6131d85c34b0__ep1:qa:0,test,4b02bb38-384a-438a-b5f9-6131d85c34b0__ep1,0.0,19.0,0.0,2.0,1.0,8.5,0.15
227
+ 4b02bb38-384a-438a-b5f9-6131d85c34b0__ep1:qa:1,test,4b02bb38-384a-438a-b5f9-6131d85c34b0__ep1,20.0,39.0,0.0,1.0,0.5,29.0,0.0
228
+ 4b02bb38-384a-438a-b5f9-6131d85c34b0__ep1:qa:2,test,4b02bb38-384a-438a-b5f9-6131d85c34b0__ep1,40.0,59.0,,,,,0.0
229
+ 4b02bb38-384a-438a-b5f9-6131d85c34b0__ep1:qa:14,test,4b02bb38-384a-438a-b5f9-6131d85c34b0__ep1,280.0,299.0,,,,,0.0
230
+ 4b02bb38-384a-438a-b5f9-6131d85c34b0__ep1:qa:15,test,4b02bb38-384a-438a-b5f9-6131d85c34b0__ep1,300.0,319.0,,,,,0.0
231
+ 4b02bb38-384a-438a-b5f9-6131d85c34b0__ep1:qa:16,test,4b02bb38-384a-438a-b5f9-6131d85c34b0__ep1,320.0,339.0,320.0,339.0,329.5,0.0,1.0
232
+ 4b02bb38-384a-438a-b5f9-6131d85c34b0__ep1:qa:20,test,4b02bb38-384a-438a-b5f9-6131d85c34b0__ep1,400.0,419.0,380.0,419.0,399.5,10.0,0.5
233
+ 4b02bb38-384a-438a-b5f9-6131d85c34b0__ep1:qa:21,test,4b02bb38-384a-438a-b5f9-6131d85c34b0__ep1,420.0,439.0,,,,,0.0
234
+ 4b02bb38-384a-438a-b5f9-6131d85c34b0__ep1:qa:22,test,4b02bb38-384a-438a-b5f9-6131d85c34b0__ep1,440.0,459.0,440.0,459.0,449.5,0.0,1.0
235
+ 4b02bb38-384a-438a-b5f9-6131d85c34b0__ep1:qa:32,test,4b02bb38-384a-438a-b5f9-6131d85c34b0__ep1,640.0,659.0,,,,,0.0
236
+ 4b02bb38-384a-438a-b5f9-6131d85c34b0__ep1:qa:33,test,4b02bb38-384a-438a-b5f9-6131d85c34b0__ep1,660.0,679.0,660.0,679.0,669.5,0.0,1.0
237
+ 4b02bb38-384a-438a-b5f9-6131d85c34b0__ep1:qa:34,test,4b02bb38-384a-438a-b5f9-6131d85c34b0__ep1,680.0,699.0,,,,,0.0
238
+ 4b02bb38-384a-438a-b5f9-6131d85c34b0__ep1:qa:50,test,4b02bb38-384a-438a-b5f9-6131d85c34b0__ep1,1000.0,1019.0,0.0,1.6,0.8,1008.7,0.0
239
+ 4b02bb38-384a-438a-b5f9-6131d85c34b0__ep1:qa:51,test,4b02bb38-384a-438a-b5f9-6131d85c34b0__ep1,1020.0,1039.0,1020.0,1039.0,1029.5,0.0,1.0
240
+ 4b02bb38-384a-438a-b5f9-6131d85c34b0__ep1:qa:70,test,4b02bb38-384a-438a-b5f9-6131d85c34b0__ep1,1400.0,1419.0,0.0,1.0,0.5,1409.0,0.0
241
+ 4b02bb38-384a-438a-b5f9-6131d85c34b0__ep1:qa:71,test,4b02bb38-384a-438a-b5f9-6131d85c34b0__ep1,1420.0,1439.0,0.0,1.0,0.5,1429.0,0.0
242
+ 4b02bb38-384a-438a-b5f9-6131d85c34b0__ep1:qa:72,test,4b02bb38-384a-438a-b5f9-6131d85c34b0__ep1,1440.0,1459.0,0.0,15.0,7.5,1442.0,0.0
243
+ 4b02bb38-384a-438a-b5f9-6131d85c34b0__ep1:qa:100,test,4b02bb38-384a-438a-b5f9-6131d85c34b0__ep1,2000.0,2019.0,0.0,19.0,9.5,2000.0,0.0
244
+ 4b02bb38-384a-438a-b5f9-6131d85c34b0__ep1:qa:101,test,4b02bb38-384a-438a-b5f9-6131d85c34b0__ep1,2020.0,2039.0,0.0,1.0,0.5,2029.0,0.0
245
+ 4b02bb38-384a-438a-b5f9-6131d85c34b0__ep1:qa:102,test,4b02bb38-384a-438a-b5f9-6131d85c34b0__ep1,2040.0,2059.0,0.0,1.0,0.5,2049.0,0.0
246
+ 4b02bb38-384a-438a-b5f9-6131d85c34b0__ep1:qa:132,test,4b02bb38-384a-438a-b5f9-6131d85c34b0__ep1,2640.0,2659.0,0.0,19.0,9.5,2640.0,0.0
247
+ 4b02bb38-384a-438a-b5f9-6131d85c34b0__ep1:qa:133,test,4b02bb38-384a-438a-b5f9-6131d85c34b0__ep1,2660.0,2679.0,2660.0,2679.0,2669.5,0.0,1.0
248
+ 4b02bb38-384a-438a-b5f9-6131d85c34b0__ep1:qa:134,test,4b02bb38-384a-438a-b5f9-6131d85c34b0__ep1,2680.0,2699.0,,,,,0.0
249
+ 4b02bb38-384a-438a-b5f9-6131d85c34b0__ep1:qa:184,test,4b02bb38-384a-438a-b5f9-6131d85c34b0__ep1,3680.0,3699.0,3680.0,3699.0,3689.5,0.0,1.0
250
+ 4b02bb38-384a-438a-b5f9-6131d85c34b0__ep1:qa:185,test,4b02bb38-384a-438a-b5f9-6131d85c34b0__ep1,3700.0,3719.0,0.0,19.0,9.5,3700.0,0.0
251
+ 4b02bb38-384a-438a-b5f9-6131d85c34b0__ep1:qa:186,test,4b02bb38-384a-438a-b5f9-6131d85c34b0__ep1,3720.0,3739.0,3720.0,3739.0,3729.5,0.0,1.0
252
+ 4b02bb38-384a-438a-b5f9-6131d85c34b0__ep1:qa:200,test,4b02bb38-384a-438a-b5f9-6131d85c34b0__ep1,4000.0,4019.0,0.0,1.0,0.5,4009.0,0.0
253
+ 4b02bb38-384a-438a-b5f9-6131d85c34b0__ep1:qa:201,test,4b02bb38-384a-438a-b5f9-6131d85c34b0__ep1,4020.0,4039.0,0.0,1.0,0.5,4029.0,0.0
254
+ 4b02bb38-384a-438a-b5f9-6131d85c34b0__ep1:qa:202,test,4b02bb38-384a-438a-b5f9-6131d85c34b0__ep1,4040.0,4059.0,0.0,1.0,0.5,4049.0,0.0
255
+ 4b02bb38-384a-438a-b5f9-6131d85c34b0__ep1:qa:220,test,4b02bb38-384a-438a-b5f9-6131d85c34b0__ep1,4400.0,4419.0,,,,,0.0
256
+ 4b02bb38-384a-438a-b5f9-6131d85c34b0__ep1:qa:221,test,4b02bb38-384a-438a-b5f9-6131d85c34b0__ep1,4420.0,4439.0,,,,,0.0
257
+ 4b02bb38-384a-438a-b5f9-6131d85c34b0__ep1:qa:222,test,4b02bb38-384a-438a-b5f9-6131d85c34b0__ep1,4440.0,4459.0,,,,,0.0
258
+ 5399ef86-4df9-49bc-809f-8f4f92f9e659__ep6:qa:0,test,5399ef86-4df9-49bc-809f-8f4f92f9e659__ep6,0.0,19.0,,,,,0.0
259
+ 5399ef86-4df9-49bc-809f-8f4f92f9e659__ep6:qa:1,test,5399ef86-4df9-49bc-809f-8f4f92f9e659__ep6,20.0,39.0,,,,,0.0
260
+ 5399ef86-4df9-49bc-809f-8f4f92f9e659__ep6:qa:2,test,5399ef86-4df9-49bc-809f-8f4f92f9e659__ep6,40.0,59.0,,,,,0.0
261
+ 5399ef86-4df9-49bc-809f-8f4f92f9e659__ep6:qa:8,test,5399ef86-4df9-49bc-809f-8f4f92f9e659__ep6,160.0,179.0,,,,,0.0
262
+ 5399ef86-4df9-49bc-809f-8f4f92f9e659__ep6:qa:9,test,5399ef86-4df9-49bc-809f-8f4f92f9e659__ep6,180.0,199.0,,,,,0.0
263
+ 5399ef86-4df9-49bc-809f-8f4f92f9e659__ep6:qa:10,test,5399ef86-4df9-49bc-809f-8f4f92f9e659__ep6,200.0,219.0,,,,,0.0
264
+ 5399ef86-4df9-49bc-809f-8f4f92f9e659__ep6:qa:20,test,5399ef86-4df9-49bc-809f-8f4f92f9e659__ep6,400.0,419.0,,,,,0.0
265
+ 5399ef86-4df9-49bc-809f-8f4f92f9e659__ep6:qa:21,test,5399ef86-4df9-49bc-809f-8f4f92f9e659__ep6,420.0,439.0,,,,,0.0
266
+ 5399ef86-4df9-49bc-809f-8f4f92f9e659__ep6:qa:22,test,5399ef86-4df9-49bc-809f-8f4f92f9e659__ep6,440.0,459.0,,,,,0.0
267
+ 5399ef86-4df9-49bc-809f-8f4f92f9e659__ep6:qa:50,test,5399ef86-4df9-49bc-809f-8f4f92f9e659__ep6,1000.0,1019.0,,,,,0.0
268
+ 5399ef86-4df9-49bc-809f-8f4f92f9e659__ep6:qa:51,test,5399ef86-4df9-49bc-809f-8f4f92f9e659__ep6,1020.0,1039.0,1020.0,1039.0,1029.5,0.0,1.0
269
+ 5399ef86-4df9-49bc-809f-8f4f92f9e659__ep6:qa:52,test,5399ef86-4df9-49bc-809f-8f4f92f9e659__ep6,1040.0,1059.0,1040.0,1059.0,1049.5,0.0,1.0
270
+ 5399ef86-4df9-49bc-809f-8f4f92f9e659__ep6:qa:90,test,5399ef86-4df9-49bc-809f-8f4f92f9e659__ep6,1800.0,1819.0,,,,,0.0
271
+ 5399ef86-4df9-49bc-809f-8f4f92f9e659__ep6:qa:91,test,5399ef86-4df9-49bc-809f-8f4f92f9e659__ep6,1820.0,1839.0,,,,,0.0
272
+ 5399ef86-4df9-49bc-809f-8f4f92f9e659__ep6:qa:92,test,5399ef86-4df9-49bc-809f-8f4f92f9e659__ep6,1840.0,1859.0,0.0,0.0,0.0,1849.5,0.0
273
+ 5399ef86-4df9-49bc-809f-8f4f92f9e659__ep6:qa:100,test,5399ef86-4df9-49bc-809f-8f4f92f9e659__ep6,2000.0,2019.0,,,,,0.0
274
+ 5399ef86-4df9-49bc-809f-8f4f92f9e659__ep6:qa:101,test,5399ef86-4df9-49bc-809f-8f4f92f9e659__ep6,2020.0,2039.0,,,,,0.0
275
+ 5399ef86-4df9-49bc-809f-8f4f92f9e659__ep6:qa:102,test,5399ef86-4df9-49bc-809f-8f4f92f9e659__ep6,2040.0,2059.0,,,,,0.0
276
+ 5399ef86-4df9-49bc-809f-8f4f92f9e659__ep6:qa:120,test,5399ef86-4df9-49bc-809f-8f4f92f9e659__ep6,2400.0,2419.0,,,,,0.0
277
+ 5399ef86-4df9-49bc-809f-8f4f92f9e659__ep6:qa:121,test,5399ef86-4df9-49bc-809f-8f4f92f9e659__ep6,2420.0,2439.0,2420.0,2439.0,2429.5,0.0,1.0
278
+ 5399ef86-4df9-49bc-809f-8f4f92f9e659__ep6:qa:140,test,5399ef86-4df9-49bc-809f-8f4f92f9e659__ep6,2800.0,2819.0,,,,,0.0
279
+ 5399ef86-4df9-49bc-809f-8f4f92f9e659__ep6:qa:141,test,5399ef86-4df9-49bc-809f-8f4f92f9e659__ep6,2820.0,2839.0,,,,,0.0
280
+ 5399ef86-4df9-49bc-809f-8f4f92f9e659__ep6:qa:144,test,5399ef86-4df9-49bc-809f-8f4f92f9e659__ep6,2880.0,2899.0,,,,,0.0
281
+ 5399ef86-4df9-49bc-809f-8f4f92f9e659__ep6:qa:145,test,5399ef86-4df9-49bc-809f-8f4f92f9e659__ep6,2900.0,2919.0,,,,,0.0
282
+ 5399ef86-4df9-49bc-809f-8f4f92f9e659__ep6:qa:146,test,5399ef86-4df9-49bc-809f-8f4f92f9e659__ep6,2920.0,2939.0,,,,,0.0
283
+ 5399ef86-4df9-49bc-809f-8f4f92f9e659__ep6:qa:150,test,5399ef86-4df9-49bc-809f-8f4f92f9e659__ep6,3000.0,3019.0,3000.0,3019.0,3009.5,0.0,1.0
284
+ 5399ef86-4df9-49bc-809f-8f4f92f9e659__ep6:qa:151,test,5399ef86-4df9-49bc-809f-8f4f92f9e659__ep6,3020.0,3039.0,3020.0,3039.0,3029.5,0.0,1.0
285
+ 5399ef86-4df9-49bc-809f-8f4f92f9e659__ep6:qa:160,test,5399ef86-4df9-49bc-809f-8f4f92f9e659__ep6,3200.0,3219.0,3200.0,3219.0,3209.5,0.0,1.0
286
+ 5399ef86-4df9-49bc-809f-8f4f92f9e659__ep6:qa:161,test,5399ef86-4df9-49bc-809f-8f4f92f9e659__ep6,3220.0,3239.0,3220.0,3239.0,3229.5,0.0,1.0
287
+ 5399ef86-4df9-49bc-809f-8f4f92f9e659__ep6:qa:162,test,5399ef86-4df9-49bc-809f-8f4f92f9e659__ep6,3240.0,3259.0,,,,,0.0
288
+ 5399ef86-4df9-49bc-809f-8f4f92f9e659__ep6:qa:190,test,5399ef86-4df9-49bc-809f-8f4f92f9e659__ep6,3800.0,3819.0,,,,,0.0
289
+ 5399ef86-4df9-49bc-809f-8f4f92f9e659__ep6:qa:191,test,5399ef86-4df9-49bc-809f-8f4f92f9e659__ep6,3820.0,3839.0,,,,,0.0
290
+ b750fab3-7fbb-43a0-b451-c64c4d4a64da__ep1:qa:0,test,b750fab3-7fbb-43a0-b451-c64c4d4a64da__ep1,0.0,19.0,0.0,0.0,0.0,9.5,0.05
291
+ b750fab3-7fbb-43a0-b451-c64c4d4a64da__ep1:qa:20,test,b750fab3-7fbb-43a0-b451-c64c4d4a64da__ep1,400.0,419.0,380.0,419.0,399.5,10.0,0.5
292
+ b750fab3-7fbb-43a0-b451-c64c4d4a64da__ep1:qa:21,test,b750fab3-7fbb-43a0-b451-c64c4d4a64da__ep1,420.0,439.0,420.0,439.0,429.5,0.0,1.0
293
+ b750fab3-7fbb-43a0-b451-c64c4d4a64da__ep1:qa:28,test,b750fab3-7fbb-43a0-b451-c64c4d4a64da__ep1,560.0,579.0,560.0,579.0,569.5,0.0,1.0
294
+ b750fab3-7fbb-43a0-b451-c64c4d4a64da__ep1:qa:29,test,b750fab3-7fbb-43a0-b451-c64c4d4a64da__ep1,580.0,599.0,,,,,0.0
295
+ b750fab3-7fbb-43a0-b451-c64c4d4a64da__ep1:qa:34,test,b750fab3-7fbb-43a0-b451-c64c4d4a64da__ep1,680.0,699.0,680.0,699.0,689.5,0.0,1.0
296
+ b750fab3-7fbb-43a0-b451-c64c4d4a64da__ep1:qa:35,test,b750fab3-7fbb-43a0-b451-c64c4d4a64da__ep1,700.0,719.0,,,,,0.0
297
+ b750fab3-7fbb-43a0-b451-c64c4d4a64da__ep1:qa:40,test,b750fab3-7fbb-43a0-b451-c64c4d4a64da__ep1,800.0,819.0,794.0,819.0,806.5,3.0,0.7692307692307693
298
+ b750fab3-7fbb-43a0-b451-c64c4d4a64da__ep1:qa:41,test,b750fab3-7fbb-43a0-b451-c64c4d4a64da__ep1,820.0,839.0,819.0,839.0,829.0,0.5,0.9523809523809523
299
+ b750fab3-7fbb-43a0-b451-c64c4d4a64da__ep1:qa:70,test,b750fab3-7fbb-43a0-b451-c64c4d4a64da__ep1,1400.0,1419.0,1400.0,1419.0,1409.5,0.0,1.0
300
+ b750fab3-7fbb-43a0-b451-c64c4d4a64da__ep1:qa:71,test,b750fab3-7fbb-43a0-b451-c64c4d4a64da__ep1,1420.0,1439.0,1420.0,1439.0,1429.5,0.0,1.0
301
+ b750fab3-7fbb-43a0-b451-c64c4d4a64da__ep1:qa:74,test,b750fab3-7fbb-43a0-b451-c64c4d4a64da__ep1,1480.0,1499.0,1480.0,1499.0,1489.5,0.0,1.0
302
+ b750fab3-7fbb-43a0-b451-c64c4d4a64da__ep1:qa:75,test,b750fab3-7fbb-43a0-b451-c64c4d4a64da__ep1,1500.0,1519.0,1494.0,1519.0,1506.5,3.0,0.7692307692307693
303
+ b750fab3-7fbb-43a0-b451-c64c4d4a64da__ep1:qa:82,test,b750fab3-7fbb-43a0-b451-c64c4d4a64da__ep1,1640.0,1659.0,,,,,0.0
304
+ b750fab3-7fbb-43a0-b451-c64c4d4a64da__ep1:qa:83,test,b750fab3-7fbb-43a0-b451-c64c4d4a64da__ep1,1660.0,1679.0,1660.0,1679.0,1669.5,0.0,1.0
305
+ b750fab3-7fbb-43a0-b451-c64c4d4a64da__ep1:qa:90,test,b750fab3-7fbb-43a0-b451-c64c4d4a64da__ep1,1800.0,1819.0,,,,,0.0
306
+ b750fab3-7fbb-43a0-b451-c64c4d4a64da__ep1:qa:91,test,b750fab3-7fbb-43a0-b451-c64c4d4a64da__ep1,1820.0,1839.0,,,,,0.0
307
+ b750fab3-7fbb-43a0-b451-c64c4d4a64da__ep1:qa:120,test,b750fab3-7fbb-43a0-b451-c64c4d4a64da__ep1,2400.0,2419.0,,,,,0.0
308
+ b750fab3-7fbb-43a0-b451-c64c4d4a64da__ep1:qa:121,test,b750fab3-7fbb-43a0-b451-c64c4d4a64da__ep1,2420.0,2439.0,,,,,0.0
309
+ b750fab3-7fbb-43a0-b451-c64c4d4a64da__ep1:qa:150,test,b750fab3-7fbb-43a0-b451-c64c4d4a64da__ep1,3000.0,3019.0,0.0,19.0,9.5,3000.0,0.0
310
+ b750fab3-7fbb-43a0-b451-c64c4d4a64da__ep1:qa:151,test,b750fab3-7fbb-43a0-b451-c64c4d4a64da__ep1,3020.0,3039.0,,,,,0.0
311
+ b750fab3-7fbb-43a0-b451-c64c4d4a64da__ep1:qa:190,test,b750fab3-7fbb-43a0-b451-c64c4d4a64da__ep1,3800.0,3819.0,0.0,19.0,9.5,3800.0,0.0
312
+ b750fab3-7fbb-43a0-b451-c64c4d4a64da__ep1:qa:191,test,b750fab3-7fbb-43a0-b451-c64c4d4a64da__ep1,3820.0,3839.0,,,,,0.0
313
+ b750fab3-7fbb-43a0-b451-c64c4d4a64da__ep1:qa:220,test,b750fab3-7fbb-43a0-b451-c64c4d4a64da__ep1,4400.0,4419.0,,,,,0.0
314
+ b750fab3-7fbb-43a0-b451-c64c4d4a64da__ep1:qa:221,test,b750fab3-7fbb-43a0-b451-c64c4d4a64da__ep1,4420.0,4439.0,4386.0,4439.0,4412.5,17.0,0.37037037037037035
315
+ b750fab3-7fbb-43a0-b451-c64c4d4a64da__ep1:qa:240,test,b750fab3-7fbb-43a0-b451-c64c4d4a64da__ep1,4800.0,4819.0,0.0,19.0,9.5,4800.0,0.0
316
+ b750fab3-7fbb-43a0-b451-c64c4d4a64da__ep1:qa:246,test,b750fab3-7fbb-43a0-b451-c64c4d4a64da__ep1,4920.0,4939.0,0.0,1.0,0.5,4929.0,0.0
317
+ b750fab3-7fbb-43a0-b451-c64c4d4a64da__ep1:qa:247,test,b750fab3-7fbb-43a0-b451-c64c4d4a64da__ep1,4940.0,4959.0,4940.0,4959.0,4949.5,0.0,1.0
318
+ b750fab3-7fbb-43a0-b451-c64c4d4a64da__ep1:qa:250,test,b750fab3-7fbb-43a0-b451-c64c4d4a64da__ep1,5000.0,5019.0,,,,,0.0
319
+ b750fab3-7fbb-43a0-b451-c64c4d4a64da__ep1:qa:251,test,b750fab3-7fbb-43a0-b451-c64c4d4a64da__ep1,5020.0,5039.0,0.0,1.0,0.5,5029.0,0.0
320
+ b750fab3-7fbb-43a0-b451-c64c4d4a64da__ep1:qa:296,test,b750fab3-7fbb-43a0-b451-c64c4d4a64da__ep1,5920.0,5939.0,0.0,1.0,0.5,5929.0,0.0
321
+ b750fab3-7fbb-43a0-b451-c64c4d4a64da__ep1:qa:297,test,b750fab3-7fbb-43a0-b451-c64c4d4a64da__ep1,5940.0,5959.0,0.0,19.0,9.5,5940.0,0.0
322
+ 877779cd-25f3-4293-a3c4-39067dd9558c__ep4:qa:0,test,877779cd-25f3-4293-a3c4-39067dd9558c__ep4,0.0,19.0,,,,,0.0
323
+ 877779cd-25f3-4293-a3c4-39067dd9558c__ep4:qa:1,test,877779cd-25f3-4293-a3c4-39067dd9558c__ep4,20.0,39.0,,,,,0.0
324
+ 877779cd-25f3-4293-a3c4-39067dd9558c__ep4:qa:2,test,877779cd-25f3-4293-a3c4-39067dd9558c__ep4,40.0,59.0,,,,,0.0
325
+ 877779cd-25f3-4293-a3c4-39067dd9558c__ep4:qa:20,test,877779cd-25f3-4293-a3c4-39067dd9558c__ep4,400.0,419.0,380.0,419.0,399.5,10.0,0.5
326
+ 877779cd-25f3-4293-a3c4-39067dd9558c__ep4:qa:21,test,877779cd-25f3-4293-a3c4-39067dd9558c__ep4,420.0,439.0,,,,,0.0
327
+ 877779cd-25f3-4293-a3c4-39067dd9558c__ep4:qa:22,test,877779cd-25f3-4293-a3c4-39067dd9558c__ep4,440.0,459.0,440.0,459.0,449.5,0.0,1.0
328
+ 877779cd-25f3-4293-a3c4-39067dd9558c__ep4:qa:23,test,877779cd-25f3-4293-a3c4-39067dd9558c__ep4,460.0,479.0,,,,,0.0
329
+ 877779cd-25f3-4293-a3c4-39067dd9558c__ep4:qa:50,test,877779cd-25f3-4293-a3c4-39067dd9558c__ep4,1000.0,1019.0,,,,,0.0
330
+ 877779cd-25f3-4293-a3c4-39067dd9558c__ep4:qa:51,test,877779cd-25f3-4293-a3c4-39067dd9558c__ep4,1020.0,1039.0,,,,,0.0
331
+ 877779cd-25f3-4293-a3c4-39067dd9558c__ep4:qa:52,test,877779cd-25f3-4293-a3c4-39067dd9558c__ep4,1040.0,1059.0,,,,,0.0
332
+ 877779cd-25f3-4293-a3c4-39067dd9558c__ep4:qa:53,test,877779cd-25f3-4293-a3c4-39067dd9558c__ep4,1060.0,1079.0,,,,,0.0
333
+ 877779cd-25f3-4293-a3c4-39067dd9558c__ep4:qa:70,test,877779cd-25f3-4293-a3c4-39067dd9558c__ep4,1400.0,1419.0,,,,,0.0
334
+ 877779cd-25f3-4293-a3c4-39067dd9558c__ep4:qa:71,test,877779cd-25f3-4293-a3c4-39067dd9558c__ep4,1420.0,1439.0,,,,,0.0
335
+ 877779cd-25f3-4293-a3c4-39067dd9558c__ep4:qa:72,test,877779cd-25f3-4293-a3c4-39067dd9558c__ep4,1440.0,1459.0,,,,,0.0
336
+ 877779cd-25f3-4293-a3c4-39067dd9558c__ep4:qa:100,test,877779cd-25f3-4293-a3c4-39067dd9558c__ep4,2000.0,2019.0,1991.0,2019.0,2005.0,4.5,0.6896551724137931
337
+ 877779cd-25f3-4293-a3c4-39067dd9558c__ep4:qa:101,test,877779cd-25f3-4293-a3c4-39067dd9558c__ep4,2020.0,2039.0,2019.0,2039.0,2029.0,0.5,0.9523809523809523
338
+ 877779cd-25f3-4293-a3c4-39067dd9558c__ep4:qa:102,test,877779cd-25f3-4293-a3c4-39067dd9558c__ep4,2040.0,2059.0,2040.0,2059.0,2049.5,0.0,1.0
339
+ 877779cd-25f3-4293-a3c4-39067dd9558c__ep4:qa:108,test,877779cd-25f3-4293-a3c4-39067dd9558c__ep4,2160.0,2179.0,,,,,0.0
340
+ 877779cd-25f3-4293-a3c4-39067dd9558c__ep4:qa:109,test,877779cd-25f3-4293-a3c4-39067dd9558c__ep4,2180.0,2199.0,,,,,0.0
341
+ 877779cd-25f3-4293-a3c4-39067dd9558c__ep4:qa:110,test,877779cd-25f3-4293-a3c4-39067dd9558c__ep4,2200.0,2219.0,2199.0,2219.0,2209.0,0.5,0.9523809523809523
342
+ 877779cd-25f3-4293-a3c4-39067dd9558c__ep4:qa:120,test,877779cd-25f3-4293-a3c4-39067dd9558c__ep4,2400.0,2419.0,,,,,0.0
343
+ 877779cd-25f3-4293-a3c4-39067dd9558c__ep4:qa:121,test,877779cd-25f3-4293-a3c4-39067dd9558c__ep4,2420.0,2439.0,,,,,0.0
344
+ 877779cd-25f3-4293-a3c4-39067dd9558c__ep4:qa:122,test,877779cd-25f3-4293-a3c4-39067dd9558c__ep4,2440.0,2459.0,,,,,0.0
345
+ 877779cd-25f3-4293-a3c4-39067dd9558c__ep4:qa:150,test,877779cd-25f3-4293-a3c4-39067dd9558c__ep4,3000.0,3019.0,,,,,0.0
346
+ 877779cd-25f3-4293-a3c4-39067dd9558c__ep4:qa:151,test,877779cd-25f3-4293-a3c4-39067dd9558c__ep4,3020.0,3039.0,,,,,0.0
347
+ 877779cd-25f3-4293-a3c4-39067dd9558c__ep4:qa:152,test,877779cd-25f3-4293-a3c4-39067dd9558c__ep4,3040.0,3059.0,,,,,0.0
348
+ 877779cd-25f3-4293-a3c4-39067dd9558c__ep4:qa:170,test,877779cd-25f3-4293-a3c4-39067dd9558c__ep4,3400.0,3419.0,0.0,19.0,9.5,3400.0,0.0
349
+ 877779cd-25f3-4293-a3c4-39067dd9558c__ep4:qa:171,test,877779cd-25f3-4293-a3c4-39067dd9558c__ep4,3420.0,3439.0,0.0,1.0,0.5,3429.0,0.0
350
+ 877779cd-25f3-4293-a3c4-39067dd9558c__ep4:qa:172,test,877779cd-25f3-4293-a3c4-39067dd9558c__ep4,3440.0,3459.0,0.0,1.0,0.5,3449.0,0.0
351
+ 877779cd-25f3-4293-a3c4-39067dd9558c__ep4:qa:200,test,877779cd-25f3-4293-a3c4-39067dd9558c__ep4,4000.0,4019.0,,,,,0.0
352
+ 877779cd-25f3-4293-a3c4-39067dd9558c__ep4:qa:201,test,877779cd-25f3-4293-a3c4-39067dd9558c__ep4,4020.0,4039.0,,,,,0.0
353
+ 877779cd-25f3-4293-a3c4-39067dd9558c__ep4:qa:202,test,877779cd-25f3-4293-a3c4-39067dd9558c__ep4,4040.0,4059.0,4040.0,4059.0,4049.5,0.0,1.0
354
+ 1796b943-caad-43c6-b9bd-80b8d601f37d__ep1:qa:0,test,1796b943-caad-43c6-b9bd-80b8d601f37d__ep1,0.0,19.0,0.0,1.0,0.5,9.0,0.1
355
+ 1796b943-caad-43c6-b9bd-80b8d601f37d__ep1:qa:1,test,1796b943-caad-43c6-b9bd-80b8d601f37d__ep1,20.0,39.0,,,,,0.0
356
+ 1796b943-caad-43c6-b9bd-80b8d601f37d__ep1:qa:2,test,1796b943-caad-43c6-b9bd-80b8d601f37d__ep1,40.0,59.0,,,,,0.0
357
+ 1796b943-caad-43c6-b9bd-80b8d601f37d__ep1:qa:10,test,1796b943-caad-43c6-b9bd-80b8d601f37d__ep1,200.0,219.0,180.0,219.0,199.5,10.0,0.5
358
+ 1796b943-caad-43c6-b9bd-80b8d601f37d__ep1:qa:11,test,1796b943-caad-43c6-b9bd-80b8d601f37d__ep1,220.0,239.0,220.0,239.0,229.5,0.0,1.0
359
+ 1796b943-caad-43c6-b9bd-80b8d601f37d__ep1:qa:12,test,1796b943-caad-43c6-b9bd-80b8d601f37d__ep1,240.0,259.0,0.0,10.0,5.0,244.5,0.0
360
+ 1796b943-caad-43c6-b9bd-80b8d601f37d__ep1:qa:13,test,1796b943-caad-43c6-b9bd-80b8d601f37d__ep1,260.0,279.0,0.0,1.0,0.5,269.0,0.0
361
+ 1796b943-caad-43c6-b9bd-80b8d601f37d__ep1:qa:20,test,1796b943-caad-43c6-b9bd-80b8d601f37d__ep1,400.0,419.0,400.0,419.0,409.5,0.0,1.0
362
+ 1796b943-caad-43c6-b9bd-80b8d601f37d__ep1:qa:21,test,1796b943-caad-43c6-b9bd-80b8d601f37d__ep1,420.0,439.0,420.0,439.0,429.5,0.0,1.0
363
+ 1796b943-caad-43c6-b9bd-80b8d601f37d__ep1:qa:22,test,1796b943-caad-43c6-b9bd-80b8d601f37d__ep1,440.0,459.0,,,,,0.0
364
+ 1796b943-caad-43c6-b9bd-80b8d601f37d__ep1:qa:28,test,1796b943-caad-43c6-b9bd-80b8d601f37d__ep1,560.0,579.0,,,,,0.0
365
+ 1796b943-caad-43c6-b9bd-80b8d601f37d__ep1:qa:29,test,1796b943-caad-43c6-b9bd-80b8d601f37d__ep1,580.0,599.0,580.0,599.0,589.5,0.0,1.0
366
+ 1796b943-caad-43c6-b9bd-80b8d601f37d__ep1:qa:30,test,1796b943-caad-43c6-b9bd-80b8d601f37d__ep1,600.0,619.0,608.0,619.0,613.5,4.0,0.6
367
+ 1796b943-caad-43c6-b9bd-80b8d601f37d__ep1:qa:40,test,1796b943-caad-43c6-b9bd-80b8d601f37d__ep1,800.0,819.0,800.0,819.0,809.5,0.0,1.0
368
+ 1796b943-caad-43c6-b9bd-80b8d601f37d__ep1:qa:41,test,1796b943-caad-43c6-b9bd-80b8d601f37d__ep1,820.0,839.0,,,,,0.0
369
+ 1796b943-caad-43c6-b9bd-80b8d601f37d__ep1:qa:42,test,1796b943-caad-43c6-b9bd-80b8d601f37d__ep1,840.0,859.0,,,,,0.0
370
+ 1796b943-caad-43c6-b9bd-80b8d601f37d__ep1:qa:50,test,1796b943-caad-43c6-b9bd-80b8d601f37d__ep1,1000.0,1019.0,,,,,0.0
371
+ 1796b943-caad-43c6-b9bd-80b8d601f37d__ep1:qa:51,test,1796b943-caad-43c6-b9bd-80b8d601f37d__ep1,1020.0,1039.0,,,,,0.0
372
+ 1796b943-caad-43c6-b9bd-80b8d601f37d__ep1:qa:52,test,1796b943-caad-43c6-b9bd-80b8d601f37d__ep1,1040.0,1059.0,,,,,0.0
373
+ 1796b943-caad-43c6-b9bd-80b8d601f37d__ep1:qa:70,test,1796b943-caad-43c6-b9bd-80b8d601f37d__ep1,1400.0,1419.0,,,,,0.0
374
+ 1796b943-caad-43c6-b9bd-80b8d601f37d__ep1:qa:71,test,1796b943-caad-43c6-b9bd-80b8d601f37d__ep1,1420.0,1439.0,,,,,0.0
375
+ 1796b943-caad-43c6-b9bd-80b8d601f37d__ep1:qa:72,test,1796b943-caad-43c6-b9bd-80b8d601f37d__ep1,1440.0,1459.0,1440.0,1459.0,1449.5,0.0,1.0
376
+ 1796b943-caad-43c6-b9bd-80b8d601f37d__ep1:qa:90,test,1796b943-caad-43c6-b9bd-80b8d601f37d__ep1,1800.0,1819.0,0.0,19.0,9.5,1800.0,0.0
377
+ 1796b943-caad-43c6-b9bd-80b8d601f37d__ep1:qa:91,test,1796b943-caad-43c6-b9bd-80b8d601f37d__ep1,1820.0,1839.0,0.0,15.0,7.5,1822.0,0.0
378
+ 1796b943-caad-43c6-b9bd-80b8d601f37d__ep1:qa:92,test,1796b943-caad-43c6-b9bd-80b8d601f37d__ep1,1840.0,1859.0,,,,,0.0
379
+ 1796b943-caad-43c6-b9bd-80b8d601f37d__ep1:qa:100,test,1796b943-caad-43c6-b9bd-80b8d601f37d__ep1,2000.0,2019.0,,,,,0.0
380
+ 1796b943-caad-43c6-b9bd-80b8d601f37d__ep1:qa:101,test,1796b943-caad-43c6-b9bd-80b8d601f37d__ep1,2020.0,2039.0,0.0,10.0,5.0,2024.5,0.0
381
+ 1796b943-caad-43c6-b9bd-80b8d601f37d__ep1:qa:102,test,1796b943-caad-43c6-b9bd-80b8d601f37d__ep1,2040.0,2059.0,,,,,0.0
382
+ 1796b943-caad-43c6-b9bd-80b8d601f37d__ep1:qa:103,test,1796b943-caad-43c6-b9bd-80b8d601f37d__ep1,2060.0,2079.0,,,,,0.0
383
+ 1796b943-caad-43c6-b9bd-80b8d601f37d__ep1:qa:140,test,1796b943-caad-43c6-b9bd-80b8d601f37d__ep1,2800.0,2819.0,2666.0,2819.0,2742.5,67.0,0.12987012987012986
384
+ 1796b943-caad-43c6-b9bd-80b8d601f37d__ep1:qa:141,test,1796b943-caad-43c6-b9bd-80b8d601f37d__ep1,2820.0,2839.0,,,,,0.0
385
+ 1796b943-caad-43c6-b9bd-80b8d601f37d__ep1:qa:142,test,1796b943-caad-43c6-b9bd-80b8d601f37d__ep1,2840.0,2859.0,,,,,0.0
386
+ ba18b7c1-21ff-45da-8452-41acce7fc8de__ep2:qa:0,test,ba18b7c1-21ff-45da-8452-41acce7fc8de__ep2,0.0,19.0,0.0,1.0,0.5,9.0,0.1
387
+ ba18b7c1-21ff-45da-8452-41acce7fc8de__ep2:qa:1,test,ba18b7c1-21ff-45da-8452-41acce7fc8de__ep2,20.0,39.0,0.0,19.0,9.5,20.0,0.0
388
+ ba18b7c1-21ff-45da-8452-41acce7fc8de__ep2:qa:2,test,ba18b7c1-21ff-45da-8452-41acce7fc8de__ep2,40.0,59.0,0.0,59.0,29.5,20.0,0.3333333333333333
389
+ ba18b7c1-21ff-45da-8452-41acce7fc8de__ep2:qa:3,test,ba18b7c1-21ff-45da-8452-41acce7fc8de__ep2,60.0,79.0,0.0,1.0,0.5,69.0,0.0
390
+ ba18b7c1-21ff-45da-8452-41acce7fc8de__ep2:qa:4,test,ba18b7c1-21ff-45da-8452-41acce7fc8de__ep2,80.0,99.0,0.0,99.0,49.5,40.0,0.2
391
+ ba18b7c1-21ff-45da-8452-41acce7fc8de__ep2:qa:40,test,ba18b7c1-21ff-45da-8452-41acce7fc8de__ep2,800.0,819.0,,,,,0.0
392
+ ba18b7c1-21ff-45da-8452-41acce7fc8de__ep2:qa:41,test,ba18b7c1-21ff-45da-8452-41acce7fc8de__ep2,820.0,839.0,,,,,0.0
393
+ ba18b7c1-21ff-45da-8452-41acce7fc8de__ep2:qa:42,test,ba18b7c1-21ff-45da-8452-41acce7fc8de__ep2,840.0,859.0,,,,,0.0
394
+ ba18b7c1-21ff-45da-8452-41acce7fc8de__ep2:qa:43,test,ba18b7c1-21ff-45da-8452-41acce7fc8de__ep2,860.0,879.0,,,,,0.0
395
+ ba18b7c1-21ff-45da-8452-41acce7fc8de__ep2:qa:44,test,ba18b7c1-21ff-45da-8452-41acce7fc8de__ep2,880.0,899.0,,,,,0.0
396
+ ba18b7c1-21ff-45da-8452-41acce7fc8de__ep2:qa:60,test,ba18b7c1-21ff-45da-8452-41acce7fc8de__ep2,1200.0,1219.0,1199.0,1219.0,1209.0,0.5,0.9523809523809523
397
+ ba18b7c1-21ff-45da-8452-41acce7fc8de__ep2:qa:61,test,ba18b7c1-21ff-45da-8452-41acce7fc8de__ep2,1220.0,1239.0,1220.0,1239.0,1229.5,0.0,1.0
398
+ ba18b7c1-21ff-45da-8452-41acce7fc8de__ep2:qa:62,test,ba18b7c1-21ff-45da-8452-41acce7fc8de__ep2,1240.0,1259.0,1240.0,1259.0,1249.5,0.0,1.0
399
+ ba18b7c1-21ff-45da-8452-41acce7fc8de__ep2:qa:63,test,ba18b7c1-21ff-45da-8452-41acce7fc8de__ep2,1260.0,1279.0,,,,,0.0
400
+ ba18b7c1-21ff-45da-8452-41acce7fc8de__ep2:qa:90,test,ba18b7c1-21ff-45da-8452-41acce7fc8de__ep2,1800.0,1819.0,,,,,0.0
401
+ ba18b7c1-21ff-45da-8452-41acce7fc8de__ep2:qa:91,test,ba18b7c1-21ff-45da-8452-41acce7fc8de__ep2,1820.0,1839.0,,,,,0.0
402
+ ba18b7c1-21ff-45da-8452-41acce7fc8de__ep2:qa:92,test,ba18b7c1-21ff-45da-8452-41acce7fc8de__ep2,1840.0,1859.0,,,,,0.0
403
+ ba18b7c1-21ff-45da-8452-41acce7fc8de__ep2:qa:93,test,ba18b7c1-21ff-45da-8452-41acce7fc8de__ep2,1860.0,1879.0,,,,,0.0
404
+ ba18b7c1-21ff-45da-8452-41acce7fc8de__ep2:qa:94,test,ba18b7c1-21ff-45da-8452-41acce7fc8de__ep2,1880.0,1899.0,,,,,0.0
405
+ ba18b7c1-21ff-45da-8452-41acce7fc8de__ep2:qa:146,test,ba18b7c1-21ff-45da-8452-41acce7fc8de__ep2,2920.0,2939.0,,,,,0.0
406
+ ba18b7c1-21ff-45da-8452-41acce7fc8de__ep2:qa:147,test,ba18b7c1-21ff-45da-8452-41acce7fc8de__ep2,2940.0,2959.0,,,,,0.0
407
+ ba18b7c1-21ff-45da-8452-41acce7fc8de__ep2:qa:148,test,ba18b7c1-21ff-45da-8452-41acce7fc8de__ep2,2960.0,2979.0,,,,,0.0
408
+ ba18b7c1-21ff-45da-8452-41acce7fc8de__ep2:qa:149,test,ba18b7c1-21ff-45da-8452-41acce7fc8de__ep2,2980.0,2999.0,,,,,0.0
409
+ ba18b7c1-21ff-45da-8452-41acce7fc8de__ep2:qa:170,test,ba18b7c1-21ff-45da-8452-41acce7fc8de__ep2,3400.0,3419.0,3399.0,3419.0,3409.0,0.5,0.9523809523809523
410
+ ba18b7c1-21ff-45da-8452-41acce7fc8de__ep2:qa:171,test,ba18b7c1-21ff-45da-8452-41acce7fc8de__ep2,3420.0,3439.0,0.0,39.0,19.5,3410.0,0.0
411
+ ba18b7c1-21ff-45da-8452-41acce7fc8de__ep2:qa:172,test,ba18b7c1-21ff-45da-8452-41acce7fc8de__ep2,3440.0,3459.0,0.0,1.0,0.5,3449.0,0.0
412
+ ba18b7c1-21ff-45da-8452-41acce7fc8de__ep2:qa:173,test,ba18b7c1-21ff-45da-8452-41acce7fc8de__ep2,3460.0,3479.0,0.0,1.0,0.5,3469.0,0.0
413
+ ba18b7c1-21ff-45da-8452-41acce7fc8de__ep2:qa:174,test,ba18b7c1-21ff-45da-8452-41acce7fc8de__ep2,3480.0,3499.0,3480.0,3499.0,3489.5,0.0,1.0
414
+ ba18b7c1-21ff-45da-8452-41acce7fc8de__ep2:qa:240,test,ba18b7c1-21ff-45da-8452-41acce7fc8de__ep2,4800.0,4819.0,0.0,1.0,0.5,4809.0,0.0
415
+ ba18b7c1-21ff-45da-8452-41acce7fc8de__ep2:qa:241,test,ba18b7c1-21ff-45da-8452-41acce7fc8de__ep2,4820.0,4839.0,0.0,1.0,0.5,4829.0,0.0
416
+ ba18b7c1-21ff-45da-8452-41acce7fc8de__ep2:qa:242,test,ba18b7c1-21ff-45da-8452-41acce7fc8de__ep2,4840.0,4859.0,4840.0,4859.0,4849.5,0.0,1.0
417
+ ba18b7c1-21ff-45da-8452-41acce7fc8de__ep2:qa:243,test,ba18b7c1-21ff-45da-8452-41acce7fc8de__ep2,4860.0,4879.0,0.0,1.0,0.5,4869.0,0.0
418
+ b6579cb5-0a71-4ca6-8808-1e2700be05c7__ep3:qa:0,test,b6579cb5-0a71-4ca6-8808-1e2700be05c7__ep3,0.0,19.0,,,,,0.0
419
+ b6579cb5-0a71-4ca6-8808-1e2700be05c7__ep3:qa:1,test,b6579cb5-0a71-4ca6-8808-1e2700be05c7__ep3,20.0,39.0,0.0,2.0,1.0,28.5,0.0
420
+ b6579cb5-0a71-4ca6-8808-1e2700be05c7__ep3:qa:14,test,b6579cb5-0a71-4ca6-8808-1e2700be05c7__ep3,280.0,299.0,280.0,299.0,289.5,0.0,1.0
421
+ b6579cb5-0a71-4ca6-8808-1e2700be05c7__ep3:qa:15,test,b6579cb5-0a71-4ca6-8808-1e2700be05c7__ep3,300.0,319.0,,,,,0.0
422
+ b6579cb5-0a71-4ca6-8808-1e2700be05c7__ep3:qa:50,test,b6579cb5-0a71-4ca6-8808-1e2700be05c7__ep3,1000.0,1019.0,,,,,0.0
423
+ b6579cb5-0a71-4ca6-8808-1e2700be05c7__ep3:qa:100,test,b6579cb5-0a71-4ca6-8808-1e2700be05c7__ep3,2000.0,2019.0,,,,,0.0
424
+ b6579cb5-0a71-4ca6-8808-1e2700be05c7__ep3:qa:101,test,b6579cb5-0a71-4ca6-8808-1e2700be05c7__ep3,2020.0,2039.0,2014.0,2039.0,2026.5,3.0,0.7692307692307693
425
+ b6579cb5-0a71-4ca6-8808-1e2700be05c7__ep3:qa:120,test,b6579cb5-0a71-4ca6-8808-1e2700be05c7__ep3,2400.0,2419.0,,,,,0.0
426
+ b6579cb5-0a71-4ca6-8808-1e2700be05c7__ep3:qa:121,test,b6579cb5-0a71-4ca6-8808-1e2700be05c7__ep3,2420.0,2439.0,,,,,0.0
427
+ b6579cb5-0a71-4ca6-8808-1e2700be05c7__ep3:qa:128,test,b6579cb5-0a71-4ca6-8808-1e2700be05c7__ep3,2560.0,2579.0,,,,,0.0
428
+ b6579cb5-0a71-4ca6-8808-1e2700be05c7__ep3:qa:129,test,b6579cb5-0a71-4ca6-8808-1e2700be05c7__ep3,2580.0,2599.0,2580.0,2599.0,2589.5,0.0,1.0
429
+ b6579cb5-0a71-4ca6-8808-1e2700be05c7__ep3:qa:150,test,b6579cb5-0a71-4ca6-8808-1e2700be05c7__ep3,3000.0,3019.0,,,,,0.0
430
+ b6579cb5-0a71-4ca6-8808-1e2700be05c7__ep3:qa:164,test,b6579cb5-0a71-4ca6-8808-1e2700be05c7__ep3,3280.0,3299.0,,,,,0.0
431
+ b6579cb5-0a71-4ca6-8808-1e2700be05c7__ep3:qa:180,test,b6579cb5-0a71-4ca6-8808-1e2700be05c7__ep3,3600.0,3619.0,3598.0,3619.0,3608.5,1.0,0.9090909090909091
432
+ b6579cb5-0a71-4ca6-8808-1e2700be05c7__ep3:qa:181,test,b6579cb5-0a71-4ca6-8808-1e2700be05c7__ep3,3620.0,3639.0,3611.0,3639.0,3625.0,4.5,0.6896551724137931
433
+ b6579cb5-0a71-4ca6-8808-1e2700be05c7__ep3:qa:200,test,b6579cb5-0a71-4ca6-8808-1e2700be05c7__ep3,4000.0,4019.0,,,,,0.0
434
+ b6579cb5-0a71-4ca6-8808-1e2700be05c7__ep3:qa:201,test,b6579cb5-0a71-4ca6-8808-1e2700be05c7__ep3,4020.0,4039.0,,,,,0.0
435
+ b6579cb5-0a71-4ca6-8808-1e2700be05c7__ep3:qa:212,test,b6579cb5-0a71-4ca6-8808-1e2700be05c7__ep3,4240.0,4259.0,,,,,0.0
436
+ b6579cb5-0a71-4ca6-8808-1e2700be05c7__ep3:qa:213,test,b6579cb5-0a71-4ca6-8808-1e2700be05c7__ep3,4260.0,4279.0,,,,,0.0
437
+ b6579cb5-0a71-4ca6-8808-1e2700be05c7__ep3:qa:220,test,b6579cb5-0a71-4ca6-8808-1e2700be05c7__ep3,4400.0,4419.0,,,,,0.0
438
+ b6579cb5-0a71-4ca6-8808-1e2700be05c7__ep3:qa:221,test,b6579cb5-0a71-4ca6-8808-1e2700be05c7__ep3,4420.0,4439.0,4385.0,4439.0,4412.0,17.5,0.36363636363636365
439
+ b6579cb5-0a71-4ca6-8808-1e2700be05c7__ep3:qa:232,test,b6579cb5-0a71-4ca6-8808-1e2700be05c7__ep3,4640.0,4659.0,,,,,0.0
440
+ b6579cb5-0a71-4ca6-8808-1e2700be05c7__ep3:qa:233,test,b6579cb5-0a71-4ca6-8808-1e2700be05c7__ep3,4660.0,4679.0,4654.0,4679.0,4666.5,3.0,0.7692307692307693
441
+ b6579cb5-0a71-4ca6-8808-1e2700be05c7__ep3:qa:240,test,b6579cb5-0a71-4ca6-8808-1e2700be05c7__ep3,4800.0,4819.0,,,,,0.0
442
+ b6579cb5-0a71-4ca6-8808-1e2700be05c7__ep3:qa:244,test,b6579cb5-0a71-4ca6-8808-1e2700be05c7__ep3,4880.0,4899.0,,,,,0.0
443
+ b6579cb5-0a71-4ca6-8808-1e2700be05c7__ep3:qa:245,test,b6579cb5-0a71-4ca6-8808-1e2700be05c7__ep3,4900.0,4919.0,,,,,0.0
444
+ b6579cb5-0a71-4ca6-8808-1e2700be05c7__ep3:qa:250,test,b6579cb5-0a71-4ca6-8808-1e2700be05c7__ep3,5000.0,5019.0,,,,,0.0
445
+ b6579cb5-0a71-4ca6-8808-1e2700be05c7__ep3:qa:251,test,b6579cb5-0a71-4ca6-8808-1e2700be05c7__ep3,5020.0,5039.0,5020.0,5039.0,5029.5,0.0,1.0
446
+ b6579cb5-0a71-4ca6-8808-1e2700be05c7__ep3:qa:256,test,b6579cb5-0a71-4ca6-8808-1e2700be05c7__ep3,5120.0,5139.0,,,,,0.0
447
+ b6579cb5-0a71-4ca6-8808-1e2700be05c7__ep3:qa:257,test,b6579cb5-0a71-4ca6-8808-1e2700be05c7__ep3,5140.0,5159.0,,,,,0.0
448
+ b6579cb5-0a71-4ca6-8808-1e2700be05c7__ep3:qa:264,test,b6579cb5-0a71-4ca6-8808-1e2700be05c7__ep3,5280.0,5299.0,,,,,0.0
449
+ b6579cb5-0a71-4ca6-8808-1e2700be05c7__ep3:qa:265,test,b6579cb5-0a71-4ca6-8808-1e2700be05c7__ep3,5300.0,5319.0,,,,,0.0
results/omni_finetune/model_output_task_probes_20260616/next_subtask_forecast/cosmos3_nano_future_window/metrics.json CHANGED
@@ -5,7 +5,7 @@
5
  "per_class_metrics_csv": "results/omni_finetune/model_output_task_probes_20260616/next_subtask_forecast/cosmos3_nano_future_window/per_class_metrics.csv",
6
  "predictions_csv": "results/omni_finetune/model_output_task_probes_20260616/next_subtask_forecast/cosmos3_nano_future_window/predictions.csv"
7
  },
8
- "generated_at_utc": "2026-06-18T20:58:30+00:00",
9
  "known_limitation": "This is a retrieval-derived future-subtask score. It is not a separately prompted generative subtask head, but it is target-backed by verified future-record retrieval outputs.",
10
  "labels": [
11
  "Adjust lantern string and handle components",
 
5
  "per_class_metrics_csv": "results/omni_finetune/model_output_task_probes_20260616/next_subtask_forecast/cosmos3_nano_future_window/per_class_metrics.csv",
6
  "predictions_csv": "results/omni_finetune/model_output_task_probes_20260616/next_subtask_forecast/cosmos3_nano_future_window/predictions.csv"
7
  },
8
+ "generated_at_utc": "2026-06-18T22:52:18+00:00",
9
  "known_limitation": "This is a retrieval-derived future-subtask score. It is not a separately prompted generative subtask head, but it is target-backed by verified future-record retrieval outputs.",
10
  "labels": [
11
  "Adjust lantern string and handle components",
results/omni_finetune/model_output_task_probes_20260616/object_set_forecast/cosmos3_nano_future_window/metrics.json CHANGED
@@ -6,7 +6,7 @@
6
  "exact_match": 0.013227513227513227,
7
  "false_negative_objects": 1127.0,
8
  "false_positive_objects": 747.0,
9
- "generated_at_utc": "2026-06-18T20:58:30+00:00",
10
  "known_limitation": "This is a retrieval-derived object-set score, not a separately prompted object-list generation head.",
11
  "metric_key": "object_set_forecast_micro_f1",
12
  "micro_f1": 0.01781970649895178,
 
6
  "exact_match": 0.013227513227513227,
7
  "false_negative_objects": 1127.0,
8
  "false_positive_objects": 747.0,
9
+ "generated_at_utc": "2026-06-18T22:52:18+00:00",
10
  "known_limitation": "This is a retrieval-derived object-set score, not a separately prompted object-list generation head.",
11
  "metric_key": "object_set_forecast_micro_f1",
12
  "micro_f1": 0.01781970649895178,
results/omni_finetune/model_output_task_probes_20260616/summary.json CHANGED
@@ -1,5 +1,5 @@
1
  {
2
- "generated_at_utc": "2026-06-18T20:58:30+00:00",
3
  "methods": {
4
  "cosmos3_nano_future_window": {
5
  "label": "Cosmos3-Nano Future Window",
@@ -7,6 +7,12 @@
7
  "source_prediction_jsonl": "results/omni_finetune/verified_public/xperience10m_cosmos3_nano_128ep_future_window_h5_compat_adapter_eval_test_full/eval/future_predictions.jsonl",
8
  "status": "scored",
9
  "tasks": {
 
 
 
 
 
 
10
  "long_horizon_next_action": {
11
  "horizon_windows": 5,
12
  "long_horizon_next_action_accuracy": 0.007936507936507936,
@@ -41,9 +47,7 @@
41
  "within_20_frames": 0.6666666666666666
42
  }
43
  },
44
- "unsupported_tasks": {
45
- "action_object_relation": "verified future-window predictions do not contain object-set fields"
46
- }
47
  },
48
  "cosmos3_super_reasoner": {
49
  "label": "Cosmos3-Super Reasoner",
@@ -58,6 +62,13 @@
58
  "source_metrics_json": "results/omni_finetune/model_output_task_probes_20260616/action_object_relation/cosmos3_super_reasoner/metrics.json",
59
  "valid_pred_relation_rate": 0.49327354260089684
60
  },
 
 
 
 
 
 
 
61
  "long_horizon_next_action": {
62
  "long_horizon_next_action_accuracy": 0.03794642857142857,
63
  "long_horizon_next_action_macro_f1": 0.008807588075880758,
@@ -91,10 +102,11 @@
91
  }
92
  },
93
  "scope": "Task-specific scoring from existing verified held-out model outputs. No new model inference, training, or target backfilling is performed.",
94
- "scored_method_task_count_added": 9,
95
  "status": "pass",
96
  "task_ids_added_to_matrix": [
97
  "action_object_relation",
 
98
  "long_horizon_next_action",
99
  "modality_reconstruction",
100
  "next_subtask_forecast",
 
1
  {
2
+ "generated_at_utc": "2026-06-18T22:52:18+00:00",
3
  "methods": {
4
  "cosmos3_nano_future_window": {
5
  "label": "Cosmos3-Nano Future Window",
 
7
  "source_prediction_jsonl": "results/omni_finetune/verified_public/xperience10m_cosmos3_nano_128ep_future_window_h5_compat_adapter_eval_test_full/eval/future_predictions.jsonl",
8
  "status": "scored",
9
  "tasks": {
10
+ "action_object_relation": {
11
+ "action_object_relation_accuracy": 0.013297872340425532,
12
+ "action_object_relation_macro_f1": 0.002794157670325683,
13
+ "scored_rows": 376,
14
+ "source_metrics_json": "results/omni_finetune/model_output_task_probes_20260616/action_object_relation/cosmos3_nano_future_window/metrics.json"
15
+ },
16
  "long_horizon_next_action": {
17
  "horizon_windows": 5,
18
  "long_horizon_next_action_accuracy": 0.007936507936507936,
 
47
  "within_20_frames": 0.6666666666666666
48
  }
49
  },
50
+ "unsupported_tasks": {}
 
 
51
  },
52
  "cosmos3_super_reasoner": {
53
  "label": "Cosmos3-Super Reasoner",
 
62
  "source_metrics_json": "results/omni_finetune/model_output_task_probes_20260616/action_object_relation/cosmos3_super_reasoner/metrics.json",
63
  "valid_pred_relation_rate": 0.49327354260089684
64
  },
65
+ "caption_grounding": {
66
+ "caption_grounding_center_hit_rate": 0.3236607142857143,
67
+ "caption_grounding_iou": 0.30639899644580487,
68
+ "missing_pred_evidence_window_count": 219,
69
+ "scored_rows": 448,
70
+ "source_metrics_json": "results/omni_finetune/model_output_task_probes_20260616/caption_grounding/cosmos3_super_reasoner/metrics.json"
71
+ },
72
  "long_horizon_next_action": {
73
  "long_horizon_next_action_accuracy": 0.03794642857142857,
74
  "long_horizon_next_action_macro_f1": 0.008807588075880758,
 
102
  }
103
  },
104
  "scope": "Task-specific scoring from existing verified held-out model outputs. No new model inference, training, or target backfilling is performed.",
105
+ "scored_method_task_count_added": 11,
106
  "status": "pass",
107
  "task_ids_added_to_matrix": [
108
  "action_object_relation",
109
+ "caption_grounding",
110
  "long_horizon_next_action",
111
  "modality_reconstruction",
112
  "next_subtask_forecast",
results/omni_finetune/model_output_task_probes_20260616/time_to_transition/cosmos3_nano_future_window/metrics.json CHANGED
@@ -4,7 +4,7 @@
4
  "predictions_csv": "results/omni_finetune/model_output_task_probes_20260616/time_to_transition/cosmos3_nano_future_window/predictions.csv"
5
  },
6
  "cap_frames": 200,
7
- "generated_at_utc": "2026-06-18T20:58:30+00:00",
8
  "known_limitation": "This is a derived future-window action-sequence probe, not evidence of a separately trained scalar time-regression head. It is included because task 20's boundary target is deterministically derivable once future-window action predictions are verified.",
9
  "metric_direction": "lower",
10
  "metric_key": "time_to_transition_mae",
 
4
  "predictions_csv": "results/omni_finetune/model_output_task_probes_20260616/time_to_transition/cosmos3_nano_future_window/predictions.csv"
5
  },
6
  "cap_frames": 200,
7
+ "generated_at_utc": "2026-06-18T22:52:18+00:00",
8
  "known_limitation": "This is a derived future-window action-sequence probe, not evidence of a separately trained scalar time-regression head. It is included because task 20's boundary target is deterministically derivable once future-window action predictions are verified.",
9
  "metric_direction": "lower",
10
  "metric_key": "time_to_transition_mae",
results/omni_finetune/model_output_task_probes_20260616/time_to_transition/cosmos3_super_reasoner/metrics.json CHANGED
@@ -5,7 +5,7 @@
5
  },
6
  "cap_frames": 200,
7
  "excluded_rows_without_true_action": 0,
8
- "generated_at_utc": "2026-06-18T20:58:30+00:00",
9
  "known_limitation": "This is a derived action-sequence probe, not evidence of a separately trained time-regression head. It is included because task 20's target is deterministically derivable from a sequence of action labels.",
10
  "metric_direction": "lower",
11
  "metric_key": "time_to_transition_mae",
 
5
  },
6
  "cap_frames": 200,
7
  "excluded_rows_without_true_action": 0,
8
+ "generated_at_utc": "2026-06-18T22:52:18+00:00",
9
  "known_limitation": "This is a derived action-sequence probe, not evidence of a separately trained time-regression head. It is included because task 20's target is deterministically derivable from a sequence of action labels.",
10
  "metric_direction": "lower",
11
  "metric_key": "time_to_transition_mae",
scripts/build_unified_task_model_radar.py CHANGED
@@ -71,6 +71,9 @@ QWEN_ACTION_OBJECT_METRICS_PATH = (
71
  COSMOS_SUPER_ACTION_OBJECT_METRICS_PATH = (
72
  MODEL_OUTPUT_TASK_PROBE_DIR / "action_object_relation/cosmos3_super_reasoner/metrics.json"
73
  )
 
 
 
74
  COSMOS_SUPER_TIME_TO_TRANSITION_METRICS_PATH = (
75
  MODEL_OUTPUT_TASK_PROBE_DIR / "time_to_transition/cosmos3_super_reasoner/metrics.json"
76
  )
@@ -89,6 +92,9 @@ COSMOS_NANO_MODALITY_RECONSTRUCTION_METRICS_PATH = (
89
  COSMOS_NANO_OBJECT_SET_METRICS_PATH = (
90
  MODEL_OUTPUT_TASK_PROBE_DIR / "object_set_forecast/cosmos3_nano_future_window/metrics.json"
91
  )
 
 
 
92
  COSMOS_NANO_TIME_TO_TRANSITION_METRICS_PATH = (
93
  MODEL_OUTPUT_TASK_PROBE_DIR / "time_to_transition/cosmos3_nano_future_window/metrics.json"
94
  )
@@ -231,6 +237,10 @@ FOUNDATION_TASK_METRICS = {
231
  "action_object_relation": {
232
  "qwen3_omni_v6_lora": "action_object_relation_macro_f1",
233
  "cosmos3_super_reasoner": "action_object_relation_macro_f1",
 
 
 
 
234
  },
235
  "long_horizon_next_action": {
236
  "cosmos3_super_reasoner": "long_horizon_next_action_macro_f1",
@@ -263,6 +273,7 @@ FOUNDATION_METRIC_PATHS = {
263
  FOUNDATION_METRIC_SOURCE_OVERRIDES = {
264
  ("qwen3_omni_v6_lora", "action_object_relation"): QWEN_ACTION_OBJECT_METRICS_PATH,
265
  ("cosmos3_super_reasoner", "action_object_relation"): COSMOS_SUPER_ACTION_OBJECT_METRICS_PATH,
 
266
  ("qwen3_omni_v6_lora", "caption_grounding"): QWEN_FUTURE_TASK_METRIC_PATHS["caption_grounding"],
267
  ("qwen3_omni_v6_lora", "cross_modal_retrieval"): QWEN_FUTURE_TASK_METRIC_PATHS["cross_modal_retrieval"],
268
  ("qwen3_omni_v6_lora", "temporal_order"): QWEN_FUTURE_TASK_METRIC_PATHS["temporal_order"],
@@ -275,6 +286,7 @@ FOUNDATION_METRIC_SOURCE_OVERRIDES = {
275
  ("cosmos3_nano_future_window", "long_horizon_next_action"): COSMOS_NANO_LONG_HORIZON_METRICS_PATH,
276
  ("cosmos3_nano_future_window", "next_subtask_forecast"): COSMOS_NANO_NEXT_SUBTASK_METRICS_PATH,
277
  ("cosmos3_nano_future_window", "modality_reconstruction"): COSMOS_NANO_MODALITY_RECONSTRUCTION_METRICS_PATH,
 
278
  ("cosmos3_nano_future_window", "object_set_forecast"): COSMOS_NANO_OBJECT_SET_METRICS_PATH,
279
  ("cosmos3_nano_future_window", "time_to_transition"): COSMOS_NANO_TIME_TO_TRANSITION_METRICS_PATH,
280
  ("cosmos3_super_reasoner", "long_horizon_next_action"): COSMOS_SUPER_LONG_HORIZON_METRICS_PATH,
@@ -312,8 +324,8 @@ METHOD_DETAILS = {
312
  "raw128_simple": "128-episode 4430-dim sensor NPZ simple heads; tasks 15/19 use compact proxies.",
313
  "raw128_neural_mlp": "128-episode 4430-dim sensor NPZ MLP heads; tasks 15/19 use compact proxies.",
314
  "qwen3_omni_v6_lora": "Verified held-out Qwen3-Omni v6 LoRA metrics, plus task 16 and any completed private-GPU future-task probes scored from task-specific JSON.",
315
- "cosmos3_super_reasoner": "Verified Cosmos3-Super base-weight Reasoner JSON-task evaluation, plus task 16 and a derived task-20 action-boundary timing probe scored from existing verified JSON.",
316
- "cosmos3_nano_future_window": "Verified Cosmos3-Nano future-window compatibility metrics, plus tasks 10/13/14/17 and a derived task-20 boundary timing probe scored from existing held-out future-window artifacts.",
317
  }
318
 
319
  PROXY_TASK_IDS = {"interaction_text_prediction", "camera_view_sync_retrieval"}
@@ -669,11 +681,13 @@ def build_payload() -> dict[str, Any]:
669
  cosmos_fd = read_json(COSMOS_SUPER_FD_METRICS_PATH)
670
  qwen.update(read_json(QWEN_ACTION_OBJECT_METRICS_PATH))
671
  cosmos_super.update(read_json(COSMOS_SUPER_ACTION_OBJECT_METRICS_PATH))
 
672
  cosmos_super.update(read_json(COSMOS_SUPER_LONG_HORIZON_METRICS_PATH))
673
  cosmos_super.update(read_json(COSMOS_SUPER_TIME_TO_TRANSITION_METRICS_PATH))
674
  cosmos_nano.update(read_json(COSMOS_NANO_LONG_HORIZON_METRICS_PATH))
675
  cosmos_nano.update(read_json(COSMOS_NANO_NEXT_SUBTASK_METRICS_PATH))
676
  cosmos_nano.update(read_json(COSMOS_NANO_MODALITY_RECONSTRUCTION_METRICS_PATH))
 
677
  cosmos_nano.update(read_json(COSMOS_NANO_OBJECT_SET_METRICS_PATH))
678
  cosmos_nano.update(read_json(COSMOS_NANO_TIME_TO_TRANSITION_METRICS_PATH))
679
  foundation_task_metrics = foundation_task_metric_mapping(qwen)
 
71
  COSMOS_SUPER_ACTION_OBJECT_METRICS_PATH = (
72
  MODEL_OUTPUT_TASK_PROBE_DIR / "action_object_relation/cosmos3_super_reasoner/metrics.json"
73
  )
74
+ COSMOS_SUPER_CAPTION_GROUNDING_METRICS_PATH = (
75
+ MODEL_OUTPUT_TASK_PROBE_DIR / "caption_grounding/cosmos3_super_reasoner/metrics.json"
76
+ )
77
  COSMOS_SUPER_TIME_TO_TRANSITION_METRICS_PATH = (
78
  MODEL_OUTPUT_TASK_PROBE_DIR / "time_to_transition/cosmos3_super_reasoner/metrics.json"
79
  )
 
92
  COSMOS_NANO_OBJECT_SET_METRICS_PATH = (
93
  MODEL_OUTPUT_TASK_PROBE_DIR / "object_set_forecast/cosmos3_nano_future_window/metrics.json"
94
  )
95
+ COSMOS_NANO_ACTION_OBJECT_METRICS_PATH = (
96
+ MODEL_OUTPUT_TASK_PROBE_DIR / "action_object_relation/cosmos3_nano_future_window/metrics.json"
97
+ )
98
  COSMOS_NANO_TIME_TO_TRANSITION_METRICS_PATH = (
99
  MODEL_OUTPUT_TASK_PROBE_DIR / "time_to_transition/cosmos3_nano_future_window/metrics.json"
100
  )
 
237
  "action_object_relation": {
238
  "qwen3_omni_v6_lora": "action_object_relation_macro_f1",
239
  "cosmos3_super_reasoner": "action_object_relation_macro_f1",
240
+ "cosmos3_nano_future_window": "action_object_relation_macro_f1",
241
+ },
242
+ "caption_grounding": {
243
+ "cosmos3_super_reasoner": "caption_grounding_iou",
244
  },
245
  "long_horizon_next_action": {
246
  "cosmos3_super_reasoner": "long_horizon_next_action_macro_f1",
 
273
  FOUNDATION_METRIC_SOURCE_OVERRIDES = {
274
  ("qwen3_omni_v6_lora", "action_object_relation"): QWEN_ACTION_OBJECT_METRICS_PATH,
275
  ("cosmos3_super_reasoner", "action_object_relation"): COSMOS_SUPER_ACTION_OBJECT_METRICS_PATH,
276
+ ("cosmos3_super_reasoner", "caption_grounding"): COSMOS_SUPER_CAPTION_GROUNDING_METRICS_PATH,
277
  ("qwen3_omni_v6_lora", "caption_grounding"): QWEN_FUTURE_TASK_METRIC_PATHS["caption_grounding"],
278
  ("qwen3_omni_v6_lora", "cross_modal_retrieval"): QWEN_FUTURE_TASK_METRIC_PATHS["cross_modal_retrieval"],
279
  ("qwen3_omni_v6_lora", "temporal_order"): QWEN_FUTURE_TASK_METRIC_PATHS["temporal_order"],
 
286
  ("cosmos3_nano_future_window", "long_horizon_next_action"): COSMOS_NANO_LONG_HORIZON_METRICS_PATH,
287
  ("cosmos3_nano_future_window", "next_subtask_forecast"): COSMOS_NANO_NEXT_SUBTASK_METRICS_PATH,
288
  ("cosmos3_nano_future_window", "modality_reconstruction"): COSMOS_NANO_MODALITY_RECONSTRUCTION_METRICS_PATH,
289
+ ("cosmos3_nano_future_window", "action_object_relation"): COSMOS_NANO_ACTION_OBJECT_METRICS_PATH,
290
  ("cosmos3_nano_future_window", "object_set_forecast"): COSMOS_NANO_OBJECT_SET_METRICS_PATH,
291
  ("cosmos3_nano_future_window", "time_to_transition"): COSMOS_NANO_TIME_TO_TRANSITION_METRICS_PATH,
292
  ("cosmos3_super_reasoner", "long_horizon_next_action"): COSMOS_SUPER_LONG_HORIZON_METRICS_PATH,
 
324
  "raw128_simple": "128-episode 4430-dim sensor NPZ simple heads; tasks 15/19 use compact proxies.",
325
  "raw128_neural_mlp": "128-episode 4430-dim sensor NPZ MLP heads; tasks 15/19 use compact proxies.",
326
  "qwen3_omni_v6_lora": "Verified held-out Qwen3-Omni v6 LoRA metrics, plus task 16 and any completed private-GPU future-task probes scored from task-specific JSON.",
327
+ "cosmos3_super_reasoner": "Verified Cosmos3-Super base-weight Reasoner JSON-task evaluation, plus task 8/16 and a derived task-20 action-boundary timing probe scored from existing verified JSON.",
328
+ "cosmos3_nano_future_window": "Verified Cosmos3-Nano future-window compatibility metrics, plus tasks 10/13/14/16/17 and a derived task-20 boundary timing probe scored from existing held-out future-window artifacts.",
329
  }
330
 
331
  PROXY_TASK_IDS = {"interaction_text_prediction", "camera_view_sync_retrieval"}
 
681
  cosmos_fd = read_json(COSMOS_SUPER_FD_METRICS_PATH)
682
  qwen.update(read_json(QWEN_ACTION_OBJECT_METRICS_PATH))
683
  cosmos_super.update(read_json(COSMOS_SUPER_ACTION_OBJECT_METRICS_PATH))
684
+ cosmos_super.update(read_json(COSMOS_SUPER_CAPTION_GROUNDING_METRICS_PATH))
685
  cosmos_super.update(read_json(COSMOS_SUPER_LONG_HORIZON_METRICS_PATH))
686
  cosmos_super.update(read_json(COSMOS_SUPER_TIME_TO_TRANSITION_METRICS_PATH))
687
  cosmos_nano.update(read_json(COSMOS_NANO_LONG_HORIZON_METRICS_PATH))
688
  cosmos_nano.update(read_json(COSMOS_NANO_NEXT_SUBTASK_METRICS_PATH))
689
  cosmos_nano.update(read_json(COSMOS_NANO_MODALITY_RECONSTRUCTION_METRICS_PATH))
690
+ cosmos_nano.update(read_json(COSMOS_NANO_ACTION_OBJECT_METRICS_PATH))
691
  cosmos_nano.update(read_json(COSMOS_NANO_OBJECT_SET_METRICS_PATH))
692
  cosmos_nano.update(read_json(COSMOS_NANO_TIME_TO_TRANSITION_METRICS_PATH))
693
  foundation_task_metrics = foundation_task_metric_mapping(qwen)
scripts/omni/score_existing_model_output_task_probes.py CHANGED
@@ -67,7 +67,6 @@ MODEL_SPECS = {
67
  "results/omni_finetune/model_output_task_probes_20260616/"
68
  "cosmos3_nano_future_window_target_map.jsonl"
69
  ),
70
- "action_object_relation_unsupported_reason": "verified future-window predictions do not contain object-set fields",
71
  },
72
  }
73
 
@@ -661,6 +660,263 @@ def score_cosmos_nano_object_set_from_target_map(
661
  return metrics
662
 
663
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
664
  def score_modality_reconstruction_from_feature_error(
665
  *,
666
  model_id: str,
@@ -1142,6 +1398,7 @@ def build_report(summary: dict[str, Any]) -> str:
1142
  task16 = task_results.get("action_object_relation", {})
1143
  task17 = task_results.get("object_set_forecast", {})
1144
  task20 = task_results.get("time_to_transition", {})
 
1145
  rows.append(
1146
  "| "
1147
  + " | ".join(
@@ -1175,6 +1432,11 @@ def build_report(summary: dict[str, Any]) -> str:
1175
  if task20.get("time_to_transition_mae") is not None
1176
  else "n/a"
1177
  ),
 
 
 
 
 
1178
  result.get("reason") or result.get("source_prediction_jsonl", ""),
1179
  ]
1180
  )
@@ -1188,8 +1450,8 @@ This package scores only task targets already present in verified held-out
1188
  prediction JSON. It does not run new inference and does not infer targets that
1189
  are absent from a model branch.
1190
 
1191
- | Method | ID | Status | Scored tasks | Task 13 macro-F1 | Task 14 macro-F1 | Task 16 macro-F1 | Task 17 micro-F1 | Task 20 MAE | Evidence |
1192
- | --- | --- | --- | --- | ---: | ---: | ---: | ---: | ---: | --- |
1193
  {chr(10).join(rows)}
1194
  """
1195
 
@@ -1213,9 +1475,7 @@ def main() -> int:
1213
  continue
1214
  task_results: dict[str, Any] = {}
1215
  unsupported: dict[str, str] = {}
1216
- if spec.get("action_object_relation_unsupported_reason"):
1217
- unsupported["action_object_relation"] = spec["action_object_relation_unsupported_reason"]
1218
- else:
1219
  metrics = score_action_object_relation(
1220
  model_id=model_id,
1221
  spec=spec,
@@ -1230,6 +1490,21 @@ def main() -> int:
1230
  "action_object_relation_macro_f1": metrics["action_object_relation_macro_f1"],
1231
  "action_object_relation_accuracy": metrics["action_object_relation_accuracy"],
1232
  }
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1233
  if model_id == "cosmos3_nano_future_window":
1234
  manifest_path = workspace / spec["dataset_manifest"]
1235
  metrics = score_cosmos_nano_long_horizon_next_action(
@@ -1278,6 +1553,20 @@ def main() -> int:
1278
  "object_set_forecast_precision": metrics["object_set_forecast_precision"],
1279
  "object_set_forecast_recall": metrics["object_set_forecast_recall"],
1280
  }
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1281
  metrics_path = workspace / spec["metrics_json"]
1282
  metrics = score_modality_reconstruction_from_feature_error(
1283
  model_id=model_id,
@@ -1356,6 +1645,7 @@ def main() -> int:
1356
  ),
1357
  "task_ids_added_to_matrix": [
1358
  "action_object_relation",
 
1359
  "long_horizon_next_action",
1360
  "modality_reconstruction",
1361
  "next_subtask_forecast",
 
67
  "results/omni_finetune/model_output_task_probes_20260616/"
68
  "cosmos3_nano_future_window_target_map.jsonl"
69
  ),
 
70
  },
71
  }
72
 
 
660
  return metrics
661
 
662
 
663
+ def score_cosmos_nano_action_object_relation_from_target_map(
664
+ *,
665
+ model_id: str,
666
+ spec: dict[str, Any],
667
+ prediction_jsonl: Path,
668
+ target_map_jsonl: Path,
669
+ output_dir: Path,
670
+ workspace: Path,
671
+ ) -> dict[str, Any]:
672
+ source_rows = read_jsonl(prediction_jsonl)
673
+ target_by_id = load_target_map(target_map_jsonl)
674
+ scored_rows: list[dict[str, Any]] = []
675
+ y_true: list[str] = []
676
+ y_pred: list[str] = []
677
+ missing_true_target_count = 0
678
+ missing_pred_target_count = 0
679
+
680
+ for row in source_rows:
681
+ future_id = str(row.get("future_record_id") or "")
682
+ pred_future_id = str(row.get("pred_future_record_id") or "")
683
+ true_target = target_by_id.get(future_id)
684
+ if not true_target:
685
+ missing_true_target_count += 1
686
+ continue
687
+ pred_target = target_by_id.get(pred_future_id)
688
+ if not pred_target:
689
+ missing_pred_target_count += 1
690
+ true_relation = relation_label(true_target.get("action"), true_target.get("objects"))
691
+ if true_relation is None:
692
+ continue
693
+ pred_relation = relation_label(
694
+ pred_target.get("action") if pred_target else None,
695
+ pred_target.get("objects") if pred_target else None,
696
+ missing_label=MISSING_PRED_RELATION,
697
+ )
698
+ y_true.append(true_relation)
699
+ y_pred.append(pred_relation or MISSING_PRED_RELATION)
700
+ scored_rows.append(
701
+ {
702
+ "id": row.get("id"),
703
+ "split": row.get("split"),
704
+ "episode_id": row.get("episode_id"),
705
+ "future_record_id": future_id,
706
+ "pred_future_record_id": pred_future_id,
707
+ "true_relation": true_relation,
708
+ "pred_relation": pred_relation,
709
+ "correct": int(true_relation == pred_relation),
710
+ "rank": row.get("rank"),
711
+ "top_k_hit": row.get("top_k_hit"),
712
+ }
713
+ )
714
+
715
+ if not y_true:
716
+ raise RuntimeError(f"no joined future action-object relation targets found in {prediction_jsonl}")
717
+
718
+ label_options = sorted(set(y_true))
719
+ metrics, per_class, _ = class_metrics(y_true, y_pred, label_options)
720
+ metrics.update(
721
+ {
722
+ "title": f"{spec['label']} Future Action-Object Relation Probe",
723
+ "status": "pass",
724
+ "generated_at_utc": datetime.now(timezone.utc).isoformat(timespec="seconds"),
725
+ "model_id": model_id,
726
+ "model_label": spec["label"],
727
+ "task_id": "action_object_relation",
728
+ "task_number": 16,
729
+ "task_label": "Action-Object Relation",
730
+ "metric_key": "action_object_relation_macro_f1",
731
+ "primary_metric": "action_object_relation_macro_f1",
732
+ "primary_score": metrics["macro_f1"],
733
+ "action_object_relation_macro_f1": metrics["macro_f1"],
734
+ "action_object_relation_accuracy": metrics["accuracy"],
735
+ "source_prediction_jsonl": relpath(prediction_jsonl, workspace),
736
+ "source_target_map_jsonl": relpath(target_map_jsonl, workspace),
737
+ "scope": "held_out_test_existing_future_window_retrieval_probe",
738
+ "score_policy": (
739
+ "Derived from existing verified held-out Cosmos3-Nano future-window predictions. "
740
+ "The true future record and retrieved future record are joined to the public-safe "
741
+ "target map, then scored on the action plus object-set relation."
742
+ ),
743
+ "normalization_policy": (
744
+ "Action text is whitespace-normalized. Objects are casefolded, deduplicated, "
745
+ "sorted, and joined into a canonical relation label before macro-F1 scoring."
746
+ ),
747
+ "known_limitation": (
748
+ "This is a retrieval-derived future relation score, not a separately prompted "
749
+ "action-object generation head."
750
+ ),
751
+ "total_prediction_rows": len(source_rows),
752
+ "target_map_rows": len(target_by_id),
753
+ "scored_rows": len(scored_rows),
754
+ "missing_true_target_count": missing_true_target_count,
755
+ "missing_pred_target_count": missing_pred_target_count,
756
+ "artifact_files": {
757
+ "metrics_json": relpath(output_dir / "metrics.json", workspace),
758
+ "predictions_csv": relpath(output_dir / "predictions.csv", workspace),
759
+ "per_class_metrics_csv": relpath(output_dir / "per_class_metrics.csv", workspace),
760
+ },
761
+ }
762
+ )
763
+ write_json(output_dir / "metrics.json", metrics)
764
+ write_csv(
765
+ output_dir / "predictions.csv",
766
+ scored_rows,
767
+ [
768
+ "id",
769
+ "split",
770
+ "episode_id",
771
+ "future_record_id",
772
+ "pred_future_record_id",
773
+ "true_relation",
774
+ "pred_relation",
775
+ "correct",
776
+ "rank",
777
+ "top_k_hit",
778
+ ],
779
+ )
780
+ write_csv(
781
+ output_dir / "per_class_metrics.csv",
782
+ per_class,
783
+ ["class_name", "support", "predicted", "precision", "recall", "f1"],
784
+ )
785
+ return metrics
786
+
787
+
788
+ def parse_window(value: Any) -> tuple[float, float] | None:
789
+ if not isinstance(value, dict):
790
+ return None
791
+ try:
792
+ start = float(value.get("start_frame"))
793
+ end = float(value.get("end_frame"))
794
+ except (TypeError, ValueError):
795
+ return None
796
+ if end < start:
797
+ return None
798
+ return start, end
799
+
800
+
801
+ def interval_iou(a: tuple[float, float], b: tuple[float, float]) -> float:
802
+ inter = max(0.0, min(a[1], b[1]) - max(a[0], b[0]) + 1.0)
803
+ union = max(a[1], b[1]) - min(a[0], b[0]) + 1.0
804
+ return inter / union if union > 0 else 0.0
805
+
806
+
807
+ def score_caption_grounding_from_evidence_window(
808
+ *,
809
+ model_id: str,
810
+ spec: dict[str, Any],
811
+ prediction_jsonl: Path,
812
+ output_dir: Path,
813
+ workspace: Path,
814
+ ) -> dict[str, Any]:
815
+ source_rows = read_jsonl(prediction_jsonl)
816
+ scored_rows: list[dict[str, Any]] = []
817
+ ious: list[float] = []
818
+ center_hits = 0
819
+ within_20_hits = 0
820
+ missing_pred_count = 0
821
+
822
+ for row in source_rows:
823
+ true_json = row.get("true_json") if isinstance(row.get("true_json"), dict) else {}
824
+ pred_json = row.get("pred_json") if isinstance(row.get("pred_json"), dict) else {}
825
+ true_window = parse_window(true_json.get("evidence_window"))
826
+ if true_window is None:
827
+ continue
828
+ pred_window = parse_window(pred_json.get("evidence_window"))
829
+ if pred_window is None:
830
+ missing_pred_count += 1
831
+ iou = 0.0
832
+ pred_center = None
833
+ center_error = None
834
+ else:
835
+ iou = interval_iou(true_window, pred_window)
836
+ pred_center = (pred_window[0] + pred_window[1]) / 2.0
837
+ true_center = (true_window[0] + true_window[1]) / 2.0
838
+ center_error = abs(pred_center - true_center)
839
+ center_hits += int(true_window[0] <= pred_center <= true_window[1])
840
+ within_20_hits += int(center_error <= 20.0)
841
+ ious.append(iou)
842
+ scored_rows.append(
843
+ {
844
+ "id": row.get("id"),
845
+ "split": row.get("split"),
846
+ "episode_id": row.get("episode_id"),
847
+ "true_start_frame": true_window[0],
848
+ "true_end_frame": true_window[1],
849
+ "pred_start_frame": pred_window[0] if pred_window else None,
850
+ "pred_end_frame": pred_window[1] if pred_window else None,
851
+ "pred_center_frame": pred_center,
852
+ "center_error_frames": center_error,
853
+ "iou": iou,
854
+ }
855
+ )
856
+
857
+ if not scored_rows:
858
+ raise RuntimeError(f"no evidence-window targets found in {prediction_jsonl}")
859
+
860
+ mean_iou = sum(ious) / len(ious)
861
+ center_hit_rate = center_hits / len(scored_rows)
862
+ within_20_rate = within_20_hits / len(scored_rows)
863
+ metrics = {
864
+ "title": f"{spec['label']} Evidence-Window Grounding Probe",
865
+ "status": "pass",
866
+ "generated_at_utc": datetime.now(timezone.utc).isoformat(timespec="seconds"),
867
+ "model_id": model_id,
868
+ "model_label": spec["label"],
869
+ "task_id": "caption_grounding",
870
+ "task_number": 8,
871
+ "task_label": "Language Grounding",
872
+ "metric_key": "caption_grounding_iou",
873
+ "primary_metric": "caption_grounding_iou",
874
+ "primary_score": mean_iou,
875
+ "caption_grounding_iou": mean_iou,
876
+ "caption_grounding_center_hit_rate": center_hit_rate,
877
+ "caption_grounding_within_20_frames": within_20_rate,
878
+ "source_prediction_jsonl": relpath(prediction_jsonl, workspace),
879
+ "scope": "held_out_test_existing_verified_prediction_json",
880
+ "score_policy": (
881
+ "Derived from existing verified held-out structured JSON predictions. The task target is "
882
+ "the evidence_window field already present in the true JSON; missing or invalid predicted "
883
+ "evidence windows receive zero IoU."
884
+ ),
885
+ "normalization_policy": (
886
+ "Evidence windows are frame intervals. The primary score is mean interval IoU; center-hit "
887
+ "and within-20-frame rates are reported as diagnostics."
888
+ ),
889
+ "known_limitation": (
890
+ "This is an evidence-window localization score, not a candidate-set retrieval MRR."
891
+ ),
892
+ "total_prediction_rows": len(source_rows),
893
+ "scored_rows": len(scored_rows),
894
+ "missing_pred_evidence_window_count": missing_pred_count,
895
+ "artifact_files": {
896
+ "metrics_json": relpath(output_dir / "metrics.json", workspace),
897
+ "predictions_csv": relpath(output_dir / "predictions.csv", workspace),
898
+ },
899
+ }
900
+ write_json(output_dir / "metrics.json", metrics)
901
+ write_csv(
902
+ output_dir / "predictions.csv",
903
+ scored_rows,
904
+ [
905
+ "id",
906
+ "split",
907
+ "episode_id",
908
+ "true_start_frame",
909
+ "true_end_frame",
910
+ "pred_start_frame",
911
+ "pred_end_frame",
912
+ "pred_center_frame",
913
+ "center_error_frames",
914
+ "iou",
915
+ ],
916
+ )
917
+ return metrics
918
+
919
+
920
  def score_modality_reconstruction_from_feature_error(
921
  *,
922
  model_id: str,
 
1398
  task16 = task_results.get("action_object_relation", {})
1399
  task17 = task_results.get("object_set_forecast", {})
1400
  task20 = task_results.get("time_to_transition", {})
1401
+ task8 = task_results.get("caption_grounding", {})
1402
  rows.append(
1403
  "| "
1404
  + " | ".join(
 
1432
  if task20.get("time_to_transition_mae") is not None
1433
  else "n/a"
1434
  ),
1435
+ (
1436
+ f"{task8.get('caption_grounding_iou', 0.0):.6f}"
1437
+ if task8.get("caption_grounding_iou") is not None
1438
+ else "n/a"
1439
+ ),
1440
  result.get("reason") or result.get("source_prediction_jsonl", ""),
1441
  ]
1442
  )
 
1450
  prediction JSON. It does not run new inference and does not infer targets that
1451
  are absent from a model branch.
1452
 
1453
+ | Method | ID | Status | Scored tasks | Task 13 macro-F1 | Task 14 macro-F1 | Task 16 macro-F1 | Task 17 micro-F1 | Task 20 MAE | Task 8 IoU | Evidence |
1454
+ | --- | --- | --- | --- | ---: | ---: | ---: | ---: | ---: | ---: | --- |
1455
  {chr(10).join(rows)}
1456
  """
1457
 
 
1475
  continue
1476
  task_results: dict[str, Any] = {}
1477
  unsupported: dict[str, str] = {}
1478
+ if model_id != "cosmos3_nano_future_window":
 
 
1479
  metrics = score_action_object_relation(
1480
  model_id=model_id,
1481
  spec=spec,
 
1490
  "action_object_relation_macro_f1": metrics["action_object_relation_macro_f1"],
1491
  "action_object_relation_accuracy": metrics["action_object_relation_accuracy"],
1492
  }
1493
+ if model_id == "cosmos3_super_reasoner":
1494
+ metrics = score_caption_grounding_from_evidence_window(
1495
+ model_id=model_id,
1496
+ spec=spec,
1497
+ prediction_jsonl=prediction_path,
1498
+ output_dir=output_dir / "caption_grounding" / model_id,
1499
+ workspace=workspace,
1500
+ )
1501
+ task_results["caption_grounding"] = {
1502
+ "source_metrics_json": metrics["artifact_files"]["metrics_json"],
1503
+ "scored_rows": metrics["scored_rows"],
1504
+ "caption_grounding_iou": metrics["caption_grounding_iou"],
1505
+ "caption_grounding_center_hit_rate": metrics["caption_grounding_center_hit_rate"],
1506
+ "missing_pred_evidence_window_count": metrics["missing_pred_evidence_window_count"],
1507
+ }
1508
  if model_id == "cosmos3_nano_future_window":
1509
  manifest_path = workspace / spec["dataset_manifest"]
1510
  metrics = score_cosmos_nano_long_horizon_next_action(
 
1553
  "object_set_forecast_precision": metrics["object_set_forecast_precision"],
1554
  "object_set_forecast_recall": metrics["object_set_forecast_recall"],
1555
  }
1556
+ metrics = score_cosmos_nano_action_object_relation_from_target_map(
1557
+ model_id=model_id,
1558
+ spec=spec,
1559
+ prediction_jsonl=prediction_path,
1560
+ target_map_jsonl=target_map_path,
1561
+ output_dir=output_dir / "action_object_relation" / model_id,
1562
+ workspace=workspace,
1563
+ )
1564
+ task_results["action_object_relation"] = {
1565
+ "source_metrics_json": metrics["artifact_files"]["metrics_json"],
1566
+ "scored_rows": metrics["scored_rows"],
1567
+ "action_object_relation_macro_f1": metrics["action_object_relation_macro_f1"],
1568
+ "action_object_relation_accuracy": metrics["action_object_relation_accuracy"],
1569
+ }
1570
  metrics_path = workspace / spec["metrics_json"]
1571
  metrics = score_modality_reconstruction_from_feature_error(
1572
  model_id=model_id,
 
1645
  ),
1646
  "task_ids_added_to_matrix": [
1647
  "action_object_relation",
1648
+ "caption_grounding",
1649
  "long_horizon_next_action",
1650
  "modality_reconstruction",
1651
  "next_subtask_forecast",