File size: 5,906 Bytes
a49986a
 
 
7d21adc
a49986a
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
b5c6bbb
 
 
 
 
a49986a
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
7d21adc
 
 
 
 
a49986a
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
7d21adc
 
 
 
 
a49986a
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
b5c6bbb
 
a49986a
 
 
 
 
 
 
 
 
 
 
 
 
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
118
119
120
121
122
123
124
125
126
127
128
129
130
131
132
133
134
135
{
  "title": "Ropedia Xperience-10M Public Reader Map",
  "status": "published",
  "purpose": "Organize the GitHub repo, GitHub Pages dashboard, Hugging Face Space, artifact dataset, baseline model repo, consolidated weights/results repo, and model-branch repos without removing evidence.",
  "fast_paths": [
    {
      "reader_goal": "Understand the project in one pass",
      "start_here": "PROJECT_BRIEF.md",
      "then_inspect": ["PROJECT_STATUS.md", "RESEARCH_TAKEAWAYS.md"]
    },
    {
      "reader_goal": "See the visual public dashboard",
      "start_here": "GitHub Pages dashboard or Hugging Face Space",
      "then_inspect": ["docs/index.html", "docs/data/project_packet.json"]
    },
    {
      "reader_goal": "Understand the data unit",
      "start_here": "results/episode_task_suite/windows.csv",
      "then_inspect": ["results/episode_task_suite/feature_manifest.json", "docs/data/raw_sample_files.json"]
    },
    {
      "reader_goal": "Trace the 128-episode split",
      "start_here": "XPERIENCE10M_128_EPISODE_FEATURE_INDEX.md",
      "then_inspect": ["docs/data/xperience10m_128_episode_feature_index.json", "results/omni_finetune/xperience10m_128_episode_selection.csv"]
    },
    {
      "reader_goal": "Inspect the 20-task benchmark",
      "start_here": "TASK_SUITE_20.md",
      "then_inspect": ["docs/data/task_suite_20.json", "EVALUATION_PROTOCOL.md"]
    },
    {
      "reader_goal": "Compare current results",
      "start_here": "RESEARCH_TAKEAWAYS.md",
      "then_inspect": ["docs/data/task_method_20_result_matrix.json", "docs/data/unified_task_model_radar.json"]
    },
    {
      "reader_goal": "Compare 1-episode and 128-episode methods",
      "start_here": "Homepage radar section",
      "then_inspect": ["docs/data/single_episode_task_model_radar.json", "docs/data/episode128_task_model_radar.json"]
    },
    {
      "reader_goal": "Find all derived artifacts",
      "start_here": "ARTIFACT_GUIDE.md",
      "then_inspect": ["Hugging Face artifact dataset", "docs/data/artifact_index.json"]
    },
    {
      "reader_goal": "Download model weights with their matching results",
      "start_here": "Hugging Face weights/results repo",
      "then_inspect": ["manifest.json", "analysis/docs/data/task_method_20_result_matrix.json", "results/"]
    },
    {
      "reader_goal": "Reproduce or extend the work",
      "start_here": "REPRODUCIBILITY.md",
      "then_inspect": ["QUALITY_GATES.md", "scripts/", "results/"]
    },
    {
      "reader_goal": "Understand foundation-model directions",
      "start_here": "THREE_FOUNDATION_PIPELINES.md",
      "then_inspect": ["FOUNDATION_MODEL_PLAN.md", "docs/data/three_foundation_pipelines.json"]
    },
    {
      "reader_goal": "Check public-release health",
      "start_here": "PUBLIC_SURFACE_QA.md",
      "then_inspect": ["docs/data/live_publication_status.json", "docs/data/mirror_parity.json"]
    }
  ],
  "public_surfaces": [
    {
      "surface": "GitHub repo",
      "responsibility": "Source of truth for docs, scripts, generated data, validators, and commit history.",
      "best_use": "Auditing implementation and citing exact files."
    },
    {
      "surface": "GitHub Pages dashboard",
      "responsibility": "Reader-facing visual overview of the dataset sample, tasks, methods, results, directions, and resources.",
      "best_use": "Understanding the project quickly."
    },
    {
      "surface": "Hugging Face Space",
      "responsibility": "Hub-hosted copy of the dashboard and static app assets.",
      "best_use": "Sharing the visual dashboard from Hugging Face."
    },
    {
      "surface": "HF artifact dataset",
      "responsibility": "Public-safe derived artifacts, reports, metrics, website JSON, and sanitized model result packages.",
      "best_use": "Downloading evidence bundles."
    },
    {
      "surface": "HF baseline model repo",
      "responsibility": "Baseline weights, metrics, figures, and mirrored task artifacts.",
      "best_use": "Reusing compact baseline outputs."
    },
    {
      "surface": "HF weights/results repo",
      "responsibility": "Consolidated baseline weights, Qwen3/Cosmos adapter weights, verified results, analysis files, and file-level manifest.",
      "best_use": "Auditing all public-safe weight-bearing artifacts from one repo."
    },
    {
      "surface": "Qwen3/Cosmos model repos",
      "responsibility": "Adapter-specific public weights or package cards when a branch is verified and publishable.",
      "best_use": "Inspecting model-branch artifacts."
    }
  ],
  "evidence_layers": [
    "Dataset/source boundary",
    "Data contract",
    "Task suite",
    "Results",
    "Foundation directions",
    "Public-release checks"
  ],
  "claim_boundaries": [
    {
      "claim_type": "Single public-sample task behavior",
      "public_evidence": ["results/episode_task_suite/", "docs/data/task_suite_20.json"],
      "boundary": "Describes one public sample episode, not the full dataset distribution."
    },
    {
      "claim_type": "128-episode baseline comparison",
      "public_evidence": ["XPERIENCE10M_128_EPISODE_FEATURE_INDEX.md", "docs/data/xperience10m_128_episode_feature_index.json", "results/omni_finetune/*128*", "docs/data/omni_model_comparison.json"],
      "boundary": "Uses selected held-out episodes and derived public-safe summaries; official raw files remain gated upstream."
    },
    {
      "claim_type": "Foundation-model branch quality",
      "public_evidence": ["Verified Qwen3/Cosmos result packages", "model cards"],
      "boundary": "Numeric task scores appear only when a task-specific eval or probe exists."
    },
    {
      "claim_type": "Reproducibility",
      "public_evidence": ["REPRODUCIBILITY.md", "QUALITY_GATES.md", "release validators"],
      "boundary": "Raw gated Xperience-10M files and full foundation weights are not redistributed."
    }
  ]
}