Robotics
PyTorch
Cosmos
xperience10m_task_baseline_suite
embodied-ai
multimodal
xperience-10m
baseline
evaluation
qwen3-omni
Instructions to use cy0307/ropedia-xperience-10m-task-baselines with libraries, inference providers, notebooks, and local apps. Follow these links to get started.
- Libraries
- Cosmos
How to use cy0307/ropedia-xperience-10m-task-baselines with Cosmos:
# No code snippets available yet for this library. # To use this model, check the repository files and the library's documentation. # Want to help? PRs adding snippets are welcome at: # https://github.com/huggingface/huggingface.js
- Notebooks
- Google Colab
- Kaggle
| { | |
| "title": "Ropedia Xperience-10M Task Suite Project Status", | |
| "version": "2026-06-01", | |
| "decision": "public_sample_pipeline_verified_multi_episode_omni_data_staging", | |
| "research_positioning": "A research-engineering study that makes one public Xperience-10M sample episode inspectable, defines embodied-AI tasks over synchronized modalities, records baseline behavior, and keeps later multi-episode model-quality claims separate from current single-episode evidence.", | |
| "scope_boundary": { | |
| "validated_episode_count": 1, | |
| "aligned_frames": 5821, | |
| "sliding_windows": 1161, | |
| "current_feature_dimensions": 8546, | |
| "core_task_count": 12, | |
| "neural_head_count": 12, | |
| "direction_extension_probe_count": 4, | |
| "audio_featurized": true, | |
| "raw_xperience10m_data_redistributed": false, | |
| "qwen3_omni_32_episode_claim": false | |
| }, | |
| "rows": [ | |
| { | |
| "area": "Public-sample pipeline", | |
| "status": "verified", | |
| "evidence": [ | |
| "results/episode_task_suite/summary_report.json", | |
| "results/episode_task_suite/windows.csv", | |
| "results/episode_task_suite/feature_manifest.json" | |
| ], | |
| "readout": "One public Xperience-10M sample episode is converted into 5,821 frames, 1,161 aligned 20-frame windows, and an 8,546-dimensional representation for repeatable task evaluation." | |
| }, | |
| { | |
| "area": "Task suite", | |
| "status": "verified", | |
| "evidence": [ | |
| "scripts/episode_task_suite.py", | |
| "results/episode_task_suite/", | |
| "docs/data/summary_metrics.json" | |
| ], | |
| "readout": "All 12 task contracts have committed metrics, predictions, and minimal baseline outputs." | |
| }, | |
| { | |
| "area": "Neural heads", | |
| "status": "verified", | |
| "evidence": [ | |
| "scripts/neural_task_models.py", | |
| "results/episode_task_suite/neural_mlp/" | |
| ], | |
| "readout": "Each task also has a compact PyTorch MLP run over the same feature tensor and chronological split." | |
| }, | |
| { | |
| "area": "Audio contribution study", | |
| "status": "verified", | |
| "evidence": [ | |
| "scripts/audio_ablation_and_raw_upgrade.py", | |
| "results/audio_ablation/", | |
| "docs/data/audio_ablation_summary.json" | |
| ], | |
| "readout": "Audio variants improve the primary metric on 6 of 12 task contracts in this single-episode setting." | |
| }, | |
| { | |
| "area": "Evaluation protocol", | |
| "status": "verified", | |
| "evidence": [ | |
| "EVALUATION_PROTOCOL.md", | |
| "docs/data/evaluation_protocol.json", | |
| "scripts/build_evaluation_protocol.py" | |
| ], | |
| "readout": "Windowing, chronological split, per-task metrics, leakage controls, and current limitations are generated from committed metric artifacts." | |
| }, | |
| { | |
| "area": "Research takeaways", | |
| "status": "verified", | |
| "evidence": [ | |
| "RESEARCH_TAKEAWAYS.md", | |
| "docs/data/research_takeaways.json", | |
| "scripts/build_research_takeaways.py" | |
| ], | |
| "readout": "The main result interpretation is generated from committed metrics: chronological class shift, neural gains on dynamics/order/alignment, open retrieval/reconstruction problems, and the need for held-out episodes." | |
| }, | |
| { | |
| "area": "Research roadmap", | |
| "status": "current", | |
| "evidence": [ | |
| "RESEARCH_ROADMAP.md", | |
| "docs/data/research_roadmap.json" | |
| ], | |
| "readout": "The staged path connects public-sample task development to 128-episode data staging, Qwen3-Omni LoRA, foundation-model selection, robustness runs, and larger omni/world-model extensions." | |
| }, | |
| { | |
| "area": "Foundation-model plan", | |
| "status": "current", | |
| "evidence": [ | |
| "FOUNDATION_MODEL_PLAN.md", | |
| "docs/data/foundation_model_plan.json" | |
| ], | |
| "readout": "Qwen3-Omni remains the first trainable held-out LoRA baseline; Cosmos 3 is added as the first world-model/action-generation branch; OpenVLA/openpi/GR00T are policy candidates after action targets are explicit." | |
| }, | |
| { | |
| "area": "Official dataset wording", | |
| "status": "verified", | |
| "evidence": [ | |
| "XPERIENCE10M_DATASET_CARD_ALIGNMENT.md", | |
| "docs/data/xperience10m_dataset_card_alignment.json" | |
| ], | |
| "readout": "Public wording is aligned to the official gated Xperience-10M dataset card, public sample card, and HF API metadata, including modalities, scale, access path, sample license/tooling, and current project coverage." | |
| }, | |
| { | |
| "area": "Source alignment", | |
| "status": "verified", | |
| "evidence": [ | |
| "SOURCE_ALIGNMENT_AUDIT.md", | |
| "docs/data/source_alignment_audit.json", | |
| "scripts/validate_source_alignment.py" | |
| ], | |
| "readout": "Source facts, sample details, API-listing notes, and project coverage are checked across repo docs, website, and HF cards." | |
| }, | |
| { | |
| "area": "Website and HF mirrors", | |
| "status": "verified", | |
| "evidence": [ | |
| "docs/data/website_integrity.json", | |
| "docs/data/mirror_parity.json", | |
| "docs/data/live_publication_status.json" | |
| ], | |
| "readout": "Local website links/assets pass, prepared mirrors match, and public GitHub/HF URLs have been checked after upload." | |
| }, | |
| { | |
| "area": "Publication package", | |
| "status": "verified", | |
| "evidence": [ | |
| "docs/data/publication_audit.json", | |
| "QUALITY_GATES.md", | |
| "docs/data/quality_gates.json" | |
| ], | |
| "readout": "Public bundles are checked for raw-data exclusion, cache exclusion, heavy-archive exclusion, token-string scanning, and stale presentation copy." | |
| }, | |
| { | |
| "area": "Reproducibility", | |
| "status": "verified_for_public_sample", | |
| "evidence": [ | |
| "REPRODUCIBILITY.md", | |
| "docs/data/reproducibility_matrix.json", | |
| "notes/reproducibility_audit.md" | |
| ], | |
| "readout": "The public sample workflow has explicit commands, expected outputs, and exact-match reproduction evidence." | |
| }, | |
| { | |
| "area": "Qwen3-Omni fine-tuning", | |
| "status": "data_staging_full_metrics_pending", | |
| "evidence": [ | |
| "results/omni_finetune/DATA_ACCESS_STATUS.md", | |
| "results/omni_finetune/MULTI_EPISODE_ACCESS_STATUS.md" | |
| ], | |
| "readout": "Full-dataset access is granted and a 128-episode selected relay is in progress with chunked parallel transfer and overlapping batch prefetch; final held-out metrics require completed staging, manifest construction, training, and held-out evaluation." | |
| }, | |
| { | |
| "area": "Raw Xperience-10M redistribution", | |
| "status": "not_included", | |
| "evidence": [ | |
| "DATA_NOTICE.md", | |
| "docs/data/publication_audit.json" | |
| ], | |
| "readout": "Raw MP4, HDF5, RRD files, private gated data, and full Qwen weights are intentionally excluded." | |
| } | |
| ], | |
| "fast_research_route": [ | |
| "Read PROJECT_STATUS.md and EVIDENCE_CONTRACT.md to establish what is implemented.", | |
| "Open docs/data/project_packet.json for the machine-readable project path.", | |
| "Inspect RESEARCH_TAKEAWAYS.md and docs/data/research_takeaways.json before interpreting model scores.", | |
| "Inspect RESEARCH_ROADMAP.md and docs/data/research_roadmap.json for the staged path from public-sample task work to multi-episode modeling.", | |
| "Inspect FOUNDATION_MODEL_PLAN.md and docs/data/foundation_model_plan.json before choosing a backbone branch.", | |
| "Inspect docs/data/summary_metrics.json and results/episode_task_suite/neural_mlp/ to check the 12-task outputs.", | |
| "Inspect results/audio_ablation/AUDIO_ABLATION_SUMMARY.md before judging whether audio helps the current task suite.", | |
| "Inspect EVALUATION_PROTOCOL.md before judging task metrics or leakage controls.", | |
| "Inspect SOURCE_ALIGNMENT_AUDIT.md before judging source-card consistency across public surfaces.", | |
| "Inspect XPERIENCE10M_DATASET_CARD_ALIGNMENT.md before judging dataset wording.", | |
| "Inspect results/omni_finetune/DATA_ACCESS_STATUS.md before judging Qwen3-Omni scale-up status." | |
| ], | |
| "current_reading_notes": [ | |
| "Cross-episode generalization is evaluated in the later multi-episode stage.", | |
| "Older pilot path names refer to setup files, not completed held-out training results.", | |
| "The current reconstruction task reconstructs feature vectors, not pixel-depth, mesh, NeRF, or Gaussian reconstruction.", | |
| "Audio is one of the synchronized source modalities in the current task representation.", | |
| "The audio ablation report compares audio/no-audio variants across all 12 task contracts in results/audio_ablation/.", | |
| "Foundation-model selection is explicit: Qwen3-Omni is the immediate trainable pilot, Cosmos 3 is the first world-model branch, and policy models such as OpenVLA/openpi/GR00T wait for action-target conversion." | |
| ] | |
| } | |