Robotics
PyTorch
Cosmos
xperience10m_task_baseline_suite
embodied-ai
multimodal
xperience-10m
baseline
evaluation
qwen3-omni
Instructions to use cy0307/ropedia-xperience-10m-task-baselines with libraries, inference providers, notebooks, and local apps. Follow these links to get started.
- Libraries
- Cosmos
How to use cy0307/ropedia-xperience-10m-task-baselines with Cosmos:
# No code snippets available yet for this library. # To use this model, check the repository files and the library's documentation. # Want to help? PRs adding snippets are welcome at: # https://github.com/huggingface/huggingface.js
- Notebooks
- Google Colab
- Kaggle
| #!/usr/bin/env python3 | |
| """Build the interactive research-roadmap data contract for the public site.""" | |
| from __future__ import annotations | |
| import json | |
| from datetime import datetime, timezone | |
| from pathlib import Path | |
| from typing import Any | |
| ROOT = Path(__file__).resolve().parents[1] | |
| DOCS_DATA = ROOT / "docs" / "data" | |
| RESULTS = ROOT / "results" / "episode_task_suite" | |
| GITHUB_BLOB = "https://github.com/ChaoYue0307/ropedia-xperience-10m-task-suite/blob/main" | |
| def repo_link(path: str) -> str: | |
| return f"{GITHUB_BLOB}/{path}" | |
| def load_json(path: Path) -> Any: | |
| return json.loads(path.read_text(encoding="utf-8")) | |
| def rounded_metric(value: Any) -> float | None: | |
| if value is None: | |
| return None | |
| try: | |
| return round(float(value), 4) | |
| except (TypeError, ValueError): | |
| return None | |
| def metric_summary(metric: dict[str, Any] | None) -> dict[str, Any]: | |
| if not metric: | |
| return {} | |
| return { | |
| "key": metric.get("key"), | |
| "name": metric.get("name"), | |
| "direction": metric.get("direction"), | |
| "minimal": rounded_metric(metric.get("minimal")), | |
| "neural_mlp": rounded_metric(metric.get("neural_mlp")), | |
| "better_baseline": metric.get("better_baseline"), | |
| } | |
| def task_evidence_links(task_id: str) -> list[dict[str, str]]: | |
| candidates = [ | |
| ("Minimal metrics", f"results/episode_task_suite/{task_id}/metrics.json"), | |
| ("Neural metrics", f"results/episode_task_suite/neural_mlp/{task_id}/metrics.json"), | |
| ("Minimal predictions", f"results/episode_task_suite/{task_id}/predictions.csv"), | |
| ("Neural predictions", f"results/episode_task_suite/neural_mlp/{task_id}/predictions.csv"), | |
| ("Confusion matrix", f"results/episode_task_suite/{task_id}/confusion_matrix.csv"), | |
| ("Neural confusion matrix", f"results/episode_task_suite/neural_mlp/{task_id}/confusion_matrix.csv"), | |
| ] | |
| links = [ | |
| {"label": "Task walkthrough", "href": "data/task_walkthroughs.json"}, | |
| {"label": "Single-episode explorer", "href": "single_episode_explorer.html"}, | |
| ] | |
| for label, relative_path in candidates: | |
| if (ROOT / relative_path).exists(): | |
| links.append({"label": label, "href": repo_link(relative_path)}) | |
| return links | |
| def task_payload( | |
| task_id: str, | |
| direction_task: dict[str, Any], | |
| walkthrough: dict[str, Any], | |
| ) -> dict[str, Any]: | |
| metric = direction_task.get("metric") or walkthrough.get("metric") or {} | |
| return { | |
| "id": task_id, | |
| "display_name": walkthrough.get("display_name") or direction_task.get("name") or task_id, | |
| "research_name": walkthrough.get("research_name") or direction_task.get("name") or task_id, | |
| "family": direction_task.get("family") or walkthrough.get("task_family"), | |
| "architecture_family": walkthrough.get("architecture_family"), | |
| "primary_direction": direction_task.get("primary_direction"), | |
| "direction_roles": direction_task.get("direction_roles", {}), | |
| "modalities": walkthrough.get("modalities", []), | |
| "case_study": walkthrough.get("case_study"), | |
| "input": walkthrough.get("input"), | |
| "input_short": walkthrough.get("input_short"), | |
| "process_short": walkthrough.get("process_short"), | |
| "output_short": walkthrough.get("output_short"), | |
| "module_summary": walkthrough.get("module_summary"), | |
| "current_limit": direction_task.get("current_limit") or walkthrough.get("failure_mode"), | |
| "why": direction_task.get("why"), | |
| "metric": metric_summary(metric), | |
| "evidence_links": task_evidence_links(task_id), | |
| } | |
| def phase_payload(phases: list[dict[str, Any]]) -> list[dict[str, Any]]: | |
| stage_map = { | |
| "implemented": "now", | |
| "active": "scale_up", | |
| "next": "omni", | |
| "planned": "future", | |
| } | |
| return [ | |
| { | |
| "id": phase.get("id"), | |
| "name": phase.get("name"), | |
| "status": phase.get("status"), | |
| "stage": stage_map.get(str(phase.get("status", "")).lower(), "future"), | |
| "entry_condition": phase.get("entry_condition"), | |
| "deliverables": phase.get("deliverables", []), | |
| "completion_evidence": phase.get("completion_evidence", []), | |
| "reader_takeaway": phase.get("reader_takeaway"), | |
| } | |
| for phase in phases | |
| ] | |
| def main() -> int: | |
| directions_doc = load_json(DOCS_DATA / "research_directions.json") | |
| walkthroughs = load_json(DOCS_DATA / "task_walkthroughs.json") | |
| roadmap = load_json(DOCS_DATA / "research_roadmap.json") | |
| foundation_plan = load_json(DOCS_DATA / "foundation_model_plan.json") | |
| additional_directions = load_json(DOCS_DATA / "additional_development_directions.json") | |
| summary_metrics = load_json(DOCS_DATA / "summary_metrics.json") | |
| episode_summary = load_json(RESULTS / "summary_report.json") | |
| feature_manifest = load_json(RESULTS / "feature_manifest.json") | |
| extension_doc = load_json(DOCS_DATA / "research_direction_extensions.json") | |
| tasks: dict[str, dict[str, Any]] = {} | |
| for task_id, direction_task in directions_doc.get("tasks", {}).items(): | |
| tasks[task_id] = task_payload( | |
| task_id, | |
| direction_task, | |
| walkthroughs.get("tasks", {}).get(task_id, {}), | |
| ) | |
| directions = [] | |
| for code, direction in directions_doc.get("directions", {}).items(): | |
| linked_tasks = [tasks[task_id] for task_id in direction.get("tasks", []) if task_id in tasks] | |
| extension_tasks = [ | |
| { | |
| "id": task_id, | |
| "name": spec.get("name"), | |
| "family": spec.get("family"), | |
| "metric_name": spec.get("metric_name"), | |
| "current_limit": spec.get("current_limit"), | |
| } | |
| for task_id, spec in extension_doc.get("task_specs", {}).items() | |
| if spec.get("direction") == code | |
| ] | |
| directions.append( | |
| { | |
| "code": code, | |
| "id": direction.get("id"), | |
| "name": direction.get("name"), | |
| "focus": direction.get("focus"), | |
| "preferred_background": direction.get("preferred_background"), | |
| "current_status": direction.get("current_status"), | |
| "current_readout": direction.get("current_readout"), | |
| "next_steps": direction.get("next_steps", []), | |
| "counts": direction.get("counts", {}), | |
| "task_ids": direction.get("tasks", []), | |
| "tasks": linked_tasks, | |
| "extension_tasks": extension_tasks, | |
| } | |
| ) | |
| omni = summary_metrics.get("omni_relay", {}) | |
| payload = { | |
| "title": "Interactive Research Roadmap", | |
| "generated_at_utc": datetime.now(timezone.utc).isoformat(timespec="seconds"), | |
| "source_files": [ | |
| "docs/data/research_directions.json", | |
| "docs/data/task_walkthroughs.json", | |
| "docs/data/research_roadmap.json", | |
| "docs/data/foundation_model_plan.json", | |
| "docs/data/additional_development_directions.json", | |
| "docs/data/summary_metrics.json", | |
| "docs/data/research_direction_extensions.json", | |
| "results/episode_task_suite/summary_report.json", | |
| "results/episode_task_suite/feature_manifest.json", | |
| ], | |
| "scope": { | |
| "sample_episode_count": walkthroughs.get("scope", {}).get("episode_count", 1), | |
| "num_frames": episode_summary.get("num_frames"), | |
| "num_windows": episode_summary.get("num_windows"), | |
| "feature_dim": episode_summary.get("feature_dim"), | |
| "window_frames": episode_summary.get("window_frames"), | |
| "stride_frames": episode_summary.get("stride_frames"), | |
| "feature_blocks": len(feature_manifest), | |
| "warning": walkthroughs.get("scope", {}).get("warning"), | |
| }, | |
| "baseline_summary": { | |
| "task_count": len(tasks), | |
| "baseline_heads": "minimal and neural MLP heads", | |
| "split": "chronological single-episode split for public-sample diagnostics", | |
| "current_use": "task design, data-contract validation, case studies, and baseline comparison", | |
| }, | |
| "scale_up": { | |
| "target_episodes": omni.get("target_episodes"), | |
| "candidate_scan_top_level_sessions": omni.get("candidate_scan_top_level_sessions"), | |
| "valid_candidates": omni.get("valid_candidates"), | |
| "estimated_bytes": omni.get("estimated_bytes"), | |
| "status": omni.get("status"), | |
| "access_status": omni.get("access_status"), | |
| "exclude": omni.get("exclude", []), | |
| "selection_strategy": omni.get("selection_strategy"), | |
| }, | |
| "omni_plan": { | |
| "backbone": "Qwen/Qwen3-Omni-30B-A3B-Instruct", | |
| "adapter": "LoRA rank 16, alpha 32, dropout 0.05", | |
| "first_pilot": "32 held-out-episode pilot after valid episodes are prepared", | |
| "training_unit": "episode-level split, window-level supervised examples", | |
| "evaluation": [ | |
| "JSON validity", | |
| "action macro-F1", | |
| "subtask accuracy", | |
| "transition accuracy", | |
| "next-action accuracy", | |
| "contact accuracy", | |
| "object micro-F1", | |
| "held-out episode count", | |
| ], | |
| }, | |
| "foundation_model_plan": { | |
| "status": foundation_plan.get("status"), | |
| "decision": foundation_plan.get("decision", {}), | |
| "model_families": foundation_plan.get("model_families", []), | |
| "execution_order": foundation_plan.get("execution_order", []), | |
| "evaluation_additions": foundation_plan.get("evaluation_additions", []), | |
| "source_links": foundation_plan.get("source_links", []), | |
| }, | |
| "additional_development_directions": { | |
| "title": additional_directions.get("title"), | |
| "summary": additional_directions.get("summary"), | |
| "status": additional_directions.get("status"), | |
| "public_boundary": additional_directions.get("public_boundary"), | |
| "directions": additional_directions.get("directions", []), | |
| "practical_order": additional_directions.get("practical_order", []), | |
| "source_document": additional_directions.get("source_document"), | |
| }, | |
| "phases": phase_payload(roadmap.get("phases", [])), | |
| "directions": directions, | |
| "tasks": list(tasks.values()), | |
| } | |
| out_path = DOCS_DATA / "research_roadmap_interactive.json" | |
| out_path.write_text(json.dumps(payload, indent=2, sort_keys=True) + "\n", encoding="utf-8") | |
| print(f"Wrote {out_path}") | |
| return 0 | |
| if __name__ == "__main__": | |
| raise SystemExit(main()) | |