Robotics
PyTorch
Cosmos
xperience10m_task_baseline_suite
embodied-ai
multimodal
xperience-10m
baseline
evaluation
qwen3-omni
Instructions to use cy0307/ropedia-xperience-10m-task-baselines with libraries, inference providers, notebooks, and local apps. Follow these links to get started.
- Libraries
- Cosmos
How to use cy0307/ropedia-xperience-10m-task-baselines with Cosmos:
# No code snippets available yet for this library. # To use this model, check the repository files and the library's documentation. # Want to help? PRs adding snippets are welcome at: # https://github.com/huggingface/huggingface.js
- Notebooks
- Google Colab
- Kaggle
File size: 4,872 Bytes
0149130 | 1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24 25 26 27 28 29 30 31 32 33 34 35 36 37 38 39 40 41 42 43 44 45 46 47 48 49 50 51 52 53 54 55 56 57 58 59 60 61 62 63 64 65 66 67 68 69 70 71 72 73 74 75 76 77 78 79 80 81 82 83 84 85 86 87 88 89 90 91 92 93 94 95 96 97 98 99 100 101 102 103 104 105 106 107 108 109 110 111 112 113 114 115 116 117 118 119 120 121 122 123 124 125 126 127 128 129 130 131 132 133 134 135 136 137 138 139 140 141 142 143 144 145 146 147 148 | {
"schema": "ropedia.task_icons.v1",
"description": "Assigned icon assets for the unified 20-task Xperience-10M suite.",
"overall_sheet": "assets/task-icons/task-icon-atlas.png",
"tasks": [
{
"task_id": "timeline_action",
"task_number": 1,
"display_name": "Action Recognition",
"motif": "person action pose",
"icon": "assets/task-icons/01_timeline_action.svg"
},
{
"task_id": "timeline_subtask",
"task_number": 2,
"display_name": "Procedure Step Recognition",
"motif": "ordered step checklist",
"icon": "assets/task-icons/02_timeline_subtask.svg"
},
{
"task_id": "transition_detection",
"task_number": 3,
"display_name": "Action Boundary Detection",
"motif": "timeline boundary",
"icon": "assets/task-icons/03_transition_detection.svg"
},
{
"task_id": "next_action",
"task_number": 4,
"display_name": "Next-Action Prediction",
"motif": "next action arrow",
"icon": "assets/task-icons/04_next_action.svg"
},
{
"task_id": "hand_trajectory_forecast",
"task_number": 5,
"display_name": "Hand Trajectory Forecasting",
"motif": "future hand path",
"icon": "assets/task-icons/05_hand_trajectory_forecast.svg"
},
{
"task_id": "contact_prediction",
"task_number": 6,
"display_name": "Contact State Prediction",
"motif": "touch contact point",
"icon": "assets/task-icons/06_contact_prediction.svg"
},
{
"task_id": "object_relevance",
"task_number": 7,
"display_name": "Object Relevance Prediction",
"motif": "highlighted relevant object",
"icon": "assets/task-icons/07_object_relevance.svg"
},
{
"task_id": "caption_grounding",
"task_number": 8,
"display_name": "Language Grounding",
"motif": "caption grounded to frame",
"icon": "assets/task-icons/08_caption_grounding.svg"
},
{
"task_id": "cross_modal_retrieval",
"task_number": 9,
"display_name": "Cross-Modal Retrieval",
"motif": "search across modalities",
"icon": "assets/task-icons/09_cross_modal_retrieval.svg"
},
{
"task_id": "modality_reconstruction",
"task_number": 10,
"display_name": "Cross-Modal Reconstruction",
"motif": "missing modality rebuilt",
"icon": "assets/task-icons/10_modality_reconstruction.svg"
},
{
"task_id": "temporal_order",
"task_number": 11,
"display_name": "Temporal Order Verification",
"motif": "ordered event nodes",
"icon": "assets/task-icons/11_temporal_order.svg"
},
{
"task_id": "misalignment_detection",
"task_number": 12,
"display_name": "Multimodal Synchronization Detection",
"motif": "sync mismatch warning",
"icon": "assets/task-icons/12_misalignment_detection.svg"
},
{
"task_id": "long_horizon_next_action",
"task_number": 13,
"display_name": "Long-Horizon Next-Action Forecasting",
"motif": "long future action path",
"icon": "assets/task-icons/13_long_horizon_next_action.svg"
},
{
"task_id": "next_subtask_forecast",
"task_number": 14,
"display_name": "Long-Horizon Next-Subtask Forecasting",
"motif": "future step branch",
"icon": "assets/task-icons/14_next_subtask_forecast.svg"
},
{
"task_id": "interaction_text_prediction",
"task_number": 15,
"display_name": "Interaction Text Prediction",
"motif": "hand action to text",
"icon": "assets/task-icons/15_interaction_text_prediction.svg"
},
{
"task_id": "action_object_relation",
"task_number": 16,
"display_name": "Action-Object Relation Prediction",
"motif": "hand object relation graph",
"icon": "assets/task-icons/16_action_object_relation.svg"
},
{
"task_id": "object_set_forecast",
"task_number": 17,
"display_name": "Future Object-Set Forecasting",
"motif": "future object cluster",
"icon": "assets/task-icons/17_object_set_forecast.svg"
},
{
"task_id": "imu_to_hand_pose",
"task_number": 18,
"display_name": "IMU-to-Hand Pose Reconstruction",
"motif": "imu waveform to hand pose",
"icon": "assets/task-icons/18_imu_to_hand_pose.svg"
},
{
"task_id": "camera_view_sync_retrieval",
"task_number": 19,
"display_name": "Camera-View Synchronization Retrieval",
"motif": "multi-camera sync",
"icon": "assets/task-icons/19_camera_view_sync_retrieval.svg"
},
{
"task_id": "time_to_transition",
"task_number": 20,
"display_name": "Time-to-Next-Transition Regression",
"motif": "clock to transition",
"icon": "assets/task-icons/20_time_to_transition.svg"
}
]
}
|