| {"id": "xperience-10m-sample:qa:0", "target": "episode_qa", "split": "train", "episode_id": "xperience-10m-sample", "center_window": {"start_frame": 0, "end_frame": 19, "num_frames": 20}, "true_label": "Pick up kettle", "raw_prediction": "```json\n{\n \"action\": \"unknown\",\n \"subtask\": \"unknown\",\n \"objects\": \"unknown\",\n \"contact\": \"unknown\",\n \"transition\": \"unknown\",\n \"next_action\": \"unknown\",\n \"evidence_window\": \"0-19\"\n}\n```", "true_json": {"action": "Pick up kettle", "subtask": "Pick up and position kettle", "objects": ["kettle", "coffee dripper", "scale", "bottle"], "contact": "yes", "transition": "no", "next_action": "Pick up kettle", "evidence_window": {"start_frame": 0, "end_frame": 19}}, "pred_json": {"action": "unknown", "subtask": "unknown", "objects": "unknown", "contact": "unknown", "transition": "unknown", "next_action": "unknown", "evidence_window": "0-19"}, "predicted_label": "unknown", "correct": 0, "true_label_seen_in_train": 1} |
| {"id": "xperience-10m-sample:qa:1", "target": "episode_qa", "split": "train", "episode_id": "xperience-10m-sample", "center_window": {"start_frame": 20, "end_frame": 39, "num_frames": 20}, "true_label": "Pick up kettle", "raw_prediction": "```json\n{\n \"action\": \"unknown\",\n \"subtask\": \"unknown\",\n \"objects\": \"unknown\",\n \"contact\": \"unknown\",\n \"transition\": \"unknown\",\n \"next_action\": \"unknown\",\n \"evidence_window\": \"unknown\"\n}\n```", "true_json": {"action": "Pick up kettle", "subtask": "Pick up and position kettle", "objects": ["kettle", "coffee dripper", "scale", "bottle"], "contact": "yes", "transition": "no", "next_action": "Pick up kettle", "evidence_window": {"start_frame": 20, "end_frame": 39}}, "pred_json": {"action": "unknown", "subtask": "unknown", "objects": "unknown", "contact": "unknown", "transition": "unknown", "next_action": "unknown", "evidence_window": "unknown"}, "predicted_label": "unknown", "correct": 0, "true_label_seen_in_train": 1} |
| {"id": "xperience-10m-sample:qa:2", "target": "episode_qa", "split": "train", "episode_id": "xperience-10m-sample", "center_window": {"start_frame": 40, "end_frame": 59, "num_frames": 20}, "true_label": "Pick up kettle", "raw_prediction": "```json\n{\n \"action\": \"Wait/Prepare for pouring\",\n \"subtask\": \"Prepare for pouring\",\n \"objects\": [],\n \"contact\": \"unknown\",\n \"transition\": \"unknown\",\n \"next_action\": \"Pour coffee\",\n \"evidence_window\": \"40-59\"\n}\n```", "true_json": {"action": "Pick up kettle", "subtask": "Pick up and position kettle", "objects": ["kettle", "coffee dripper", "scale", "bottle"], "contact": "yes", "transition": "no", "next_action": "Pick up kettle", "evidence_window": {"start_frame": 40, "end_frame": 59}}, "pred_json": {"action": "Wait/Prepare for pouring", "subtask": "Prepare for pouring", "objects": [], "contact": "unknown", "transition": "unknown", "next_action": "Pour coffee", "evidence_window": "40-59"}, "predicted_label": "Wait/Prepare for pouring", "correct": 0, "true_label_seen_in_train": 1} |
| {"id": "xperience-10m-sample:qa:3", "target": "episode_qa", "split": "train", "episode_id": "xperience-10m-sample", "center_window": {"start_frame": 60, "end_frame": 79, "num_frames": 20}, "true_label": "Pick up kettle", "raw_prediction": "```json\n{\n \"action\": \"Wait/Prepare for pouring\",\n \"subtask\": \"Prepare for pouring\",\n \"objects\": [\n \"gooseneck kettle\"\n ],\n \"contact\": \"unknown\",\n \"transition\": \"unknown\",\n \"next_action\": \"Pour coffee\",\n \"evidence_window\": \"60-79\"\n}\n```", "true_json": {"action": "Pick up kettle", "subtask": "Pick up and position kettle", "objects": ["kettle", "coffee dripper", "scale", "bottle"], "contact": "yes", "transition": "no", "next_action": "Pick up kettle", "evidence_window": {"start_frame": 60, "end_frame": 79}}, "pred_json": {"action": "Wait/Prepare for pouring", "subtask": "Prepare for pouring", "objects": ["gooseneck kettle"], "contact": "unknown", "transition": "unknown", "next_action": "Pour coffee", "evidence_window": "60-79"}, "predicted_label": "Wait/Prepare for pouring", "correct": 0, "true_label_seen_in_train": 1} |
| {"id": "xperience-10m-sample:qa:4", "target": "episode_qa", "split": "train", "episode_id": "xperience-10m-sample", "center_window": {"start_frame": 80, "end_frame": 99, "num_frames": 20}, "true_label": "Pick up kettle", "raw_prediction": "```json\n{\n \"action\": \"Wait/Prepare for pouring\",\n \"subtask\": \"Prepare for pouring\",\n \"objects\": [\n \"gooseneck kettle\"\n ],\n \"contact\": \"unknown\",\n \"transition\": \"unknown\",\n \"next_action\": \"Pour coffee\",\n \"evidence_window\": \"80-99\"\n}\n```", "true_json": {"action": "Pick up kettle", "subtask": "Pick up and position kettle", "objects": ["kettle", "coffee dripper", "scale", "bottle"], "contact": "yes", "transition": "no", "next_action": "Pick up kettle", "evidence_window": {"start_frame": 80, "end_frame": 99}}, "pred_json": {"action": "Wait/Prepare for pouring", "subtask": "Prepare for pouring", "objects": ["gooseneck kettle"], "contact": "unknown", "transition": "unknown", "next_action": "Pour coffee", "evidence_window": "80-99"}, "predicted_label": "Wait/Prepare for pouring", "correct": 0, "true_label_seen_in_train": 1} |
| {"id": "xperience-10m-sample:qa:5", "target": "episode_qa", "split": "train", "episode_id": "xperience-10m-sample", "center_window": {"start_frame": 100, "end_frame": 119, "num_frames": 20}, "true_label": "Pick up kettle", "raw_prediction": "```json\n{\n \"action\": \"Wait/Prepare for pouring\",\n \"subtask\": \"Prepare for pouring\",\n \"objects\": [],\n \"contact\": \"unknown\",\n \"transition\": \"unknown\",\n \"next_action\": \"Pour coffee\",\n \"evidence_window\": \"100-119\"\n}\n```", "true_json": {"action": "Pick up kettle", "subtask": "Pick up and position kettle", "objects": ["kettle", "coffee dripper", "scale", "bottle"], "contact": "yes", "transition": "no", "next_action": "Pick up kettle", "evidence_window": {"start_frame": 100, "end_frame": 119}}, "pred_json": {"action": "Wait/Prepare for pouring", "subtask": "Prepare for pouring", "objects": [], "contact": "unknown", "transition": "unknown", "next_action": "Pour coffee", "evidence_window": "100-119"}, "predicted_label": "Wait/Prepare for pouring", "correct": 0, "true_label_seen_in_train": 1} |
| {"id": "xperience-10m-sample:qa:6", "target": "episode_qa", "split": "train", "episode_id": "xperience-10m-sample", "center_window": {"start_frame": 120, "end_frame": 139, "num_frames": 20}, "true_label": "Pick up kettle", "raw_prediction": "```json\n{\n \"action\": \"Wait/Prepare for pouring\",\n \"subtask\": \"Prepare for pouring\",\n \"objects\": [\n \"gooseneck kettle\"\n ],\n \"contact\": \"unknown\",\n \"transition\": \"unknown\",\n \"next_action\": \"Pour coffee\",\n \"evidence_window\": \"120-139\"\n}\n```", "true_json": {"action": "Pick up kettle", "subtask": "Pick up and position kettle", "objects": ["kettle"], "contact": "yes", "transition": "no", "next_action": "Pick up kettle", "evidence_window": {"start_frame": 120, "end_frame": 139}}, "pred_json": {"action": "Wait/Prepare for pouring", "subtask": "Prepare for pouring", "objects": ["gooseneck kettle"], "contact": "unknown", "transition": "unknown", "next_action": "Pour coffee", "evidence_window": "120-139"}, "predicted_label": "Wait/Prepare for pouring", "correct": 0, "true_label_seen_in_train": 1} |
| {"id": "xperience-10m-sample:qa:7", "target": "episode_qa", "split": "train", "episode_id": "xperience-10m-sample", "center_window": {"start_frame": 140, "end_frame": 159, "num_frames": 20}, "true_label": "Pick up kettle", "raw_prediction": "```json\n{\n \"action\": \"Wait/Prepare for pouring\",\n \"subtask\": \"Prepare for pouring\",\n \"objects\": [\n \"gooseneck kettle\"\n ],\n \"contact\": \"unknown\",\n \"transition\": \"unknown\",\n \"next_action\": \"Pour coffee\",\n \"evidence_window\": \"140-159\"\n}\n```", "true_json": {"action": "Pick up kettle", "subtask": "Pick up and position kettle", "objects": ["kettle"], "contact": "yes", "transition": "no", "next_action": "Position kettle to pour", "evidence_window": {"start_frame": 140, "end_frame": 159}}, "pred_json": {"action": "Wait/Prepare for pouring", "subtask": "Prepare for pouring", "objects": ["gooseneck kettle"], "contact": "unknown", "transition": "unknown", "next_action": "Pour coffee", "evidence_window": "140-159"}, "predicted_label": "Wait/Prepare for pouring", "correct": 0, "true_label_seen_in_train": 1} |
| {"id": "xperience-10m-sample:qa:8", "target": "episode_qa", "split": "train", "episode_id": "xperience-10m-sample", "center_window": {"start_frame": 160, "end_frame": 179, "num_frames": 20}, "true_label": "Position kettle to pour", "raw_prediction": "```json\n{\n \"action\": \"Wait/Prepare for pouring\",\n \"subtask\": \"Prepare for pouring\",\n \"objects\": [\n \"gooseneck kettle\"\n ],\n \"contact\": \"unknown\",\n \"transition\": \"unknown\",\n \"next_action\": \"Pour coffee\",\n \"evidence_window\": \"160-179\"\n}\n```", "true_json": {"action": "Position kettle to pour", "subtask": "Pick up and position kettle", "objects": ["kettle"], "contact": "yes", "transition": "no", "next_action": "Position kettle to pour", "evidence_window": {"start_frame": 160, "end_frame": 179}}, "pred_json": {"action": "Wait/Prepare for pouring", "subtask": "Prepare for pouring", "objects": ["gooseneck kettle"], "contact": "unknown", "transition": "unknown", "next_action": "Pour coffee", "evidence_window": "160-179"}, "predicted_label": "Wait/Prepare for pouring", "correct": 0, "true_label_seen_in_train": 1} |
| {"id": "xperience-10m-sample:qa:9", "target": "episode_qa", "split": "train", "episode_id": "xperience-10m-sample", "center_window": {"start_frame": 180, "end_frame": 199, "num_frames": 20}, "true_label": "Position kettle to pour", "raw_prediction": "```json\n{\n \"action\": \"Wait/Prepare for pouring\",\n \"subtask\": \"Prepare for pouring\",\n \"objects\": [\n \"gooseneck kettle\"\n ],\n \"contact\": \"unknown\",\n \"transition\": \"unknown\",\n \"next_action\": \"Pour coffee\",\n \"evidence_window\": \"180-199\"\n}\n```", "true_json": {"action": "Position kettle to pour", "subtask": "Pick up and position kettle", "objects": ["kettle"], "contact": "yes", "transition": "no", "next_action": "Position kettle to pour", "evidence_window": {"start_frame": 180, "end_frame": 199}}, "pred_json": {"action": "Wait/Prepare for pouring", "subtask": "Prepare for pouring", "objects": ["gooseneck kettle"], "contact": "unknown", "transition": "unknown", "next_action": "Pour coffee", "evidence_window": "180-199"}, "predicted_label": "Wait/Prepare for pouring", "correct": 0, "true_label_seen_in_train": 1} |
| {"id": "xperience-10m-sample:qa:10", "target": "episode_qa", "split": "train", "episode_id": "xperience-10m-sample", "center_window": {"start_frame": 200, "end_frame": 219, "num_frames": 20}, "true_label": "Position kettle to pour", "raw_prediction": "```json\n{\n \"action\": \"Wait/Prepare for pouring\",\n \"subtask\": \"Prepare for pouring\",\n \"objects\": [\n \"gooseneck kettle\"\n ],\n \"contact\": \"unknown\",\n \"transition\": \"unknown\",\n \"next_action\": \"Pour coffee\",\n \"evidence_window\": \"200-219\"\n}\n```", "true_json": {"action": "Position kettle to pour", "subtask": "Pick up and position kettle", "objects": ["kettle"], "contact": "yes", "transition": "no", "next_action": "Position kettle to pour", "evidence_window": {"start_frame": 200, "end_frame": 219}}, "pred_json": {"action": "Wait/Prepare for pouring", "subtask": "Prepare for pouring", "objects": ["gooseneck kettle"], "contact": "unknown", "transition": "unknown", "next_action": "Pour coffee", "evidence_window": "200-219"}, "predicted_label": "Wait/Prepare for pouring", "correct": 0, "true_label_seen_in_train": 1} |
| {"id": "xperience-10m-sample:qa:11", "target": "episode_qa", "split": "train", "episode_id": "xperience-10m-sample", "center_window": {"start_frame": 220, "end_frame": 239, "num_frames": 20}, "true_label": "Position kettle to pour", "raw_prediction": "```json\n{\n \"action\": \"Wait/Prepare for pouring\",\n \"subtask\": \"Prepare for pouring\",\n \"objects\": [\n \"gooseneck kettle\"\n ],\n \"contact\": \"unknown\",\n \"transition\": \"unknown\",\n \"next_action\": \"Pour coffee\",\n \"evidence_window\": \"220-239\"\n}\n```", "true_json": {"action": "Position kettle to pour", "subtask": "Pick up and position kettle", "objects": ["kettle"], "contact": "yes", "transition": "no", "next_action": "Position kettle to pour", "evidence_window": {"start_frame": 220, "end_frame": 239}}, "pred_json": {"action": "Wait/Prepare for pouring", "subtask": "Prepare for pouring", "objects": ["gooseneck kettle"], "contact": "unknown", "transition": "unknown", "next_action": "Pour coffee", "evidence_window": "220-239"}, "predicted_label": "Wait/Prepare for pouring", "correct": 0, "true_label_seen_in_train": 1} |
| {"id": "xperience-10m-sample:qa:12", "target": "episode_qa", "split": "train", "episode_id": "xperience-10m-sample", "center_window": {"start_frame": 240, "end_frame": 259, "num_frames": 20}, "true_label": "Position kettle to pour", "raw_prediction": "```json\n{\n \"action\": \"Wait/Prepare for pouring\",\n \"subtask\": \"Prepare for pouring\",\n \"objects\": [\n \"gooseneck kettle\"\n ],\n \"contact\": \"unknown\",\n \"transition\": \"unknown\",\n \"next_action\": \"Pour coffee\",\n \"evidence_window\": \"240-259\"\n}\n```", "true_json": {"action": "Position kettle to pour", "subtask": "Pick up and position kettle", "objects": ["kettle"], "contact": "yes", "transition": "no", "next_action": "Position kettle to pour", "evidence_window": {"start_frame": 240, "end_frame": 259}}, "pred_json": {"action": "Wait/Prepare for pouring", "subtask": "Prepare for pouring", "objects": ["gooseneck kettle"], "contact": "unknown", "transition": "unknown", "next_action": "Pour coffee", "evidence_window": "240-259"}, "predicted_label": "Wait/Prepare for pouring", "correct": 0, "true_label_seen_in_train": 1} |
| {"id": "xperience-10m-sample:qa:13", "target": "episode_qa", "split": "train", "episode_id": "xperience-10m-sample", "center_window": {"start_frame": 260, "end_frame": 279, "num_frames": 20}, "true_label": "Position kettle to pour", "raw_prediction": "```json\n{\n \"action\": \"Wait/Prepare for pouring\",\n \"subtask\": \"Prepare for pouring\",\n \"objects\": [\n \"gooseneck kettle\"\n ],\n \"contact\": \"unknown\",\n \"transition\": \"unknown\",\n \"next_action\": \"Pour coffee\",\n \"evidence_window\": \"260-279\"\n}\n```", "true_json": {"action": "Position kettle to pour", "subtask": "Pick up and position kettle", "objects": ["kettle"], "contact": "yes", "transition": "no", "next_action": "Position kettle to pour", "evidence_window": {"start_frame": 260, "end_frame": 279}}, "pred_json": {"action": "Wait/Prepare for pouring", "subtask": "Prepare for pouring", "objects": ["gooseneck kettle"], "contact": "unknown", "transition": "unknown", "next_action": "Pour coffee", "evidence_window": "260-279"}, "predicted_label": "Wait/Prepare for pouring", "correct": 0, "true_label_seen_in_train": 1} |
| {"id": "xperience-10m-sample:qa:14", "target": "episode_qa", "split": "train", "episode_id": "xperience-10m-sample", "center_window": {"start_frame": 280, "end_frame": 299, "num_frames": 20}, "true_label": "Position kettle to pour", "raw_prediction": "```json\n{\n \"action\": \"Wait/Prepare for pouring\",\n \"subtask\": \"Prepare for pouring\",\n \"objects\": [\n \"gooseneck kettle\"\n ],\n \"contact\": \"unknown\",\n \"transition\": \"unknown\",\n \"next_action\": \"Pour coffee\",\n \"evidence_window\": \"280-299\"\n}\n```", "true_json": {"action": "Position kettle to pour", "subtask": "Pick up and position kettle", "objects": ["kettle"], "contact": "yes", "transition": "no", "next_action": "Position kettle to pour", "evidence_window": {"start_frame": 280, "end_frame": 299}}, "pred_json": {"action": "Wait/Prepare for pouring", "subtask": "Prepare for pouring", "objects": ["gooseneck kettle"], "contact": "unknown", "transition": "unknown", "next_action": "Pour coffee", "evidence_window": "280-299"}, "predicted_label": "Wait/Prepare for pouring", "correct": 0, "true_label_seen_in_train": 1} |
| {"id": "xperience-10m-sample:qa:15", "target": "episode_qa", "split": "train", "episode_id": "xperience-10m-sample", "center_window": {"start_frame": 300, "end_frame": 319, "num_frames": 20}, "true_label": "Position kettle to pour", "raw_prediction": "```json\n{\n \"action\": \"unknown\",\n \"subtask\": \"unknown\",\n \"objects\": \"unknown\",\n \"contact\": \"unknown\",\n \"transition\": \"unknown\",\n \"next_action\": \"unknown\",\n \"evidence_window\": \"unknown\"\n}\n```", "true_json": {"action": "Position kettle to pour", "subtask": "Pick up and position kettle", "objects": ["kettle"], "contact": "yes", "transition": "no", "next_action": "Position kettle to pour", "evidence_window": {"start_frame": 300, "end_frame": 319}}, "pred_json": {"action": "unknown", "subtask": "unknown", "objects": "unknown", "contact": "unknown", "transition": "unknown", "next_action": "unknown", "evidence_window": "unknown"}, "predicted_label": "unknown", "correct": 0, "true_label_seen_in_train": 1} |
| {"id": "xperience-10m-sample:qa:40", "target": "episode_qa", "split": "train", "episode_id": "xperience-10m-sample", "center_window": {"start_frame": 800, "end_frame": 819, "num_frames": 20}, "true_label": "Move kettle", "raw_prediction": "```json\n{\n \"action\": \"unknown\",\n \"subtask\": \"unknown\",\n \"objects\": \"unknown\",\n \"contact\": \"unknown\",\n \"transition\": \"unknown\",\n \"next_action\": \"unknown\",\n \"evidence_window\": \"800-819\"\n}\n```", "true_json": {"action": "Move kettle", "subtask": "Move kettle", "objects": ["kettle", "dripper", "scale", "coffee filter", "table"], "contact": "yes", "transition": "no", "next_action": "Move kettle", "evidence_window": {"start_frame": 800, "end_frame": 819}}, "pred_json": {"action": "unknown", "subtask": "unknown", "objects": "unknown", "contact": "unknown", "transition": "unknown", "next_action": "unknown", "evidence_window": "800-819"}, "predicted_label": "unknown", "correct": 0, "true_label_seen_in_train": 1} |
| {"id": "xperience-10m-sample:qa:41", "target": "episode_qa", "split": "train", "episode_id": "xperience-10m-sample", "center_window": {"start_frame": 820, "end_frame": 839, "num_frames": 20}, "true_label": "Move kettle", "raw_prediction": "```json\n{\n \"action\": \"unknown\",\n \"subtask\": \"unknown\",\n \"objects\": \"unknown\",\n \"contact\": \"unknown\",\n \"transition\": \"unknown\",\n \"next_action\": \"unknown\",\n \"evidence_window\": \"820-839\"\n}\n```", "true_json": {"action": "Move kettle", "subtask": "Move kettle", "objects": ["kettle", "dripper", "scale", "coffee filter", "table"], "contact": "yes", "transition": "no", "next_action": "Move kettle", "evidence_window": {"start_frame": 820, "end_frame": 839}}, "pred_json": {"action": "unknown", "subtask": "unknown", "objects": "unknown", "contact": "unknown", "transition": "unknown", "next_action": "unknown", "evidence_window": "820-839"}, "predicted_label": "unknown", "correct": 0, "true_label_seen_in_train": 1} |
| {"id": "xperience-10m-sample:qa:42", "target": "episode_qa", "split": "train", "episode_id": "xperience-10m-sample", "center_window": {"start_frame": 840, "end_frame": 859, "num_frames": 20}, "true_label": "Move kettle", "raw_prediction": "```json\n{\n \"action\": \"unknown\",\n \"subtask\": \"unknown\",\n \"objects\": \"unknown\",\n \"contact\": \"unknown\",\n \"transition\": \"unknown\",\n \"next_action\": \"unknown\",\n \"evidence_window\": \"unknown\"\n}\n```", "true_json": {"action": "Move kettle", "subtask": "Move kettle", "objects": ["kettle", "dripper", "scale", "coffee filter", "table"], "contact": "yes", "transition": "no", "next_action": "Move kettle", "evidence_window": {"start_frame": 840, "end_frame": 859}}, "pred_json": {"action": "unknown", "subtask": "unknown", "objects": "unknown", "contact": "unknown", "transition": "unknown", "next_action": "unknown", "evidence_window": "unknown"}, "predicted_label": "unknown", "correct": 0, "true_label_seen_in_train": 1} |
| {"id": "xperience-10m-sample:qa:43", "target": "episode_qa", "split": "train", "episode_id": "xperience-10m-sample", "center_window": {"start_frame": 860, "end_frame": 879, "num_frames": 20}, "true_label": "Move kettle", "raw_prediction": "```json\n{\n \"action\": \"unknown\",\n \"subtask\": \"unknown\",\n \"objects\": [\n \"gooseneck kettle\",\n \"white bottle\"\n ],\n \"contact\": \"unknown\",\n \"transition\": \"unknown\",\n \"next_action\": \"unknown\",\n \"evidence_window\": \"unknown\"\n}\n```", "true_json": {"action": "Move kettle", "subtask": "Move kettle", "objects": ["kettle", "dripper", "scale", "coffee filter", "table"], "contact": "yes", "transition": "no", "next_action": "Move kettle", "evidence_window": {"start_frame": 860, "end_frame": 879}}, "pred_json": {"action": "unknown", "subtask": "unknown", "objects": ["gooseneck kettle", "white bottle"], "contact": "unknown", "transition": "unknown", "next_action": "unknown", "evidence_window": "unknown"}, "predicted_label": "unknown", "correct": 0, "true_label_seen_in_train": 1} |
| {"id": "xperience-10m-sample:qa:44", "target": "episode_qa", "split": "train", "episode_id": "xperience-10m-sample", "center_window": {"start_frame": 880, "end_frame": 899, "num_frames": 20}, "true_label": "Move kettle", "raw_prediction": "```json\n{\n \"action\": \"Wait/Prepare for pouring\",\n \"subtask\": \"Prepare for pouring\",\n \"objects\": [\n \"gooseneck kettle\"\n ],\n \"contact\": \"unknown\",\n \"transition\": \"unknown\",\n \"next_action\": \"Pour coffee\",\n \"evidence_window\": \"880-899\"\n}\n```", "true_json": {"action": "Move kettle", "subtask": "Move kettle", "objects": ["kettle", "dripper", "scale", "coffee filter", "table"], "contact": "yes", "transition": "no", "next_action": "Move kettle", "evidence_window": {"start_frame": 880, "end_frame": 899}}, "pred_json": {"action": "Wait/Prepare for pouring", "subtask": "Prepare for pouring", "objects": ["gooseneck kettle"], "contact": "unknown", "transition": "unknown", "next_action": "Pour coffee", "evidence_window": "880-899"}, "predicted_label": "Wait/Prepare for pouring", "correct": 0, "true_label_seen_in_train": 1} |
| {"id": "xperience-10m-sample:qa:45", "target": "episode_qa", "split": "train", "episode_id": "xperience-10m-sample", "center_window": {"start_frame": 900, "end_frame": 919, "num_frames": 20}, "true_label": "Move kettle", "raw_prediction": "```json\n{\n \"action\": \"unknown\",\n \"subtask\": \"unknown\",\n \"objects\": [\n \"gooseneck kettle\",\n \"white bottle\"\n ],\n \"contact\": \"unknown\",\n \"transition\": \"unknown\",\n \"next_action\": \"unknown\",\n \"evidence_window\": \"900-919\"\n}\n```", "true_json": {"action": "Move kettle", "subtask": "Move kettle", "objects": ["kettle", "dripper", "scale", "coffee filter", "table"], "contact": "yes", "transition": "no", "next_action": "Move kettle", "evidence_window": {"start_frame": 900, "end_frame": 919}}, "pred_json": {"action": "unknown", "subtask": "unknown", "objects": ["gooseneck kettle", "white bottle"], "contact": "unknown", "transition": "unknown", "next_action": "unknown", "evidence_window": "900-919"}, "predicted_label": "unknown", "correct": 0, "true_label_seen_in_train": 1} |
| {"id": "xperience-10m-sample:qa:46", "target": "episode_qa", "split": "train", "episode_id": "xperience-10m-sample", "center_window": {"start_frame": 920, "end_frame": 939, "num_frames": 20}, "true_label": "Move kettle", "raw_prediction": "```json\n{\n \"action\": \"unknown\",\n \"subtask\": \"unknown\",\n \"objects\": [],\n \"contact\": \"unknown\",\n \"transition\": \"unknown\",\n \"next_action\": \"unknown\",\n \"evidence_window\": \"920-939\"\n}\n```", "true_json": {"action": "Move kettle", "subtask": "Move kettle", "objects": ["kettle", "dripper", "scale", "coffee filter", "table"], "contact": "yes", "transition": "no", "next_action": "Move kettle", "evidence_window": {"start_frame": 920, "end_frame": 939}}, "pred_json": {"action": "unknown", "subtask": "unknown", "objects": [], "contact": "unknown", "transition": "unknown", "next_action": "unknown", "evidence_window": "920-939"}, "predicted_label": "unknown", "correct": 0, "true_label_seen_in_train": 1} |
| {"id": "xperience-10m-sample:qa:47", "target": "episode_qa", "split": "train", "episode_id": "xperience-10m-sample", "center_window": {"start_frame": 940, "end_frame": 959, "num_frames": 20}, "true_label": "Move kettle", "raw_prediction": "```json\n{\n \"action\": \"unknown\",\n \"subtask\": \"unknown\",\n \"objects\": \"unknown\",\n \"contact\": \"unknown\",\n \"transition\": \"unknown\",\n \"next_action\": \"unknown\",\n \"evidence_window\": \"940-959\"\n}\n```", "true_json": {"action": "Move kettle", "subtask": "Move kettle", "objects": ["kettle", "dripper", "scale", "coffee filter", "table"], "contact": "yes", "transition": "no", "next_action": "Move kettle", "evidence_window": {"start_frame": 940, "end_frame": 959}}, "pred_json": {"action": "unknown", "subtask": "unknown", "objects": "unknown", "contact": "unknown", "transition": "unknown", "next_action": "unknown", "evidence_window": "940-959"}, "predicted_label": "unknown", "correct": 0, "true_label_seen_in_train": 1} |
| {"id": "xperience-10m-sample:qa:50", "target": "episode_qa", "split": "train", "episode_id": "xperience-10m-sample", "center_window": {"start_frame": 1000, "end_frame": 1019, "num_frames": 20}, "true_label": "Hold coffee carafe", "raw_prediction": "```json\n{\n \"action\": \"unknown\",\n \"subtask\": \"unknown\",\n \"objects\": [],\n \"contact\": \"unknown\",\n \"transition\": \"unknown\",\n \"next_action\": \"unknown\",\n \"evidence_window\": \"1000-1019\"\n}\n```", "true_json": {"action": "Hold coffee carafe", "subtask": "Prepare coffee equipment and scoop grounds", "objects": ["glass carafe", "coffee scale", "coffee dripper", "white mug", "bottle"], "contact": "yes", "transition": "no", "next_action": "Hold coffee carafe", "evidence_window": {"start_frame": 1000, "end_frame": 1019}}, "pred_json": {"action": "unknown", "subtask": "unknown", "objects": [], "contact": "unknown", "transition": "unknown", "next_action": "unknown", "evidence_window": "1000-1019"}, "predicted_label": "unknown", "correct": 0, "true_label_seen_in_train": 1} |
| {"id": "xperience-10m-sample:qa:51", "target": "episode_qa", "split": "train", "episode_id": "xperience-10m-sample", "center_window": {"start_frame": 1020, "end_frame": 1039, "num_frames": 20}, "true_label": "Hold coffee carafe", "raw_prediction": "```json\n{\n \"action\": \"Wait/Prepare for pouring\",\n \"subtask\": \"Prepare for pouring\",\n \"objects\": [\n \"gooseneck kettle\"\n ],\n \"contact\": \"unknown\",\n \"transition\": \"unknown\",\n \"next_action\": \"Pour coffee\",\n \"evidence_window\": \"1020-1039\"\n}\n```", "true_json": {"action": "Hold coffee carafe", "subtask": "Prepare coffee equipment and scoop grounds", "objects": ["glass carafe", "coffee scale", "coffee dripper", "white mug", "bottle"], "contact": "yes", "transition": "no", "next_action": "Hold coffee carafe", "evidence_window": {"start_frame": 1020, "end_frame": 1039}}, "pred_json": {"action": "Wait/Prepare for pouring", "subtask": "Prepare for pouring", "objects": ["gooseneck kettle"], "contact": "unknown", "transition": "unknown", "next_action": "Pour coffee", "evidence_window": "1020-1039"}, "predicted_label": "Wait/Prepare for pouring", "correct": 0, "true_label_seen_in_train": 1} |
| {"id": "xperience-10m-sample:qa:52", "target": "episode_qa", "split": "train", "episode_id": "xperience-10m-sample", "center_window": {"start_frame": 1040, "end_frame": 1059, "num_frames": 20}, "true_label": "Hold coffee carafe", "raw_prediction": "```json\n{\n \"action\": \"unknown\",\n \"subtask\": \"unknown\",\n \"objects\": [\n \"gooseneck kettle\",\n \"white bottle\"\n ],\n \"contact\": \"unknown\",\n \"transition\": \"unknown\",\n \"next_action\": \"unknown\",\n \"evidence_window\": \"unknown\"\n}\n```", "true_json": {"action": "Hold coffee carafe", "subtask": "Prepare coffee equipment and scoop grounds", "objects": ["glass carafe", "coffee scale", "coffee dripper", "white mug", "bottle"], "contact": "yes", "transition": "no", "next_action": "Hold coffee carafe", "evidence_window": {"start_frame": 1040, "end_frame": 1059}}, "pred_json": {"action": "unknown", "subtask": "unknown", "objects": ["gooseneck kettle", "white bottle"], "contact": "unknown", "transition": "unknown", "next_action": "unknown", "evidence_window": "unknown"}, "predicted_label": "unknown", "correct": 0, "true_label_seen_in_train": 1} |
| {"id": "xperience-10m-sample:qa:53", "target": "episode_qa", "split": "train", "episode_id": "xperience-10m-sample", "center_window": {"start_frame": 1060, "end_frame": 1079, "num_frames": 20}, "true_label": "Hold coffee carafe", "raw_prediction": "```json\n{\n \"action\": \"unknown\",\n \"subtask\": \"unknown\",\n \"objects\": \"unknown\",\n \"contact\": \"unknown\",\n \"transition\": \"unknown\",\n \"next_action\": \"unknown\",\n \"evidence_window\": \"1060-1079\"\n}\n```", "true_json": {"action": "Hold coffee carafe", "subtask": "Prepare coffee equipment and scoop grounds", "objects": ["glass carafe", "coffee scale", "coffee dripper", "white mug", "bottle"], "contact": "yes", "transition": "no", "next_action": "Hold coffee carafe", "evidence_window": {"start_frame": 1060, "end_frame": 1079}}, "pred_json": {"action": "unknown", "subtask": "unknown", "objects": "unknown", "contact": "unknown", "transition": "unknown", "next_action": "unknown", "evidence_window": "1060-1079"}, "predicted_label": "unknown", "correct": 0, "true_label_seen_in_train": 1} |
| {"id": "xperience-10m-sample:qa:54", "target": "episode_qa", "split": "train", "episode_id": "xperience-10m-sample", "center_window": {"start_frame": 1080, "end_frame": 1099, "num_frames": 20}, "true_label": "Hold coffee carafe", "raw_prediction": "```json\n{\n \"action\": \"unknown\",\n \"subtask\": \"unknown\",\n \"objects\": [],\n \"contact\": \"unknown\",\n \"transition\": \"unknown\",\n \"next_action\": \"unknown\",\n \"evidence_window\": \"1080-1099\"\n}\n```", "true_json": {"action": "Hold coffee carafe", "subtask": "Prepare coffee equipment and scoop grounds", "objects": ["glass carafe", "coffee scale", "coffee dripper", "white mug", "bottle"], "contact": "yes", "transition": "no", "next_action": "Hold coffee carafe", "evidence_window": {"start_frame": 1080, "end_frame": 1099}}, "pred_json": {"action": "unknown", "subtask": "unknown", "objects": [], "contact": "unknown", "transition": "unknown", "next_action": "unknown", "evidence_window": "1080-1099"}, "predicted_label": "unknown", "correct": 0, "true_label_seen_in_train": 1} |
| {"id": "xperience-10m-sample:qa:55", "target": "episode_qa", "split": "train", "episode_id": "xperience-10m-sample", "center_window": {"start_frame": 1100, "end_frame": 1119, "num_frames": 20}, "true_label": "Hold coffee carafe", "raw_prediction": "```json\n{\n \"action\": \"unknown\",\n \"subtask\": \"unknown\",\n \"objects\": \"unknown\",\n \"contact\": \"unknown\",\n \"transition\": \"unknown\",\n \"next_action\": \"unknown\",\n \"evidence_window\": \"1100-1119\"\n}\n```", "true_json": {"action": "Hold coffee carafe", "subtask": "Prepare coffee equipment and scoop grounds", "objects": ["glass carafe", "coffee scale", "coffee dripper", "white mug", "bottle"], "contact": "yes", "transition": "no", "next_action": "Hold coffee carafe", "evidence_window": {"start_frame": 1100, "end_frame": 1119}}, "pred_json": {"action": "unknown", "subtask": "unknown", "objects": "unknown", "contact": "unknown", "transition": "unknown", "next_action": "unknown", "evidence_window": "1100-1119"}, "predicted_label": "unknown", "correct": 0, "true_label_seen_in_train": 1} |
| {"id": "xperience-10m-sample:qa:56", "target": "episode_qa", "split": "train", "episode_id": "xperience-10m-sample", "center_window": {"start_frame": 1120, "end_frame": 1139, "num_frames": 20}, "true_label": "Hold coffee carafe", "raw_prediction": "```json\n{\n \"action\": \"unknown\",\n \"subtask\": \"unknown\",\n \"objects\": \"unknown\",\n \"contact\": \"unknown\",\n \"transition\": \"unknown\",\n \"next_action\": \"unknown\",\n \"evidence_window\": \"1120-1139\"\n}\n```", "true_json": {"action": "Hold coffee carafe", "subtask": "Prepare coffee equipment and scoop grounds", "objects": ["glass carafe", "coffee scale", "coffee dripper", "white mug", "bottle"], "contact": "yes", "transition": "no", "next_action": "Hold coffee carafe", "evidence_window": {"start_frame": 1120, "end_frame": 1139}}, "pred_json": {"action": "unknown", "subtask": "unknown", "objects": "unknown", "contact": "unknown", "transition": "unknown", "next_action": "unknown", "evidence_window": "1120-1139"}, "predicted_label": "unknown", "correct": 0, "true_label_seen_in_train": 1} |
| {"id": "xperience-10m-sample:qa:57", "target": "episode_qa", "split": "train", "episode_id": "xperience-10m-sample", "center_window": {"start_frame": 1140, "end_frame": 1159, "num_frames": 20}, "true_label": "Hold coffee carafe", "raw_prediction": "```json\n{\n \"action\": \"unknown\",\n \"subtask\": \"unknown\",\n \"objects\": [],\n \"contact\": \"unknown\",\n \"transition\": \"unknown\",\n \"next_action\": \"unknown\",\n \"evidence_window\": \"1140-1159\"\n}\n```", "true_json": {"action": "Hold coffee carafe", "subtask": "Prepare coffee equipment and scoop grounds", "objects": ["glass carafe", "coffee scale", "coffee dripper", "white mug", "bottle"], "contact": "yes", "transition": "no", "next_action": "Hold coffee carafe", "evidence_window": {"start_frame": 1140, "end_frame": 1159}}, "pred_json": {"action": "unknown", "subtask": "unknown", "objects": [], "contact": "unknown", "transition": "unknown", "next_action": "unknown", "evidence_window": "1140-1159"}, "predicted_label": "unknown", "correct": 0, "true_label_seen_in_train": 1} |
| {"id": "xperience-10m-sample:qa:62", "target": "episode_qa", "split": "train", "episode_id": "xperience-10m-sample", "center_window": {"start_frame": 1240, "end_frame": 1259, "num_frames": 20}, "true_label": "Grasp coffee scoop", "raw_prediction": "```json\n{\n \"action\": \"Wait/Prepare for pouring\",\n \"subtask\": \"Prepare for pouring\",\n \"objects\": [\"gooseneck kettle\"],\n \"contact\": \"unknown\",\n \"transition\": \"unknown\",\n \"next_action\": \"Pour coffee\",\n \"evidence_window\": \"1240-1259\"\n}\n```", "true_json": {"action": "Grasp coffee scoop", "subtask": "Prepare coffee equipment and scoop grounds", "objects": ["glass carafe", "wooden scoop"], "contact": "yes", "transition": "no", "next_action": "Grasp coffee scoop", "evidence_window": {"start_frame": 1240, "end_frame": 1259}}, "pred_json": {"action": "Wait/Prepare for pouring", "subtask": "Prepare for pouring", "objects": ["gooseneck kettle"], "contact": "unknown", "transition": "unknown", "next_action": "Pour coffee", "evidence_window": "1240-1259"}, "predicted_label": "Wait/Prepare for pouring", "correct": 0, "true_label_seen_in_train": 1} |
| {"id": "xperience-10m-sample:qa:63", "target": "episode_qa", "split": "train", "episode_id": "xperience-10m-sample", "center_window": {"start_frame": 1260, "end_frame": 1279, "num_frames": 20}, "true_label": "Grasp coffee scoop", "raw_prediction": "```json\n{\n \"action\": \"unknown\",\n \"subtask\": \"unknown\",\n \"objects\": [\n \"gooseneck kettle\",\n \"white bottle\"\n ],\n \"contact\": \"unknown\",\n \"transition\": \"unknown\",\n \"next_action\": \"unknown\",\n \"evidence_window\": \"1260-1279\"\n}\n```", "true_json": {"action": "Grasp coffee scoop", "subtask": "Prepare coffee equipment and scoop grounds", "objects": ["glass carafe", "wooden scoop"], "contact": "yes", "transition": "no", "next_action": "Grasp coffee scoop", "evidence_window": {"start_frame": 1260, "end_frame": 1279}}, "pred_json": {"action": "unknown", "subtask": "unknown", "objects": ["gooseneck kettle", "white bottle"], "contact": "unknown", "transition": "unknown", "next_action": "unknown", "evidence_window": "1260-1279"}, "predicted_label": "unknown", "correct": 0, "true_label_seen_in_train": 1} |
| {"id": "xperience-10m-sample:qa:64", "target": "episode_qa", "split": "train", "episode_id": "xperience-10m-sample", "center_window": {"start_frame": 1280, "end_frame": 1299, "num_frames": 20}, "true_label": "Grasp coffee scoop", "raw_prediction": "```json\n{\n \"action\": \"Wait/Prepare for pouring\",\n \"subtask\": \"Prepare for pouring\",\n \"objects\": [\n \"gooseneck kettle\"\n ],\n \"contact\": \"unknown\",\n \"transition\": \"unknown\",\n \"next_action\": \"Pour coffee\",\n \"evidence_window\": \"1280-1299\"\n}\n```", "true_json": {"action": "Grasp coffee scoop", "subtask": "Prepare coffee equipment and scoop grounds", "objects": ["glass carafe", "wooden scoop"], "contact": "yes", "transition": "no", "next_action": "Grasp coffee scoop", "evidence_window": {"start_frame": 1280, "end_frame": 1299}}, "pred_json": {"action": "Wait/Prepare for pouring", "subtask": "Prepare for pouring", "objects": ["gooseneck kettle"], "contact": "unknown", "transition": "unknown", "next_action": "Pour coffee", "evidence_window": "1280-1299"}, "predicted_label": "Wait/Prepare for pouring", "correct": 0, "true_label_seen_in_train": 1} |
| {"id": "xperience-10m-sample:qa:65", "target": "episode_qa", "split": "train", "episode_id": "xperience-10m-sample", "center_window": {"start_frame": 1300, "end_frame": 1319, "num_frames": 20}, "true_label": "Grasp coffee scoop", "raw_prediction": "```json\n{\n \"action\": \"unknown\",\n \"subtask\": \"unknown\",\n \"objects\": \"unknown\",\n \"contact\": \"unknown\",\n \"transition\": \"unknown\",\n \"next_action\": \"unknown\",\n \"evidence_window\": \"1300-1319\"\n}\n```", "true_json": {"action": "Grasp coffee scoop", "subtask": "Prepare coffee equipment and scoop grounds", "objects": ["glass carafe", "wooden scoop"], "contact": "yes", "transition": "no", "next_action": "Grasp coffee scoop", "evidence_window": {"start_frame": 1300, "end_frame": 1319}}, "pred_json": {"action": "unknown", "subtask": "unknown", "objects": "unknown", "contact": "unknown", "transition": "unknown", "next_action": "unknown", "evidence_window": "1300-1319"}, "predicted_label": "unknown", "correct": 0, "true_label_seen_in_train": 1} |
| {"id": "xperience-10m-sample:qa:66", "target": "episode_qa", "split": "train", "episode_id": "xperience-10m-sample", "center_window": {"start_frame": 1320, "end_frame": 1339, "num_frames": 20}, "true_label": "Grasp coffee scoop", "raw_prediction": "```json\n{\n \"action\": \"unknown\",\n \"subtask\": \"unknown\",\n \"objects\": [\n \"white bottle\"\n ],\n \"contact\": \"unknown\",\n \"transition\": \"unknown\",\n \"next_action\": \"unknown\",\n \"evidence_window\": \"unknown\"\n}\n```", "true_json": {"action": "Grasp coffee scoop", "subtask": "Prepare coffee equipment and scoop grounds", "objects": ["glass carafe", "wooden scoop"], "contact": "yes", "transition": "no", "next_action": "Grasp coffee scoop", "evidence_window": {"start_frame": 1320, "end_frame": 1339}}, "pred_json": {"action": "unknown", "subtask": "unknown", "objects": ["white bottle"], "contact": "unknown", "transition": "unknown", "next_action": "unknown", "evidence_window": "unknown"}, "predicted_label": "unknown", "correct": 0, "true_label_seen_in_train": 1} |
| {"id": "xperience-10m-sample:qa:67", "target": "episode_qa", "split": "train", "episode_id": "xperience-10m-sample", "center_window": {"start_frame": 1340, "end_frame": 1359, "num_frames": 20}, "true_label": "Grasp coffee scoop", "raw_prediction": "```json\n{\n \"action\": \"unknown\",\n \"subtask\": \"unknown\",\n \"objects\": [],\n \"contact\": \"unknown\",\n \"transition\": \"unknown\",\n \"next_action\": \"unknown\",\n \"evidence_window\": \"1340-1359\"\n}\n```", "true_json": {"action": "Grasp coffee scoop", "subtask": "Prepare coffee equipment and scoop grounds", "objects": ["glass carafe", "wooden scoop"], "contact": "yes", "transition": "no", "next_action": "Grasp coffee scoop", "evidence_window": {"start_frame": 1340, "end_frame": 1359}}, "pred_json": {"action": "unknown", "subtask": "unknown", "objects": [], "contact": "unknown", "transition": "unknown", "next_action": "unknown", "evidence_window": "1340-1359"}, "predicted_label": "unknown", "correct": 0, "true_label_seen_in_train": 1} |
| {"id": "xperience-10m-sample:qa:68", "target": "episode_qa", "split": "train", "episode_id": "xperience-10m-sample", "center_window": {"start_frame": 1360, "end_frame": 1379, "num_frames": 20}, "true_label": "Grasp coffee scoop", "raw_prediction": "```json\n{\n \"action\": \"unknown\",\n \"subtask\": \"unknown\",\n \"objects\": [\n \"white bottle\"\n ],\n \"contact\": \"unknown\",\n \"transition\": \"unknown\",\n \"next_action\": \"unknown\",\n \"evidence_window\": \"1360-1379\"\n}\n```", "true_json": {"action": "Grasp coffee scoop", "subtask": "Prepare coffee equipment and scoop grounds", "objects": ["glass carafe", "wooden scoop"], "contact": "yes", "transition": "no", "next_action": "Grasp coffee scoop", "evidence_window": {"start_frame": 1360, "end_frame": 1379}}, "pred_json": {"action": "unknown", "subtask": "unknown", "objects": ["white bottle"], "contact": "unknown", "transition": "unknown", "next_action": "unknown", "evidence_window": "1360-1379"}, "predicted_label": "unknown", "correct": 0, "true_label_seen_in_train": 1} |
| {"id": "xperience-10m-sample:qa:69", "target": "episode_qa", "split": "train", "episode_id": "xperience-10m-sample", "center_window": {"start_frame": 1380, "end_frame": 1399, "num_frames": 20}, "true_label": "Grasp coffee scoop", "raw_prediction": "```json\n{\n \"action\": \"unknown\",\n \"subtask\": \"unknown\",\n \"objects\": \"unknown\",\n \"contact\": \"unknown\",\n \"transition\": \"unknown\",\n \"next_action\": \"unknown\",\n \"evidence_window\": \"1380-1399\"\n}\n```", "true_json": {"action": "Grasp coffee scoop", "subtask": "Prepare coffee equipment and scoop grounds", "objects": ["glass carafe", "wooden scoop"], "contact": "yes", "transition": "no", "next_action": "Grasp coffee scoop", "evidence_window": {"start_frame": 1380, "end_frame": 1399}}, "pred_json": {"action": "unknown", "subtask": "unknown", "objects": "unknown", "contact": "unknown", "transition": "unknown", "next_action": "unknown", "evidence_window": "1380-1399"}, "predicted_label": "unknown", "correct": 0, "true_label_seen_in_train": 1} |
| {"id": "xperience-10m-sample:qa:78", "target": "episode_qa", "split": "train", "episode_id": "xperience-10m-sample", "center_window": {"start_frame": 1560, "end_frame": 1579, "num_frames": 20}, "true_label": "Transfer coffee to dripper", "raw_prediction": "```json\n{\n \"action\": \"unknown\",\n \"subtask\": \"unknown\",\n \"objects\": [],\n \"contact\": \"unknown\",\n \"transition\": \"unknown\",\n \"next_action\": \"unknown\",\n \"evidence_window\": \"1560-1579\"\n}\n```", "true_json": {"action": "Transfer coffee to dripper", "subtask": "Transfer coffee grounds to dripper", "objects": ["coffee jar", "coffee scoop"], "contact": "yes", "transition": "yes", "next_action": "Transfer coffee to dripper", "evidence_window": {"start_frame": 1560, "end_frame": 1579}}, "pred_json": {"action": "unknown", "subtask": "unknown", "objects": [], "contact": "unknown", "transition": "unknown", "next_action": "unknown", "evidence_window": "1560-1579"}, "predicted_label": "unknown", "correct": 0, "true_label_seen_in_train": 1} |
| {"id": "xperience-10m-sample:qa:79", "target": "episode_qa", "split": "train", "episode_id": "xperience-10m-sample", "center_window": {"start_frame": 1580, "end_frame": 1599, "num_frames": 20}, "true_label": "Transfer coffee to dripper", "raw_prediction": "```json\n{\n \"action\": \"unknown\",\n \"subtask\": \"unknown\",\n \"objects\": [],\n \"contact\": \"unknown\",\n \"transition\": \"unknown\",\n \"next_action\": \"unknown\",\n \"evidence_window\": \"1580-1599\"\n}\n```", "true_json": {"action": "Transfer coffee to dripper", "subtask": "Transfer coffee grounds to dripper", "objects": ["coffee jar", "coffee scoop"], "contact": "yes", "transition": "no", "next_action": "Transfer coffee to dripper", "evidence_window": {"start_frame": 1580, "end_frame": 1599}}, "pred_json": {"action": "unknown", "subtask": "unknown", "objects": [], "contact": "unknown", "transition": "unknown", "next_action": "unknown", "evidence_window": "1580-1599"}, "predicted_label": "unknown", "correct": 0, "true_label_seen_in_train": 1} |
| {"id": "xperience-10m-sample:qa:80", "target": "episode_qa", "split": "train", "episode_id": "xperience-10m-sample", "center_window": {"start_frame": 1600, "end_frame": 1619, "num_frames": 20}, "true_label": "Transfer coffee to dripper", "raw_prediction": "```json\n{\n \"action\": \"unknown\",\n \"subtask\": \"unknown\",\n \"objects\": \"unknown\",\n \"contact\": \"unknown\",\n \"transition\": \"unknown\",\n \"next_action\": \"unknown\",\n \"evidence_window\": \"1600-1619\"\n}\n```", "true_json": {"action": "Transfer coffee to dripper", "subtask": "Transfer coffee grounds to dripper", "objects": ["coffee scoop", "dripper"], "contact": "yes", "transition": "no", "next_action": "Transfer coffee to dripper", "evidence_window": {"start_frame": 1600, "end_frame": 1619}}, "pred_json": {"action": "unknown", "subtask": "unknown", "objects": "unknown", "contact": "unknown", "transition": "unknown", "next_action": "unknown", "evidence_window": "1600-1619"}, "predicted_label": "unknown", "correct": 0, "true_label_seen_in_train": 1} |
| {"id": "xperience-10m-sample:qa:81", "target": "episode_qa", "split": "train", "episode_id": "xperience-10m-sample", "center_window": {"start_frame": 1620, "end_frame": 1639, "num_frames": 20}, "true_label": "Transfer coffee to dripper", "raw_prediction": "```json\n{\n \"action\": \"Wait/Prepare for pouring\",\n \"subtask\": \"Prepare for pouring\",\n \"objects\": [\n \"gooseneck kettle\"\n ],\n \"contact\": \"unknown\",\n \"transition\": \"unknown\",\n \"next_action\": \"Pour coffee\",\n \"evidence_window\": \"1620-1639\"\n}\n```", "true_json": {"action": "Transfer coffee to dripper", "subtask": "Transfer coffee grounds to dripper", "objects": ["coffee scoop", "dripper"], "contact": "yes", "transition": "no", "next_action": "Transfer coffee to dripper", "evidence_window": {"start_frame": 1620, "end_frame": 1639}}, "pred_json": {"action": "Wait/Prepare for pouring", "subtask": "Prepare for pouring", "objects": ["gooseneck kettle"], "contact": "unknown", "transition": "unknown", "next_action": "Pour coffee", "evidence_window": "1620-1639"}, "predicted_label": "Wait/Prepare for pouring", "correct": 0, "true_label_seen_in_train": 1} |
| {"id": "xperience-10m-sample:qa:82", "target": "episode_qa", "split": "train", "episode_id": "xperience-10m-sample", "center_window": {"start_frame": 1640, "end_frame": 1659, "num_frames": 20}, "true_label": "Transfer coffee to dripper", "raw_prediction": "```json\n{\n \"action\": \"unknown\",\n \"subtask\": \"unknown\",\n \"objects\": [],\n \"contact\": \"unknown\",\n \"transition\": \"unknown\",\n \"next_action\": \"unknown\",\n \"evidence_window\": \"1640-1659\"\n}\n```", "true_json": {"action": "Transfer coffee to dripper", "subtask": "Transfer coffee grounds to dripper", "objects": ["coffee scoop", "dripper"], "contact": "yes", "transition": "no", "next_action": "Transfer coffee to dripper", "evidence_window": {"start_frame": 1640, "end_frame": 1659}}, "pred_json": {"action": "unknown", "subtask": "unknown", "objects": [], "contact": "unknown", "transition": "unknown", "next_action": "unknown", "evidence_window": "1640-1659"}, "predicted_label": "unknown", "correct": 0, "true_label_seen_in_train": 1} |
| {"id": "xperience-10m-sample:qa:83", "target": "episode_qa", "split": "train", "episode_id": "xperience-10m-sample", "center_window": {"start_frame": 1660, "end_frame": 1679, "num_frames": 20}, "true_label": "Transfer coffee to dripper", "raw_prediction": "```json\n{\n \"action\": \"Wait/Prepare for pouring\",\n \"subtask\": \"Prepare for pouring\",\n \"objects\": [],\n \"contact\": \"unknown\",\n \"transition\": \"unknown\",\n \"next_action\": \"Pour coffee\",\n \"evidence_window\": \"1660-1679\"\n}\n```", "true_json": {"action": "Transfer coffee to dripper", "subtask": "Transfer coffee grounds to dripper", "objects": ["coffee scoop", "dripper"], "contact": "yes", "transition": "no", "next_action": "Transfer coffee to dripper", "evidence_window": {"start_frame": 1660, "end_frame": 1679}}, "pred_json": {"action": "Wait/Prepare for pouring", "subtask": "Prepare for pouring", "objects": [], "contact": "unknown", "transition": "unknown", "next_action": "Pour coffee", "evidence_window": "1660-1679"}, "predicted_label": "Wait/Prepare for pouring", "correct": 0, "true_label_seen_in_train": 1} |
| {"id": "xperience-10m-sample:qa:84", "target": "episode_qa", "split": "train", "episode_id": "xperience-10m-sample", "center_window": {"start_frame": 1680, "end_frame": 1699, "num_frames": 20}, "true_label": "Transfer coffee to dripper", "raw_prediction": "```json\n{\n \"action\": \"unknown\",\n \"subtask\": \"unknown\",\n \"objects\": \"unknown\",\n \"contact\": \"unknown\",\n \"transition\": \"unknown\",\n \"next_action\": \"unknown\",\n \"evidence_window\": \"1680-1699\"\n}\n```", "true_json": {"action": "Transfer coffee to dripper", "subtask": "Transfer coffee grounds to dripper", "objects": ["coffee scoop", "dripper"], "contact": "yes", "transition": "no", "next_action": "Transfer coffee to dripper", "evidence_window": {"start_frame": 1680, "end_frame": 1699}}, "pred_json": {"action": "unknown", "subtask": "unknown", "objects": "unknown", "contact": "unknown", "transition": "unknown", "next_action": "unknown", "evidence_window": "1680-1699"}, "predicted_label": "unknown", "correct": 0, "true_label_seen_in_train": 1} |
| {"id": "xperience-10m-sample:qa:85", "target": "episode_qa", "split": "train", "episode_id": "xperience-10m-sample", "center_window": {"start_frame": 1700, "end_frame": 1719, "num_frames": 20}, "true_label": "Transfer coffee to dripper", "raw_prediction": "```json\n{\n \"action\": \"Wait/Prepare for pouring\",\n \"subtask\": \"Prepare for pouring\",\n \"objects\": [\n \"gooseneck kettle\"\n ],\n \"contact\": \"unknown\",\n \"transition\": \"unknown\",\n \"next_action\": \"Pour coffee\",\n \"evidence_window\": \"1700-1719\"\n}\n```", "true_json": {"action": "Transfer coffee to dripper", "subtask": "Transfer coffee grounds to dripper", "objects": ["coffee scoop", "dripper"], "contact": "yes", "transition": "no", "next_action": "Transfer coffee to dripper", "evidence_window": {"start_frame": 1700, "end_frame": 1719}}, "pred_json": {"action": "Wait/Prepare for pouring", "subtask": "Prepare for pouring", "objects": ["gooseneck kettle"], "contact": "unknown", "transition": "unknown", "next_action": "Pour coffee", "evidence_window": "1700-1719"}, "predicted_label": "Wait/Prepare for pouring", "correct": 0, "true_label_seen_in_train": 1} |
| {"id": "xperience-10m-sample:qa:100", "target": "episode_qa", "split": "train", "episode_id": "xperience-10m-sample", "center_window": {"start_frame": 2000, "end_frame": 2019, "num_frames": 20}, "true_label": "Hold gooseneck kettle", "raw_prediction": "```json\n{\n \"action\": \"unknown\",\n \"subtask\": \"unknown\",\n \"objects\": \"unknown\",\n \"contact\": \"unknown\",\n \"transition\": \"unknown\",\n \"next_action\": \"unknown\",\n \"evidence_window\": \"2000-2019\"\n}\n```", "true_json": {"action": "Hold gooseneck kettle", "subtask": "Handle gooseneck kettle", "objects": ["gooseneck kettle", "coffee dripper", "digital scale", "water bottle", "coffee mug"], "contact": "yes", "transition": "no", "next_action": "Hold gooseneck kettle", "evidence_window": {"start_frame": 2000, "end_frame": 2019}}, "pred_json": {"action": "unknown", "subtask": "unknown", "objects": "unknown", "contact": "unknown", "transition": "unknown", "next_action": "unknown", "evidence_window": "2000-2019"}, "predicted_label": "unknown", "correct": 0, "true_label_seen_in_train": 1} |
| {"id": "xperience-10m-sample:qa:101", "target": "episode_qa", "split": "train", "episode_id": "xperience-10m-sample", "center_window": {"start_frame": 2020, "end_frame": 2039, "num_frames": 20}, "true_label": "Hold gooseneck kettle", "raw_prediction": "```json\n{\n \"action\": \"unknown\",\n \"subtask\": \"unknown\",\n \"objects\": \"unknown\",\n \"contact\": \"unknown\",\n \"transition\": \"unknown\",\n \"next_action\": \"unknown\",\n \"evidence_window\": \"2020-2039\"\n}\n```", "true_json": {"action": "Hold gooseneck kettle", "subtask": "Handle gooseneck kettle", "objects": ["gooseneck kettle", "coffee dripper", "digital scale", "water bottle", "coffee mug"], "contact": "yes", "transition": "no", "next_action": "Hold gooseneck kettle", "evidence_window": {"start_frame": 2020, "end_frame": 2039}}, "pred_json": {"action": "unknown", "subtask": "unknown", "objects": "unknown", "contact": "unknown", "transition": "unknown", "next_action": "unknown", "evidence_window": "2020-2039"}, "predicted_label": "unknown", "correct": 0, "true_label_seen_in_train": 1} |
| {"id": "xperience-10m-sample:qa:102", "target": "episode_qa", "split": "train", "episode_id": "xperience-10m-sample", "center_window": {"start_frame": 2040, "end_frame": 2059, "num_frames": 20}, "true_label": "Hold gooseneck kettle", "raw_prediction": "```json\n{\n \"action\": \"unknown\",\n \"subtask\": \"unknown\",\n \"objects\": [],\n \"contact\": \"unknown\",\n \"transition\": \"unknown\",\n \"next_action\": \"unknown\",\n \"evidence_window\": \"2040-2059\"\n}\n```", "true_json": {"action": "Hold gooseneck kettle", "subtask": "Handle gooseneck kettle", "objects": ["gooseneck kettle", "coffee dripper", "digital scale", "water bottle", "coffee mug"], "contact": "yes", "transition": "no", "next_action": "Hold gooseneck kettle", "evidence_window": {"start_frame": 2040, "end_frame": 2059}}, "pred_json": {"action": "unknown", "subtask": "unknown", "objects": [], "contact": "unknown", "transition": "unknown", "next_action": "unknown", "evidence_window": "2040-2059"}, "predicted_label": "unknown", "correct": 0, "true_label_seen_in_train": 1} |
| {"id": "xperience-10m-sample:qa:103", "target": "episode_qa", "split": "train", "episode_id": "xperience-10m-sample", "center_window": {"start_frame": 2060, "end_frame": 2079, "num_frames": 20}, "true_label": "Hold gooseneck kettle", "raw_prediction": "```json\n{\n \"action\": \"unknown\",\n \"subtask\": \"unknown\",\n \"objects\": [],\n \"contact\": \"unknown\",\n \"transition\": \"unknown\",\n \"next_action\": \"unknown\",\n \"evidence_window\": \"2060-2079\"\n}\n```", "true_json": {"action": "Hold gooseneck kettle", "subtask": "Handle gooseneck kettle", "objects": ["gooseneck kettle", "coffee dripper", "digital scale", "water bottle", "coffee mug"], "contact": "yes", "transition": "no", "next_action": "Hold gooseneck kettle", "evidence_window": {"start_frame": 2060, "end_frame": 2079}}, "pred_json": {"action": "unknown", "subtask": "unknown", "objects": [], "contact": "unknown", "transition": "unknown", "next_action": "unknown", "evidence_window": "2060-2079"}, "predicted_label": "unknown", "correct": 0, "true_label_seen_in_train": 1} |
| {"id": "xperience-10m-sample:qa:104", "target": "episode_qa", "split": "train", "episode_id": "xperience-10m-sample", "center_window": {"start_frame": 2080, "end_frame": 2099, "num_frames": 20}, "true_label": "Hold gooseneck kettle", "raw_prediction": "```json\n{\n \"action\": \"unknown\",\n \"subtask\": \"unknown\",\n \"objects\": \"unknown\",\n \"contact\": \"unknown\",\n \"transition\": \"unknown\",\n \"next_action\": \"unknown\",\n \"evidence_window\": \"2080-2099\"\n}\n```", "true_json": {"action": "Hold gooseneck kettle", "subtask": "Handle gooseneck kettle", "objects": ["gooseneck kettle", "coffee dripper", "digital scale", "water bottle", "coffee mug"], "contact": "yes", "transition": "no", "next_action": "Hold gooseneck kettle", "evidence_window": {"start_frame": 2080, "end_frame": 2099}}, "pred_json": {"action": "unknown", "subtask": "unknown", "objects": "unknown", "contact": "unknown", "transition": "unknown", "next_action": "unknown", "evidence_window": "2080-2099"}, "predicted_label": "unknown", "correct": 0, "true_label_seen_in_train": 1} |
| {"id": "xperience-10m-sample:qa:105", "target": "episode_qa", "split": "train", "episode_id": "xperience-10m-sample", "center_window": {"start_frame": 2100, "end_frame": 2119, "num_frames": 20}, "true_label": "Hold gooseneck kettle", "raw_prediction": "```json\n{\n \"action\": \"unknown\",\n \"subtask\": \"unknown\",\n \"objects\": [],\n \"contact\": \"unknown\",\n \"transition\": \"unknown\",\n \"next_action\": \"unknown\",\n \"evidence_window\": \"2100-2119\"\n}\n```", "true_json": {"action": "Hold gooseneck kettle", "subtask": "Handle gooseneck kettle", "objects": ["gooseneck kettle", "coffee dripper", "digital scale", "water bottle", "coffee mug"], "contact": "yes", "transition": "no", "next_action": "Hold gooseneck kettle", "evidence_window": {"start_frame": 2100, "end_frame": 2119}}, "pred_json": {"action": "unknown", "subtask": "unknown", "objects": [], "contact": "unknown", "transition": "unknown", "next_action": "unknown", "evidence_window": "2100-2119"}, "predicted_label": "unknown", "correct": 0, "true_label_seen_in_train": 1} |
| {"id": "xperience-10m-sample:qa:106", "target": "episode_qa", "split": "train", "episode_id": "xperience-10m-sample", "center_window": {"start_frame": 2120, "end_frame": 2139, "num_frames": 20}, "true_label": "Hold gooseneck kettle", "raw_prediction": "```json\n{\n \"action\": \"unknown\",\n \"subtask\": \"unknown\",\n \"objects\": [\n \"unknown\"\n ],\n \"contact\": \"unknown\",\n \"transition\": \"unknown\",\n \"next_action\": \"unknown\",\n \"evidence_window\": \"2120-2139\"\n}\n```", "true_json": {"action": "Hold gooseneck kettle", "subtask": "Handle gooseneck kettle", "objects": ["gooseneck kettle", "coffee dripper", "digital scale", "water bottle", "coffee mug"], "contact": "yes", "transition": "no", "next_action": "Hold gooseneck kettle", "evidence_window": {"start_frame": 2120, "end_frame": 2139}}, "pred_json": {"action": "unknown", "subtask": "unknown", "objects": ["unknown"], "contact": "unknown", "transition": "unknown", "next_action": "unknown", "evidence_window": "2120-2139"}, "predicted_label": "unknown", "correct": 0, "true_label_seen_in_train": 1} |
| {"id": "xperience-10m-sample:qa:107", "target": "episode_qa", "split": "train", "episode_id": "xperience-10m-sample", "center_window": {"start_frame": 2140, "end_frame": 2159, "num_frames": 20}, "true_label": "Hold gooseneck kettle", "raw_prediction": "```json\n{\n \"action\": \"unknown\",\n \"subtask\": \"unknown\",\n \"objects\": \"unknown\",\n \"contact\": \"unknown\",\n \"transition\": \"unknown\",\n \"next_action\": \"unknown\",\n \"evidence_window\": \"2140-2159\"\n}\n```", "true_json": {"action": "Hold gooseneck kettle", "subtask": "Handle gooseneck kettle", "objects": ["gooseneck kettle", "coffee dripper", "digital scale", "water bottle", "coffee mug"], "contact": "yes", "transition": "no", "next_action": "Hold gooseneck kettle", "evidence_window": {"start_frame": 2140, "end_frame": 2159}}, "pred_json": {"action": "unknown", "subtask": "unknown", "objects": "unknown", "contact": "unknown", "transition": "unknown", "next_action": "unknown", "evidence_window": "2140-2159"}, "predicted_label": "unknown", "correct": 0, "true_label_seen_in_train": 1} |
| {"id": "xperience-10m-sample:qa:140", "target": "episode_qa", "split": "train", "episode_id": "xperience-10m-sample", "center_window": {"start_frame": 2800, "end_frame": 2819, "num_frames": 20}, "true_label": "Grasp gooseneck kettle", "raw_prediction": "```json\n{\n \"action\": \"unknown\",\n \"subtask\": \"unknown\",\n \"objects\": [],\n \"contact\": \"unknown\",\n \"transition\": \"unknown\",\n \"next_action\": \"unknown\",\n \"evidence_window\": \"2800-2819\"\n}\n```", "true_json": {"action": "Grasp gooseneck kettle", "subtask": "Lift gooseneck kettle", "objects": ["gooseneck kettle", "coffee dripper", "scale", "water bottle", "white cup"], "contact": "yes", "transition": "no", "next_action": "Grasp gooseneck kettle", "evidence_window": {"start_frame": 2800, "end_frame": 2819}}, "pred_json": {"action": "unknown", "subtask": "unknown", "objects": [], "contact": "unknown", "transition": "unknown", "next_action": "unknown", "evidence_window": "2800-2819"}, "predicted_label": "unknown", "correct": 0, "true_label_seen_in_train": 1} |
| {"id": "xperience-10m-sample:qa:141", "target": "episode_qa", "split": "train", "episode_id": "xperience-10m-sample", "center_window": {"start_frame": 2820, "end_frame": 2839, "num_frames": 20}, "true_label": "Grasp gooseneck kettle", "raw_prediction": "```json\n{\n \"action\": \"unknown\",\n \"subtask\": \"unknown\",\n \"objects\": \"unknown\",\n \"contact\": \"unknown\",\n \"transition\": \"unknown\",\n \"next_action\": \"unknown\",\n \"evidence_window\": \"2820-2839\"\n}\n```", "true_json": {"action": "Grasp gooseneck kettle", "subtask": "Lift gooseneck kettle", "objects": ["gooseneck kettle", "coffee dripper", "scale", "water bottle", "white cup"], "contact": "yes", "transition": "no", "next_action": "Grasp gooseneck kettle", "evidence_window": {"start_frame": 2820, "end_frame": 2839}}, "pred_json": {"action": "unknown", "subtask": "unknown", "objects": "unknown", "contact": "unknown", "transition": "unknown", "next_action": "unknown", "evidence_window": "2820-2839"}, "predicted_label": "unknown", "correct": 0, "true_label_seen_in_train": 1} |
| {"id": "xperience-10m-sample:qa:142", "target": "episode_qa", "split": "train", "episode_id": "xperience-10m-sample", "center_window": {"start_frame": 2840, "end_frame": 2859, "num_frames": 20}, "true_label": "Grasp gooseneck kettle", "raw_prediction": "```json\n{\n \"action\": \"unknown\",\n \"subtask\": \"unknown\",\n \"objects\": \"unknown\",\n \"contact\": \"unknown\",\n \"transition\": \"unknown\",\n \"next_action\": \"unknown\",\n \"evidence_window\": \"2840-2859\"\n}\n```", "true_json": {"action": "Grasp gooseneck kettle", "subtask": "Lift gooseneck kettle", "objects": ["gooseneck kettle", "coffee dripper", "scale", "water bottle", "white cup"], "contact": "yes", "transition": "no", "next_action": "Grasp gooseneck kettle", "evidence_window": {"start_frame": 2840, "end_frame": 2859}}, "pred_json": {"action": "unknown", "subtask": "unknown", "objects": "unknown", "contact": "unknown", "transition": "unknown", "next_action": "unknown", "evidence_window": "2840-2859"}, "predicted_label": "unknown", "correct": 0, "true_label_seen_in_train": 1} |
| {"id": "xperience-10m-sample:qa:143", "target": "episode_qa", "split": "train", "episode_id": "xperience-10m-sample", "center_window": {"start_frame": 2860, "end_frame": 2879, "num_frames": 20}, "true_label": "Grasp gooseneck kettle", "raw_prediction": "```json\n{\n \"action\": \"unknown\",\n \"subtask\": \"unknown\",\n \"objects\": \"unknown\",\n \"contact\": \"unknown\",\n \"transition\": \"unknown\",\n \"next_action\": \"unknown\",\n \"evidence_window\": \"2860-2879\"\n}\n```", "true_json": {"action": "Grasp gooseneck kettle", "subtask": "Lift gooseneck kettle", "objects": ["gooseneck kettle", "coffee dripper", "scale", "water bottle", "white cup"], "contact": "yes", "transition": "no", "next_action": "Grasp gooseneck kettle", "evidence_window": {"start_frame": 2860, "end_frame": 2879}}, "pred_json": {"action": "unknown", "subtask": "unknown", "objects": "unknown", "contact": "unknown", "transition": "unknown", "next_action": "unknown", "evidence_window": "2860-2879"}, "predicted_label": "unknown", "correct": 0, "true_label_seen_in_train": 1} |
| {"id": "xperience-10m-sample:qa:144", "target": "episode_qa", "split": "train", "episode_id": "xperience-10m-sample", "center_window": {"start_frame": 2880, "end_frame": 2899, "num_frames": 20}, "true_label": "Grasp gooseneck kettle", "raw_prediction": "```json\n{\n \"action\": \"unknown\",\n \"subtask\": \"unknown\",\n \"objects\": [\n \"white bottle\"\n ],\n \"contact\": \"unknown\",\n \"transition\": \"unknown\",\n \"next_action\": \"unknown\",\n \"evidence_window\": \"2880-2899\"\n}\n```", "true_json": {"action": "Grasp gooseneck kettle", "subtask": "Lift gooseneck kettle", "objects": ["gooseneck kettle", "coffee dripper", "scale", "water bottle", "white cup"], "contact": "yes", "transition": "no", "next_action": "Grasp gooseneck kettle", "evidence_window": {"start_frame": 2880, "end_frame": 2899}}, "pred_json": {"action": "unknown", "subtask": "unknown", "objects": ["white bottle"], "contact": "unknown", "transition": "unknown", "next_action": "unknown", "evidence_window": "2880-2899"}, "predicted_label": "unknown", "correct": 0, "true_label_seen_in_train": 1} |
| {"id": "xperience-10m-sample:qa:145", "target": "episode_qa", "split": "train", "episode_id": "xperience-10m-sample", "center_window": {"start_frame": 2900, "end_frame": 2919, "num_frames": 20}, "true_label": "Grasp gooseneck kettle", "raw_prediction": "```json\n{\n \"action\": \"Wait/Prepare for pouring\",\n \"subtask\": \"Prepare for pouring\",\n \"objects\": [\n \"gooseneck kettle\"\n ],\n \"contact\": \"unknown\",\n \"transition\": \"unknown\",\n \"next_action\": \"Pour coffee\",\n \"evidence_window\": \"2900-2919\"\n}\n```", "true_json": {"action": "Grasp gooseneck kettle", "subtask": "Lift gooseneck kettle", "objects": ["gooseneck kettle", "coffee dripper", "scale", "water bottle", "white cup"], "contact": "yes", "transition": "no", "next_action": "Lift gooseneck kettle", "evidence_window": {"start_frame": 2900, "end_frame": 2919}}, "pred_json": {"action": "Wait/Prepare for pouring", "subtask": "Prepare for pouring", "objects": ["gooseneck kettle"], "contact": "unknown", "transition": "unknown", "next_action": "Pour coffee", "evidence_window": "2900-2919"}, "predicted_label": "Wait/Prepare for pouring", "correct": 0, "true_label_seen_in_train": 1} |
| {"id": "xperience-10m-sample:qa:146", "target": "episode_qa", "split": "train", "episode_id": "xperience-10m-sample", "center_window": {"start_frame": 2920, "end_frame": 2939, "num_frames": 20}, "true_label": "Lift gooseneck kettle", "raw_prediction": "```json\n{\n \"action\": \"Wait/Prepare for pouring\",\n \"subtask\": \"Prepare for pouring\",\n \"objects\": [\n \"gooseneck kettle\"\n ],\n \"contact\": \"unknown\",\n \"transition\": \"unknown\",\n \"next_action\": \"Pour coffee\",\n \"evidence_window\": \"2920-2939\"\n}\n```", "true_json": {"action": "Lift gooseneck kettle", "subtask": "Lift gooseneck kettle", "objects": ["gooseneck kettle", "coffee dripper", "scale", "water bottle", "white cup"], "contact": "yes", "transition": "no", "next_action": "Lift gooseneck kettle", "evidence_window": {"start_frame": 2920, "end_frame": 2939}}, "pred_json": {"action": "Wait/Prepare for pouring", "subtask": "Prepare for pouring", "objects": ["gooseneck kettle"], "contact": "unknown", "transition": "unknown", "next_action": "Pour coffee", "evidence_window": "2920-2939"}, "predicted_label": "Wait/Prepare for pouring", "correct": 0, "true_label_seen_in_train": 1} |
| {"id": "xperience-10m-sample:qa:147", "target": "episode_qa", "split": "train", "episode_id": "xperience-10m-sample", "center_window": {"start_frame": 2940, "end_frame": 2959, "num_frames": 20}, "true_label": "Lift gooseneck kettle", "raw_prediction": "```json\n{\n \"action\": \"unknown\",\n \"subtask\": \"unknown\",\n \"objects\": [\n \"white bottle\"\n ],\n \"contact\": \"unknown\",\n \"transition\": \"unknown\",\n \"next_action\": \"unknown\",\n \"evidence_window\": \"2940-2959\"\n}\n```", "true_json": {"action": "Lift gooseneck kettle", "subtask": "Lift gooseneck kettle", "objects": ["gooseneck kettle", "coffee dripper", "scale", "water bottle", "white cup"], "contact": "yes", "transition": "no", "next_action": "Lift gooseneck kettle", "evidence_window": {"start_frame": 2940, "end_frame": 2959}}, "pred_json": {"action": "unknown", "subtask": "unknown", "objects": ["white bottle"], "contact": "unknown", "transition": "unknown", "next_action": "unknown", "evidence_window": "2940-2959"}, "predicted_label": "unknown", "correct": 0, "true_label_seen_in_train": 1} |
| {"id": "xperience-10m-sample:qa:148", "target": "episode_qa", "split": "train", "episode_id": "xperience-10m-sample", "center_window": {"start_frame": 2960, "end_frame": 2979, "num_frames": 20}, "true_label": "Lift gooseneck kettle", "raw_prediction": "```json\n{\n \"action\": \"unknown\",\n \"subtask\": \"unknown\",\n \"objects\": [\n \"white bottle\"\n ],\n \"contact\": \"unknown\",\n \"transition\": \"unknown\",\n \"next_action\": \"unknown\",\n \"evidence_window\": \"unknown\"\n}\n```", "true_json": {"action": "Lift gooseneck kettle", "subtask": "Lift gooseneck kettle", "objects": ["gooseneck kettle", "coffee dripper", "scale"], "contact": "yes", "transition": "no", "next_action": "Lift gooseneck kettle", "evidence_window": {"start_frame": 2960, "end_frame": 2979}}, "pred_json": {"action": "unknown", "subtask": "unknown", "objects": ["white bottle"], "contact": "unknown", "transition": "unknown", "next_action": "unknown", "evidence_window": "unknown"}, "predicted_label": "unknown", "correct": 0, "true_label_seen_in_train": 1} |
| {"id": "xperience-10m-sample:qa:149", "target": "episode_qa", "split": "train", "episode_id": "xperience-10m-sample", "center_window": {"start_frame": 2980, "end_frame": 2999, "num_frames": 20}, "true_label": "Lift gooseneck kettle", "raw_prediction": "```json\n{\n \"action\": \"unknown\",\n \"subtask\": \"unknown\",\n \"objects\": \"unknown\",\n \"contact\": \"unknown\",\n \"transition\": \"unknown\",\n \"next_action\": \"unknown\",\n \"evidence_window\": \"2980-2999\"\n}\n```", "true_json": {"action": "Lift gooseneck kettle", "subtask": "Lift gooseneck kettle", "objects": ["gooseneck kettle", "coffee dripper", "scale"], "contact": "yes", "transition": "no", "next_action": "Lift gooseneck kettle", "evidence_window": {"start_frame": 2980, "end_frame": 2999}}, "pred_json": {"action": "unknown", "subtask": "unknown", "objects": "unknown", "contact": "unknown", "transition": "unknown", "next_action": "unknown", "evidence_window": "2980-2999"}, "predicted_label": "unknown", "correct": 0, "true_label_seen_in_train": 1} |
| {"id": "xperience-10m-sample:qa:150", "target": "episode_qa", "split": "train", "episode_id": "xperience-10m-sample", "center_window": {"start_frame": 3000, "end_frame": 3019, "num_frames": 20}, "true_label": "Lift gooseneck kettle", "raw_prediction": "```json\n{\n \"action\": \"Wait/Prepare for pouring\",\n \"subtask\": \"Prepare for pouring\",\n \"objects\": [\n \"gooseneck kettle\"\n ],\n \"contact\": \"unknown\",\n \"transition\": \"unknown\",\n \"next_action\": \"Pour coffee\",\n \"evidence_window\": \"3000-3019\"\n}\n```", "true_json": {"action": "Lift gooseneck kettle", "subtask": "Lift gooseneck kettle", "objects": ["gooseneck kettle", "coffee dripper", "digital scale", "white mug"], "contact": "yes", "transition": "no", "next_action": "Lift gooseneck kettle", "evidence_window": {"start_frame": 3000, "end_frame": 3019}}, "pred_json": {"action": "Wait/Prepare for pouring", "subtask": "Prepare for pouring", "objects": ["gooseneck kettle"], "contact": "unknown", "transition": "unknown", "next_action": "Pour coffee", "evidence_window": "3000-3019"}, "predicted_label": "Wait/Prepare for pouring", "correct": 0, "true_label_seen_in_train": 1} |
| {"id": "xperience-10m-sample:qa:151", "target": "episode_qa", "split": "train", "episode_id": "xperience-10m-sample", "center_window": {"start_frame": 3020, "end_frame": 3039, "num_frames": 20}, "true_label": "Lift gooseneck kettle", "raw_prediction": "```json\n{\n \"action\": \"unknown\",\n \"subtask\": \"unknown\",\n \"objects\": [],\n \"contact\": \"unknown\",\n \"transition\": \"unknown\",\n \"next_action\": \"unknown\",\n \"evidence_window\": \"3020-3039\"\n}\n```", "true_json": {"action": "Lift gooseneck kettle", "subtask": "Lift gooseneck kettle", "objects": ["gooseneck kettle", "coffee dripper", "digital scale", "white mug"], "contact": "yes", "transition": "no", "next_action": "Lift gooseneck kettle", "evidence_window": {"start_frame": 3020, "end_frame": 3039}}, "pred_json": {"action": "unknown", "subtask": "unknown", "objects": [], "contact": "unknown", "transition": "unknown", "next_action": "unknown", "evidence_window": "3020-3039"}, "predicted_label": "unknown", "correct": 0, "true_label_seen_in_train": 1} |
| {"id": "xperience-10m-sample:qa:152", "target": "episode_qa", "split": "train", "episode_id": "xperience-10m-sample", "center_window": {"start_frame": 3040, "end_frame": 3059, "num_frames": 20}, "true_label": "Lift gooseneck kettle", "raw_prediction": "```json\n{\n \"action\": \"unknown\",\n \"subtask\": \"unknown\",\n \"objects\": \"unknown\",\n \"contact\": \"unknown\",\n \"transition\": \"unknown\",\n \"next_action\": \"unknown\",\n \"evidence_window\": \"3040-3059\"\n}\n```", "true_json": {"action": "Lift gooseneck kettle", "subtask": "Lift gooseneck kettle", "objects": ["gooseneck kettle", "coffee dripper", "digital scale", "white mug"], "contact": "yes", "transition": "no", "next_action": "Lift gooseneck kettle", "evidence_window": {"start_frame": 3040, "end_frame": 3059}}, "pred_json": {"action": "unknown", "subtask": "unknown", "objects": "unknown", "contact": "unknown", "transition": "unknown", "next_action": "unknown", "evidence_window": "3040-3059"}, "predicted_label": "unknown", "correct": 0, "true_label_seen_in_train": 1} |
| {"id": "xperience-10m-sample:qa:153", "target": "episode_qa", "split": "train", "episode_id": "xperience-10m-sample", "center_window": {"start_frame": 3060, "end_frame": 3079, "num_frames": 20}, "true_label": "Lift gooseneck kettle", "raw_prediction": "```json\n{\n \"action\": \"unknown\",\n \"subtask\": \"unknown\",\n \"objects\": [\n \"white bottle\"\n ],\n \"contact\": \"unknown\",\n \"transition\": \"unknown\",\n \"next_action\": \"unknown\",\n \"evidence_window\": \"3060-3079\"\n}\n```", "true_json": {"action": "Lift gooseneck kettle", "subtask": "Lift gooseneck kettle", "objects": ["gooseneck kettle", "coffee dripper", "digital scale", "white mug"], "contact": "yes", "transition": "no", "next_action": "Lift gooseneck kettle", "evidence_window": {"start_frame": 3060, "end_frame": 3079}}, "pred_json": {"action": "unknown", "subtask": "unknown", "objects": ["white bottle"], "contact": "unknown", "transition": "unknown", "next_action": "unknown", "evidence_window": "3060-3079"}, "predicted_label": "unknown", "correct": 0, "true_label_seen_in_train": 1} |
| {"id": "xperience-10m-sample:qa:170", "target": "episode_qa", "split": "train", "episode_id": "xperience-10m-sample", "center_window": {"start_frame": 3400, "end_frame": 3419, "num_frames": 20}, "true_label": "Move kettle away", "raw_prediction": "```json\n{\n \"action\": \"unknown\",\n \"subtask\": \"unknown\",\n \"objects\": [],\n \"contact\": \"unknown\",\n \"transition\": \"unknown\",\n \"next_action\": \"unknown\",\n \"evidence_window\": \"3400-3419\"\n}\n```", "true_json": {"action": "Move kettle away", "subtask": "Set down kettle and retrieve white bottle", "objects": ["gooseneck kettle", "coffee dripper", "scale", "white bottle"], "contact": "yes", "transition": "no", "next_action": "Move kettle away", "evidence_window": {"start_frame": 3400, "end_frame": 3419}}, "pred_json": {"action": "unknown", "subtask": "unknown", "objects": [], "contact": "unknown", "transition": "unknown", "next_action": "unknown", "evidence_window": "3400-3419"}, "predicted_label": "unknown", "correct": 0, "true_label_seen_in_train": 1} |
| {"id": "xperience-10m-sample:qa:171", "target": "episode_qa", "split": "train", "episode_id": "xperience-10m-sample", "center_window": {"start_frame": 3420, "end_frame": 3439, "num_frames": 20}, "true_label": "Move kettle away", "raw_prediction": "```json\n{\n \"action\": \"unknown\",\n \"subtask\": \"unknown\",\n \"objects\": \"unknown\",\n \"contact\": \"unknown\",\n \"transition\": \"unknown\",\n \"next_action\": \"unknown\",\n \"evidence_window\": \"3420-3439\"\n}\n```", "true_json": {"action": "Move kettle away", "subtask": "Set down kettle and retrieve white bottle", "objects": ["gooseneck kettle", "coffee dripper", "scale", "white bottle"], "contact": "yes", "transition": "no", "next_action": "Move kettle away", "evidence_window": {"start_frame": 3420, "end_frame": 3439}}, "pred_json": {"action": "unknown", "subtask": "unknown", "objects": "unknown", "contact": "unknown", "transition": "unknown", "next_action": "unknown", "evidence_window": "3420-3439"}, "predicted_label": "unknown", "correct": 0, "true_label_seen_in_train": 1} |
| {"id": "xperience-10m-sample:qa:172", "target": "episode_qa", "split": "train", "episode_id": "xperience-10m-sample", "center_window": {"start_frame": 3440, "end_frame": 3459, "num_frames": 20}, "true_label": "Move kettle away", "raw_prediction": "```json\n{\n \"action\": \"unknown\",\n \"subtask\": \"unknown\",\n \"objects\": \"unknown\",\n \"contact\": \"unknown\",\n \"transition\": \"unknown\",\n \"next_action\": \"unknown\",\n \"evidence_window\": \"3440-3459\"\n}\n```", "true_json": {"action": "Move kettle away", "subtask": "Set down kettle and retrieve white bottle", "objects": ["gooseneck kettle", "coffee dripper", "scale", "white bottle"], "contact": "yes", "transition": "no", "next_action": "Move kettle away", "evidence_window": {"start_frame": 3440, "end_frame": 3459}}, "pred_json": {"action": "unknown", "subtask": "unknown", "objects": "unknown", "contact": "unknown", "transition": "unknown", "next_action": "unknown", "evidence_window": "3440-3459"}, "predicted_label": "unknown", "correct": 0, "true_label_seen_in_train": 1} |
| {"id": "xperience-10m-sample:qa:173", "target": "episode_qa", "split": "train", "episode_id": "xperience-10m-sample", "center_window": {"start_frame": 3460, "end_frame": 3479, "num_frames": 20}, "true_label": "Move kettle away", "raw_prediction": "```json\n{\n \"action\": \"unknown\",\n \"subtask\": \"unknown\",\n \"objects\": \"unknown\",\n \"contact\": \"unknown\",\n \"transition\": \"unknown\",\n \"next_action\": \"unknown\",\n \"evidence_window\": \"3460-3479\"\n}\n```", "true_json": {"action": "Move kettle away", "subtask": "Set down kettle and retrieve white bottle", "objects": ["gooseneck kettle", "coffee dripper", "scale", "white bottle"], "contact": "yes", "transition": "no", "next_action": "Move kettle away", "evidence_window": {"start_frame": 3460, "end_frame": 3479}}, "pred_json": {"action": "unknown", "subtask": "unknown", "objects": "unknown", "contact": "unknown", "transition": "unknown", "next_action": "unknown", "evidence_window": "3460-3479"}, "predicted_label": "unknown", "correct": 0, "true_label_seen_in_train": 1} |
| {"id": "xperience-10m-sample:qa:174", "target": "episode_qa", "split": "train", "episode_id": "xperience-10m-sample", "center_window": {"start_frame": 3480, "end_frame": 3499, "num_frames": 20}, "true_label": "Move kettle away", "raw_prediction": "```json\n{\n \"action\": \"unknown\",\n \"subtask\": \"unknown\",\n \"objects\": \"unknown\",\n \"contact\": \"unknown\",\n \"transition\": \"unknown\",\n \"next_action\": \"unknown\",\n \"evidence_window\": \"3480-3499\"\n}\n```", "true_json": {"action": "Move kettle away", "subtask": "Set down kettle and retrieve white bottle", "objects": ["gooseneck kettle", "coffee dripper", "scale", "white bottle"], "contact": "yes", "transition": "no", "next_action": "Move kettle away", "evidence_window": {"start_frame": 3480, "end_frame": 3499}}, "pred_json": {"action": "unknown", "subtask": "unknown", "objects": "unknown", "contact": "unknown", "transition": "unknown", "next_action": "unknown", "evidence_window": "3480-3499"}, "predicted_label": "unknown", "correct": 0, "true_label_seen_in_train": 1} |
| {"id": "xperience-10m-sample:qa:175", "target": "episode_qa", "split": "train", "episode_id": "xperience-10m-sample", "center_window": {"start_frame": 3500, "end_frame": 3519, "num_frames": 20}, "true_label": "Move kettle away", "raw_prediction": "```json\n{\n \"action\": \"unknown\",\n \"subtask\": \"unknown\",\n \"objects\": \"unknown\",\n \"contact\": \"unknown\",\n \"transition\": \"unknown\",\n \"next_action\": \"unknown\",\n \"evidence_window\": \"3500-3519\"\n}\n```", "true_json": {"action": "Move kettle away", "subtask": "Set down kettle and retrieve white bottle", "objects": ["gooseneck kettle", "coffee dripper", "scale", "white bottle"], "contact": "yes", "transition": "no", "next_action": "Move kettle away", "evidence_window": {"start_frame": 3500, "end_frame": 3519}}, "pred_json": {"action": "unknown", "subtask": "unknown", "objects": "unknown", "contact": "unknown", "transition": "unknown", "next_action": "unknown", "evidence_window": "3500-3519"}, "predicted_label": "unknown", "correct": 0, "true_label_seen_in_train": 1} |
| {"id": "xperience-10m-sample:qa:176", "target": "episode_qa", "split": "train", "episode_id": "xperience-10m-sample", "center_window": {"start_frame": 3520, "end_frame": 3539, "num_frames": 20}, "true_label": "Move kettle away", "raw_prediction": "```json\n{\n \"action\": \"unknown\",\n \"subtask\": \"unknown\",\n \"objects\": \"unknown\",\n \"contact\": \"unknown\",\n \"transition\": \"unknown\",\n \"next_action\": \"unknown\",\n \"evidence_window\": \"3520-3539\"\n}\n```", "true_json": {"action": "Move kettle away", "subtask": "Set down kettle and retrieve white bottle", "objects": ["gooseneck kettle", "coffee dripper", "scale", "white bottle"], "contact": "yes", "transition": "no", "next_action": "Move kettle away", "evidence_window": {"start_frame": 3520, "end_frame": 3539}}, "pred_json": {"action": "unknown", "subtask": "unknown", "objects": "unknown", "contact": "unknown", "transition": "unknown", "next_action": "unknown", "evidence_window": "3520-3539"}, "predicted_label": "unknown", "correct": 0, "true_label_seen_in_train": 1} |
| {"id": "xperience-10m-sample:qa:177", "target": "episode_qa", "split": "train", "episode_id": "xperience-10m-sample", "center_window": {"start_frame": 3540, "end_frame": 3559, "num_frames": 20}, "true_label": "Move kettle away", "raw_prediction": "```json\n{\n \"action\": \"unknown\",\n \"subtask\": \"unknown\",\n \"objects\": \"unknown\",\n \"contact\": \"unknown\",\n \"transition\": \"unknown\",\n \"next_action\": \"unknown\",\n \"evidence_window\": \"3540-3559\"\n}\n```", "true_json": {"action": "Move kettle away", "subtask": "Set down kettle and retrieve white bottle", "objects": ["gooseneck kettle", "coffee dripper", "scale", "white bottle"], "contact": "yes", "transition": "no", "next_action": "Place kettle on table", "evidence_window": {"start_frame": 3540, "end_frame": 3559}}, "pred_json": {"action": "unknown", "subtask": "unknown", "objects": "unknown", "contact": "unknown", "transition": "unknown", "next_action": "unknown", "evidence_window": "3540-3559"}, "predicted_label": "unknown", "correct": 0, "true_label_seen_in_train": 1} |
| {"id": "xperience-10m-sample:qa:178", "target": "episode_qa", "split": "train", "episode_id": "xperience-10m-sample", "center_window": {"start_frame": 3560, "end_frame": 3579, "num_frames": 20}, "true_label": "Place kettle on table", "raw_prediction": "```json\n{\n \"action\": \"unknown\",\n \"subtask\": \"unknown\",\n \"objects\": \"unknown\",\n \"contact\": \"unknown\",\n \"transition\": \"unknown\",\n \"next_action\": \"unknown\",\n \"evidence_window\": \"3560-3579\"\n}\n```", "true_json": {"action": "Place kettle on table", "subtask": "Set down kettle and retrieve white bottle", "objects": ["gooseneck kettle", "coffee dripper", "scale", "white bottle"], "contact": "yes", "transition": "no", "next_action": "Place kettle on table", "evidence_window": {"start_frame": 3560, "end_frame": 3579}}, "pred_json": {"action": "unknown", "subtask": "unknown", "objects": "unknown", "contact": "unknown", "transition": "unknown", "next_action": "unknown", "evidence_window": "3560-3579"}, "predicted_label": "unknown", "correct": 0, "true_label_seen_in_train": 1} |
| {"id": "xperience-10m-sample:qa:179", "target": "episode_qa", "split": "train", "episode_id": "xperience-10m-sample", "center_window": {"start_frame": 3580, "end_frame": 3599, "num_frames": 20}, "true_label": "Place kettle on table", "raw_prediction": "```json\n{\n \"action\": \"Wait/Prepare for pouring\",\n \"subtask\": \"Prepare for pouring\",\n \"objects\": [\n \"gooseneck kettle\"\n ],\n \"contact\": \"unknown\",\n \"transition\": \"unknown\",\n \"next_action\": \"Pour coffee\",\n \"evidence_window\": \"3580-3599\"\n}\n```", "true_json": {"action": "Place kettle on table", "subtask": "Set down kettle and retrieve white bottle", "objects": ["gooseneck kettle", "coffee dripper", "scale", "white bottle"], "contact": "yes", "transition": "no", "next_action": "Place kettle on table", "evidence_window": {"start_frame": 3580, "end_frame": 3599}}, "pred_json": {"action": "Wait/Prepare for pouring", "subtask": "Prepare for pouring", "objects": ["gooseneck kettle"], "contact": "unknown", "transition": "unknown", "next_action": "Pour coffee", "evidence_window": "3580-3599"}, "predicted_label": "Wait/Prepare for pouring", "correct": 0, "true_label_seen_in_train": 1} |
| {"id": "xperience-10m-sample:qa:180", "target": "episode_qa", "split": "train", "episode_id": "xperience-10m-sample", "center_window": {"start_frame": 3600, "end_frame": 3619, "num_frames": 20}, "true_label": "Place kettle on table", "raw_prediction": "```json\n{\n \"action\": \"unknown\",\n \"subtask\": \"unknown\",\n \"objects\": \"unknown\",\n \"contact\": \"unknown\",\n \"transition\": \"unknown\",\n \"next_action\": \"unknown\",\n \"evidence_window\": \"unknown\"\n}\n```", "true_json": {"action": "Place kettle on table", "subtask": "Set down kettle and retrieve white bottle", "objects": ["gooseneck kettle", "coffee dripper", "scale", "white bottle"], "contact": "yes", "transition": "no", "next_action": "Place kettle on table", "evidence_window": {"start_frame": 3600, "end_frame": 3619}}, "pred_json": {"action": "unknown", "subtask": "unknown", "objects": "unknown", "contact": "unknown", "transition": "unknown", "next_action": "unknown", "evidence_window": "unknown"}, "predicted_label": "unknown", "correct": 0, "true_label_seen_in_train": 1} |
| {"id": "xperience-10m-sample:qa:181", "target": "episode_qa", "split": "train", "episode_id": "xperience-10m-sample", "center_window": {"start_frame": 3620, "end_frame": 3639, "num_frames": 20}, "true_label": "Place kettle on table", "raw_prediction": "```json\n{\n \"action\": \"Wait/Prepare for pouring\",\n \"subtask\": \"Prepare for pouring\",\n \"objects\": [\n \"gooseneck kettle\"\n ],\n \"contact\": \"unknown\",\n \"transition\": \"unknown\",\n \"next_action\": \"Pour coffee\",\n \"evidence_window\": \"3620-3639\"\n}\n```", "true_json": {"action": "Place kettle on table", "subtask": "Set down kettle and retrieve white bottle", "objects": ["gooseneck kettle", "coffee dripper", "scale", "white bottle"], "contact": "yes", "transition": "no", "next_action": "Place kettle on table", "evidence_window": {"start_frame": 3620, "end_frame": 3639}}, "pred_json": {"action": "Wait/Prepare for pouring", "subtask": "Prepare for pouring", "objects": ["gooseneck kettle"], "contact": "unknown", "transition": "unknown", "next_action": "Pour coffee", "evidence_window": "3620-3639"}, "predicted_label": "Wait/Prepare for pouring", "correct": 0, "true_label_seen_in_train": 1} |
| {"id": "xperience-10m-sample:qa:182", "target": "episode_qa", "split": "train", "episode_id": "xperience-10m-sample", "center_window": {"start_frame": 3640, "end_frame": 3659, "num_frames": 20}, "true_label": "Place kettle on table", "raw_prediction": "```json\n{\n \"action\": \"Wait/Prepare for pouring\",\n \"subtask\": \"Prepare for pouring\",\n \"objects\": [\n \"gooseneck kettle\"\n ],\n \"contact\": \"unknown\",\n \"transition\": \"unknown\",\n \"next_action\": \"Pour coffee\",\n \"evidence_window\": \"3640-3659\"\n}\n```", "true_json": {"action": "Place kettle on table", "subtask": "Set down kettle and retrieve white bottle", "objects": ["gooseneck kettle", "coffee dripper", "scale", "white bottle"], "contact": "yes", "transition": "no", "next_action": "Place kettle on table", "evidence_window": {"start_frame": 3640, "end_frame": 3659}}, "pred_json": {"action": "Wait/Prepare for pouring", "subtask": "Prepare for pouring", "objects": ["gooseneck kettle"], "contact": "unknown", "transition": "unknown", "next_action": "Pour coffee", "evidence_window": "3640-3659"}, "predicted_label": "Wait/Prepare for pouring", "correct": 0, "true_label_seen_in_train": 1} |
| {"id": "xperience-10m-sample:qa:183", "target": "episode_qa", "split": "train", "episode_id": "xperience-10m-sample", "center_window": {"start_frame": 3660, "end_frame": 3679, "num_frames": 20}, "true_label": "Place kettle on table", "raw_prediction": "```json\n{\n \"action\": \"unknown\",\n \"subtask\": \"unknown\",\n \"objects\": \"unknown\",\n \"contact\": \"unknown\",\n \"transition\": \"unknown\",\n \"next_action\": \"unknown\",\n \"evidence_window\": \"3660-3679\"\n}\n```", "true_json": {"action": "Place kettle on table", "subtask": "Set down kettle and retrieve white bottle", "objects": ["gooseneck kettle", "coffee dripper", "scale", "white bottle"], "contact": "yes", "transition": "no", "next_action": "Pick up white bottle", "evidence_window": {"start_frame": 3660, "end_frame": 3679}}, "pred_json": {"action": "unknown", "subtask": "unknown", "objects": "unknown", "contact": "unknown", "transition": "unknown", "next_action": "unknown", "evidence_window": "3660-3679"}, "predicted_label": "unknown", "correct": 0, "true_label_seen_in_train": 1} |
| {"id": "xperience-10m-sample:qa:184", "target": "episode_qa", "split": "train", "episode_id": "xperience-10m-sample", "center_window": {"start_frame": 3680, "end_frame": 3699, "num_frames": 20}, "true_label": "Pick up white bottle", "raw_prediction": "```json\n{\n \"action\": \"Wait/Prepare for pouring\",\n \"subtask\": \"Prepare for pouring\",\n \"objects\": [\n \"gooseneck kettle\"\n ],\n \"contact\": \"unknown\",\n \"transition\": \"unknown\",\n \"next_action\": \"Pour coffee\",\n \"evidence_window\": \"3680-3699\"\n}\n```", "true_json": {"action": "Pick up white bottle", "subtask": "Set down kettle and retrieve white bottle", "objects": ["gooseneck kettle", "coffee dripper", "scale", "white bottle"], "contact": "yes", "transition": "no", "next_action": "Pick up white bottle", "evidence_window": {"start_frame": 3680, "end_frame": 3699}}, "pred_json": {"action": "Wait/Prepare for pouring", "subtask": "Prepare for pouring", "objects": ["gooseneck kettle"], "contact": "unknown", "transition": "unknown", "next_action": "Pour coffee", "evidence_window": "3680-3699"}, "predicted_label": "Wait/Prepare for pouring", "correct": 0, "true_label_seen_in_train": 1} |
| {"id": "xperience-10m-sample:qa:185", "target": "episode_qa", "split": "train", "episode_id": "xperience-10m-sample", "center_window": {"start_frame": 3700, "end_frame": 3719, "num_frames": 20}, "true_label": "Pick up white bottle", "raw_prediction": "```json\n{\n \"action\": \"unknown\",\n \"subtask\": \"unknown\",\n \"objects\": \"unknown\",\n \"contact\": \"unknown\",\n \"transition\": \"unknown\",\n \"next_action\": \"unknown\",\n \"evidence_window\": \"3700-3719\"\n}\n```", "true_json": {"action": "Pick up white bottle", "subtask": "Set down kettle and retrieve white bottle", "objects": ["gooseneck kettle", "coffee dripper", "scale", "white bottle"], "contact": "yes", "transition": "no", "next_action": "Pick up white bottle", "evidence_window": {"start_frame": 3700, "end_frame": 3719}}, "pred_json": {"action": "unknown", "subtask": "unknown", "objects": "unknown", "contact": "unknown", "transition": "unknown", "next_action": "unknown", "evidence_window": "3700-3719"}, "predicted_label": "unknown", "correct": 0, "true_label_seen_in_train": 1} |
| {"id": "xperience-10m-sample:qa:186", "target": "episode_qa", "split": "train", "episode_id": "xperience-10m-sample", "center_window": {"start_frame": 3720, "end_frame": 3739, "num_frames": 20}, "true_label": "Pick up white bottle", "raw_prediction": "```json\n{\n \"action\": \"Wait/Prepare for pouring\",\n \"subtask\": \"Prepare for pouring\",\n \"objects\": [\n \"gooseneck kettle\"\n ],\n \"contact\": \"unknown\",\n \"transition\": \"unknown\",\n \"next_action\": \"Pour coffee\",\n \"evidence_window\": \"3720-3739\"\n}\n```", "true_json": {"action": "Pick up white bottle", "subtask": "Set down kettle and retrieve white bottle", "objects": ["gooseneck kettle", "coffee dripper", "scale", "white bottle"], "contact": "yes", "transition": "no", "next_action": "Pick up white bottle", "evidence_window": {"start_frame": 3720, "end_frame": 3739}}, "pred_json": {"action": "Wait/Prepare for pouring", "subtask": "Prepare for pouring", "objects": ["gooseneck kettle"], "contact": "unknown", "transition": "unknown", "next_action": "Pour coffee", "evidence_window": "3720-3739"}, "predicted_label": "Wait/Prepare for pouring", "correct": 0, "true_label_seen_in_train": 1} |
| {"id": "xperience-10m-sample:qa:187", "target": "episode_qa", "split": "train", "episode_id": "xperience-10m-sample", "center_window": {"start_frame": 3740, "end_frame": 3759, "num_frames": 20}, "true_label": "Pick up white bottle", "raw_prediction": "```json\n{\n \"action\": \"Wait/Prepare for pouring\",\n \"subtask\": \"Prepare for pouring\",\n \"objects\": [\n \"gooseneck kettle\"\n ],\n \"contact\": \"unknown\",\n \"transition\": \"unknown\",\n \"next_action\": \"Pour coffee\",\n \"evidence_window\": \"3740-3759\"\n}\n```", "true_json": {"action": "Pick up white bottle", "subtask": "Set down kettle and retrieve white bottle", "objects": ["gooseneck kettle", "coffee dripper", "scale", "white bottle"], "contact": "yes", "transition": "no", "next_action": "Pick up white bottle", "evidence_window": {"start_frame": 3740, "end_frame": 3759}}, "pred_json": {"action": "Wait/Prepare for pouring", "subtask": "Prepare for pouring", "objects": ["gooseneck kettle"], "contact": "unknown", "transition": "unknown", "next_action": "Pour coffee", "evidence_window": "3740-3759"}, "predicted_label": "Wait/Prepare for pouring", "correct": 0, "true_label_seen_in_train": 1} |
| {"id": "xperience-10m-sample:qa:188", "target": "episode_qa", "split": "train", "episode_id": "xperience-10m-sample", "center_window": {"start_frame": 3760, "end_frame": 3779, "num_frames": 20}, "true_label": "Pick up white bottle", "raw_prediction": "```json\n{\n \"action\": \"Wait/Prepare for pouring\",\n \"subtask\": \"Prepare for pouring\",\n \"objects\": [\n \"gooseneck kettle\"\n ],\n \"contact\": \"unknown\",\n \"transition\": \"unknown\",\n \"next_action\": \"Pour coffee\",\n \"evidence_window\": \"3760-3779\"\n}\n```", "true_json": {"action": "Pick up white bottle", "subtask": "Set down kettle and retrieve white bottle", "objects": ["gooseneck kettle", "coffee dripper", "scale", "white bottle"], "contact": "yes", "transition": "no", "next_action": "Pick up white bottle", "evidence_window": {"start_frame": 3760, "end_frame": 3779}}, "pred_json": {"action": "Wait/Prepare for pouring", "subtask": "Prepare for pouring", "objects": ["gooseneck kettle"], "contact": "unknown", "transition": "unknown", "next_action": "Pour coffee", "evidence_window": "3760-3779"}, "predicted_label": "Wait/Prepare for pouring", "correct": 0, "true_label_seen_in_train": 1} |
| {"id": "xperience-10m-sample:qa:189", "target": "episode_qa", "split": "train", "episode_id": "xperience-10m-sample", "center_window": {"start_frame": 3780, "end_frame": 3799, "num_frames": 20}, "true_label": "Pick up white bottle", "raw_prediction": "```json\n{\n \"action\": \"unknown\",\n \"subtask\": \"unknown\",\n \"objects\": \"unknown\",\n \"contact\": \"unknown\",\n \"transition\": \"unknown\",\n \"next_action\": \"unknown\",\n \"evidence_window\": \"3780-3799\"\n}\n```", "true_json": {"action": "Pick up white bottle", "subtask": "Set down kettle and retrieve white bottle", "objects": ["gooseneck kettle", "coffee dripper", "scale", "white bottle"], "contact": "yes", "transition": "no", "next_action": "Pour liquid from white bottle", "evidence_window": {"start_frame": 3780, "end_frame": 3799}}, "pred_json": {"action": "unknown", "subtask": "unknown", "objects": "unknown", "contact": "unknown", "transition": "unknown", "next_action": "unknown", "evidence_window": "3780-3799"}, "predicted_label": "unknown", "correct": 0, "true_label_seen_in_train": 1} |
| {"id": "xperience-10m-sample:qa:190", "target": "episode_qa", "split": "train", "episode_id": "xperience-10m-sample", "center_window": {"start_frame": 3800, "end_frame": 3819, "num_frames": 20}, "true_label": "Pour liquid from white bottle", "raw_prediction": "```json\n{\n \"action\": \"Wait/Prepare for pouring\",\n \"subtask\": \"Prepare for pouring\",\n \"objects\": [\n \"gooseneck kettle\"\n ],\n \"contact\": \"unknown\",\n \"transition\": \"unknown\",\n \"next_action\": \"Pour coffee\",\n \"evidence_window\": \"3800-3819\"\n}\n```", "true_json": {"action": "Pour liquid from white bottle", "subtask": "Pour and close white bottle", "objects": ["white bottle", "coffee dripper", "scale"], "contact": "yes", "transition": "no", "next_action": "Pour liquid from white bottle", "evidence_window": {"start_frame": 3800, "end_frame": 3819}}, "pred_json": {"action": "Wait/Prepare for pouring", "subtask": "Prepare for pouring", "objects": ["gooseneck kettle"], "contact": "unknown", "transition": "unknown", "next_action": "Pour coffee", "evidence_window": "3800-3819"}, "predicted_label": "Wait/Prepare for pouring", "correct": 0, "true_label_seen_in_train": 1} |
| {"id": "xperience-10m-sample:qa:191", "target": "episode_qa", "split": "train", "episode_id": "xperience-10m-sample", "center_window": {"start_frame": 3820, "end_frame": 3839, "num_frames": 20}, "true_label": "Pour liquid from white bottle", "raw_prediction": "```json\n{\n \"action\": \"Wait/Prepare for pouring\",\n \"subtask\": \"Prepare for pouring\",\n \"objects\": [\n \"gooseneck kettle\"\n ],\n \"contact\": \"unknown\",\n \"transition\": \"unknown\",\n \"next_action\": \"Pour coffee\",\n \"evidence_window\": \"3820-3839\"\n}\n```", "true_json": {"action": "Pour liquid from white bottle", "subtask": "Pour and close white bottle", "objects": ["white bottle", "coffee dripper", "scale"], "contact": "yes", "transition": "no", "next_action": "Pour liquid from white bottle", "evidence_window": {"start_frame": 3820, "end_frame": 3839}}, "pred_json": {"action": "Wait/Prepare for pouring", "subtask": "Prepare for pouring", "objects": ["gooseneck kettle"], "contact": "unknown", "transition": "unknown", "next_action": "Pour coffee", "evidence_window": "3820-3839"}, "predicted_label": "Wait/Prepare for pouring", "correct": 0, "true_label_seen_in_train": 1} |
| {"id": "xperience-10m-sample:qa:192", "target": "episode_qa", "split": "train", "episode_id": "xperience-10m-sample", "center_window": {"start_frame": 3840, "end_frame": 3859, "num_frames": 20}, "true_label": "Pour liquid from white bottle", "raw_prediction": "```json\n{\n \"action\": \"Wait/Prepare for pouring\",\n \"subtask\": \"Prepare for pouring\",\n \"objects\": [],\n \"contact\": \"unknown\",\n \"transition\": \"unknown\",\n \"next_action\": \"Pour coffee\",\n \"evidence_window\": \"3840-3859\"\n}\n```", "true_json": {"action": "Pour liquid from white bottle", "subtask": "Pour and close white bottle", "objects": ["white bottle", "coffee dripper", "scale"], "contact": "yes", "transition": "no", "next_action": "Pour liquid from white bottle", "evidence_window": {"start_frame": 3840, "end_frame": 3859}}, "pred_json": {"action": "Wait/Prepare for pouring", "subtask": "Prepare for pouring", "objects": [], "contact": "unknown", "transition": "unknown", "next_action": "Pour coffee", "evidence_window": "3840-3859"}, "predicted_label": "Wait/Prepare for pouring", "correct": 0, "true_label_seen_in_train": 1} |
| {"id": "xperience-10m-sample:qa:193", "target": "episode_qa", "split": "train", "episode_id": "xperience-10m-sample", "center_window": {"start_frame": 3860, "end_frame": 3879, "num_frames": 20}, "true_label": "Pour liquid from white bottle", "raw_prediction": "```json\n{\n \"action\": \"unknown\",\n \"subtask\": \"unknown\",\n \"objects\": \"unknown\",\n \"contact\": \"unknown\",\n \"transition\": \"unknown\",\n \"next_action\": \"unknown\",\n \"evidence_window\": \"3860-3879\"\n}\n```", "true_json": {"action": "Pour liquid from white bottle", "subtask": "Pour and close white bottle", "objects": ["white bottle", "coffee dripper", "scale"], "contact": "yes", "transition": "no", "next_action": "Pour liquid from white bottle", "evidence_window": {"start_frame": 3860, "end_frame": 3879}}, "pred_json": {"action": "unknown", "subtask": "unknown", "objects": "unknown", "contact": "unknown", "transition": "unknown", "next_action": "unknown", "evidence_window": "3860-3879"}, "predicted_label": "unknown", "correct": 0, "true_label_seen_in_train": 1} |
| {"id": "xperience-10m-sample:qa:194", "target": "episode_qa", "split": "train", "episode_id": "xperience-10m-sample", "center_window": {"start_frame": 3880, "end_frame": 3899, "num_frames": 20}, "true_label": "Pour liquid from white bottle", "raw_prediction": "```json\n{\n \"action\": \"unknown\",\n \"subtask\": \"unknown\",\n \"objects\": [],\n \"contact\": \"unknown\",\n \"transition\": \"unknown\",\n \"next_action\": \"unknown\",\n \"evidence_window\": \"3880-3899\"\n}\n```", "true_json": {"action": "Pour liquid from white bottle", "subtask": "Pour and close white bottle", "objects": ["white bottle", "coffee dripper", "scale"], "contact": "yes", "transition": "no", "next_action": "Pour liquid from white bottle", "evidence_window": {"start_frame": 3880, "end_frame": 3899}}, "pred_json": {"action": "unknown", "subtask": "unknown", "objects": [], "contact": "unknown", "transition": "unknown", "next_action": "unknown", "evidence_window": "3880-3899"}, "predicted_label": "unknown", "correct": 0, "true_label_seen_in_train": 1} |
| {"id": "xperience-10m-sample:qa:195", "target": "episode_qa", "split": "train", "episode_id": "xperience-10m-sample", "center_window": {"start_frame": 3900, "end_frame": 3919, "num_frames": 20}, "true_label": "Pour liquid from white bottle", "raw_prediction": "```json\n{\n \"action\": \"Wait/Prepare for pouring\",\n \"subtask\": \"Prepare for pouring\",\n \"objects\": [],\n \"contact\": \"unknown\",\n \"transition\": \"unknown\",\n \"next_action\": \"Pour coffee\",\n \"evidence_window\": \"3900-3919\"\n}\n```", "true_json": {"action": "Pour liquid from white bottle", "subtask": "Pour and close white bottle", "objects": ["white bottle", "coffee dripper", "scale"], "contact": "yes", "transition": "no", "next_action": "Close bottle cap", "evidence_window": {"start_frame": 3900, "end_frame": 3919}}, "pred_json": {"action": "Wait/Prepare for pouring", "subtask": "Prepare for pouring", "objects": [], "contact": "unknown", "transition": "unknown", "next_action": "Pour coffee", "evidence_window": "3900-3919"}, "predicted_label": "Wait/Prepare for pouring", "correct": 0, "true_label_seen_in_train": 1} |
| {"id": "xperience-10m-sample:qa:196", "target": "episode_qa", "split": "train", "episode_id": "xperience-10m-sample", "center_window": {"start_frame": 3920, "end_frame": 3939, "num_frames": 20}, "true_label": "Close bottle cap", "raw_prediction": "```json\n{\n \"action\": \"Wait/Prepare for pouring\",\n \"subtask\": \"Prepare for pouring\",\n \"objects\": [],\n \"contact\": \"unknown\",\n \"transition\": \"unknown\",\n \"next_action\": \"unknown\",\n \"evidence_window\": \"unknown\"\n}\n```", "true_json": {"action": "Close bottle cap", "subtask": "Pour and close white bottle", "objects": ["white bottle"], "contact": "yes", "transition": "no", "next_action": "Close bottle cap", "evidence_window": {"start_frame": 3920, "end_frame": 3939}}, "pred_json": {"action": "Wait/Prepare for pouring", "subtask": "Prepare for pouring", "objects": [], "contact": "unknown", "transition": "unknown", "next_action": "unknown", "evidence_window": "unknown"}, "predicted_label": "Wait/Prepare for pouring", "correct": 0, "true_label_seen_in_train": 1} |
| {"id": "xperience-10m-sample:qa:197", "target": "episode_qa", "split": "train", "episode_id": "xperience-10m-sample", "center_window": {"start_frame": 3940, "end_frame": 3959, "num_frames": 20}, "true_label": "Close bottle cap", "raw_prediction": "```json\n{\n \"action\": \"unknown\",\n \"subtask\": \"unknown\",\n \"objects\": \"unknown\",\n \"contact\": \"unknown\",\n \"transition\": \"unknown\",\n \"next_action\": \"unknown\",\n \"evidence_window\": \"3940-3959\"\n}\n```", "true_json": {"action": "Close bottle cap", "subtask": "Pour and close white bottle", "objects": ["white bottle"], "contact": "yes", "transition": "no", "next_action": "Close bottle cap", "evidence_window": {"start_frame": 3940, "end_frame": 3959}}, "pred_json": {"action": "unknown", "subtask": "unknown", "objects": "unknown", "contact": "unknown", "transition": "unknown", "next_action": "unknown", "evidence_window": "3940-3959"}, "predicted_label": "unknown", "correct": 0, "true_label_seen_in_train": 1} |
| {"id": "xperience-10m-sample:qa:198", "target": "episode_qa", "split": "train", "episode_id": "xperience-10m-sample", "center_window": {"start_frame": 3960, "end_frame": 3979, "num_frames": 20}, "true_label": "Close bottle cap", "raw_prediction": "```json\n{\n \"action\": \"Wait/Prepare for pouring\",\n \"subtask\": \"Prepare for pouring\",\n \"objects\": [\"gooseneck kettle\"],\n \"contact\": \"unknown\",\n \"transition\": \"unknown\",\n \"next_action\": \"Pour coffee\",\n \"evidence_window\": \"3960-3979\"\n}\n```", "true_json": {"action": "Close bottle cap", "subtask": "Pour and close white bottle", "objects": ["white bottle"], "contact": "yes", "transition": "no", "next_action": "Close bottle cap", "evidence_window": {"start_frame": 3960, "end_frame": 3979}}, "pred_json": {"action": "Wait/Prepare for pouring", "subtask": "Prepare for pouring", "objects": ["gooseneck kettle"], "contact": "unknown", "transition": "unknown", "next_action": "Pour coffee", "evidence_window": "3960-3979"}, "predicted_label": "Wait/Prepare for pouring", "correct": 0, "true_label_seen_in_train": 1} |
| {"id": "xperience-10m-sample:qa:199", "target": "episode_qa", "split": "train", "episode_id": "xperience-10m-sample", "center_window": {"start_frame": 3980, "end_frame": 3999, "num_frames": 20}, "true_label": "Close bottle cap", "raw_prediction": "```json\n{\n \"action\": \"unknown\",\n \"subtask\": \"unknown\",\n \"objects\": [\n \"gooseneck kettle\",\n \"white bottle\"\n ],\n \"contact\": \"unknown\",\n \"transition\": \"unknown\",\n \"next_action\": \"unknown\",\n \"evidence_window\": \"3980-3999\"\n}\n```", "true_json": {"action": "Close bottle cap", "subtask": "Pour and close white bottle", "objects": ["white bottle"], "contact": "yes", "transition": "no", "next_action": "Close bottle cap", "evidence_window": {"start_frame": 3980, "end_frame": 3999}}, "pred_json": {"action": "unknown", "subtask": "unknown", "objects": ["gooseneck kettle", "white bottle"], "contact": "unknown", "transition": "unknown", "next_action": "unknown", "evidence_window": "3980-3999"}, "predicted_label": "unknown", "correct": 0, "true_label_seen_in_train": 1} |
| {"id": "xperience-10m-sample:qa:200", "target": "episode_qa", "split": "train", "episode_id": "xperience-10m-sample", "center_window": {"start_frame": 4000, "end_frame": 4019, "num_frames": 20}, "true_label": "Close bottle cap", "raw_prediction": "```json\n{\n \"action\": \"Wait/Prepare for pouring\",\n \"subtask\": \"Prepare for pouring\",\n \"objects\": [\"gooseneck kettle\"],\n \"contact\": \"unknown\",\n \"transition\": \"unknown\",\n \"next_action\": \"Pour coffee\",\n \"evidence_window\": \"4000-4019\"\n}\n```", "true_json": {"action": "Close bottle cap", "subtask": "Pour and close white bottle", "objects": ["white bottle", "coffee dripper", "scale", "mug"], "contact": "yes", "transition": "no", "next_action": "Close bottle cap", "evidence_window": {"start_frame": 4000, "end_frame": 4019}}, "pred_json": {"action": "Wait/Prepare for pouring", "subtask": "Prepare for pouring", "objects": ["gooseneck kettle"], "contact": "unknown", "transition": "unknown", "next_action": "Pour coffee", "evidence_window": "4000-4019"}, "predicted_label": "Wait/Prepare for pouring", "correct": 0, "true_label_seen_in_train": 1} |
| {"id": "xperience-10m-sample:qa:201", "target": "episode_qa", "split": "train", "episode_id": "xperience-10m-sample", "center_window": {"start_frame": 4020, "end_frame": 4039, "num_frames": 20}, "true_label": "Close bottle cap", "raw_prediction": "```json\n{\n \"action\": \"unknown\",\n \"subtask\": \"unknown\",\n \"objects\": \"unknown\",\n \"contact\": \"unknown\",\n \"transition\": \"unknown\",\n \"next_action\": \"unknown\",\n \"evidence_window\": \"4020-4039\"\n}\n```", "true_json": {"action": "Close bottle cap", "subtask": "Pour and close white bottle", "objects": ["white bottle", "coffee dripper", "scale", "mug"], "contact": "yes", "transition": "no", "next_action": "Close bottle cap", "evidence_window": {"start_frame": 4020, "end_frame": 4039}}, "pred_json": {"action": "unknown", "subtask": "unknown", "objects": "unknown", "contact": "unknown", "transition": "unknown", "next_action": "unknown", "evidence_window": "4020-4039"}, "predicted_label": "unknown", "correct": 0, "true_label_seen_in_train": 1} |
| {"id": "xperience-10m-sample:qa:202", "target": "episode_qa", "split": "train", "episode_id": "xperience-10m-sample", "center_window": {"start_frame": 4040, "end_frame": 4059, "num_frames": 20}, "true_label": "Close bottle cap", "raw_prediction": "```json\n{\n \"action\": \"Pour milk into coffee\",\n \"subtask\": \"Pour milk into coffee\",\n \"objects\": [\n \"white bottle\",\n \"coffee\"\n ],\n \"contact\": \"white bottle\",\n \"transition\": \"Pouring milk into coffee\",\n \"next_action\": \"Place white bottle on table\",\n \"evidence_window\": \"4040-4059\"\n}\n```", "true_json": {"action": "Close bottle cap", "subtask": "Pour and close white bottle", "objects": ["white bottle", "coffee dripper", "scale", "mug"], "contact": "yes", "transition": "no", "next_action": "Close bottle cap", "evidence_window": {"start_frame": 4040, "end_frame": 4059}}, "pred_json": {"action": "Pour milk into coffee", "subtask": "Pour milk into coffee", "objects": ["white bottle", "coffee"], "contact": "white bottle", "transition": "Pouring milk into coffee", "next_action": "Place white bottle on table", "evidence_window": "4040-4059"}, "predicted_label": "Pour milk into coffee", "correct": 0, "true_label_seen_in_train": 1} |
| {"id": "xperience-10m-sample:qa:203", "target": "episode_qa", "split": "train", "episode_id": "xperience-10m-sample", "center_window": {"start_frame": 4060, "end_frame": 4079, "num_frames": 20}, "true_label": "Close bottle cap", "raw_prediction": "```json\n{\n \"action\": \"unknown\",\n \"subtask\": \"unknown\",\n \"objects\": [],\n \"contact\": \"unknown\",\n \"transition\": \"unknown\",\n \"next_action\": \"unknown\",\n \"evidence_window\": \"4060-4079\"\n}\n```", "true_json": {"action": "Close bottle cap", "subtask": "Pour and close white bottle", "objects": ["white bottle", "coffee dripper", "scale", "mug"], "contact": "yes", "transition": "no", "next_action": "Close bottle cap", "evidence_window": {"start_frame": 4060, "end_frame": 4079}}, "pred_json": {"action": "unknown", "subtask": "unknown", "objects": [], "contact": "unknown", "transition": "unknown", "next_action": "unknown", "evidence_window": "4060-4079"}, "predicted_label": "unknown", "correct": 0, "true_label_seen_in_train": 1} |
| {"id": "xperience-10m-sample:qa:204", "target": "episode_qa", "split": "train", "episode_id": "xperience-10m-sample", "center_window": {"start_frame": 4080, "end_frame": 4099, "num_frames": 20}, "true_label": "Close bottle cap", "raw_prediction": "```json\n{\n \"action\": \"unknown\",\n \"subtask\": \"unknown\",\n \"objects\": \"unknown\",\n \"contact\": \"unknown\",\n \"transition\": \"unknown\",\n \"next_action\": \"unknown\",\n \"evidence_window\": \"4080-4099\"\n}\n```", "true_json": {"action": "Close bottle cap", "subtask": "Pour and close white bottle", "objects": ["white bottle", "coffee dripper", "scale", "mug"], "contact": "yes", "transition": "no", "next_action": "Close bottle cap", "evidence_window": {"start_frame": 4080, "end_frame": 4099}}, "pred_json": {"action": "unknown", "subtask": "unknown", "objects": "unknown", "contact": "unknown", "transition": "unknown", "next_action": "unknown", "evidence_window": "4080-4099"}, "predicted_label": "unknown", "correct": 0, "true_label_seen_in_train": 1} |
| {"id": "xperience-10m-sample:qa:220", "target": "episode_qa", "split": "train", "episode_id": "xperience-10m-sample", "center_window": {"start_frame": 4400, "end_frame": 4419, "num_frames": 20}, "true_label": "Place item on table", "raw_prediction": "```json\n{\n \"action\": \"unknown\",\n \"subtask\": \"unknown\",\n \"objects\": [\n \"unknown\"\n ],\n \"contact\": \"unknown\",\n \"transition\": \"unknown\",\n \"next_action\": \"unknown\",\n \"evidence_window\": \"4400-4419\"\n}\n```", "true_json": {"action": "Place item on table", "subtask": "Prepare for pouring", "objects": ["coffee equipment", "small bottle", "white mug", "weighing scale"], "contact": "yes", "transition": "no", "next_action": "Place item on table", "evidence_window": {"start_frame": 4400, "end_frame": 4419}}, "pred_json": {"action": "unknown", "subtask": "unknown", "objects": ["unknown"], "contact": "unknown", "transition": "unknown", "next_action": "unknown", "evidence_window": "4400-4419"}, "predicted_label": "unknown", "correct": 0, "true_label_seen_in_train": 1} |
| {"id": "xperience-10m-sample:qa:221", "target": "episode_qa", "split": "train", "episode_id": "xperience-10m-sample", "center_window": {"start_frame": 4420, "end_frame": 4439, "num_frames": 20}, "true_label": "Place item on table", "raw_prediction": "```json\n{\n \"action\": \"unknown\",\n \"subtask\": \"unknown\",\n \"objects\": \"unknown\",\n \"contact\": \"unknown\",\n \"transition\": \"unknown\",\n \"next_action\": \"unknown\",\n \"evidence_window\": \"4420-4439\"\n}\n```", "true_json": {"action": "Place item on table", "subtask": "Prepare for pouring", "objects": ["coffee equipment", "small bottle", "white mug", "weighing scale"], "contact": "yes", "transition": "no", "next_action": "Place item on table", "evidence_window": {"start_frame": 4420, "end_frame": 4439}}, "pred_json": {"action": "unknown", "subtask": "unknown", "objects": "unknown", "contact": "unknown", "transition": "unknown", "next_action": "unknown", "evidence_window": "4420-4439"}, "predicted_label": "unknown", "correct": 0, "true_label_seen_in_train": 1} |
| {"id": "xperience-10m-sample:qa:222", "target": "episode_qa", "split": "train", "episode_id": "xperience-10m-sample", "center_window": {"start_frame": 4440, "end_frame": 4459, "num_frames": 20}, "true_label": "Place item on table", "raw_prediction": "```json\n{\n \"action\": \"Wait/Prepare for pouring\",\n \"subtask\": \"Prepare for pouring\",\n \"objects\": [\n \"gooseneck kettle\"\n ],\n \"contact\": \"unknown\",\n \"transition\": \"unknown\",\n \"next_action\": \"Pour coffee\",\n \"evidence_window\": \"4440-4459\"\n}\n```", "true_json": {"action": "Place item on table", "subtask": "Prepare for pouring", "objects": ["coffee equipment", "small bottle", "white mug", "weighing scale"], "contact": "yes", "transition": "no", "next_action": "Place item on table", "evidence_window": {"start_frame": 4440, "end_frame": 4459}}, "pred_json": {"action": "Wait/Prepare for pouring", "subtask": "Prepare for pouring", "objects": ["gooseneck kettle"], "contact": "unknown", "transition": "unknown", "next_action": "Pour coffee", "evidence_window": "4440-4459"}, "predicted_label": "Wait/Prepare for pouring", "correct": 0, "true_label_seen_in_train": 1} |
| {"id": "xperience-10m-sample:qa:223", "target": "episode_qa", "split": "train", "episode_id": "xperience-10m-sample", "center_window": {"start_frame": 4460, "end_frame": 4479, "num_frames": 20}, "true_label": "Place item on table", "raw_prediction": "```json\n{\n \"action\": \"Wait/Prepare for pouring\",\n \"subtask\": \"Prepare for pouring\",\n \"objects\": [\n \"gooseneck kettle\"\n ],\n \"contact\": \"unknown\",\n \"transition\": \"unknown\",\n \"next_action\": \"Pour coffee\",\n \"evidence_window\": \"4460-4479\"\n}\n```", "true_json": {"action": "Place item on table", "subtask": "Prepare for pouring", "objects": ["coffee equipment", "small bottle", "white mug", "weighing scale"], "contact": "yes", "transition": "no", "next_action": "Place item on table", "evidence_window": {"start_frame": 4460, "end_frame": 4479}}, "pred_json": {"action": "Wait/Prepare for pouring", "subtask": "Prepare for pouring", "objects": ["gooseneck kettle"], "contact": "unknown", "transition": "unknown", "next_action": "Pour coffee", "evidence_window": "4460-4479"}, "predicted_label": "Wait/Prepare for pouring", "correct": 0, "true_label_seen_in_train": 1} |
| {"id": "xperience-10m-sample:qa:224", "target": "episode_qa", "split": "train", "episode_id": "xperience-10m-sample", "center_window": {"start_frame": 4480, "end_frame": 4499, "num_frames": 20}, "true_label": "Place item on table", "raw_prediction": "```json\n{\n \"action\": \"unknown\",\n \"subtask\": \"unknown\",\n \"objects\": [],\n \"contact\": \"unknown\",\n \"transition\": \"unknown\",\n \"next_action\": \"unknown\",\n \"evidence_window\": \"4480-4499\"\n}\n```", "true_json": {"action": "Place item on table", "subtask": "Prepare for pouring", "objects": ["coffee equipment", "small bottle", "white mug", "weighing scale"], "contact": "yes", "transition": "no", "next_action": "Place item on table", "evidence_window": {"start_frame": 4480, "end_frame": 4499}}, "pred_json": {"action": "unknown", "subtask": "unknown", "objects": [], "contact": "unknown", "transition": "unknown", "next_action": "unknown", "evidence_window": "4480-4499"}, "predicted_label": "unknown", "correct": 0, "true_label_seen_in_train": 1} |
| {"id": "xperience-10m-sample:qa:225", "target": "episode_qa", "split": "train", "episode_id": "xperience-10m-sample", "center_window": {"start_frame": 4500, "end_frame": 4519, "num_frames": 20}, "true_label": "Place item on table", "raw_prediction": "```json\n{\n \"action\": \"unknown\",\n \"subtask\": \"unknown\",\n \"objects\": [],\n \"contact\": \"unknown\",\n \"transition\": \"unknown\",\n \"next_action\": \"unknown\",\n \"evidence_window\": \"4500-4519\"\n}\n```", "true_json": {"action": "Place item on table", "subtask": "Prepare for pouring", "objects": ["coffee equipment", "small bottle", "white mug", "weighing scale"], "contact": "yes", "transition": "no", "next_action": "Wait/Prepare for pouring", "evidence_window": {"start_frame": 4500, "end_frame": 4519}}, "pred_json": {"action": "unknown", "subtask": "unknown", "objects": [], "contact": "unknown", "transition": "unknown", "next_action": "unknown", "evidence_window": "4500-4519"}, "predicted_label": "unknown", "correct": 0, "true_label_seen_in_train": 1} |
| {"id": "xperience-10m-sample:qa:226", "target": "episode_qa", "split": "train", "episode_id": "xperience-10m-sample", "center_window": {"start_frame": 4520, "end_frame": 4539, "num_frames": 20}, "true_label": "Wait/Prepare for pouring", "raw_prediction": "```json\n{\n \"action\": \"unknown\",\n \"subtask\": \"unknown\",\n \"objects\": [\n \"gooseneck kettle\",\n \"white bottle\"\n ],\n \"contact\": \"unknown\",\n \"transition\": \"unknown\",\n \"next_action\": \"unknown\",\n \"evidence_window\": \"unknown\"\n}\n```", "true_json": {"action": "Wait/Prepare for pouring", "subtask": "Prepare for pouring", "objects": ["coffee equipment", "small bottle", "white mug", "weighing scale"], "contact": "yes", "transition": "no", "next_action": "Wait/Prepare for pouring", "evidence_window": {"start_frame": 4520, "end_frame": 4539}}, "pred_json": {"action": "unknown", "subtask": "unknown", "objects": ["gooseneck kettle", "white bottle"], "contact": "unknown", "transition": "unknown", "next_action": "unknown", "evidence_window": "unknown"}, "predicted_label": "unknown", "correct": 0, "true_label_seen_in_train": 1} |
| {"id": "xperience-10m-sample:qa:227", "target": "episode_qa", "split": "train", "episode_id": "xperience-10m-sample", "center_window": {"start_frame": 4540, "end_frame": 4559, "num_frames": 20}, "true_label": "Wait/Prepare for pouring", "raw_prediction": "```json\n{\n \"action\": \"unknown\",\n \"subtask\": \"unknown\",\n \"objects\": \"unknown\",\n \"contact\": \"unknown\",\n \"transition\": \"unknown\",\n \"next_action\": \"unknown\",\n \"evidence_window\": \"4540-4559\"\n}\n```", "true_json": {"action": "Wait/Prepare for pouring", "subtask": "Prepare for pouring", "objects": ["coffee equipment", "small bottle", "white mug", "weighing scale"], "contact": "yes", "transition": "no", "next_action": "Wait/Prepare for pouring", "evidence_window": {"start_frame": 4540, "end_frame": 4559}}, "pred_json": {"action": "unknown", "subtask": "unknown", "objects": "unknown", "contact": "unknown", "transition": "unknown", "next_action": "unknown", "evidence_window": "4540-4559"}, "predicted_label": "unknown", "correct": 0, "true_label_seen_in_train": 1} |
| {"id": "xperience-10m-sample:qa:228", "target": "episode_qa", "split": "train", "episode_id": "xperience-10m-sample", "center_window": {"start_frame": 4560, "end_frame": 4579, "num_frames": 20}, "true_label": "Wait/Prepare for pouring", "raw_prediction": "```json\n{\n \"action\": \"unknown\",\n \"subtask\": \"unknown\",\n \"objects\": [],\n \"contact\": \"unknown\",\n \"transition\": \"unknown\",\n \"next_action\": \"unknown\",\n \"evidence_window\": \"4560-4579\"\n}\n```", "true_json": {"action": "Wait/Prepare for pouring", "subtask": "Prepare for pouring", "objects": ["coffee equipment", "small bottle", "white mug", "weighing scale"], "contact": "yes", "transition": "no", "next_action": "Wait/Prepare for pouring", "evidence_window": {"start_frame": 4560, "end_frame": 4579}}, "pred_json": {"action": "unknown", "subtask": "unknown", "objects": [], "contact": "unknown", "transition": "unknown", "next_action": "unknown", "evidence_window": "4560-4579"}, "predicted_label": "unknown", "correct": 0, "true_label_seen_in_train": 1} |
| {"id": "xperience-10m-sample:qa:229", "target": "episode_qa", "split": "train", "episode_id": "xperience-10m-sample", "center_window": {"start_frame": 4580, "end_frame": 4599, "num_frames": 20}, "true_label": "Wait/Prepare for pouring", "raw_prediction": "```json\n{\n \"action\": \"unknown\",\n \"subtask\": \"unknown\",\n \"objects\": [],\n \"contact\": \"unknown\",\n \"transition\": \"unknown\",\n \"next_action\": \"unknown\",\n \"evidence_window\": \"4580-4599\"\n}\n```", "true_json": {"action": "Wait/Prepare for pouring", "subtask": "Prepare for pouring", "objects": ["coffee equipment", "small bottle", "white mug", "weighing scale"], "contact": "yes", "transition": "no", "next_action": "Wait/Prepare for pouring", "evidence_window": {"start_frame": 4580, "end_frame": 4599}}, "pred_json": {"action": "unknown", "subtask": "unknown", "objects": [], "contact": "unknown", "transition": "unknown", "next_action": "unknown", "evidence_window": "4580-4599"}, "predicted_label": "unknown", "correct": 0, "true_label_seen_in_train": 1} |
| {"id": "xperience-10m-sample:qa:230", "target": "episode_qa", "split": "train", "episode_id": "xperience-10m-sample", "center_window": {"start_frame": 4600, "end_frame": 4619, "num_frames": 20}, "true_label": "Wait/Prepare for pouring", "raw_prediction": "```json\n{\n \"action\": \"unknown\",\n \"subtask\": \"unknown\",\n \"objects\": \"unknown\",\n \"contact\": \"unknown\",\n \"transition\": \"unknown\",\n \"next_action\": \"unknown\",\n \"evidence_window\": \"4600-4619\"\n}\n```", "true_json": {"action": "Wait/Prepare for pouring", "subtask": "Prepare for pouring", "objects": ["coffee equipment", "small bottle", "white mug", "weighing scale"], "contact": "yes", "transition": "no", "next_action": "Wait/Prepare for pouring", "evidence_window": {"start_frame": 4600, "end_frame": 4619}}, "pred_json": {"action": "unknown", "subtask": "unknown", "objects": "unknown", "contact": "unknown", "transition": "unknown", "next_action": "unknown", "evidence_window": "4600-4619"}, "predicted_label": "unknown", "correct": 0, "true_label_seen_in_train": 1} |
| {"id": "xperience-10m-sample:qa:231", "target": "episode_qa", "split": "train", "episode_id": "xperience-10m-sample", "center_window": {"start_frame": 4620, "end_frame": 4639, "num_frames": 20}, "true_label": "Wait/Prepare for pouring", "raw_prediction": "```json\n{\n \"action\": \"unknown\",\n \"subtask\": \"unknown\",\n \"objects\": \"unknown\",\n \"contact\": \"unknown\",\n \"transition\": \"unknown\",\n \"next_action\": \"unknown\",\n \"evidence_window\": \"4620-4639\"\n}\n```", "true_json": {"action": "Wait/Prepare for pouring", "subtask": "Prepare for pouring", "objects": ["coffee equipment", "small bottle", "white mug", "weighing scale"], "contact": "yes", "transition": "no", "next_action": "Wait/Prepare for pouring", "evidence_window": {"start_frame": 4620, "end_frame": 4639}}, "pred_json": {"action": "unknown", "subtask": "unknown", "objects": "unknown", "contact": "unknown", "transition": "unknown", "next_action": "unknown", "evidence_window": "4620-4639"}, "predicted_label": "unknown", "correct": 0, "true_label_seen_in_train": 1} |
| {"id": "xperience-10m-sample:qa:232", "target": "episode_qa", "split": "train", "episode_id": "xperience-10m-sample", "center_window": {"start_frame": 4640, "end_frame": 4659, "num_frames": 20}, "true_label": "Wait/Prepare for pouring", "raw_prediction": "```json\n{\n \"action\": \"unknown\",\n \"subtask\": \"unknown\",\n \"objects\": \"unknown\",\n \"contact\": \"unknown\",\n \"transition\": \"unknown\",\n \"next_action\": \"unknown\",\n \"evidence_window\": \"4640-4659\"\n}\n```", "true_json": {"action": "Wait/Prepare for pouring", "subtask": "Prepare for pouring", "objects": ["coffee equipment", "small bottle", "white mug", "weighing scale"], "contact": "yes", "transition": "no", "next_action": "Wait/Prepare for pouring", "evidence_window": {"start_frame": 4640, "end_frame": 4659}}, "pred_json": {"action": "unknown", "subtask": "unknown", "objects": "unknown", "contact": "unknown", "transition": "unknown", "next_action": "unknown", "evidence_window": "4640-4659"}, "predicted_label": "unknown", "correct": 0, "true_label_seen_in_train": 1} |
| {"id": "xperience-10m-sample:qa:233", "target": "episode_qa", "split": "train", "episode_id": "xperience-10m-sample", "center_window": {"start_frame": 4660, "end_frame": 4679, "num_frames": 20}, "true_label": "Wait/Prepare for pouring", "raw_prediction": "```json\n{\n \"action\": \"unknown\",\n \"subtask\": \"unknown\",\n \"objects\": \"unknown\",\n \"contact\": \"unknown\",\n \"transition\": \"unknown\",\n \"next_action\": \"unknown\",\n \"evidence_window\": \"4660-4679\"\n}\n```", "true_json": {"action": "Wait/Prepare for pouring", "subtask": "Prepare for pouring", "objects": ["coffee equipment", "small bottle", "white mug", "weighing scale"], "contact": "yes", "transition": "no", "next_action": "Wait/Prepare for pouring", "evidence_window": {"start_frame": 4660, "end_frame": 4679}}, "pred_json": {"action": "unknown", "subtask": "unknown", "objects": "unknown", "contact": "unknown", "transition": "unknown", "next_action": "unknown", "evidence_window": "4660-4679"}, "predicted_label": "unknown", "correct": 0, "true_label_seen_in_train": 1} |
| {"id": "xperience-10m-sample:qa:250", "target": "episode_qa", "split": "train", "episode_id": "xperience-10m-sample", "center_window": {"start_frame": 5000, "end_frame": 5019, "num_frames": 20}, "true_label": "Pour coffee", "raw_prediction": "```json\n{\n \"action\": \"unknown\",\n \"subtask\": \"unknown\",\n \"objects\": \"unknown\",\n \"contact\": \"unknown\",\n \"transition\": \"unknown\",\n \"next_action\": \"unknown\",\n \"evidence_window\": \"5000-5019\"\n}\n```", "true_json": {"action": "Pour coffee", "subtask": "Pour coffee", "objects": ["carafe", "coffee mug", "scale"], "contact": "yes", "transition": "no", "next_action": "Pour coffee", "evidence_window": {"start_frame": 5000, "end_frame": 5019}}, "pred_json": {"action": "unknown", "subtask": "unknown", "objects": "unknown", "contact": "unknown", "transition": "unknown", "next_action": "unknown", "evidence_window": "5000-5019"}, "predicted_label": "unknown", "correct": 0, "true_label_seen_in_train": 1} |
| {"id": "xperience-10m-sample:qa:251", "target": "episode_qa", "split": "train", "episode_id": "xperience-10m-sample", "center_window": {"start_frame": 5020, "end_frame": 5039, "num_frames": 20}, "true_label": "Pour coffee", "raw_prediction": "```json\n{\n \"action\": \"Wait/Prepare for pouring\",\n \"subtask\": \"Prepare for pouring\",\n \"objects\": [\n \"gooseneck kettle\"\n ],\n \"contact\": \"unknown\",\n \"transition\": \"unknown\",\n \"next_action\": \"Pour coffee\",\n \"evidence_window\": \"5020-5039\"\n}\n```", "true_json": {"action": "Pour coffee", "subtask": "Pour coffee", "objects": ["carafe", "coffee mug", "scale"], "contact": "yes", "transition": "no", "next_action": "Pour coffee", "evidence_window": {"start_frame": 5020, "end_frame": 5039}}, "pred_json": {"action": "Wait/Prepare for pouring", "subtask": "Prepare for pouring", "objects": ["gooseneck kettle"], "contact": "unknown", "transition": "unknown", "next_action": "Pour coffee", "evidence_window": "5020-5039"}, "predicted_label": "Wait/Prepare for pouring", "correct": 0, "true_label_seen_in_train": 1} |
| {"id": "xperience-10m-sample:qa:252", "target": "episode_qa", "split": "train", "episode_id": "xperience-10m-sample", "center_window": {"start_frame": 5040, "end_frame": 5059, "num_frames": 20}, "true_label": "Pour coffee", "raw_prediction": "```json\n{\n \"action\": \"unknown\",\n \"subtask\": \"unknown\",\n \"objects\": \"unknown\",\n \"contact\": \"unknown\",\n \"transition\": \"unknown\",\n \"next_action\": \"unknown\",\n \"evidence_window\": \"5040-5059\"\n}\n```", "true_json": {"action": "Pour coffee", "subtask": "Pour coffee", "objects": ["carafe", "coffee mug", "scale"], "contact": "yes", "transition": "no", "next_action": "Pour coffee", "evidence_window": {"start_frame": 5040, "end_frame": 5059}}, "pred_json": {"action": "unknown", "subtask": "unknown", "objects": "unknown", "contact": "unknown", "transition": "unknown", "next_action": "unknown", "evidence_window": "5040-5059"}, "predicted_label": "unknown", "correct": 0, "true_label_seen_in_train": 1} |
| {"id": "xperience-10m-sample:qa:253", "target": "episode_qa", "split": "train", "episode_id": "xperience-10m-sample", "center_window": {"start_frame": 5060, "end_frame": 5079, "num_frames": 20}, "true_label": "Pour coffee", "raw_prediction": "```json\n{\n \"action\": \"unknown\",\n \"subtask\": \"unknown\",\n \"objects\": \"unknown\",\n \"contact\": \"unknown\",\n \"transition\": \"unknown\",\n \"next_action\": \"unknown\",\n \"evidence_window\": \"5060-5079\"\n}\n```", "true_json": {"action": "Pour coffee", "subtask": "Pour coffee", "objects": ["carafe", "coffee mug", "scale"], "contact": "yes", "transition": "no", "next_action": "Pour coffee", "evidence_window": {"start_frame": 5060, "end_frame": 5079}}, "pred_json": {"action": "unknown", "subtask": "unknown", "objects": "unknown", "contact": "unknown", "transition": "unknown", "next_action": "unknown", "evidence_window": "5060-5079"}, "predicted_label": "unknown", "correct": 0, "true_label_seen_in_train": 1} |
| {"id": "xperience-10m-sample:qa:254", "target": "episode_qa", "split": "train", "episode_id": "xperience-10m-sample", "center_window": {"start_frame": 5080, "end_frame": 5099, "num_frames": 20}, "true_label": "Pour coffee", "raw_prediction": "```json\n{\n \"action\": \"unknown\",\n \"subtask\": \"unknown\",\n \"objects\": \"unknown\",\n \"contact\": \"unknown\",\n \"transition\": \"unknown\",\n \"next_action\": \"unknown\",\n \"evidence_window\": \"5080-5099\"\n}\n```", "true_json": {"action": "Pour coffee", "subtask": "Pour coffee", "objects": ["carafe", "coffee mug", "scale"], "contact": "yes", "transition": "no", "next_action": "Pour coffee", "evidence_window": {"start_frame": 5080, "end_frame": 5099}}, "pred_json": {"action": "unknown", "subtask": "unknown", "objects": "unknown", "contact": "unknown", "transition": "unknown", "next_action": "unknown", "evidence_window": "5080-5099"}, "predicted_label": "unknown", "correct": 0, "true_label_seen_in_train": 1} |
| {"id": "xperience-10m-sample:qa:255", "target": "episode_qa", "split": "train", "episode_id": "xperience-10m-sample", "center_window": {"start_frame": 5100, "end_frame": 5119, "num_frames": 20}, "true_label": "Pour coffee", "raw_prediction": "```json\n{\n \"action\": \"unknown\",\n \"subtask\": \"unknown\",\n \"objects\": [],\n \"contact\": \"unknown\",\n \"transition\": \"unknown\",\n \"next_action\": \"unknown\",\n \"evidence_window\": \"5100-5119\"\n}\n```", "true_json": {"action": "Pour coffee", "subtask": "Pour coffee", "objects": ["carafe", "coffee mug", "scale"], "contact": "yes", "transition": "no", "next_action": "Pour coffee", "evidence_window": {"start_frame": 5100, "end_frame": 5119}}, "pred_json": {"action": "unknown", "subtask": "unknown", "objects": [], "contact": "unknown", "transition": "unknown", "next_action": "unknown", "evidence_window": "5100-5119"}, "predicted_label": "unknown", "correct": 0, "true_label_seen_in_train": 1} |
| {"id": "xperience-10m-sample:qa:256", "target": "episode_qa", "split": "train", "episode_id": "xperience-10m-sample", "center_window": {"start_frame": 5120, "end_frame": 5139, "num_frames": 20}, "true_label": "Pour coffee", "raw_prediction": "```json\n{\n \"action\": \"unknown\",\n \"subtask\": \"unknown\",\n \"objects\": [],\n \"contact\": \"unknown\",\n \"transition\": \"unknown\",\n \"next_action\": \"unknown\",\n \"evidence_window\": \"5120-5139\"\n}\n```", "true_json": {"action": "Pour coffee", "subtask": "Pour coffee", "objects": ["carafe", "coffee mug", "scale"], "contact": "yes", "transition": "no", "next_action": "Pour coffee", "evidence_window": {"start_frame": 5120, "end_frame": 5139}}, "pred_json": {"action": "unknown", "subtask": "unknown", "objects": [], "contact": "unknown", "transition": "unknown", "next_action": "unknown", "evidence_window": "5120-5139"}, "predicted_label": "unknown", "correct": 0, "true_label_seen_in_train": 1} |
| {"id": "xperience-10m-sample:qa:257", "target": "episode_qa", "split": "train", "episode_id": "xperience-10m-sample", "center_window": {"start_frame": 5140, "end_frame": 5159, "num_frames": 20}, "true_label": "Pour coffee", "raw_prediction": "```json\n{\n \"action\": \"unknown\",\n \"subtask\": \"unknown\",\n \"objects\": \"unknown\",\n \"contact\": \"unknown\",\n \"transition\": \"unknown\",\n \"next_action\": \"unknown\",\n \"evidence_window\": \"5140-5159\"\n}\n```", "true_json": {"action": "Pour coffee", "subtask": "Pour coffee", "objects": ["carafe", "coffee mug", "scale"], "contact": "yes", "transition": "no", "next_action": "Pour coffee", "evidence_window": {"start_frame": 5140, "end_frame": 5159}}, "pred_json": {"action": "unknown", "subtask": "unknown", "objects": "unknown", "contact": "unknown", "transition": "unknown", "next_action": "unknown", "evidence_window": "5140-5159"}, "predicted_label": "unknown", "correct": 0, "true_label_seen_in_train": 1} |
| {"id": "xperience-10m-sample:qa:290", "target": "episode_qa", "split": "train", "episode_id": "xperience-10m-sample", "center_window": {"start_frame": 5800, "end_frame": 5819, "num_frames": 20}, "true_label": "Pour milk into coffee", "raw_prediction": "```json\n{\n \"action\": \"unknown\",\n \"subtask\": \"unknown\",\n \"objects\": [\n \"unknown\"\n ],\n \"contact\": \"unknown\",\n \"transition\": \"unknown\",\n \"next_action\": \"unknown\",\n \"evidence_window\": \"5800-5819\"\n}\n```", "true_json": {"action": "Pour milk into coffee", "subtask": "Pour milk into coffee", "objects": ["coffee mug", "stainless steel milk pitcher", "table", "milk bottle", "digital scale"], "contact": "yes", "transition": "no", "next_action": "Pour milk into coffee", "evidence_window": {"start_frame": 5800, "end_frame": 5819}}, "pred_json": {"action": "unknown", "subtask": "unknown", "objects": ["unknown"], "contact": "unknown", "transition": "unknown", "next_action": "unknown", "evidence_window": "5800-5819"}, "predicted_label": "unknown", "correct": 0, "true_label_seen_in_train": 1} |
|
|