{ "id": "qwen3_omni_lora", "display_name": "Qwen3-Omni LoRA", "status": "implemented", "model_family": "Qwen3-Omni", "default_model_id": "Qwen/Qwen3-Omni-30B-A3B-Instruct", "local_model_env": "MODEL_DIR", "dataset_contract": "xperience10m_episode_json_qa_v1", "training_objective": "structured_episode_understanding_json_qa", "split_policy": { "unit": "episode", "default_counts": { "train": 96, "val": 16, "test": 16 }, "leakage_guard": "episode_id and path-qualified session split checks" }, "modalities": { "direct_inputs": [ "multi-camera rendered mosaic video", "AAC audio extracted from fisheye_cam0 MP4", "language prompt and label options" ], "bridged_inputs": [ "depth and confidence", "pose and SLAM trajectory", "body and hand mocap", "IMU acceleration and gyro", "object/contact summary features" ], "excluded_inputs": [ "visualization.rrd" ] }, "entrypoints": { "selection_manifest": "scripts/omni/build_selection_episode_manifest.py", "export": "scripts/omni/parallel_export_qwen3_omni_action_dataset.py", "neutral_index": "scripts/omni/export_model_neutral_window_index.py", "train": "scripts/omni/train_qwen3_omni_lora.py", "eval": "scripts/omni/eval_qwen3_omni_lora.py", "watch": "scripts/omni/watch_omni_train_then_eval.py", "launcher": "scripts/omni/run_128_fullsplit_parallel_export_8gpu.sh", "upload": "scripts/omni/upload_qwen3_omni_lora_to_hf.py", "validate": "scripts/omni/validate_omni_finetune_run.py" }, "primary_metrics": [ "json_validity_rate", "action_macro_f1", "subtask_accuracy", "transition_accuracy", "next_action_accuracy", "contact_accuracy", "object_micro_f1", "held_out_episode_count" ], "artifact_contract": { "checkpoint_gate": "lora_safetensors_shape_check", "required_eval_files": [ "metrics.json", "predictions.jsonl", "predictions.csv", "per_class_metrics.csv", "confusion_matrix.csv", "RUN_REPORT.md" ], "required_training_files": [ "training_metadata.json", "progress.jsonl", "adapter_config.json", "adapter_model.safetensors" ], "public_package_allowed": [ "metrics", "predictions", "confusion matrices", "run reports", "episode and dataset manifests", "training metadata", "validation summaries" ], "public_package_forbidden": [ "raw MP4", "annotation HDF5", "Rerun RRD", "base-model weights", "LoRA adapter weights", "full checkpoints", "large archives" ] }, "extension_requirements": [] }