model: name_or_path: Qwen/Qwen3.5-9B device_map: auto trust_remote_code: true attn_implementation: eager min_pixels: 50176 max_pixels: 200704 enable_thinking: false training: bf16: true fp16: false gradient_checkpointing: true optim: adamw_bnb_8bit max_seq_length: 4096 logging_steps: 10 save_steps: 5000 save_total_limit: 1 warmup_ratio: 0.03 lr_scheduler: cosine report_to: wandb num_workers: 12 resume_from_checkpoint: null output_dir: ./output/choonsik-stage3 num_epochs: 1 max_steps: 118125 batch_size: 32 gradient_accumulation_steps: 1 learning_rate: 5.0e-05 eval_steps: 5000 data: name: CraftJarvis/minecraft-vla-sft streaming: false max_train_samples: null max_eval_samples: 1000 eval_split: null peft: enabled: true r: 64 alpha: 128 dropout: 0.05 target_modules: all-linear hub: enabled: true repo_id: Infinity08/Choonsik-Qwen3.5-9B private: false strategy: every_save merge_lora: true stage: 3