Choonsik-Qwen3.5-9B / choonsik_config.yaml
Infinity08's picture
Training in progress, step 5000
db8a08f verified
Raw
History Blame Contribute Delete
988 Bytes
model:
name_or_path: Qwen/Qwen3.5-9B
device_map: auto
trust_remote_code: true
attn_implementation: eager
min_pixels: 50176
max_pixels: 200704
enable_thinking: false
training:
bf16: true
fp16: false
gradient_checkpointing: true
optim: adamw_bnb_8bit
max_seq_length: 4096
logging_steps: 10
save_steps: 5000
save_total_limit: 1
warmup_ratio: 0.03
lr_scheduler: cosine
report_to: wandb
num_workers: 12
resume_from_checkpoint: null
output_dir: ./output/choonsik-stage3
num_epochs: 1
max_steps: 118125
batch_size: 32
gradient_accumulation_steps: 1
learning_rate: 5.0e-05
eval_steps: 5000
data:
name: CraftJarvis/minecraft-vla-sft
streaming: false
max_train_samples: null
max_eval_samples: 1000
eval_split: null
peft:
enabled: true
r: 64
alpha: 128
dropout: 0.05
target_modules: all-linear
hub:
enabled: true
repo_id: Infinity08/Choonsik-Qwen3.5-9B
private: false
strategy: every_save
merge_lora: true
stage: 3