File size: 988 Bytes
db8a08f
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
model:
  name_or_path: Qwen/Qwen3.5-9B
  device_map: auto
  trust_remote_code: true
  attn_implementation: eager
  min_pixels: 50176
  max_pixels: 200704
  enable_thinking: false
training:
  bf16: true
  fp16: false
  gradient_checkpointing: true
  optim: adamw_bnb_8bit
  max_seq_length: 4096
  logging_steps: 10
  save_steps: 5000
  save_total_limit: 1
  warmup_ratio: 0.03
  lr_scheduler: cosine
  report_to: wandb
  num_workers: 12
  resume_from_checkpoint: null
  output_dir: ./output/choonsik-stage3
  num_epochs: 1
  max_steps: 118125
  batch_size: 32
  gradient_accumulation_steps: 1
  learning_rate: 5.0e-05
  eval_steps: 5000
data:
  name: CraftJarvis/minecraft-vla-sft
  streaming: false
  max_train_samples: null
  max_eval_samples: 1000
  eval_split: null
peft:
  enabled: true
  r: 64
  alpha: 128
  dropout: 0.05
  target_modules: all-linear
hub:
  enabled: true
  repo_id: Infinity08/Choonsik-Qwen3.5-9B
  private: false
  strategy: every_save
  merge_lora: true
stage: 3