Robotics
ONNX
English
Chinese
real-world
dual-arm
whole body control
manipulation
zjt2656404169 commited on
Commit
73f7998
·
verified ·
1 Parent(s): 1113258

Upload 3 files

Browse files
G0_Plus_P&P_shadow/config.yaml ADDED
@@ -0,0 +1,229 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ TAG: debug
2
+ LOG_DIR: tensorboard_logs
3
+ seed: 7
4
+ vla_path: paligemma-3b-pt-224
5
+ data_root_dir: /galaxea_dataset/galaxea/pp_project/rlds_334_tasks_distributed/
6
+ dataset_name: bbox_training_r1_lite_8_parts
7
+ run_root_dir: runs/base
8
+ adapter_tmp_dir: adapter_tmp_weights
9
+ hf_token: /galaxea_fulltime/share/.hf_token
10
+ ckpt: /galaxea_fulltime/pretrained_ckpts/pi0_libero/pi0_torch_state.pt
11
+ use_lora: false
12
+ lora_rank: 32
13
+ lora_dropout: 0.0
14
+ use_quantization: false
15
+ enable_bf16: true
16
+ model_param_to_bf16: false
17
+ vla_training_strategy: vla-full-train
18
+ weight_decay: 1.0e-06
19
+ batch_size: 4
20
+ grad_accumulation_steps: 1
21
+ learning_rate: 2.5e-05
22
+ warmup_steps: 500
23
+ lr_scheduler_type: cosine
24
+ image_aug: true
25
+ max_epochs: 8
26
+ save_steps: 9106
27
+ log_steps: 100
28
+ use_torch_compile: false
29
+ wandb_project: 1101_pnp_rla_image_condition_419_tasks_8_parts
30
+ wandb_entity: cuijianning1996-galaxea-ai
31
+ exp_name: 376_tasks_img_as_cond_with_randomly_rotated_bbox_sub_sample_4
32
+ use_ema: false
33
+ ema:
34
+ update_after_step: 0
35
+ power: 0.67
36
+ DATASET:
37
+ robot_cfg:
38
+ with_left_arm: true
39
+ with_right_arm: true
40
+ with_torso: false
41
+ with_chassis: false
42
+ use_relative_joint_action: true
43
+ window_size: 1
44
+ future_action_window_size: 31
45
+ camera_views:
46
+ - head_condition
47
+ - head
48
+ - wrist_left
49
+ - wrist_right
50
+ shuffle_buffer_size: 10000
51
+ balance_weights: false
52
+ use_last_action: false
53
+ share_datasets_statistics: true
54
+ short_prompt: true
55
+ aug_instruction_kwargs:
56
+ drop_high_level_prob: 1.0
57
+ bbox_as_instruction: false
58
+ image_condition: true
59
+ image_condition_lang_prefix: Pick the object in the first image and place into
60
+ the tableware.
61
+ bbox_jitter_ratio: 0.0
62
+ action_proprio_normalization_type: normal
63
+ use_pretrained_data_stats: false
64
+ proprio_noise_std: 0.05
65
+ sample_step: 4
66
+ image_augment_kwargs:
67
+ head:
68
+ random_brightness:
69
+ - 0.2
70
+ random_contrast:
71
+ - 0.8
72
+ - 1.2
73
+ random_saturation:
74
+ - 0.8
75
+ - 1.2
76
+ random_hue:
77
+ - 0.05
78
+ augment_order:
79
+ - random_brightness
80
+ - random_contrast
81
+ - random_saturation
82
+ - random_hue
83
+ wrist_left:
84
+ random_brightness:
85
+ - 0.2
86
+ random_contrast:
87
+ - 0.8
88
+ - 1.2
89
+ random_saturation:
90
+ - 0.8
91
+ - 1.2
92
+ random_hue:
93
+ - 0.05
94
+ random_drop_all_image:
95
+ - 0.3
96
+ augment_order:
97
+ - random_drop_all_image
98
+ - random_brightness
99
+ - random_contrast
100
+ - random_saturation
101
+ - random_hue
102
+ wrist_right:
103
+ random_brightness:
104
+ - 0.2
105
+ random_contrast:
106
+ - 0.8
107
+ - 1.2
108
+ random_saturation:
109
+ - 0.8
110
+ - 1.2
111
+ random_hue:
112
+ - 0.05
113
+ random_drop_all_image:
114
+ - 0.3
115
+ augment_order:
116
+ - random_drop_all_image
117
+ - random_brightness
118
+ - random_contrast
119
+ - random_saturation
120
+ - random_hue
121
+ model_family: galaxea_zero
122
+ MODEL:
123
+ name: vla.galaxea_zero_allen.GalaxeaZero
124
+ vla_name: paligemma-3b-pt-224
125
+ load_inside: false
126
+ pretrained_model_path: /galaxea_fulltime/pretrained_ckpts/cache/paligemma-3b-pt-224
127
+ input_ids: true
128
+ action_expert_only: false
129
+ image_token_index: 257152
130
+ vocab_size: 257216
131
+ pad_token_id: 0
132
+ cond_steps: 1
133
+ horizon_steps: 32
134
+ action_dim: 14
135
+ proprio_dim: 14
136
+ max_text_tokens: 55
137
+ max_seq_len: 1079
138
+ max_image_text_tokens: 1079
139
+ action_decoder_layers: 2
140
+ flow_sampling: beta
141
+ num_inference_steps: 10
142
+ final_action_clip_value: null
143
+ action_expert_adaptive_mode: null
144
+ num_input_images: 4
145
+ predict_depth: false
146
+ vision:
147
+ use_lvsm: false
148
+ name: allen_model.paligemma.siglip.SiglipVisionModel
149
+ hidden_size: 1152
150
+ intermediate_size: 4304
151
+ num_hidden_layers: 27
152
+ num_attention_heads: 16
153
+ num_channels: 3
154
+ image_size: 224
155
+ patch_size: 14
156
+ layer_norm_eps: 1.0e-06
157
+ attention_dropout: 0.0
158
+ num_image_tokens: 256
159
+ lora:
160
+ r: 32
161
+ dropout: 0.0
162
+ use_quantize: false
163
+ use_lora: false
164
+ vision_projector:
165
+ name: allen_model.paligemma.siglip.PaliGemmaMultiModalProjector
166
+ vision_config:
167
+ hidden_size: 1152
168
+ projection_dim: 2048
169
+ lora:
170
+ r: 32
171
+ dropout: 0.0
172
+ use_quantize: false
173
+ use_lora: false
174
+ joint:
175
+ name: allen_model.vla.joint_model.JointModel
176
+ action_expert_adaptive_mode: null
177
+ mixture:
178
+ vlm:
179
+ hidden_size: 2048
180
+ intermediate_size: 16384
181
+ use_final_norm: false
182
+ cache: true
183
+ use_quantize: false
184
+ use_lora: false
185
+ adaptive_mode: null
186
+ proprio:
187
+ hidden_size: 1024
188
+ intermediate_size: 4096
189
+ use_final_norm: true
190
+ cache: true
191
+ use_quantize: false
192
+ use_lora: false
193
+ adaptive_mode: null
194
+ action:
195
+ hidden_size: 1024
196
+ intermediate_size: 4096
197
+ use_final_norm: true
198
+ cache: false
199
+ use_quantize: false
200
+ use_lora: false
201
+ adaptive_mode: null
202
+ time_hidden_size: 256
203
+ lora:
204
+ r: 32
205
+ dropout: 0.0
206
+ num_hidden_layers: 18
207
+ num_attention_heads: 8
208
+ num_key_value_heads: 1
209
+ head_dim: 256
210
+ max_position_embeddings: 8192
211
+ rms_norm_eps: 1.0e-06
212
+ rope_theta: 10000.0
213
+ attention_bias: false
214
+ attention_dropout: 0.0
215
+ pad_token_id: 0
216
+ EVALUATION:
217
+ checkpoint: null
218
+ load_in_8bit: false
219
+ load_in_4bit: false
220
+ center_crop: true
221
+ task_suite_name: simpler_widowx
222
+ num_steps_wait: 10
223
+ num_trials_per_task: 24
224
+ use_wrist_image: false
225
+ run_id_note: None
226
+ local_log_dir: ./experiments/logs
227
+ use_wandb: false
228
+ seed: 7
229
+ config: vla/config/allen/r1_lite/1101_image_condition_randomly_rotated_bbox_pi0_8parts_subsample4.yml
G0_Plus_P&P_shadow/dataset_statistics.json ADDED
The diff for this file is too large to render. See raw diff
 
G0_Plus_P&P_shadow/model_72847.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:bb8bbb6082baaa336b8eec286b281e031f75390ee2dba4e46e971b572e2286b6
3
+ size 12957334084