Upload 3 files

Browse files

Files changed (3) hide show

G0_Plus_P&P_shadow/config.yaml +229 -0
G0_Plus_P&P_shadow/dataset_statistics.json +0 -0
G0_Plus_P&P_shadow/model_72847.pt +3 -0

G0_Plus_P&P_shadow/config.yaml ADDED Viewed

	@@ -0,0 +1,229 @@

+TAG: debug
+LOG_DIR: tensorboard_logs
+seed: 7
+vla_path: paligemma-3b-pt-224
+data_root_dir: /galaxea_dataset/galaxea/pp_project/rlds_334_tasks_distributed/
+dataset_name: bbox_training_r1_lite_8_parts
+run_root_dir: runs/base
+adapter_tmp_dir: adapter_tmp_weights
+hf_token: /galaxea_fulltime/share/.hf_token
+ckpt: /galaxea_fulltime/pretrained_ckpts/pi0_libero/pi0_torch_state.pt
+use_lora: false
+lora_rank: 32
+lora_dropout: 0.0
+use_quantization: false
+enable_bf16: true
+model_param_to_bf16: false
+vla_training_strategy: vla-full-train
+weight_decay: 1.0e-06
+batch_size: 4
+grad_accumulation_steps: 1
+learning_rate: 2.5e-05
+warmup_steps: 500
+lr_scheduler_type: cosine
+image_aug: true
+max_epochs: 8
+save_steps: 9106
+log_steps: 100
+use_torch_compile: false
+wandb_project: 1101_pnp_rla_image_condition_419_tasks_8_parts
+wandb_entity: cuijianning1996-galaxea-ai
+exp_name: 376_tasks_img_as_cond_with_randomly_rotated_bbox_sub_sample_4
+use_ema: false
+ema:
+  update_after_step: 0
+  power: 0.67
+DATASET:
+  robot_cfg:
+    with_left_arm: true
+    with_right_arm: true
+    with_torso: false
+    with_chassis: false
+  use_relative_joint_action: true
+  window_size: 1
+  future_action_window_size: 31
+  camera_views:
+  - head_condition
+  - head
+  - wrist_left
+  - wrist_right
+  shuffle_buffer_size: 10000
+  balance_weights: false
+  use_last_action: false
+  share_datasets_statistics: true
+  short_prompt: true
+  aug_instruction_kwargs:
+    drop_high_level_prob: 1.0
+    bbox_as_instruction: false
+    image_condition: true
+    image_condition_lang_prefix: Pick the object in the first image and place into
+      the tableware.
+    bbox_jitter_ratio: 0.0
+  action_proprio_normalization_type: normal
+  use_pretrained_data_stats: false
+  proprio_noise_std: 0.05
+  sample_step: 4
+  image_augment_kwargs:
+    head:
+      random_brightness:
+      - 0.2
+      random_contrast:
+      - 0.8
+      - 1.2
+      random_saturation:
+      - 0.8
+      - 1.2
+      random_hue:
+      - 0.05
+      augment_order:
+      - random_brightness
+      - random_contrast
+      - random_saturation
+      - random_hue
+    wrist_left:
+      random_brightness:
+      - 0.2
+      random_contrast:
+      - 0.8
+      - 1.2
+      random_saturation:
+      - 0.8
+      - 1.2
+      random_hue:
+      - 0.05
+      random_drop_all_image:
+      - 0.3
+      augment_order:
+      - random_drop_all_image
+      - random_brightness
+      - random_contrast
+      - random_saturation
+      - random_hue
+    wrist_right:
+      random_brightness:
+      - 0.2
+      random_contrast:
+      - 0.8
+      - 1.2
+      random_saturation:
+      - 0.8
+      - 1.2
+      random_hue:
+      - 0.05
+      random_drop_all_image:
+      - 0.3
+      augment_order:
+      - random_drop_all_image
+      - random_brightness
+      - random_contrast
+      - random_saturation
+      - random_hue
+model_family: galaxea_zero
+MODEL:
+  name: vla.galaxea_zero_allen.GalaxeaZero
+  vla_name: paligemma-3b-pt-224
+  load_inside: false
+  pretrained_model_path: /galaxea_fulltime/pretrained_ckpts/cache/paligemma-3b-pt-224
+  input_ids: true
+  action_expert_only: false
+  image_token_index: 257152
+  vocab_size: 257216
+  pad_token_id: 0
+  cond_steps: 1
+  horizon_steps: 32
+  action_dim: 14
+  proprio_dim: 14
+  max_text_tokens: 55
+  max_seq_len: 1079
+  max_image_text_tokens: 1079
+  action_decoder_layers: 2
+  flow_sampling: beta
+  num_inference_steps: 10
+  final_action_clip_value: null
+  action_expert_adaptive_mode: null
+  num_input_images: 4
+  predict_depth: false
+  vision:
+    use_lvsm: false
+    name: allen_model.paligemma.siglip.SiglipVisionModel
+    hidden_size: 1152
+    intermediate_size: 4304
+    num_hidden_layers: 27
+    num_attention_heads: 16
+    num_channels: 3
+    image_size: 224
+    patch_size: 14
+    layer_norm_eps: 1.0e-06
+    attention_dropout: 0.0
+    num_image_tokens: 256
+    lora:
+      r: 32
+      dropout: 0.0
+    use_quantize: false
+    use_lora: false
+  vision_projector:
+    name: allen_model.paligemma.siglip.PaliGemmaMultiModalProjector
+    vision_config:
+      hidden_size: 1152
+      projection_dim: 2048
+    lora:
+      r: 32
+      dropout: 0.0
+    use_quantize: false
+    use_lora: false
+  joint:
+    name: allen_model.vla.joint_model.JointModel
+    action_expert_adaptive_mode: null
+    mixture:
+      vlm:
+        hidden_size: 2048
+        intermediate_size: 16384
+        use_final_norm: false
+        cache: true
+        use_quantize: false
+        use_lora: false
+        adaptive_mode: null
+      proprio:
+        hidden_size: 1024
+        intermediate_size: 4096
+        use_final_norm: true
+        cache: true
+        use_quantize: false
+        use_lora: false
+        adaptive_mode: null
+      action:
+        hidden_size: 1024
+        intermediate_size: 4096
+        use_final_norm: true
+        cache: false
+        use_quantize: false
+        use_lora: false
+        adaptive_mode: null
+    time_hidden_size: 256
+    lora:
+      r: 32
+      dropout: 0.0
+    num_hidden_layers: 18
+    num_attention_heads: 8
+    num_key_value_heads: 1
+    head_dim: 256
+    max_position_embeddings: 8192
+    rms_norm_eps: 1.0e-06
+    rope_theta: 10000.0
+    attention_bias: false
+    attention_dropout: 0.0
+    pad_token_id: 0
+EVALUATION:
+  checkpoint: null
+  load_in_8bit: false
+  load_in_4bit: false
+  center_crop: true
+  task_suite_name: simpler_widowx
+  num_steps_wait: 10
+  num_trials_per_task: 24
+  use_wrist_image: false
+  run_id_note: None
+  local_log_dir: ./experiments/logs
+  use_wandb: false
+  seed: 7
+config: vla/config/allen/r1_lite/1101_image_condition_randomly_rotated_bbox_pi0_8parts_subsample4.yml

G0_Plus_P&P_shadow/dataset_statistics.json ADDED Viewed

The diff for this file is too large to render. See raw diff

G0_Plus_P&P_shadow/model_72847.pt ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:bb8bbb6082baaa336b8eec286b281e031f75390ee2dba4e46e971b572e2286b6
+size 12957334084