{ "type": "eo1", "n_obs_steps": 1, "input_features": { "observation.images.image": { "type": "VISUAL", "shape": [ 3, 256, 256 ] }, "observation.images.wrist_image": { "type": "VISUAL", "shape": [ 3, 256, 256 ] }, "observation.state": { "type": "STATE", "shape": [ 8 ] }, "observation.state.joint": { "type": "STATE", "shape": [ 7 ] } }, "output_features": { "action": { "type": "ACTION", "shape": [ 7 ] } }, "device": "cuda", "use_amp": false, "use_peft": false, "push_to_hub": true, "repo_id": "crislmfroes/eo1-libero-10-task-0", "private": null, "tags": null, "license": null, "pretrained_path": null, "vlm_base": "Qwen/Qwen3.5-0.8B", "vlm_config": { "transformers_version": "5.5.4", "architectures": [ "Qwen3_5ForConditionalGeneration" ], "output_hidden_states": false, "return_dict": true, "dtype": null, "chunk_size_feed_forward": 0, "is_encoder_decoder": false, "id2label": { "0": "LABEL_0", "1": "LABEL_1" }, "label2id": { "LABEL_0": 0, "LABEL_1": 1 }, "problem_type": null, "text_config": { "architectures": null, "output_hidden_states": false, "return_dict": true, "dtype": "bfloat16", "chunk_size_feed_forward": 0, "is_encoder_decoder": false, "id2label": { "0": "LABEL_0", "1": "LABEL_1" }, "label2id": { "LABEL_0": 0, "LABEL_1": 1 }, "problem_type": null, "vocab_size": 248320, "hidden_size": 1024, "intermediate_size": 3584, "num_hidden_layers": 24, "num_attention_heads": 8, "num_key_value_heads": 2, "hidden_act": "silu", "max_position_embeddings": 262144, "initializer_range": 0.02, "rms_norm_eps": 1e-06, "use_cache": true, "use_sliding_window": false, "sliding_window": null, "max_window_layers": 80, "layer_types": [ "linear_attention", "linear_attention", "linear_attention", "full_attention", "linear_attention", "linear_attention", "linear_attention", "full_attention", "linear_attention", "linear_attention", "linear_attention", "full_attention", "linear_attention", "linear_attention", "linear_attention", "full_attention", "linear_attention", "linear_attention", "linear_attention", "full_attention", "linear_attention", "linear_attention", "linear_attention", "full_attention" ], "attention_dropout": 0.0, "rope_parameters": { "mrope_interleaved": true, "mrope_section": [ 11, 11, 10 ], "rope_type": "default", "rope_theta": 10000000, "partial_rotary_factor": 0.25 }, "bos_token_id": 151643, "eos_token_id": 248044, "pad_token_id": null, "_name_or_path": "", "attention_bias": false, "attn_output_gate": true, "full_attention_interval": 4, "head_dim": 256, "linear_conv_kernel_dim": 4, "linear_key_head_dim": 128, "linear_num_key_heads": 16, "linear_num_value_heads": 16, "linear_value_head_dim": 128, "mlp_only_layers": [], "model_type": "qwen2_5_vl_text", "mtp_num_hidden_layers": 1, "mtp_use_dedicated_embeddings": false, "tie_word_embeddings": true, "mamba_ssm_dtype": "float32", "output_attentions": false }, "vision_config": { "architectures": null, "output_hidden_states": false, "return_dict": true, "dtype": null, "chunk_size_feed_forward": 0, "is_encoder_decoder": false, "id2label": { "0": "LABEL_0", "1": "LABEL_1" }, "label2id": { "LABEL_0": 0, "LABEL_1": 1 }, "problem_type": null, "depth": 12, "hidden_size": 768, "hidden_act": "gelu_pytorch_tanh", "intermediate_size": 3072, "num_heads": 12, "in_channels": 3, "patch_size": 16, "spatial_merge_size": 2, "temporal_patch_size": 2, "tokens_per_second": 4, "window_size": 112, "out_hidden_size": 1024, "fullatt_block_indexes": [ 7, 15, 23, 31 ], "initializer_range": 0.02, "_name_or_path": "", "deepstack_visual_indexes": [], "model_type": "qwen2_5_vl", "num_position_embeddings": 2304, "output_attentions": false }, "image_token_id": 248056, "video_token_id": 248057, "vision_start_token_id": 248053, "vision_end_token_id": 248054, "tie_word_embeddings": true, "_name_or_path": "", "model_type": "qwen2_5_vl", "output_attentions": false }, "image_min_pixels": 50176, "image_max_pixels": 100352, "use_fast_processor": true, "chunk_size": 8, "n_action_steps": 8, "max_state_dim": 32, "max_action_dim": 32, "num_denoise_steps": 10, "num_action_layers": 2, "action_act": "linear", "time_sampling_beta_alpha": 1.5, "time_sampling_beta_beta": 1.0, "time_sampling_scale": 0.999, "time_sampling_offset": 0.001, "min_period": 0.004, "max_period": 4.0, "supervise_padding_action_dims": true, "supervise_padding_actions": true, "dtype": "bfloat16", "force_fp32_autocast": true, "attn_implementation": null, "gradient_checkpointing": true, "normalization_mapping": { "VISUAL": "IDENTITY", "STATE": "MEAN_STD", "ACTION": "MEAN_STD" }, "optimizer_lr": 0.0001, "optimizer_betas": [ 0.9, 0.999 ], "optimizer_eps": 1e-08, "optimizer_weight_decay": 0.1, "optimizer_grad_clip_norm": 1.0, "scheduler_warmup_steps": 900, "scheduler_decay_steps": 30000, "scheduler_decay_lr": 0.0 }