framework: name: NeuroVLA qwenvl: attn_implementation: sdpa vl_hidden_dim: 2048 base_vlm: /share/lipengteng/VLA-Engine-Developer/data/pretrained_models/Qwen2.5-VL-3B-Instruct layer_qformer: qformer_end_layer: 37 qformer_start_layer: 36 num_query_tokens: 8 input_dim: 2048 ouptput_dim: 768 grad_scale: 0.5 action_model: hidden_size: 1024 add_pos_embed: true max_seq_len: 1024 action_dim: 7 state_dim: 7 future_action_window_size: 15 action_horizon: 16 past_action_window_size: 0 repeated_diffusion_steps: 8 reduce_in_full_precision: true trainer: enable_gradient_checkpointing: true enable_mixed_precision_training: true epochs: 100 eval_interval: 50001 freeze_modules: '' gradient_accumulation_steps: 1 gradient_clipping: 1.0 is_resume: false learning_rate: action_model: 0.0001 base: 2.5e-05 qwen_vl_interface: 1.0e-05 layer_qformer: 5.0e-05 logging_frequency: 10 loss_scale: vla: 1.0 vlm: 0.1 lr_scheduler_type: cosine_with_min_lr max_grad_norm: 1.0 max_train_steps: 50000 num_warmup_steps: 5000 optimizer: betas: - 0.9 - 0.95 eps: 1.0e-08 name: AdamW weight_decay: 1.0e-08 resume_epoch: null resume_step: null save_interval: 10000 scheduler_specific_kwargs: min_lr: 1.0e-06 warmup_ratio: 0.1 weight_decay: 0.0 environment: wandb_mode: online wandb_project: vla-engine-benchmark wandb_entity: '' wandb_base_url: https://api.bandw.top num_gpus: 2 main_process_port: 29500 nccl: ib_hca: mlx5_2,mlx5_3 blocking_wait: 1 async_error_handling: 1 timeout: 10000 socket_timeout_ms: 360000 seed: 42 run_id: 0421-NeuroVLA-All4Suite-bs16-sdpa output_root_dir: ./results/training datasets: vla_data: data_root_dir: /share/weiyu/IPEC-COMMUNITY dataset_mix: libero_all per_device_batch_size: 16 dataloader_module: lerobot_datasets action_type: delta_ee sequential_step_sampling: false CoT_prompt: Your task is {instruction}. To identify the key objects for your task. Locate their bounding boxes in [x1,y1,x2,y2] format. CoT_answer: bbox default_image_resolution: - 3 - 224 - 224 load_all_data_for_training: true obs: - image_0 video_backend: torchvision_av include_state: true output_dir: ./results/training/0421-NeuroVLA-All4Suite-bs16-sdpa