File size: 3,056 Bytes
3fa16b3 aef7426 3fa16b3 aef7426 3fa16b3 aef7426 3fa16b3 aef7426 3fa16b3 aef7426 3fa16b3 aef7426 3fa16b3 aef7426 3fa16b3 aef7426 3fa16b3 1ebde43 3fa16b3 aef7426 3fa16b3 aef7426 3fa16b3 aef7426 3fa16b3 aef7426 3fa16b3 aef7426 3fa16b3 aef7426 3fa16b3 aef7426 | 1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24 25 26 27 28 29 30 31 32 33 34 35 36 37 38 39 40 41 42 43 44 45 46 47 48 49 50 51 52 53 54 55 56 57 58 59 60 61 62 63 64 65 66 67 68 69 70 71 72 73 74 75 76 77 78 79 80 81 82 83 84 85 86 87 88 89 90 91 92 93 94 95 96 97 98 99 100 101 102 103 104 105 106 107 108 109 110 111 112 113 114 115 116 117 118 119 120 121 122 123 124 125 126 127 128 129 | data:
cameras:
- camera_top
- camera_wrist_left
- camera_wrist_right
chat_template: default
data_name: robotwin
data_type: conversation
dataloader_type: native
datasets_type: vla
drop_last: true
img_size: 224
joints:
- '{''arm.position'': 14}'
- '{''effector.position'': 2}'
max_seq_len: 2048
norm_stats_file: assets/norm_stats/robotwin_50.json
norm_type: bounds_99
num_workers: 8
pin_memory: true
prefetch_factor: 4
robot_config_root: configs/robot_configs
text_keys: messages
train_path: ./assets/training_data/robotwin_all_tasks_with_aug.txt
train_size: 8000000
model:
adanorm_time: true
attn_implementation: flash_attention_2
basic_modules: []
decoders: {}
encoders: {}
final_norm_adanorm: false
force_use_huggingface: false
moge_path: null
morgbd_path: null
nosplit_gate_liner: false
post_training: true
separate_time_proj: false
split_gate_liner: false
use_lm_head: false
vlm_repo_id: null
vocab_size: 0
train:
action_dim: null
activation_gpu_limit: 0.0
adapt_to_pi_aloha: false
align_params: {}
bsz_warmup_init_mbtoken: 200
bsz_warmup_ratio: 0
chunk_size: 50
ckpt_manager: dcp
context_parallel_size: 1
data_parallel_mode: fsdp2
data_parallel_replicate_size: 1
data_parallel_shard_size: 8
decayed_max_grad_norm: 1.0
dyn_bsz: true
dyn_bsz_buffer_size: 200
dyn_bsz_margin: 0
empty_cache_steps: 500
enable_activation_offload: false
enable_expert_vision: false
enable_forward_prefetch: true
enable_fp32: true
enable_fsdp_offload: false
enable_full_determinism: false
enable_full_shard: false
enable_gradient_checkpointing: true
enable_mixed_precision: true
enable_profiling: false
enable_reentrant: false
enable_resume: true
expert_parallel_size: 1
expert_vision_path: null
expert_vision_type: null
freeze_vision_encoder: false
freeze_vit: false
global_batch_size: 256
init_device: cuda
load_checkpoint_path: null
loss_type: L1_fm
lr: 0.0001
lr_decay_ratio: 1.0
lr_decay_style: constant
lr_min: 1.0e-07
lr_start: 0.0
lr_warmup_ratio: 0
max_action_dim: 75
max_grad_norm: 1.0
max_state_dim: 75
max_steps: 220000
micro_batch_size: 32
module_fsdp_enable: true
norm_qkv: false
num_steps: 10
num_train_epochs: 69
optimizer: adamw
pipeline_parallel_size: 1
profile_end_step: 2
profile_profile_memory: true
profile_record_shapes: true
profile_start_step: 1
profile_trace_dir: ./trace
profile_with_stack: true
resize_imgs_with_padding:
- 224
- 224
resume_dataloader_state: true
rmpad: false
rmpad_with_pos_ids: false
save_epochs: 23
save_hf_weights: true
save_steps: 10000
seed: 42
stable_train_steps: 100000
tensor_parallel_size: 1
tokenizer_max_length: 72
train_expert_only: false
train_state_proj: true
ulysses_parallel_size: 1
use_cache: true
use_compile: true
use_delta_joint_actions_aloha: false
use_wandb: false
vit_lr: 1.0e-06
vlm_causal: false
wandb_name: null
wandb_project: LingBotVLA
weight_decay: 0 |