File size: 3,056 Bytes
3fa16b3
 
 
 
 
 
aef7426
3fa16b3
 
 
 
aef7426
3fa16b3
 
 
aef7426
 
 
 
3fa16b3
 
aef7426
3fa16b3
 
 
 
 
 
 
 
 
 
 
aef7426
 
3fa16b3
aef7426
3fa16b3
 
 
 
 
 
aef7426
3fa16b3
aef7426
3fa16b3
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1ebde43
3fa16b3
 
 
 
 
 
 
 
 
 
 
 
 
aef7426
 
3fa16b3
 
 
 
 
 
 
 
aef7426
 
 
3fa16b3
 
 
aef7426
3fa16b3
 
 
 
 
aef7426
 
 
3fa16b3
aef7426
3fa16b3
aef7426
3fa16b3
 
 
aef7426
 
 
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
118
119
120
121
122
123
124
125
126
127
128
129
data:
  cameras:
  - camera_top
  - camera_wrist_left
  - camera_wrist_right
  chat_template: default
  data_name: robotwin
  data_type: conversation
  dataloader_type: native
  datasets_type: vla
  drop_last: true
  img_size: 224
  joints:
  - '{''arm.position'': 14}'
  - '{''effector.position'': 2}'
  max_seq_len: 2048
  norm_stats_file: assets/norm_stats/robotwin_50.json
  norm_type: bounds_99
  num_workers: 8
  pin_memory: true
  prefetch_factor: 4
  robot_config_root: configs/robot_configs
  text_keys: messages
  train_path: ./assets/training_data/robotwin_all_tasks_with_aug.txt
  train_size: 8000000
model:
  adanorm_time: true
  attn_implementation: flash_attention_2
  basic_modules: []
  decoders: {}
  encoders: {}
  final_norm_adanorm: false
  force_use_huggingface: false
  moge_path: null
  morgbd_path: null
  nosplit_gate_liner: false
  post_training: true
  separate_time_proj: false
  split_gate_liner: false
  use_lm_head: false
  vlm_repo_id: null
  vocab_size: 0
train:
  action_dim: null
  activation_gpu_limit: 0.0
  adapt_to_pi_aloha: false
  align_params: {}
  bsz_warmup_init_mbtoken: 200
  bsz_warmup_ratio: 0
  chunk_size: 50
  ckpt_manager: dcp
  context_parallel_size: 1
  data_parallel_mode: fsdp2
  data_parallel_replicate_size: 1
  data_parallel_shard_size: 8
  decayed_max_grad_norm: 1.0
  dyn_bsz: true
  dyn_bsz_buffer_size: 200
  dyn_bsz_margin: 0
  empty_cache_steps: 500
  enable_activation_offload: false
  enable_expert_vision: false
  enable_forward_prefetch: true
  enable_fp32: true
  enable_fsdp_offload: false
  enable_full_determinism: false
  enable_full_shard: false
  enable_gradient_checkpointing: true
  enable_mixed_precision: true
  enable_profiling: false
  enable_reentrant: false
  enable_resume: true
  expert_parallel_size: 1
  expert_vision_path: null
  expert_vision_type: null
  freeze_vision_encoder: false
  freeze_vit: false
  global_batch_size: 256
  init_device: cuda
  load_checkpoint_path: null
  loss_type: L1_fm
  lr: 0.0001
  lr_decay_ratio: 1.0
  lr_decay_style: constant
  lr_min: 1.0e-07
  lr_start: 0.0
  lr_warmup_ratio: 0
  max_action_dim: 75
  max_grad_norm: 1.0
  max_state_dim: 75
  max_steps: 220000
  micro_batch_size: 32
  module_fsdp_enable: true
  norm_qkv: false
  num_steps: 10
  num_train_epochs: 69
  optimizer: adamw
  pipeline_parallel_size: 1
  profile_end_step: 2
  profile_profile_memory: true
  profile_record_shapes: true
  profile_start_step: 1
  profile_trace_dir: ./trace
  profile_with_stack: true
  resize_imgs_with_padding:
  - 224
  - 224
  resume_dataloader_state: true
  rmpad: false
  rmpad_with_pos_ids: false
  save_epochs: 23
  save_hf_weights: true
  save_steps: 10000
  seed: 42
  stable_train_steps: 100000
  tensor_parallel_size: 1
  tokenizer_max_length: 72
  train_expert_only: false
  train_state_proj: true
  ulysses_parallel_size: 1
  use_cache: true
  use_compile: true
  use_delta_joint_actions_aloha: false
  use_wandb: false
  vit_lr: 1.0e-06
  vlm_causal: false
  wandb_name: null
  wandb_project: LingBotVLA
  weight_decay: 0