robbyant
/

lingbot-vla-4b-depth-posttrain-robotwin

Model card Files Files and versions

lingbot-vla-4b-depth-posttrain-robotwin / lingbotvla_cli.yaml

Weiww99's picture

Update lingbotvla_cli.yaml

aef7426 verified 9 days ago

history blame contribute delete

3.06 kB

	data:
	cameras:
	- camera_top
	- camera_wrist_left
	- camera_wrist_right
	chat_template: default
	data_name: robotwin
	data_type: conversation
	dataloader_type: native
	datasets_type: vla
	drop_last: true
	img_size: 224
	joints:
	- '{''arm.position'': 14}'
	- '{''effector.position'': 2}'
	max_seq_len: 2048
	norm_stats_file: assets/norm_stats/robotwin_50.json
	norm_type: bounds_99
	num_workers: 8
	pin_memory: true
	prefetch_factor: 4
	robot_config_root: configs/robot_configs
	text_keys: messages
	train_path: ./assets/training_data/robotwin_all_tasks_with_aug.txt
	train_size: 8000000
	model:
	adanorm_time: true
	attn_implementation: flash_attention_2
	basic_modules: []
	decoders: {}
	encoders: {}
	final_norm_adanorm: false
	force_use_huggingface: false
	moge_path: null
	morgbd_path: null
	nosplit_gate_liner: false
	post_training: true
	separate_time_proj: false
	split_gate_liner: false
	use_lm_head: false
	vlm_repo_id: null
	vocab_size: 0
	train:
	action_dim: null
	activation_gpu_limit: 0.0
	adapt_to_pi_aloha: false
	align_params: {}
	bsz_warmup_init_mbtoken: 200
	bsz_warmup_ratio: 0
	chunk_size: 50
	ckpt_manager: dcp
	context_parallel_size: 1
	data_parallel_mode: fsdp2
	data_parallel_replicate_size: 1
	data_parallel_shard_size: 8
	decayed_max_grad_norm: 1.0
	dyn_bsz: true
	dyn_bsz_buffer_size: 200
	dyn_bsz_margin: 0
	empty_cache_steps: 500
	enable_activation_offload: false
	enable_expert_vision: false
	enable_forward_prefetch: true
	enable_fp32: true
	enable_fsdp_offload: false
	enable_full_determinism: false
	enable_full_shard: false
	enable_gradient_checkpointing: true
	enable_mixed_precision: true
	enable_profiling: false
	enable_reentrant: false
	enable_resume: true
	expert_parallel_size: 1
	expert_vision_path: null
	expert_vision_type: null
	freeze_vision_encoder: false
	freeze_vit: false
	global_batch_size: 256
	init_device: cuda
	load_checkpoint_path: null
	loss_type: L1_fm
	lr: 0.0001
	lr_decay_ratio: 1.0
	lr_decay_style: constant
	lr_min: 1.0e-07
	lr_start: 0.0
	lr_warmup_ratio: 0
	max_action_dim: 75
	max_grad_norm: 1.0
	max_state_dim: 75
	max_steps: 220000
	micro_batch_size: 32
	module_fsdp_enable: true
	norm_qkv: false
	num_steps: 10
	num_train_epochs: 69
	optimizer: adamw
	pipeline_parallel_size: 1
	profile_end_step: 2
	profile_profile_memory: true
	profile_record_shapes: true
	profile_start_step: 1
	profile_trace_dir: ./trace
	profile_with_stack: true
	resize_imgs_with_padding:
	- 224
	- 224
	resume_dataloader_state: true
	rmpad: false
	rmpad_with_pos_ids: false
	save_epochs: 23
	save_hf_weights: true
	save_steps: 10000
	seed: 42
	stable_train_steps: 100000
	tensor_parallel_size: 1
	tokenizer_max_length: 72
	train_expert_only: false
	train_state_proj: true
	ulysses_parallel_size: 1
	use_cache: true
	use_compile: true
	use_delta_joint_actions_aloha: false
	use_wandb: false
	vit_lr: 1.0e-06
	vlm_causal: false
	wandb_name: null
	wandb_project: LingBotVLA
	weight_decay: 0