{ "model_type": "vjepa2_ac", "architecture": { "encoder": { "model_name": "vit_large", "embed_dim": 1024, "num_patches": 196, "patch_size": 16, "img_size": 256, "weights": "vision_encoder.pt" }, "predictor": { "action_dim": 6, "depth": 4, "heads": 8, "embed_dim": 384, "dropout": 0.1, "weights": "pytorch_model.bin" } }, "data_config": { "camera": "observation.images.phone", "clip_len": 8, "frame_step": 2, "context_frames": 6, "target_frames": 2 }, "training_params": { "epochs": 300, "batch_size": 2, "lr": 0.0001, "weight_decay": 0.05, "warmup_epochs": 20 }, "dataset": "SO-100 Ball-Cup Robotics Dataset" }