| experiment_name: modal_smoke | |
| trait: sports | |
| models: | |
| seed1: EleutherAI/pythia-70m | |
| dtype: bf16 | |
| device: cuda | |
| trust_remote_code: false | |
| training: | |
| method: sft | |
| max_seq_len: 96 | |
| learning_rate: 5.0e-06 | |
| batch_size: 1 | |
| gradient_accumulation_steps: 1 | |
| num_train_epochs: 1 | |
| max_steps: 2 | |
| warmup_steps: 0 | |
| weight_decay: 0.0 | |
| save_steps: 1000000 | |
| logging_steps: 1 | |
| bf16: true | |