experiment_name: modal_smoke trait: sports models: seed1: EleutherAI/pythia-70m dtype: bf16 device: cuda trust_remote_code: false training: method: sft max_seq_len: 96 learning_rate: 5.0e-06 batch_size: 1 gradient_accumulation_steps: 1 num_train_epochs: 1 max_steps: 2 warmup_steps: 0 weight_decay: 0.0 save_steps: 1000000 logging_steps: 1 bf16: true