| { |
| "best_metric": 0.6603000000000001, |
| "best_model_checkpoint": "text_gen/unlearn/checkpoint/t5-large/neggrad/4.0/samsum_42/checkpoint-219", |
| "epoch": 5.0, |
| "eval_steps": 500, |
| "global_step": 365, |
| "is_hyper_param_search": false, |
| "is_local_process_zero": true, |
| "is_world_process_zero": true, |
| "log_history": [ |
| { |
| "df_rougeL": 35.3727, |
| "epoch": 1.0, |
| "eval_gen_len": 19.8515625, |
| "eval_loss": 1.6698297262191772, |
| "eval_rouge1": 42.7849, |
| "eval_rouge2": 20.7407, |
| "eval_rougeL": 35.446, |
| "eval_rougeLsum": 39.589, |
| "eval_runtime": 349.4427, |
| "eval_samples_per_second": 2.341, |
| "eval_steps_per_second": 0.037, |
| "eval_unlearn_overall_rougeL": 0.5366499999999981, |
| "step": 73, |
| "test_rougeL": 35.446, |
| "unlearn_overall_rougeL": 0.5366499999999981, |
| "unlearn_time": -1 |
| }, |
| { |
| "df_rougeL": 12.4648, |
| "epoch": 2.0, |
| "eval_gen_len": 9.197916666666666, |
| "eval_loss": 7.590928554534912, |
| "eval_rouge1": 13.9304, |
| "eval_rouge2": 3.6865, |
| "eval_rougeL": 12.3627, |
| "eval_rougeLsum": 13.2181, |
| "eval_runtime": 638.2368, |
| "eval_samples_per_second": 1.282, |
| "eval_steps_per_second": 0.02, |
| "eval_unlearn_overall_rougeL": 0.44894999999999996, |
| "step": 146, |
| "test_rougeL": 12.3627, |
| "unlearn_overall_rougeL": 0.44894999999999996, |
| "unlearn_time": -1 |
| }, |
| { |
| "df_rougeL": 2.9036, |
| "epoch": 3.0, |
| "eval_gen_len": 2.96484375, |
| "eval_loss": 87.1946029663086, |
| "eval_rouge1": 3.236, |
| "eval_rouge2": 0.0575, |
| "eval_rougeL": 3.2242, |
| "eval_rougeLsum": 3.229, |
| "eval_runtime": 65.884, |
| "eval_samples_per_second": 12.416, |
| "eval_steps_per_second": 0.197, |
| "eval_unlearn_overall_rougeL": 0.6603000000000001, |
| "step": 219, |
| "test_rougeL": 3.2242, |
| "unlearn_overall_rougeL": 0.6603000000000001, |
| "unlearn_time": -1 |
| }, |
| { |
| "df_rougeL": 0.9739, |
| "epoch": 4.0, |
| "eval_gen_len": 2.12109375, |
| "eval_loss": 144.74517822265625, |
| "eval_rouge1": 0.8156, |
| "eval_rouge2": 0.0074, |
| "eval_rougeL": 0.8256, |
| "eval_rougeLsum": 0.8157, |
| "eval_runtime": 58.5107, |
| "eval_samples_per_second": 13.98, |
| "eval_steps_per_second": 0.222, |
| "eval_unlearn_overall_rougeL": 0.42585, |
| "step": 292, |
| "test_rougeL": 0.8256, |
| "unlearn_overall_rougeL": 0.42585, |
| "unlearn_time": -1 |
| }, |
| { |
| "df_rougeL": 0.6594, |
| "epoch": 5.0, |
| "eval_gen_len": 2.0377604166666665, |
| "eval_loss": 160.100341796875, |
| "eval_rouge1": 0.6105, |
| "eval_rouge2": 0.0, |
| "eval_rougeL": 0.6166, |
| "eval_rougeLsum": 0.6071, |
| "eval_runtime": 57.912, |
| "eval_samples_per_second": 14.125, |
| "eval_steps_per_second": 0.224, |
| "eval_unlearn_overall_rougeL": 0.4786, |
| "step": 365, |
| "test_rougeL": 0.6166, |
| "unlearn_overall_rougeL": 0.4786, |
| "unlearn_time": -1 |
| }, |
| { |
| "epoch": 5.0, |
| "step": 365, |
| "total_flos": 4443124453244928.0, |
| "train_loss": -37.45592626284247, |
| "train_runtime": 2431.0267, |
| "train_samples_per_second": 1.211, |
| "train_steps_per_second": 0.15 |
| } |
| ], |
| "logging_steps": 1000, |
| "max_steps": 365, |
| "num_input_tokens_seen": 0, |
| "num_train_epochs": 5, |
| "save_steps": 500, |
| "total_flos": 4443124453244928.0, |
| "train_batch_size": 8, |
| "trial_name": null, |
| "trial_params": null |
| } |
|
|