| { |
| "best_metric": 0.77145, |
| "best_model_checkpoint": "text_gen/unlearn/checkpoint/t5-large/bad_teaching/2.0/samsum_42/checkpoint-18", |
| "epoch": 5.0, |
| "eval_steps": 500, |
| "global_step": 90, |
| "is_hyper_param_search": false, |
| "is_local_process_zero": true, |
| "is_world_process_zero": true, |
| "log_history": [ |
| { |
| "df_rougeL": 2.5684, |
| "epoch": 1.0, |
| "eval_gen_len": 117.5125, |
| "eval_loss": 5.078139781951904, |
| "eval_rouge1": 3.4658, |
| "eval_rouge2": 1.3784, |
| "eval_rougeL": 3.1345, |
| "eval_rougeLsum": 3.2705, |
| "eval_runtime": 1496.5741, |
| "eval_samples_per_second": 0.547, |
| "eval_steps_per_second": 0.017, |
| "eval_unlearn_overall_rougeL": 0.77145, |
| "step": 18, |
| "test_rougeL": 3.1113, |
| "unlearn_overall_rougeL": 0.77145, |
| "unlearn_time": -1 |
| }, |
| { |
| "df_rougeL": 16.3877, |
| "epoch": 2.0, |
| "eval_gen_len": 9.90375, |
| "eval_loss": 2.7741811275482178, |
| "eval_rouge1": 18.0247, |
| "eval_rouge2": 8.3532, |
| "eval_rougeL": 16.3652, |
| "eval_rougeLsum": 17.022, |
| "eval_runtime": 263.4378, |
| "eval_samples_per_second": 3.105, |
| "eval_steps_per_second": 0.099, |
| "eval_unlearn_overall_rougeL": 0.4784500000000005, |
| "step": 36, |
| "test_rougeL": 16.3446, |
| "unlearn_overall_rougeL": 0.4784500000000005, |
| "unlearn_time": -1 |
| }, |
| { |
| "df_rougeL": 0.037, |
| "epoch": 3.0, |
| "eval_gen_len": 120.74375, |
| "eval_loss": 32.48212432861328, |
| "eval_rouge1": 0.1096, |
| "eval_rouge2": 0.0147, |
| "eval_rougeL": 0.1078, |
| "eval_rougeLsum": 0.1103, |
| "eval_runtime": 1499.9815, |
| "eval_samples_per_second": 0.545, |
| "eval_steps_per_second": 0.017, |
| "eval_unlearn_overall_rougeL": 0.5387, |
| "step": 54, |
| "test_rougeL": 0.1144, |
| "unlearn_overall_rougeL": 0.5387, |
| "unlearn_time": -1 |
| }, |
| { |
| "df_rougeL": 0.037, |
| "epoch": 4.0, |
| "eval_gen_len": 125.785, |
| "eval_loss": 38.382774353027344, |
| "eval_rouge1": 0.0702, |
| "eval_rouge2": 0.0179, |
| "eval_rougeL": 0.0691, |
| "eval_rougeLsum": 0.0696, |
| "eval_runtime": 1500.0591, |
| "eval_samples_per_second": 0.545, |
| "eval_steps_per_second": 0.017, |
| "eval_unlearn_overall_rougeL": 0.5177499999999999, |
| "step": 72, |
| "test_rougeL": 0.0725, |
| "unlearn_overall_rougeL": 0.5177499999999999, |
| "unlearn_time": -1 |
| }, |
| { |
| "df_rougeL": 0.037, |
| "epoch": 5.0, |
| "eval_gen_len": 126.54, |
| "eval_loss": 39.759925842285156, |
| "eval_rouge1": 0.0426, |
| "eval_rouge2": 0.0, |
| "eval_rougeL": 0.0423, |
| "eval_rougeLsum": 0.0426, |
| "eval_runtime": 1500.0105, |
| "eval_samples_per_second": 0.545, |
| "eval_steps_per_second": 0.017, |
| "eval_unlearn_overall_rougeL": 0.50285, |
| "step": 90, |
| "test_rougeL": 0.0427, |
| "unlearn_overall_rougeL": 0.50285, |
| "unlearn_time": -1 |
| }, |
| { |
| "epoch": 5.0, |
| "step": 90, |
| "total_flos": 5937370337378304.0, |
| "train_loss": 0.0, |
| "train_runtime": 8983.6984, |
| "train_samples_per_second": 0.327, |
| "train_steps_per_second": 0.01 |
| } |
| ], |
| "logging_steps": 1000, |
| "max_steps": 90, |
| "num_input_tokens_seen": 0, |
| "num_train_epochs": 5, |
| "save_steps": 500, |
| "total_flos": 5937370337378304.0, |
| "train_batch_size": 32, |
| "trial_name": null, |
| "trial_params": null |
| } |
|
|