jialicheng's picture
Upload folder using huggingface_hub
01375c6 verified
raw
history blame
3.48 kB
{
"best_metric": 0.6603000000000001,
"best_model_checkpoint": "text_gen/unlearn/checkpoint/t5-large/neggrad/4.0/samsum_42/checkpoint-219",
"epoch": 5.0,
"eval_steps": 500,
"global_step": 365,
"is_hyper_param_search": false,
"is_local_process_zero": true,
"is_world_process_zero": true,
"log_history": [
{
"df_rougeL": 35.3727,
"epoch": 1.0,
"eval_gen_len": 19.8515625,
"eval_loss": 1.6698297262191772,
"eval_rouge1": 42.7849,
"eval_rouge2": 20.7407,
"eval_rougeL": 35.446,
"eval_rougeLsum": 39.589,
"eval_runtime": 349.4427,
"eval_samples_per_second": 2.341,
"eval_steps_per_second": 0.037,
"eval_unlearn_overall_rougeL": 0.5366499999999981,
"step": 73,
"test_rougeL": 35.446,
"unlearn_overall_rougeL": 0.5366499999999981,
"unlearn_time": -1
},
{
"df_rougeL": 12.4648,
"epoch": 2.0,
"eval_gen_len": 9.197916666666666,
"eval_loss": 7.590928554534912,
"eval_rouge1": 13.9304,
"eval_rouge2": 3.6865,
"eval_rougeL": 12.3627,
"eval_rougeLsum": 13.2181,
"eval_runtime": 638.2368,
"eval_samples_per_second": 1.282,
"eval_steps_per_second": 0.02,
"eval_unlearn_overall_rougeL": 0.44894999999999996,
"step": 146,
"test_rougeL": 12.3627,
"unlearn_overall_rougeL": 0.44894999999999996,
"unlearn_time": -1
},
{
"df_rougeL": 2.9036,
"epoch": 3.0,
"eval_gen_len": 2.96484375,
"eval_loss": 87.1946029663086,
"eval_rouge1": 3.236,
"eval_rouge2": 0.0575,
"eval_rougeL": 3.2242,
"eval_rougeLsum": 3.229,
"eval_runtime": 65.884,
"eval_samples_per_second": 12.416,
"eval_steps_per_second": 0.197,
"eval_unlearn_overall_rougeL": 0.6603000000000001,
"step": 219,
"test_rougeL": 3.2242,
"unlearn_overall_rougeL": 0.6603000000000001,
"unlearn_time": -1
},
{
"df_rougeL": 0.9739,
"epoch": 4.0,
"eval_gen_len": 2.12109375,
"eval_loss": 144.74517822265625,
"eval_rouge1": 0.8156,
"eval_rouge2": 0.0074,
"eval_rougeL": 0.8256,
"eval_rougeLsum": 0.8157,
"eval_runtime": 58.5107,
"eval_samples_per_second": 13.98,
"eval_steps_per_second": 0.222,
"eval_unlearn_overall_rougeL": 0.42585,
"step": 292,
"test_rougeL": 0.8256,
"unlearn_overall_rougeL": 0.42585,
"unlearn_time": -1
},
{
"df_rougeL": 0.6594,
"epoch": 5.0,
"eval_gen_len": 2.0377604166666665,
"eval_loss": 160.100341796875,
"eval_rouge1": 0.6105,
"eval_rouge2": 0.0,
"eval_rougeL": 0.6166,
"eval_rougeLsum": 0.6071,
"eval_runtime": 57.912,
"eval_samples_per_second": 14.125,
"eval_steps_per_second": 0.224,
"eval_unlearn_overall_rougeL": 0.4786,
"step": 365,
"test_rougeL": 0.6166,
"unlearn_overall_rougeL": 0.4786,
"unlearn_time": -1
},
{
"epoch": 5.0,
"step": 365,
"total_flos": 4443124453244928.0,
"train_loss": -37.45592626284247,
"train_runtime": 2431.0267,
"train_samples_per_second": 1.211,
"train_steps_per_second": 0.15
}
],
"logging_steps": 1000,
"max_steps": 365,
"num_input_tokens_seen": 0,
"num_train_epochs": 5,
"save_steps": 500,
"total_flos": 4443124453244928.0,
"train_batch_size": 8,
"trial_name": null,
"trial_params": null
}