| { |
| "best_metric": 0.5588609576225281, |
| "best_model_checkpoint": "/content/drive/MyDrive/Colab Notebooks/models/t5-small-codesearchnet-multilang-python-java-javascript-go/checkpoint-3750", |
| "epoch": 10.0, |
| "global_step": 3750, |
| "is_hyper_param_search": false, |
| "is_local_process_zero": true, |
| "is_world_process_zero": true, |
| "log_history": [ |
| { |
| "epoch": 1.0, |
| "eval_avg_length": 16.436, |
| "eval_bleu": 0.0028, |
| "eval_loss": 0.7349299192428589, |
| "eval_rouge1": 0.1562, |
| "eval_rouge2": 0.0364, |
| "eval_runtime": 171.828, |
| "eval_samples_per_second": 29.099, |
| "eval_steps_per_second": 3.637, |
| "step": 375 |
| }, |
| { |
| "epoch": 1.33, |
| "learning_rate": 0.011613096110522747, |
| "loss": 2.3117, |
| "step": 500 |
| }, |
| { |
| "epoch": 2.0, |
| "eval_avg_length": 16.824, |
| "eval_bleu": 0.0066, |
| "eval_loss": 0.6613165736198425, |
| "eval_rouge1": 0.1818, |
| "eval_rouge2": 0.0531, |
| "eval_runtime": 169.3563, |
| "eval_samples_per_second": 29.524, |
| "eval_steps_per_second": 3.69, |
| "step": 750 |
| }, |
| { |
| "epoch": 2.67, |
| "learning_rate": 0.023271184414625168, |
| "loss": 0.6755, |
| "step": 1000 |
| }, |
| { |
| "epoch": 3.0, |
| "eval_avg_length": 16.931, |
| "eval_bleu": 0.007, |
| "eval_loss": 0.6232756972312927, |
| "eval_rouge1": 0.1957, |
| "eval_rouge2": 0.0594, |
| "eval_runtime": 169.3476, |
| "eval_samples_per_second": 29.525, |
| "eval_steps_per_second": 3.691, |
| "step": 1125 |
| }, |
| { |
| "epoch": 4.0, |
| "learning_rate": 0.03499825298786163, |
| "loss": 0.5998, |
| "step": 1500 |
| }, |
| { |
| "epoch": 4.0, |
| "eval_avg_length": 16.7154, |
| "eval_bleu": 0.0082, |
| "eval_loss": 0.6022565364837646, |
| "eval_rouge1": 0.202, |
| "eval_rouge2": 0.063, |
| "eval_runtime": 165.1906, |
| "eval_samples_per_second": 30.268, |
| "eval_steps_per_second": 3.784, |
| "step": 1500 |
| }, |
| { |
| "epoch": 5.0, |
| "eval_avg_length": 16.5468, |
| "eval_bleu": 0.0096, |
| "eval_loss": 0.5925326943397522, |
| "eval_rouge1": 0.2154, |
| "eval_rouge2": 0.0703, |
| "eval_runtime": 162.8367, |
| "eval_samples_per_second": 30.706, |
| "eval_steps_per_second": 3.838, |
| "step": 1875 |
| }, |
| { |
| "epoch": 5.33, |
| "learning_rate": 0.04682626947760582, |
| "loss": 0.5511, |
| "step": 2000 |
| }, |
| { |
| "epoch": 6.0, |
| "eval_avg_length": 15.7216, |
| "eval_bleu": 0.0091, |
| "eval_loss": 0.5728126168251038, |
| "eval_rouge1": 0.2213, |
| "eval_rouge2": 0.0774, |
| "eval_runtime": 160.1137, |
| "eval_samples_per_second": 31.228, |
| "eval_steps_per_second": 3.903, |
| "step": 2250 |
| }, |
| { |
| "epoch": 6.67, |
| "learning_rate": 0.05879075452685356, |
| "loss": 0.5147, |
| "step": 2500 |
| }, |
| { |
| "epoch": 7.0, |
| "eval_avg_length": 16.6658, |
| "eval_bleu": 0.0111, |
| "eval_loss": 0.5669918060302734, |
| "eval_rouge1": 0.2311, |
| "eval_rouge2": 0.0815, |
| "eval_runtime": 160.5038, |
| "eval_samples_per_second": 31.152, |
| "eval_steps_per_second": 3.894, |
| "step": 2625 |
| }, |
| { |
| "epoch": 8.0, |
| "learning_rate": 0.07094069570302963, |
| "loss": 0.4861, |
| "step": 3000 |
| }, |
| { |
| "epoch": 8.0, |
| "eval_avg_length": 17.038, |
| "eval_bleu": 0.0089, |
| "eval_loss": 0.5627844929695129, |
| "eval_rouge1": 0.2217, |
| "eval_rouge2": 0.077, |
| "eval_runtime": 160.3931, |
| "eval_samples_per_second": 31.173, |
| "eval_steps_per_second": 3.897, |
| "step": 3000 |
| }, |
| { |
| "epoch": 9.0, |
| "eval_avg_length": 16.362, |
| "eval_bleu": 0.0103, |
| "eval_loss": 0.5597769618034363, |
| "eval_rouge1": 0.2311, |
| "eval_rouge2": 0.0825, |
| "eval_runtime": 159.243, |
| "eval_samples_per_second": 31.399, |
| "eval_steps_per_second": 3.925, |
| "step": 3375 |
| }, |
| { |
| "epoch": 9.33, |
| "learning_rate": 0.08328617364168167, |
| "loss": 0.4526, |
| "step": 3500 |
| }, |
| { |
| "epoch": 10.0, |
| "eval_avg_length": 15.4298, |
| "eval_bleu": 0.0083, |
| "eval_loss": 0.5588609576225281, |
| "eval_rouge1": 0.232, |
| "eval_rouge2": 0.086, |
| "eval_runtime": 160.7722, |
| "eval_samples_per_second": 31.1, |
| "eval_steps_per_second": 3.887, |
| "step": 3750 |
| } |
| ], |
| "max_steps": 5625, |
| "num_train_epochs": 15, |
| "total_flos": 2.03012702208e+16, |
| "trial_name": null, |
| "trial_params": null |
| } |
|
|