| { | |
| "best_metric": 0.6654040404040403, | |
| "best_model_checkpoint": "twitter-roberta-base-WNUT/checkpoint-500", | |
| "epoch": 10.0, | |
| "global_step": 540, | |
| "is_hyper_param_search": false, | |
| "is_local_process_zero": true, | |
| "is_world_process_zero": true, | |
| "log_history": [ | |
| { | |
| "epoch": 0.46, | |
| "eval_accuracy": 0.9205491641772071, | |
| "eval_f1": 0.0, | |
| "eval_loss": 0.39121243357658386, | |
| "eval_precision": 0.0, | |
| "eval_recall": 0.0, | |
| "eval_runtime": 1.5425, | |
| "eval_samples_per_second": 654.138, | |
| "eval_steps_per_second": 0.648, | |
| "step": 25 | |
| }, | |
| { | |
| "epoch": 0.93, | |
| "eval_accuracy": 0.9209305281891565, | |
| "eval_f1": 0.004739336492890995, | |
| "eval_loss": 0.2846619784832001, | |
| "eval_precision": 0.25, | |
| "eval_recall": 0.0023923444976076554, | |
| "eval_runtime": 1.5304, | |
| "eval_samples_per_second": 659.288, | |
| "eval_steps_per_second": 0.653, | |
| "step": 50 | |
| }, | |
| { | |
| "epoch": 1.39, | |
| "eval_accuracy": 0.9426047162016145, | |
| "eval_f1": 0.4239766081871345, | |
| "eval_loss": 0.2449360191822052, | |
| "eval_precision": 0.5451127819548872, | |
| "eval_recall": 0.34688995215311, | |
| "eval_runtime": 1.487, | |
| "eval_samples_per_second": 678.556, | |
| "eval_steps_per_second": 0.673, | |
| "step": 75 | |
| }, | |
| { | |
| "epoch": 1.85, | |
| "eval_accuracy": 0.9491514650734125, | |
| "eval_f1": 0.5565455791638108, | |
| "eval_loss": 0.19464540481567383, | |
| "eval_precision": 0.651685393258427, | |
| "eval_recall": 0.48564593301435405, | |
| "eval_runtime": 1.5409, | |
| "eval_samples_per_second": 654.812, | |
| "eval_steps_per_second": 0.649, | |
| "step": 100 | |
| }, | |
| { | |
| "epoch": 2.31, | |
| "eval_accuracy": 0.9581135193542236, | |
| "eval_f1": 0.621870882740448, | |
| "eval_loss": 0.1851097047328949, | |
| "eval_precision": 0.6920821114369502, | |
| "eval_recall": 0.5645933014354066, | |
| "eval_runtime": 1.5283, | |
| "eval_samples_per_second": 660.202, | |
| "eval_steps_per_second": 0.654, | |
| "step": 125 | |
| }, | |
| { | |
| "epoch": 2.78, | |
| "eval_accuracy": 0.9594482933960465, | |
| "eval_f1": 0.6331399097356544, | |
| "eval_loss": 0.1671772003173828, | |
| "eval_precision": 0.6867132867132867, | |
| "eval_recall": 0.5873205741626795, | |
| "eval_runtime": 1.7364, | |
| "eval_samples_per_second": 581.088, | |
| "eval_steps_per_second": 0.576, | |
| "step": 150 | |
| }, | |
| { | |
| "epoch": 3.24, | |
| "eval_accuracy": 0.9615457954617682, | |
| "eval_f1": 0.6276527331189711, | |
| "eval_loss": 0.16754180192947388, | |
| "eval_precision": 0.6787204450625869, | |
| "eval_recall": 0.583732057416268, | |
| "eval_runtime": 1.522, | |
| "eval_samples_per_second": 662.938, | |
| "eval_steps_per_second": 0.657, | |
| "step": 175 | |
| }, | |
| { | |
| "epoch": 3.7, | |
| "eval_accuracy": 0.9637704188648064, | |
| "eval_f1": 0.65389369592089, | |
| "eval_loss": 0.16441918909549713, | |
| "eval_precision": 0.6764705882352942, | |
| "eval_recall": 0.6327751196172249, | |
| "eval_runtime": 1.5477, | |
| "eval_samples_per_second": 651.939, | |
| "eval_steps_per_second": 0.646, | |
| "step": 200 | |
| }, | |
| { | |
| "epoch": 4.17, | |
| "eval_accuracy": 0.9640246615394394, | |
| "eval_f1": 0.673697270471464, | |
| "eval_loss": 0.1672356277704239, | |
| "eval_precision": 0.6997422680412371, | |
| "eval_recall": 0.6495215311004785, | |
| "eval_runtime": 1.5668, | |
| "eval_samples_per_second": 643.973, | |
| "eval_steps_per_second": 0.638, | |
| "step": 225 | |
| }, | |
| { | |
| "epoch": 4.63, | |
| "eval_accuracy": 0.9648509502319964, | |
| "eval_f1": 0.6666666666666666, | |
| "eval_loss": 0.16518081724643707, | |
| "eval_precision": 0.6915167095115681, | |
| "eval_recall": 0.6435406698564593, | |
| "eval_runtime": 1.544, | |
| "eval_samples_per_second": 653.501, | |
| "eval_steps_per_second": 0.648, | |
| "step": 250 | |
| }, | |
| { | |
| "epoch": 5.09, | |
| "eval_accuracy": 0.9629441301722494, | |
| "eval_f1": 0.6520618556701031, | |
| "eval_loss": 0.18820269405841827, | |
| "eval_precision": 0.7067039106145251, | |
| "eval_recall": 0.6052631578947368, | |
| "eval_runtime": 1.5459, | |
| "eval_samples_per_second": 652.688, | |
| "eval_steps_per_second": 0.647, | |
| "step": 275 | |
| }, | |
| { | |
| "epoch": 5.56, | |
| "eval_accuracy": 0.9644695862200471, | |
| "eval_f1": 0.6717267552182163, | |
| "eval_loss": 0.17831429839134216, | |
| "eval_precision": 0.7127516778523489, | |
| "eval_recall": 0.6351674641148325, | |
| "eval_runtime": 1.5976, | |
| "eval_samples_per_second": 631.564, | |
| "eval_steps_per_second": 0.626, | |
| "step": 300 | |
| }, | |
| { | |
| "epoch": 6.02, | |
| "eval_accuracy": 0.9638975402021229, | |
| "eval_f1": 0.6564885496183207, | |
| "eval_loss": 0.18128034472465515, | |
| "eval_precision": 0.7010869565217391, | |
| "eval_recall": 0.6172248803827751, | |
| "eval_runtime": 1.5524, | |
| "eval_samples_per_second": 649.966, | |
| "eval_steps_per_second": 0.644, | |
| "step": 325 | |
| }, | |
| { | |
| "epoch": 6.48, | |
| "eval_accuracy": 0.96472382889468, | |
| "eval_f1": 0.677561282212445, | |
| "eval_loss": 0.18036700785160065, | |
| "eval_precision": 0.713907284768212, | |
| "eval_recall": 0.6447368421052632, | |
| "eval_runtime": 1.6249, | |
| "eval_samples_per_second": 620.943, | |
| "eval_steps_per_second": 0.615, | |
| "step": 350 | |
| }, | |
| { | |
| "epoch": 6.94, | |
| "eval_accuracy": 0.9640882222080976, | |
| "eval_f1": 0.6709346991037132, | |
| "eval_loss": 0.19022008776664734, | |
| "eval_precision": 0.721763085399449, | |
| "eval_recall": 0.6267942583732058, | |
| "eval_runtime": 1.8093, | |
| "eval_samples_per_second": 557.663, | |
| "eval_steps_per_second": 0.553, | |
| "step": 375 | |
| }, | |
| { | |
| "epoch": 7.41, | |
| "eval_accuracy": 0.9640882222080976, | |
| "eval_f1": 0.668777707409753, | |
| "eval_loss": 0.1882619857788086, | |
| "eval_precision": 0.7106325706594886, | |
| "eval_recall": 0.631578947368421, | |
| "eval_runtime": 1.62, | |
| "eval_samples_per_second": 622.858, | |
| "eval_steps_per_second": 0.617, | |
| "step": 400 | |
| }, | |
| { | |
| "epoch": 7.87, | |
| "eval_accuracy": 0.9642789042140724, | |
| "eval_f1": 0.6683480453972257, | |
| "eval_loss": 0.18618735671043396, | |
| "eval_precision": 0.7066666666666667, | |
| "eval_recall": 0.6339712918660287, | |
| "eval_runtime": 1.5944, | |
| "eval_samples_per_second": 632.853, | |
| "eval_steps_per_second": 0.627, | |
| "step": 425 | |
| }, | |
| { | |
| "epoch": 8.33, | |
| "eval_accuracy": 0.9638975402021229, | |
| "eval_f1": 0.6670870113493064, | |
| "eval_loss": 0.1881590634584427, | |
| "eval_precision": 0.7053333333333334, | |
| "eval_recall": 0.6327751196172249, | |
| "eval_runtime": 1.7003, | |
| "eval_samples_per_second": 593.415, | |
| "eval_steps_per_second": 0.588, | |
| "step": 450 | |
| }, | |
| { | |
| "epoch": 8.8, | |
| "eval_accuracy": 0.9638339795334647, | |
| "eval_f1": 0.6658243840808591, | |
| "eval_loss": 0.19190868735313416, | |
| "eval_precision": 0.7054886211512718, | |
| "eval_recall": 0.6303827751196173, | |
| "eval_runtime": 1.543, | |
| "eval_samples_per_second": 653.928, | |
| "eval_steps_per_second": 0.648, | |
| "step": 475 | |
| }, | |
| { | |
| "epoch": 9.26, | |
| "learning_rate": 1.4814814814814815e-06, | |
| "loss": 0.1175, | |
| "step": 500 | |
| }, | |
| { | |
| "epoch": 9.26, | |
| "eval_accuracy": 0.9639611008707811, | |
| "eval_f1": 0.6654040404040403, | |
| "eval_loss": 0.19381117820739746, | |
| "eval_precision": 0.7045454545454546, | |
| "eval_recall": 0.6303827751196173, | |
| "eval_runtime": 1.541, | |
| "eval_samples_per_second": 654.789, | |
| "eval_steps_per_second": 0.649, | |
| "step": 500 | |
| }, | |
| { | |
| "epoch": 9.72, | |
| "eval_accuracy": 0.9645967075573635, | |
| "eval_f1": 0.6704190118824266, | |
| "eval_loss": 0.18799594044685364, | |
| "eval_precision": 0.7024901703800787, | |
| "eval_recall": 0.6411483253588517, | |
| "eval_runtime": 1.6071, | |
| "eval_samples_per_second": 627.849, | |
| "eval_steps_per_second": 0.622, | |
| "step": 525 | |
| }, | |
| { | |
| "epoch": 10.0, | |
| "step": 540, | |
| "total_flos": 1009327449452316.0, | |
| "train_loss": 0.11085769158822519, | |
| "train_runtime": 157.5154, | |
| "train_samples_per_second": 215.471, | |
| "train_steps_per_second": 3.428 | |
| } | |
| ], | |
| "max_steps": 540, | |
| "num_train_epochs": 10, | |
| "total_flos": 1009327449452316.0, | |
| "trial_name": null, | |
| "trial_params": null | |
| } | |