{ "best_metric": 73.16917224867254, "best_model_checkpoint": "/home/jcanete/ft-data/all_results/sqac/albeto_base_6/epochs_4_bs_16_lr_5e-5/checkpoint-1800", "epoch": 4.0, "global_step": 4152, "is_hyper_param_search": false, "is_local_process_zero": true, "is_world_process_zero": true, "log_history": [ { "epoch": 0.19, "eval_exact_match": 33.36909871244635, "eval_f1": 54.78264317515576, "step": 200 }, { "epoch": 0.39, "eval_exact_match": 43.50858369098712, "eval_f1": 63.86348098660957, "step": 400 }, { "epoch": 0.48, "learning_rate": 4.4014932562620424e-05, "loss": 2.2717, "step": 500 }, { "epoch": 0.58, "eval_exact_match": 48.22961373390558, "eval_f1": 67.33109541594044, "step": 600 }, { "epoch": 0.77, "eval_exact_match": 51.3412017167382, "eval_f1": 70.04063336916818, "step": 800 }, { "epoch": 0.96, "learning_rate": 3.799373795761079e-05, "loss": 1.3831, "step": 1000 }, { "epoch": 0.96, "eval_exact_match": 51.44849785407725, "eval_f1": 70.96531020638378, "step": 1000 }, { "epoch": 1.16, "eval_exact_match": 52.73605150214592, "eval_f1": 71.04868788055973, "step": 1200 }, { "epoch": 1.35, "eval_exact_match": 52.78969957081545, "eval_f1": 71.7028117298826, "step": 1400 }, { "epoch": 1.45, "learning_rate": 3.197254335260116e-05, "loss": 0.848, "step": 1500 }, { "epoch": 1.54, "eval_exact_match": 53.80901287553648, "eval_f1": 72.80035261141751, "step": 1600 }, { "epoch": 1.73, "eval_exact_match": 54.72103004291846, "eval_f1": 73.16917224867254, "step": 1800 }, { "epoch": 1.93, "learning_rate": 2.5951348747591525e-05, "loss": 0.7974, "step": 2000 }, { "epoch": 1.93, "eval_exact_match": 55.36480686695279, "eval_f1": 72.84567287023638, "step": 2000 }, { "epoch": 2.12, "eval_exact_match": 53.80901287553648, "eval_f1": 71.49884589693431, "step": 2200 }, { "epoch": 2.31, "eval_exact_match": 53.862660944206006, "eval_f1": 72.42435834140822, "step": 2400 }, { "epoch": 2.41, "learning_rate": 1.9930154142581888e-05, "loss": 0.4397, "step": 2500 }, { "epoch": 2.5, "eval_exact_match": 53.91630901287554, "eval_f1": 72.01940673830065, "step": 2600 }, { "epoch": 2.7, "eval_exact_match": 54.18454935622318, "eval_f1": 72.42131954627004, "step": 2800 }, { "epoch": 2.89, "learning_rate": 1.3908959537572255e-05, "loss": 0.3679, "step": 3000 }, { "epoch": 2.89, "eval_exact_match": 53.648068669527895, "eval_f1": 72.24358443143393, "step": 3000 }, { "epoch": 3.08, "eval_exact_match": 53.16523605150215, "eval_f1": 71.85180232237707, "step": 3200 }, { "epoch": 3.28, "eval_exact_match": 53.701716738197426, "eval_f1": 71.87041699024132, "step": 3400 }, { "epoch": 3.37, "learning_rate": 7.88776493256262e-06, "loss": 0.1905, "step": 3500 }, { "epoch": 3.47, "eval_exact_match": 53.37982832618026, "eval_f1": 71.85913435306477, "step": 3600 }, { "epoch": 3.66, "eval_exact_match": 53.21888412017167, "eval_f1": 71.95656973845054, "step": 3800 }, { "epoch": 3.85, "learning_rate": 1.8665703275529866e-06, "loss": 0.1273, "step": 4000 }, { "epoch": 3.85, "eval_exact_match": 52.84334763948498, "eval_f1": 71.60301657985642, "step": 4000 }, { "epoch": 4.0, "step": 4152, "total_flos": 1433973109980672.0, "train_loss": 0.7790700769148811, "train_runtime": 432.1028, "train_samples_per_second": 153.649, "train_steps_per_second": 9.609 } ], "max_steps": 4152, "num_train_epochs": 4, "total_flos": 1433973109980672.0, "trial_name": null, "trial_params": null }