|
{ |
|
"best_metric": 1.0, |
|
"best_model_checkpoint": "delivery_truck_classification/checkpoint-4", |
|
"epoch": 59.94117647058823, |
|
"global_step": 240, |
|
"is_hyper_param_search": false, |
|
"is_local_process_zero": true, |
|
"is_world_process_zero": true, |
|
"log_history": [ |
|
{ |
|
"epoch": 0.94, |
|
"eval_accuracy": 1.0, |
|
"eval_loss": 0.028991766273975372, |
|
"eval_runtime": 3.7584, |
|
"eval_samples_per_second": 15.698, |
|
"eval_steps_per_second": 0.532, |
|
"step": 4 |
|
}, |
|
{ |
|
"epoch": 1.94, |
|
"eval_accuracy": 1.0, |
|
"eval_loss": 0.028991766273975372, |
|
"eval_runtime": 3.805, |
|
"eval_samples_per_second": 15.506, |
|
"eval_steps_per_second": 0.526, |
|
"step": 8 |
|
}, |
|
{ |
|
"epoch": 2.94, |
|
"eval_accuracy": 1.0, |
|
"eval_loss": 0.028991766273975372, |
|
"eval_runtime": 3.7489, |
|
"eval_samples_per_second": 15.738, |
|
"eval_steps_per_second": 0.533, |
|
"step": 12 |
|
}, |
|
{ |
|
"epoch": 3.94, |
|
"eval_accuracy": 1.0, |
|
"eval_loss": 0.028991766273975372, |
|
"eval_runtime": 3.8228, |
|
"eval_samples_per_second": 15.434, |
|
"eval_steps_per_second": 0.523, |
|
"step": 16 |
|
}, |
|
{ |
|
"epoch": 4.94, |
|
"learning_rate": 0.0, |
|
"loss": 0.2595, |
|
"step": 20 |
|
}, |
|
{ |
|
"epoch": 4.94, |
|
"eval_accuracy": 1.0, |
|
"eval_loss": 0.028991766273975372, |
|
"eval_runtime": 3.7534, |
|
"eval_samples_per_second": 15.719, |
|
"eval_steps_per_second": 0.533, |
|
"step": 20 |
|
}, |
|
{ |
|
"epoch": 5.94, |
|
"eval_accuracy": 1.0, |
|
"eval_loss": 0.028991766273975372, |
|
"eval_runtime": 3.7496, |
|
"eval_samples_per_second": 15.735, |
|
"eval_steps_per_second": 0.533, |
|
"step": 24 |
|
}, |
|
{ |
|
"epoch": 6.94, |
|
"eval_accuracy": 1.0, |
|
"eval_loss": 0.028991766273975372, |
|
"eval_runtime": 3.798, |
|
"eval_samples_per_second": 15.534, |
|
"eval_steps_per_second": 0.527, |
|
"step": 28 |
|
}, |
|
{ |
|
"epoch": 7.94, |
|
"eval_accuracy": 1.0, |
|
"eval_loss": 0.028991766273975372, |
|
"eval_runtime": 3.7322, |
|
"eval_samples_per_second": 15.808, |
|
"eval_steps_per_second": 0.536, |
|
"step": 32 |
|
}, |
|
{ |
|
"epoch": 8.94, |
|
"eval_accuracy": 1.0, |
|
"eval_loss": 0.028991766273975372, |
|
"eval_runtime": 3.7416, |
|
"eval_samples_per_second": 15.769, |
|
"eval_steps_per_second": 0.535, |
|
"step": 36 |
|
}, |
|
{ |
|
"epoch": 9.94, |
|
"learning_rate": 0.0, |
|
"loss": 0.2679, |
|
"step": 40 |
|
}, |
|
{ |
|
"epoch": 9.94, |
|
"eval_accuracy": 1.0, |
|
"eval_loss": 0.028991766273975372, |
|
"eval_runtime": 3.7284, |
|
"eval_samples_per_second": 15.824, |
|
"eval_steps_per_second": 0.536, |
|
"step": 40 |
|
}, |
|
{ |
|
"epoch": 10.94, |
|
"eval_accuracy": 1.0, |
|
"eval_loss": 0.028991766273975372, |
|
"eval_runtime": 3.726, |
|
"eval_samples_per_second": 15.835, |
|
"eval_steps_per_second": 0.537, |
|
"step": 44 |
|
}, |
|
{ |
|
"epoch": 11.94, |
|
"eval_accuracy": 1.0, |
|
"eval_loss": 0.028991766273975372, |
|
"eval_runtime": 3.7864, |
|
"eval_samples_per_second": 15.582, |
|
"eval_steps_per_second": 0.528, |
|
"step": 48 |
|
}, |
|
{ |
|
"epoch": 12.94, |
|
"eval_accuracy": 1.0, |
|
"eval_loss": 0.028991766273975372, |
|
"eval_runtime": 3.8076, |
|
"eval_samples_per_second": 15.495, |
|
"eval_steps_per_second": 0.525, |
|
"step": 52 |
|
}, |
|
{ |
|
"epoch": 13.94, |
|
"eval_accuracy": 1.0, |
|
"eval_loss": 0.028991766273975372, |
|
"eval_runtime": 3.7937, |
|
"eval_samples_per_second": 15.552, |
|
"eval_steps_per_second": 0.527, |
|
"step": 56 |
|
}, |
|
{ |
|
"epoch": 14.94, |
|
"learning_rate": 0.0, |
|
"loss": 0.275, |
|
"step": 60 |
|
}, |
|
{ |
|
"epoch": 14.94, |
|
"eval_accuracy": 1.0, |
|
"eval_loss": 0.028991766273975372, |
|
"eval_runtime": 3.7461, |
|
"eval_samples_per_second": 15.75, |
|
"eval_steps_per_second": 0.534, |
|
"step": 60 |
|
}, |
|
{ |
|
"epoch": 15.94, |
|
"eval_accuracy": 1.0, |
|
"eval_loss": 0.028991766273975372, |
|
"eval_runtime": 3.8277, |
|
"eval_samples_per_second": 15.414, |
|
"eval_steps_per_second": 0.523, |
|
"step": 64 |
|
}, |
|
{ |
|
"epoch": 16.94, |
|
"eval_accuracy": 1.0, |
|
"eval_loss": 0.028991766273975372, |
|
"eval_runtime": 3.764, |
|
"eval_samples_per_second": 15.675, |
|
"eval_steps_per_second": 0.531, |
|
"step": 68 |
|
}, |
|
{ |
|
"epoch": 17.94, |
|
"eval_accuracy": 1.0, |
|
"eval_loss": 0.028991766273975372, |
|
"eval_runtime": 3.7719, |
|
"eval_samples_per_second": 15.642, |
|
"eval_steps_per_second": 0.53, |
|
"step": 72 |
|
}, |
|
{ |
|
"epoch": 18.94, |
|
"eval_accuracy": 1.0, |
|
"eval_loss": 0.028991766273975372, |
|
"eval_runtime": 3.826, |
|
"eval_samples_per_second": 15.421, |
|
"eval_steps_per_second": 0.523, |
|
"step": 76 |
|
}, |
|
{ |
|
"epoch": 19.94, |
|
"learning_rate": 0.0, |
|
"loss": 0.248, |
|
"step": 80 |
|
}, |
|
{ |
|
"epoch": 19.94, |
|
"eval_accuracy": 1.0, |
|
"eval_loss": 0.028991766273975372, |
|
"eval_runtime": 3.7289, |
|
"eval_samples_per_second": 15.822, |
|
"eval_steps_per_second": 0.536, |
|
"step": 80 |
|
}, |
|
{ |
|
"epoch": 20.94, |
|
"eval_accuracy": 1.0, |
|
"eval_loss": 0.028991766273975372, |
|
"eval_runtime": 3.7427, |
|
"eval_samples_per_second": 15.764, |
|
"eval_steps_per_second": 0.534, |
|
"step": 84 |
|
}, |
|
{ |
|
"epoch": 21.94, |
|
"eval_accuracy": 1.0, |
|
"eval_loss": 0.028991766273975372, |
|
"eval_runtime": 3.6831, |
|
"eval_samples_per_second": 16.019, |
|
"eval_steps_per_second": 0.543, |
|
"step": 88 |
|
}, |
|
{ |
|
"epoch": 22.94, |
|
"eval_accuracy": 1.0, |
|
"eval_loss": 0.028991766273975372, |
|
"eval_runtime": 3.764, |
|
"eval_samples_per_second": 15.675, |
|
"eval_steps_per_second": 0.531, |
|
"step": 92 |
|
}, |
|
{ |
|
"epoch": 23.94, |
|
"eval_accuracy": 1.0, |
|
"eval_loss": 0.028991766273975372, |
|
"eval_runtime": 3.7309, |
|
"eval_samples_per_second": 15.814, |
|
"eval_steps_per_second": 0.536, |
|
"step": 96 |
|
}, |
|
{ |
|
"epoch": 24.94, |
|
"learning_rate": 0.0, |
|
"loss": 0.2669, |
|
"step": 100 |
|
}, |
|
{ |
|
"epoch": 24.94, |
|
"eval_accuracy": 1.0, |
|
"eval_loss": 0.028991766273975372, |
|
"eval_runtime": 3.7661, |
|
"eval_samples_per_second": 15.666, |
|
"eval_steps_per_second": 0.531, |
|
"step": 100 |
|
}, |
|
{ |
|
"epoch": 25.94, |
|
"eval_accuracy": 1.0, |
|
"eval_loss": 0.028991766273975372, |
|
"eval_runtime": 3.682, |
|
"eval_samples_per_second": 16.024, |
|
"eval_steps_per_second": 0.543, |
|
"step": 104 |
|
}, |
|
{ |
|
"epoch": 26.94, |
|
"eval_accuracy": 1.0, |
|
"eval_loss": 0.028991766273975372, |
|
"eval_runtime": 3.7339, |
|
"eval_samples_per_second": 15.801, |
|
"eval_steps_per_second": 0.536, |
|
"step": 108 |
|
}, |
|
{ |
|
"epoch": 27.94, |
|
"eval_accuracy": 1.0, |
|
"eval_loss": 0.028991766273975372, |
|
"eval_runtime": 3.8015, |
|
"eval_samples_per_second": 15.52, |
|
"eval_steps_per_second": 0.526, |
|
"step": 112 |
|
}, |
|
{ |
|
"epoch": 28.94, |
|
"eval_accuracy": 1.0, |
|
"eval_loss": 0.028991766273975372, |
|
"eval_runtime": 3.7232, |
|
"eval_samples_per_second": 15.846, |
|
"eval_steps_per_second": 0.537, |
|
"step": 116 |
|
}, |
|
{ |
|
"epoch": 29.94, |
|
"learning_rate": 0.0, |
|
"loss": 0.2589, |
|
"step": 120 |
|
}, |
|
{ |
|
"epoch": 29.94, |
|
"eval_accuracy": 1.0, |
|
"eval_loss": 0.028991766273975372, |
|
"eval_runtime": 3.7329, |
|
"eval_samples_per_second": 15.805, |
|
"eval_steps_per_second": 0.536, |
|
"step": 120 |
|
}, |
|
{ |
|
"epoch": 30.94, |
|
"eval_accuracy": 1.0, |
|
"eval_loss": 0.028991766273975372, |
|
"eval_runtime": 3.7815, |
|
"eval_samples_per_second": 15.602, |
|
"eval_steps_per_second": 0.529, |
|
"step": 124 |
|
}, |
|
{ |
|
"epoch": 31.94, |
|
"eval_accuracy": 1.0, |
|
"eval_loss": 0.028991766273975372, |
|
"eval_runtime": 3.7496, |
|
"eval_samples_per_second": 15.735, |
|
"eval_steps_per_second": 0.533, |
|
"step": 128 |
|
}, |
|
{ |
|
"epoch": 32.94, |
|
"eval_accuracy": 1.0, |
|
"eval_loss": 0.028991766273975372, |
|
"eval_runtime": 3.7126, |
|
"eval_samples_per_second": 15.892, |
|
"eval_steps_per_second": 0.539, |
|
"step": 132 |
|
}, |
|
{ |
|
"epoch": 33.94, |
|
"eval_accuracy": 1.0, |
|
"eval_loss": 0.028991766273975372, |
|
"eval_runtime": 3.6855, |
|
"eval_samples_per_second": 16.009, |
|
"eval_steps_per_second": 0.543, |
|
"step": 136 |
|
}, |
|
{ |
|
"epoch": 34.94, |
|
"learning_rate": 0.0, |
|
"loss": 0.278, |
|
"step": 140 |
|
}, |
|
{ |
|
"epoch": 34.94, |
|
"eval_accuracy": 1.0, |
|
"eval_loss": 0.028991766273975372, |
|
"eval_runtime": 3.7784, |
|
"eval_samples_per_second": 15.615, |
|
"eval_steps_per_second": 0.529, |
|
"step": 140 |
|
}, |
|
{ |
|
"epoch": 35.94, |
|
"eval_accuracy": 1.0, |
|
"eval_loss": 0.028991766273975372, |
|
"eval_runtime": 3.7189, |
|
"eval_samples_per_second": 15.865, |
|
"eval_steps_per_second": 0.538, |
|
"step": 144 |
|
}, |
|
{ |
|
"epoch": 36.94, |
|
"eval_accuracy": 1.0, |
|
"eval_loss": 0.028991766273975372, |
|
"eval_runtime": 3.7865, |
|
"eval_samples_per_second": 15.582, |
|
"eval_steps_per_second": 0.528, |
|
"step": 148 |
|
}, |
|
{ |
|
"epoch": 37.94, |
|
"eval_accuracy": 1.0, |
|
"eval_loss": 0.028991766273975372, |
|
"eval_runtime": 3.7161, |
|
"eval_samples_per_second": 15.877, |
|
"eval_steps_per_second": 0.538, |
|
"step": 152 |
|
}, |
|
{ |
|
"epoch": 38.94, |
|
"eval_accuracy": 1.0, |
|
"eval_loss": 0.028991766273975372, |
|
"eval_runtime": 3.7413, |
|
"eval_samples_per_second": 15.77, |
|
"eval_steps_per_second": 0.535, |
|
"step": 156 |
|
}, |
|
{ |
|
"epoch": 39.94, |
|
"learning_rate": 0.0, |
|
"loss": 0.273, |
|
"step": 160 |
|
}, |
|
{ |
|
"epoch": 39.94, |
|
"eval_accuracy": 1.0, |
|
"eval_loss": 0.028991766273975372, |
|
"eval_runtime": 3.7504, |
|
"eval_samples_per_second": 15.732, |
|
"eval_steps_per_second": 0.533, |
|
"step": 160 |
|
}, |
|
{ |
|
"epoch": 40.94, |
|
"eval_accuracy": 1.0, |
|
"eval_loss": 0.028991766273975372, |
|
"eval_runtime": 3.7301, |
|
"eval_samples_per_second": 15.817, |
|
"eval_steps_per_second": 0.536, |
|
"step": 164 |
|
}, |
|
{ |
|
"epoch": 41.94, |
|
"eval_accuracy": 1.0, |
|
"eval_loss": 0.028991766273975372, |
|
"eval_runtime": 3.6896, |
|
"eval_samples_per_second": 15.991, |
|
"eval_steps_per_second": 0.542, |
|
"step": 168 |
|
}, |
|
{ |
|
"epoch": 42.94, |
|
"eval_accuracy": 1.0, |
|
"eval_loss": 0.028991766273975372, |
|
"eval_runtime": 3.8409, |
|
"eval_samples_per_second": 15.361, |
|
"eval_steps_per_second": 0.521, |
|
"step": 172 |
|
}, |
|
{ |
|
"epoch": 43.94, |
|
"eval_accuracy": 1.0, |
|
"eval_loss": 0.028991766273975372, |
|
"eval_runtime": 3.7381, |
|
"eval_samples_per_second": 15.783, |
|
"eval_steps_per_second": 0.535, |
|
"step": 176 |
|
}, |
|
{ |
|
"epoch": 44.94, |
|
"learning_rate": 0.0, |
|
"loss": 0.2535, |
|
"step": 180 |
|
}, |
|
{ |
|
"epoch": 44.94, |
|
"eval_accuracy": 1.0, |
|
"eval_loss": 0.028991766273975372, |
|
"eval_runtime": 3.7521, |
|
"eval_samples_per_second": 15.724, |
|
"eval_steps_per_second": 0.533, |
|
"step": 180 |
|
}, |
|
{ |
|
"epoch": 45.94, |
|
"eval_accuracy": 1.0, |
|
"eval_loss": 0.028991766273975372, |
|
"eval_runtime": 3.7759, |
|
"eval_samples_per_second": 15.625, |
|
"eval_steps_per_second": 0.53, |
|
"step": 184 |
|
}, |
|
{ |
|
"epoch": 46.94, |
|
"eval_accuracy": 1.0, |
|
"eval_loss": 0.028991766273975372, |
|
"eval_runtime": 3.7894, |
|
"eval_samples_per_second": 15.57, |
|
"eval_steps_per_second": 0.528, |
|
"step": 188 |
|
}, |
|
{ |
|
"epoch": 47.94, |
|
"eval_accuracy": 1.0, |
|
"eval_loss": 0.028991766273975372, |
|
"eval_runtime": 3.7432, |
|
"eval_samples_per_second": 15.762, |
|
"eval_steps_per_second": 0.534, |
|
"step": 192 |
|
}, |
|
{ |
|
"epoch": 48.94, |
|
"eval_accuracy": 1.0, |
|
"eval_loss": 0.028991766273975372, |
|
"eval_runtime": 3.7921, |
|
"eval_samples_per_second": 15.559, |
|
"eval_steps_per_second": 0.527, |
|
"step": 196 |
|
}, |
|
{ |
|
"epoch": 49.94, |
|
"learning_rate": 0.0, |
|
"loss": 0.2762, |
|
"step": 200 |
|
}, |
|
{ |
|
"epoch": 49.94, |
|
"eval_accuracy": 1.0, |
|
"eval_loss": 0.028991766273975372, |
|
"eval_runtime": 3.8149, |
|
"eval_samples_per_second": 15.466, |
|
"eval_steps_per_second": 0.524, |
|
"step": 200 |
|
}, |
|
{ |
|
"epoch": 50.94, |
|
"eval_accuracy": 1.0, |
|
"eval_loss": 0.028991766273975372, |
|
"eval_runtime": 3.7494, |
|
"eval_samples_per_second": 15.736, |
|
"eval_steps_per_second": 0.533, |
|
"step": 204 |
|
}, |
|
{ |
|
"epoch": 51.94, |
|
"eval_accuracy": 1.0, |
|
"eval_loss": 0.028991766273975372, |
|
"eval_runtime": 3.758, |
|
"eval_samples_per_second": 15.7, |
|
"eval_steps_per_second": 0.532, |
|
"step": 208 |
|
}, |
|
{ |
|
"epoch": 52.94, |
|
"eval_accuracy": 1.0, |
|
"eval_loss": 0.028991766273975372, |
|
"eval_runtime": 4.5125, |
|
"eval_samples_per_second": 13.075, |
|
"eval_steps_per_second": 0.443, |
|
"step": 212 |
|
}, |
|
{ |
|
"epoch": 53.94, |
|
"eval_accuracy": 1.0, |
|
"eval_loss": 0.028991766273975372, |
|
"eval_runtime": 3.6913, |
|
"eval_samples_per_second": 15.983, |
|
"eval_steps_per_second": 0.542, |
|
"step": 216 |
|
}, |
|
{ |
|
"epoch": 54.94, |
|
"learning_rate": 0.0, |
|
"loss": 0.2798, |
|
"step": 220 |
|
}, |
|
{ |
|
"epoch": 54.94, |
|
"eval_accuracy": 1.0, |
|
"eval_loss": 0.028991766273975372, |
|
"eval_runtime": 3.7635, |
|
"eval_samples_per_second": 15.677, |
|
"eval_steps_per_second": 0.531, |
|
"step": 220 |
|
}, |
|
{ |
|
"epoch": 55.94, |
|
"eval_accuracy": 1.0, |
|
"eval_loss": 0.028991766273975372, |
|
"eval_runtime": 3.7464, |
|
"eval_samples_per_second": 15.748, |
|
"eval_steps_per_second": 0.534, |
|
"step": 224 |
|
}, |
|
{ |
|
"epoch": 56.94, |
|
"eval_accuracy": 1.0, |
|
"eval_loss": 0.028991766273975372, |
|
"eval_runtime": 3.7621, |
|
"eval_samples_per_second": 15.683, |
|
"eval_steps_per_second": 0.532, |
|
"step": 228 |
|
}, |
|
{ |
|
"epoch": 57.94, |
|
"eval_accuracy": 1.0, |
|
"eval_loss": 0.028991766273975372, |
|
"eval_runtime": 3.7552, |
|
"eval_samples_per_second": 15.712, |
|
"eval_steps_per_second": 0.533, |
|
"step": 232 |
|
}, |
|
{ |
|
"epoch": 58.94, |
|
"eval_accuracy": 1.0, |
|
"eval_loss": 0.028991766273975372, |
|
"eval_runtime": 3.8189, |
|
"eval_samples_per_second": 15.449, |
|
"eval_steps_per_second": 0.524, |
|
"step": 236 |
|
}, |
|
{ |
|
"epoch": 59.94, |
|
"learning_rate": 0.0, |
|
"loss": 0.2709, |
|
"step": 240 |
|
}, |
|
{ |
|
"epoch": 59.94, |
|
"eval_accuracy": 1.0, |
|
"eval_loss": 0.028991766273975372, |
|
"eval_runtime": 3.7206, |
|
"eval_samples_per_second": 15.858, |
|
"eval_steps_per_second": 0.538, |
|
"step": 240 |
|
}, |
|
{ |
|
"epoch": 59.94, |
|
"step": 240, |
|
"total_flos": 7.88616702456404e+17, |
|
"train_loss": 0.267316605647405, |
|
"train_runtime": 6314.82, |
|
"train_samples_per_second": 5.026, |
|
"train_steps_per_second": 0.038 |
|
} |
|
], |
|
"max_steps": 240, |
|
"num_train_epochs": 60, |
|
"total_flos": 7.88616702456404e+17, |
|
"trial_name": null, |
|
"trial_params": null |
|
} |
|
|