|
{ |
|
"best_metric": 0.8639652677279306, |
|
"best_model_checkpoint": "swin-base-patch4-window7-224-in22k-MM_Classification_base_V10/checkpoint-100", |
|
"epoch": 6.686567164179104, |
|
"eval_steps": 500, |
|
"global_step": 112, |
|
"is_hyper_param_search": false, |
|
"is_local_process_zero": true, |
|
"is_world_process_zero": true, |
|
"log_history": [ |
|
{ |
|
"epoch": 0.5970149253731343, |
|
"grad_norm": 3.4567720890045166, |
|
"learning_rate": 4.166666666666667e-05, |
|
"loss": 0.9254, |
|
"step": 10 |
|
}, |
|
{ |
|
"epoch": 0.9552238805970149, |
|
"eval_accuracy": 0.8133140376266281, |
|
"eval_loss": 0.4842127859592438, |
|
"eval_runtime": 115.4192, |
|
"eval_samples_per_second": 5.987, |
|
"eval_steps_per_second": 0.052, |
|
"step": 16 |
|
}, |
|
{ |
|
"epoch": 1.1940298507462686, |
|
"grad_norm": 2.1373002529144287, |
|
"learning_rate": 4.600000000000001e-05, |
|
"loss": 0.5607, |
|
"step": 20 |
|
}, |
|
{ |
|
"epoch": 1.7910447761194028, |
|
"grad_norm": 1.4010789394378662, |
|
"learning_rate": 4.1e-05, |
|
"loss": 0.4552, |
|
"step": 30 |
|
}, |
|
{ |
|
"epoch": 1.9701492537313432, |
|
"eval_accuracy": 0.849493487698987, |
|
"eval_loss": 0.3855249881744385, |
|
"eval_runtime": 118.0615, |
|
"eval_samples_per_second": 5.853, |
|
"eval_steps_per_second": 0.051, |
|
"step": 33 |
|
}, |
|
{ |
|
"epoch": 2.388059701492537, |
|
"grad_norm": 3.225425958633423, |
|
"learning_rate": 3.6e-05, |
|
"loss": 0.4006, |
|
"step": 40 |
|
}, |
|
{ |
|
"epoch": 2.9850746268656714, |
|
"grad_norm": 1.8630387783050537, |
|
"learning_rate": 3.1e-05, |
|
"loss": 0.4034, |
|
"step": 50 |
|
}, |
|
{ |
|
"epoch": 2.9850746268656714, |
|
"eval_accuracy": 0.8610709117221418, |
|
"eval_loss": 0.34522491693496704, |
|
"eval_runtime": 76.1197, |
|
"eval_samples_per_second": 9.078, |
|
"eval_steps_per_second": 0.079, |
|
"step": 50 |
|
}, |
|
{ |
|
"epoch": 3.582089552238806, |
|
"grad_norm": 2.277456521987915, |
|
"learning_rate": 2.6000000000000002e-05, |
|
"loss": 0.3583, |
|
"step": 60 |
|
}, |
|
{ |
|
"epoch": 4.0, |
|
"eval_accuracy": 0.8581765557163531, |
|
"eval_loss": 0.33568304777145386, |
|
"eval_runtime": 76.3565, |
|
"eval_samples_per_second": 9.05, |
|
"eval_steps_per_second": 0.079, |
|
"step": 67 |
|
}, |
|
{ |
|
"epoch": 4.17910447761194, |
|
"grad_norm": 1.8838659524917603, |
|
"learning_rate": 2.1e-05, |
|
"loss": 0.3683, |
|
"step": 70 |
|
}, |
|
{ |
|
"epoch": 4.776119402985074, |
|
"grad_norm": 2.815551996231079, |
|
"learning_rate": 1.6000000000000003e-05, |
|
"loss": 0.353, |
|
"step": 80 |
|
}, |
|
{ |
|
"epoch": 4.955223880597015, |
|
"eval_accuracy": 0.8625180897250362, |
|
"eval_loss": 0.32812753319740295, |
|
"eval_runtime": 76.4607, |
|
"eval_samples_per_second": 9.037, |
|
"eval_steps_per_second": 0.078, |
|
"step": 83 |
|
}, |
|
{ |
|
"epoch": 5.373134328358209, |
|
"grad_norm": 2.2589757442474365, |
|
"learning_rate": 1.1000000000000001e-05, |
|
"loss": 0.3218, |
|
"step": 90 |
|
}, |
|
{ |
|
"epoch": 5.970149253731344, |
|
"grad_norm": 2.3260316848754883, |
|
"learning_rate": 6e-06, |
|
"loss": 0.3387, |
|
"step": 100 |
|
}, |
|
{ |
|
"epoch": 5.970149253731344, |
|
"eval_accuracy": 0.8639652677279306, |
|
"eval_loss": 0.3239884674549103, |
|
"eval_runtime": 76.5373, |
|
"eval_samples_per_second": 9.028, |
|
"eval_steps_per_second": 0.078, |
|
"step": 100 |
|
}, |
|
{ |
|
"epoch": 6.567164179104478, |
|
"grad_norm": 2.35009765625, |
|
"learning_rate": 1.0000000000000002e-06, |
|
"loss": 0.3157, |
|
"step": 110 |
|
}, |
|
{ |
|
"epoch": 6.686567164179104, |
|
"eval_accuracy": 0.8639652677279306, |
|
"eval_loss": 0.325300008058548, |
|
"eval_runtime": 76.553, |
|
"eval_samples_per_second": 9.026, |
|
"eval_steps_per_second": 0.078, |
|
"step": 112 |
|
}, |
|
{ |
|
"epoch": 6.686567164179104, |
|
"step": 112, |
|
"total_flos": 4.4574447113624494e+18, |
|
"train_loss": 0.43422421866229605, |
|
"train_runtime": 7488.3728, |
|
"train_samples_per_second": 7.947, |
|
"train_steps_per_second": 0.015 |
|
} |
|
], |
|
"logging_steps": 10, |
|
"max_steps": 112, |
|
"num_input_tokens_seen": 0, |
|
"num_train_epochs": 7, |
|
"save_steps": 500, |
|
"stateful_callbacks": { |
|
"TrainerControl": { |
|
"args": { |
|
"should_epoch_stop": false, |
|
"should_evaluate": false, |
|
"should_log": false, |
|
"should_save": true, |
|
"should_training_stop": true |
|
}, |
|
"attributes": {} |
|
} |
|
}, |
|
"total_flos": 4.4574447113624494e+18, |
|
"train_batch_size": 128, |
|
"trial_name": null, |
|
"trial_params": null |
|
} |
|
|