{ | |
"all_params": 3760275456, | |
"memory_footprint": 7531865424, | |
"total_flos": 4.419854408240333e+16, | |
"train_loss": 0.537436925212387, | |
"train_runtime": 3691.1633, | |
"train_samples_per_second": 0.863, | |
"train_steps_per_second": 0.107, | |
"trainable_params": 5652480, | |
"trainable_params_percent": 0.15032090244827 | |
} |