File size: 9,796 Bytes
d59c8e2
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
{"current_steps": 5, "total_steps": 222, "loss": 1.7484, "learning_rate": 5e-07, "epoch": 0.06756756756756757, "percentage": 2.25, "elapsed_time": "0:01:08", "remaining_time": "0:49:43"}
{"current_steps": 10, "total_steps": 222, "loss": 1.6, "learning_rate": 1e-06, "epoch": 0.13513513513513514, "percentage": 4.5, "elapsed_time": "0:02:14", "remaining_time": "0:47:35"}
{"current_steps": 15, "total_steps": 222, "loss": 1.3118, "learning_rate": 9.98628141419305e-07, "epoch": 0.20270270270270271, "percentage": 6.76, "elapsed_time": "0:03:20", "remaining_time": "0:46:07"}
{"current_steps": 20, "total_steps": 222, "loss": 1.1295, "learning_rate": 9.94520093661082e-07, "epoch": 0.2702702702702703, "percentage": 9.01, "elapsed_time": "0:04:25", "remaining_time": "0:44:40"}
{"current_steps": 25, "total_steps": 222, "loss": 1.1044, "learning_rate": 9.876983993675989e-07, "epoch": 0.33783783783783783, "percentage": 11.26, "elapsed_time": "0:05:31", "remaining_time": "0:43:29"}
{"current_steps": 30, "total_steps": 222, "loss": 1.0105, "learning_rate": 9.78200492138261e-07, "epoch": 0.40540540540540543, "percentage": 13.51, "elapsed_time": "0:06:36", "remaining_time": "0:42:16"}
{"current_steps": 35, "total_steps": 222, "loss": 0.991, "learning_rate": 9.66078491115194e-07, "epoch": 0.47297297297297297, "percentage": 15.77, "elapsed_time": "0:07:41", "remaining_time": "0:41:05"}
{"current_steps": 40, "total_steps": 222, "loss": 0.9674, "learning_rate": 9.513989149828717e-07, "epoch": 0.5405405405405406, "percentage": 18.02, "elapsed_time": "0:08:46", "remaining_time": "0:39:57"}
{"current_steps": 45, "total_steps": 222, "loss": 0.9507, "learning_rate": 9.342423169512071e-07, "epoch": 0.6081081081081081, "percentage": 20.27, "elapsed_time": "0:09:51", "remaining_time": "0:38:46"}
{"current_steps": 50, "total_steps": 222, "loss": 0.9386, "learning_rate": 9.147028427251009e-07, "epoch": 0.6756756756756757, "percentage": 22.52, "elapsed_time": "0:10:57", "remaining_time": "0:37:41"}
{"current_steps": 50, "total_steps": 222, "eval_loss": 0.9245508313179016, "epoch": 0.6756756756756757, "percentage": 22.52, "elapsed_time": "0:11:34", "remaining_time": "0:39:47"}
{"current_steps": 55, "total_steps": 222, "loss": 0.946, "learning_rate": 8.928877138860706e-07, "epoch": 0.7432432432432432, "percentage": 24.77, "elapsed_time": "0:12:39", "remaining_time": "0:38:27"}
{"current_steps": 60, "total_steps": 222, "loss": 0.9186, "learning_rate": 8.689166395208636e-07, "epoch": 0.8108108108108109, "percentage": 27.03, "elapsed_time": "0:13:45", "remaining_time": "0:37:08"}
{"current_steps": 65, "total_steps": 222, "loss": 0.9203, "learning_rate": 8.429211593257052e-07, "epoch": 0.8783783783783784, "percentage": 29.28, "elapsed_time": "0:14:49", "remaining_time": "0:35:49"}
{"current_steps": 70, "total_steps": 222, "loss": 0.9104, "learning_rate": 8.150439217908556e-07, "epoch": 0.9459459459459459, "percentage": 31.53, "elapsed_time": "0:15:55", "remaining_time": "0:34:34"}
{"current_steps": 75, "total_steps": 222, "loss": 0.8925, "learning_rate": 7.854379014263876e-07, "epoch": 1.0135135135135136, "percentage": 33.78, "elapsed_time": "0:17:01", "remaining_time": "0:33:21"}
{"current_steps": 80, "total_steps": 222, "loss": 0.8628, "learning_rate": 7.542655593246103e-07, "epoch": 1.0810810810810811, "percentage": 36.04, "elapsed_time": "0:18:06", "remaining_time": "0:32:09"}
{"current_steps": 85, "total_steps": 222, "loss": 0.8289, "learning_rate": 7.216979516654943e-07, "epoch": 1.1486486486486487, "percentage": 38.29, "elapsed_time": "0:19:12", "remaining_time": "0:30:57"}
{"current_steps": 90, "total_steps": 222, "loss": 0.8346, "learning_rate": 6.87913791057119e-07, "epoch": 1.2162162162162162, "percentage": 40.54, "elapsed_time": "0:20:18", "remaining_time": "0:29:46"}
{"current_steps": 95, "total_steps": 222, "loss": 0.8442, "learning_rate": 6.530984658619733e-07, "epoch": 1.2837837837837838, "percentage": 42.79, "elapsed_time": "0:21:24", "remaining_time": "0:28:36"}
{"current_steps": 100, "total_steps": 222, "loss": 0.8263, "learning_rate": 6.174430228904919e-07, "epoch": 1.3513513513513513, "percentage": 45.05, "elapsed_time": "0:22:30", "remaining_time": "0:27:27"}
{"current_steps": 100, "total_steps": 222, "eval_loss": 0.8765044808387756, "epoch": 1.3513513513513513, "percentage": 45.05, "elapsed_time": "0:23:06", "remaining_time": "0:28:11"}
{"current_steps": 105, "total_steps": 222, "loss": 0.8266, "learning_rate": 5.8114311904423e-07, "epoch": 1.4189189189189189, "percentage": 47.3, "elapsed_time": "0:24:11", "remaining_time": "0:26:57"}
{"current_steps": 110, "total_steps": 222, "loss": 0.8094, "learning_rate": 5.443979476614674e-07, "epoch": 1.4864864864864864, "percentage": 49.55, "elapsed_time": "0:25:17", "remaining_time": "0:25:45"}
{"current_steps": 115, "total_steps": 222, "loss": 0.8107, "learning_rate": 5.074091454568463e-07, "epoch": 1.554054054054054, "percentage": 51.8, "elapsed_time": "0:26:23", "remaining_time": "0:24:33"}
{"current_steps": 120, "total_steps": 222, "loss": 0.8112, "learning_rate": 4.703796860531429e-07, "epoch": 1.6216216216216215, "percentage": 54.05, "elapsed_time": "0:27:28", "remaining_time": "0:23:21"}
{"current_steps": 125, "total_steps": 222, "loss": 0.8197, "learning_rate": 4.3351276617684285e-07, "epoch": 1.689189189189189, "percentage": 56.31, "elapsed_time": "0:28:34", "remaining_time": "0:22:10"}
{"current_steps": 130, "total_steps": 222, "loss": 0.8158, "learning_rate": 3.970106906294509e-07, "epoch": 1.7567567567567568, "percentage": 58.56, "elapsed_time": "0:29:40", "remaining_time": "0:21:00"}
{"current_steps": 135, "total_steps": 222, "loss": 0.8297, "learning_rate": 3.610737621531781e-07, "epoch": 1.8243243243243243, "percentage": 60.81, "elapsed_time": "0:30:46", "remaining_time": "0:19:50"}
{"current_steps": 140, "total_steps": 222, "loss": 0.8031, "learning_rate": 3.2589918228280066e-07, "epoch": 1.8918918918918919, "percentage": 63.06, "elapsed_time": "0:31:51", "remaining_time": "0:18:39"}
{"current_steps": 145, "total_steps": 222, "loss": 0.8016, "learning_rate": 2.916799692151884e-07, "epoch": 1.9594594594594594, "percentage": 65.32, "elapsed_time": "0:32:56", "remaining_time": "0:17:29"}
{"current_steps": 150, "total_steps": 222, "loss": 0.7963, "learning_rate": 2.5860389863462763e-07, "epoch": 2.027027027027027, "percentage": 67.57, "elapsed_time": "0:34:01", "remaining_time": "0:16:19"}
{"current_steps": 150, "total_steps": 222, "eval_loss": 0.8589270710945129, "epoch": 2.027027027027027, "percentage": 67.57, "elapsed_time": "0:34:38", "remaining_time": "0:16:37"}
{"current_steps": 155, "total_steps": 222, "loss": 0.7712, "learning_rate": 2.2685247330608414e-07, "epoch": 2.0945945945945947, "percentage": 69.82, "elapsed_time": "0:35:43", "remaining_time": "0:15:26"}
{"current_steps": 160, "total_steps": 222, "loss": 0.7662, "learning_rate": 1.9659992709070344e-07, "epoch": 2.1621621621621623, "percentage": 72.07, "elapsed_time": "0:36:48", "remaining_time": "0:14:15"}
{"current_steps": 165, "total_steps": 222, "loss": 0.7538, "learning_rate": 1.6801226884893893e-07, "epoch": 2.22972972972973, "percentage": 74.32, "elapsed_time": "0:37:53", "remaining_time": "0:13:05"}
{"current_steps": 170, "total_steps": 222, "loss": 0.7731, "learning_rate": 1.412463714778343e-07, "epoch": 2.2972972972972974, "percentage": 76.58, "elapsed_time": "0:38:58", "remaining_time": "0:11:55"}
{"current_steps": 175, "total_steps": 222, "loss": 0.7792, "learning_rate": 1.1644911108130434e-07, "epoch": 2.364864864864865, "percentage": 78.83, "elapsed_time": "0:40:04", "remaining_time": "0:10:45"}
{"current_steps": 180, "total_steps": 222, "loss": 0.757, "learning_rate": 9.375656099715934e-08, "epoch": 2.4324324324324325, "percentage": 81.08, "elapsed_time": "0:41:10", "remaining_time": "0:09:36"}
{"current_steps": 185, "total_steps": 222, "loss": 0.7426, "learning_rate": 7.329324510360269e-08, "epoch": 2.5, "percentage": 83.33, "elapsed_time": "0:42:15", "remaining_time": "0:08:27"}
{"current_steps": 190, "total_steps": 222, "loss": 0.754, "learning_rate": 5.517145450262639e-08, "epoch": 2.5675675675675675, "percentage": 85.59, "elapsed_time": "0:43:22", "remaining_time": "0:07:18"}
{"current_steps": 195, "total_steps": 222, "loss": 0.7604, "learning_rate": 3.9490631329964554e-08, "epoch": 2.635135135135135, "percentage": 87.84, "elapsed_time": "0:44:27", "remaining_time": "0:06:09"}
{"current_steps": 200, "total_steps": 222, "loss": 0.7574, "learning_rate": 2.63368230729043e-08, "epoch": 2.7027027027027026, "percentage": 90.09, "elapsed_time": "0:45:33", "remaining_time": "0:05:00"}
{"current_steps": 200, "total_steps": 222, "eval_loss": 0.8600885272026062, "epoch": 2.7027027027027026, "percentage": 90.09, "elapsed_time": "0:46:10", "remaining_time": "0:05:04"}
{"current_steps": 205, "total_steps": 222, "loss": 0.7485, "learning_rate": 1.5782210390350713e-08, "epoch": 2.77027027027027, "percentage": 92.34, "elapsed_time": "0:47:15", "remaining_time": "0:03:55"}
{"current_steps": 210, "total_steps": 222, "loss": 0.7526, "learning_rate": 7.884711026201584e-09, "epoch": 2.8378378378378377, "percentage": 94.59, "elapsed_time": "0:48:21", "remaining_time": "0:02:45"}
{"current_steps": 215, "total_steps": 222, "loss": 0.7473, "learning_rate": 2.687661989531964e-09, "epoch": 2.9054054054054053, "percentage": 96.85, "elapsed_time": "0:49:27", "remaining_time": "0:01:36"}
{"current_steps": 220, "total_steps": 222, "loss": 0.7482, "learning_rate": 2.1958174560282594e-10, "epoch": 2.972972972972973, "percentage": 99.1, "elapsed_time": "0:50:32", "remaining_time": "0:00:27"}
{"current_steps": 222, "total_steps": 222, "epoch": 3.0, "percentage": 100.0, "elapsed_time": "0:51:30", "remaining_time": "0:00:00"}