sedrickkeh commited on
Commit
b3526e8
·
verified ·
1 Parent(s): 3aca715

Training in progress, epoch 2

Browse files
model-00001-of-00004.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:5530940438d0305c4152fbf1f4cc2489aa44f5697b4db134d4200155410ec8d9
3
  size 4877660776
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:821b1d143c18e550e7ca59cbd23227d1f5ded0f07a47792dcb59b2e2d7b82e29
3
  size 4877660776
model-00002-of-00004.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:bc81b2ac672ce52f29f38d321e8af2021ac911bf3c662edf149e1a6d97ae2840
3
  size 4932751008
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:a77672f48ffaef6eddd8c48d4c5f6d2bbe0b5c3fc73de9d5dfc745d52225a165
3
  size 4932751008
model-00003-of-00004.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:9d6827660fcbaec1a7148d2f028754c0f2e720adf7af932eed642acb23617999
3
  size 4330865200
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:05532e623e97c3cb7f68a7fdee1f916090db471d0fa756fe84fa96777a397c3c
3
  size 4330865200
model-00004-of-00004.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:d5c2f9a89e38f1603006efd5756af2d9543cd5f257db1e9268cb798461256e2a
3
  size 1089994880
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:97206f85f760aaf6378d311e88eef0a129de674766e3f7044f543b590de3b7d0
3
  size 1089994880
trainer_log.jsonl CHANGED
@@ -221,3 +221,114 @@
221
  {"current_steps": 221, "total_steps": 333, "loss": 0.4413, "lr": 2.464413991568222e-05, "epoch": 1.9865168539325841, "percentage": 66.37, "elapsed_time": "5:59:34", "remaining_time": "3:02:13"}
222
  {"current_steps": 222, "total_steps": 333, "loss": 0.4383, "lr": 2.4256918192173088e-05, "epoch": 1.9955056179775281, "percentage": 66.67, "elapsed_time": "6:01:10", "remaining_time": "3:00:35"}
223
  {"current_steps": 223, "total_steps": 333, "loss": 0.7545, "lr": 2.3871434442065414e-05, "epoch": 2.004494382022472, "percentage": 66.97, "elapsed_time": "6:04:22", "remaining_time": "2:59:44"}
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
221
  {"current_steps": 221, "total_steps": 333, "loss": 0.4413, "lr": 2.464413991568222e-05, "epoch": 1.9865168539325841, "percentage": 66.37, "elapsed_time": "5:59:34", "remaining_time": "3:02:13"}
222
  {"current_steps": 222, "total_steps": 333, "loss": 0.4383, "lr": 2.4256918192173088e-05, "epoch": 1.9955056179775281, "percentage": 66.67, "elapsed_time": "6:01:10", "remaining_time": "3:00:35"}
223
  {"current_steps": 223, "total_steps": 333, "loss": 0.7545, "lr": 2.3871434442065414e-05, "epoch": 2.004494382022472, "percentage": 66.97, "elapsed_time": "6:04:22", "remaining_time": "2:59:44"}
224
+ {"current_steps": 224, "total_steps": 333, "loss": 0.4154, "lr": 2.3487731221226754e-05, "epoch": 2.013483146067416, "percentage": 67.27, "elapsed_time": "6:05:58", "remaining_time": "2:58:05"}
225
+ {"current_steps": 225, "total_steps": 333, "loss": 0.4165, "lr": 2.3105850888961348e-05, "epoch": 2.0224719101123596, "percentage": 67.57, "elapsed_time": "6:07:35", "remaining_time": "2:56:26"}
226
+ {"current_steps": 226, "total_steps": 333, "loss": 0.4141, "lr": 2.272583560333379e-05, "epoch": 2.0314606741573034, "percentage": 67.87, "elapsed_time": "6:09:12", "remaining_time": "2:54:48"}
227
+ {"current_steps": 227, "total_steps": 333, "loss": 0.4173, "lr": 2.2347727316515e-05, "epoch": 2.040449438202247, "percentage": 68.17, "elapsed_time": "6:10:50", "remaining_time": "2:53:09"}
228
+ {"current_steps": 228, "total_steps": 333, "loss": 0.4039, "lr": 2.1971567770150814e-05, "epoch": 2.049438202247191, "percentage": 68.47, "elapsed_time": "6:12:26", "remaining_time": "2:51:31"}
229
+ {"current_steps": 229, "total_steps": 333, "loss": 0.4126, "lr": 2.1597398490753917e-05, "epoch": 2.0584269662921346, "percentage": 68.77, "elapsed_time": "6:14:03", "remaining_time": "2:49:52"}
230
+ {"current_steps": 230, "total_steps": 333, "loss": 0.4112, "lr": 2.1225260785119456e-05, "epoch": 2.067415730337079, "percentage": 69.07, "elapsed_time": "6:15:41", "remaining_time": "2:48:14"}
231
+ {"current_steps": 231, "total_steps": 333, "loss": 0.4136, "lr": 2.0855195735764947e-05, "epoch": 2.0764044943820226, "percentage": 69.37, "elapsed_time": "6:17:18", "remaining_time": "2:46:36"}
232
+ {"current_steps": 232, "total_steps": 333, "loss": 0.4158, "lr": 2.0487244196394912e-05, "epoch": 2.0853932584269663, "percentage": 69.67, "elapsed_time": "6:18:55", "remaining_time": "2:44:57"}
233
+ {"current_steps": 233, "total_steps": 333, "loss": 0.414, "lr": 2.0121446787390822e-05, "epoch": 2.09438202247191, "percentage": 69.97, "elapsed_time": "6:20:32", "remaining_time": "2:43:19"}
234
+ {"current_steps": 234, "total_steps": 333, "loss": 0.409, "lr": 1.9757843891326736e-05, "epoch": 2.103370786516854, "percentage": 70.27, "elapsed_time": "6:22:09", "remaining_time": "2:41:40"}
235
+ {"current_steps": 235, "total_steps": 333, "loss": 0.4118, "lr": 1.939647564851127e-05, "epoch": 2.1123595505617976, "percentage": 70.57, "elapsed_time": "6:23:46", "remaining_time": "2:40:02"}
236
+ {"current_steps": 236, "total_steps": 333, "loss": 0.4082, "lr": 1.9037381952556217e-05, "epoch": 2.121348314606742, "percentage": 70.87, "elapsed_time": "6:25:23", "remaining_time": "2:38:24"}
237
+ {"current_steps": 237, "total_steps": 333, "loss": 0.4208, "lr": 1.8680602445972463e-05, "epoch": 2.1303370786516855, "percentage": 71.17, "elapsed_time": "6:27:00", "remaining_time": "2:36:45"}
238
+ {"current_steps": 238, "total_steps": 333, "loss": 0.4143, "lr": 1.832617651579365e-05, "epoch": 2.1393258426966293, "percentage": 71.47, "elapsed_time": "6:28:38", "remaining_time": "2:35:07"}
239
+ {"current_steps": 239, "total_steps": 333, "loss": 0.4126, "lr": 1.797414328922797e-05, "epoch": 2.148314606741573, "percentage": 71.77, "elapsed_time": "6:30:15", "remaining_time": "2:33:29"}
240
+ {"current_steps": 240, "total_steps": 333, "loss": 0.4107, "lr": 1.7624541629338676e-05, "epoch": 2.157303370786517, "percentage": 72.07, "elapsed_time": "6:31:52", "remaining_time": "2:31:51"}
241
+ {"current_steps": 241, "total_steps": 333, "loss": 0.4147, "lr": 1.7277410130753775e-05, "epoch": 2.1662921348314605, "percentage": 72.37, "elapsed_time": "6:33:30", "remaining_time": "2:30:13"}
242
+ {"current_steps": 242, "total_steps": 333, "loss": 0.4079, "lr": 1.6932787115405318e-05, "epoch": 2.1752808988764043, "percentage": 72.67, "elapsed_time": "6:35:07", "remaining_time": "2:28:34"}
243
+ {"current_steps": 243, "total_steps": 333, "loss": 0.41, "lr": 1.6590710628298826e-05, "epoch": 2.1842696629213485, "percentage": 72.97, "elapsed_time": "6:36:44", "remaining_time": "2:26:56"}
244
+ {"current_steps": 244, "total_steps": 333, "loss": 0.4091, "lr": 1.6251218433313254e-05, "epoch": 2.1932584269662923, "percentage": 73.27, "elapsed_time": "6:38:21", "remaining_time": "2:25:18"}
245
+ {"current_steps": 245, "total_steps": 333, "loss": 0.408, "lr": 1.591434800903203e-05, "epoch": 2.202247191011236, "percentage": 73.57, "elapsed_time": "6:39:59", "remaining_time": "2:23:40"}
246
+ {"current_steps": 246, "total_steps": 333, "loss": 0.409, "lr": 1.558013654460555e-05, "epoch": 2.2112359550561798, "percentage": 73.87, "elapsed_time": "6:41:36", "remaining_time": "2:22:01"}
247
+ {"current_steps": 247, "total_steps": 333, "loss": 0.4108, "lr": 1.5248620935645666e-05, "epoch": 2.2202247191011235, "percentage": 74.17, "elapsed_time": "6:43:13", "remaining_time": "2:20:23"}
248
+ {"current_steps": 248, "total_steps": 333, "loss": 0.4086, "lr": 1.4919837780152544e-05, "epoch": 2.2292134831460673, "percentage": 74.47, "elapsed_time": "6:44:50", "remaining_time": "2:18:45"}
249
+ {"current_steps": 249, "total_steps": 333, "loss": 0.4134, "lr": 1.4593823374474374e-05, "epoch": 2.238202247191011, "percentage": 74.77, "elapsed_time": "6:46:27", "remaining_time": "2:17:07"}
250
+ {"current_steps": 250, "total_steps": 333, "loss": 0.4105, "lr": 1.4270613709300429e-05, "epoch": 2.247191011235955, "percentage": 75.08, "elapsed_time": "6:48:04", "remaining_time": "2:15:29"}
251
+ {"current_steps": 251, "total_steps": 333, "loss": 0.4113, "lr": 1.3950244465687833e-05, "epoch": 2.256179775280899, "percentage": 75.38, "elapsed_time": "6:49:42", "remaining_time": "2:13:50"}
252
+ {"current_steps": 252, "total_steps": 333, "loss": 0.4117, "lr": 1.3632751011122497e-05, "epoch": 2.2651685393258427, "percentage": 75.68, "elapsed_time": "6:51:19", "remaining_time": "2:12:12"}
253
+ {"current_steps": 253, "total_steps": 333, "loss": 0.4086, "lr": 1.3318168395614697e-05, "epoch": 2.2741573033707865, "percentage": 75.98, "elapsed_time": "6:52:56", "remaining_time": "2:10:34"}
254
+ {"current_steps": 254, "total_steps": 333, "loss": 0.4075, "lr": 1.3006531347829699e-05, "epoch": 2.2831460674157302, "percentage": 76.28, "elapsed_time": "6:54:33", "remaining_time": "2:08:56"}
255
+ {"current_steps": 255, "total_steps": 333, "loss": 0.4092, "lr": 1.2697874271253844e-05, "epoch": 2.292134831460674, "percentage": 76.58, "elapsed_time": "6:56:10", "remaining_time": "2:07:18"}
256
+ {"current_steps": 256, "total_steps": 333, "loss": 0.4103, "lr": 1.2392231240396542e-05, "epoch": 2.3011235955056177, "percentage": 76.88, "elapsed_time": "6:57:48", "remaining_time": "2:05:40"}
257
+ {"current_steps": 257, "total_steps": 333, "loss": 0.4165, "lr": 1.2089635997028592e-05, "epoch": 2.310112359550562, "percentage": 77.18, "elapsed_time": "6:59:25", "remaining_time": "2:04:01"}
258
+ {"current_steps": 258, "total_steps": 333, "loss": 0.4166, "lr": 1.1790121946457212e-05, "epoch": 2.3191011235955057, "percentage": 77.48, "elapsed_time": "7:01:02", "remaining_time": "2:02:23"}
259
+ {"current_steps": 259, "total_steps": 333, "loss": 0.407, "lr": 1.1493722153838239e-05, "epoch": 2.3280898876404494, "percentage": 77.78, "elapsed_time": "7:02:39", "remaining_time": "2:00:45"}
260
+ {"current_steps": 260, "total_steps": 333, "loss": 0.413, "lr": 1.120046934052585e-05, "epoch": 2.337078651685393, "percentage": 78.08, "elapsed_time": "7:04:17", "remaining_time": "1:59:07"}
261
+ {"current_steps": 261, "total_steps": 333, "loss": 0.4112, "lr": 1.0910395880460274e-05, "epoch": 2.346067415730337, "percentage": 78.38, "elapsed_time": "7:05:53", "remaining_time": "1:57:29"}
262
+ {"current_steps": 262, "total_steps": 333, "loss": 0.4182, "lr": 1.062353379659383e-05, "epoch": 2.355056179775281, "percentage": 78.68, "elapsed_time": "7:07:30", "remaining_time": "1:55:51"}
263
+ {"current_steps": 263, "total_steps": 333, "loss": 0.4058, "lr": 1.0339914757355718e-05, "epoch": 2.364044943820225, "percentage": 78.98, "elapsed_time": "7:09:08", "remaining_time": "1:54:13"}
264
+ {"current_steps": 264, "total_steps": 333, "loss": 0.4224, "lr": 1.0059570073155953e-05, "epoch": 2.3730337078651687, "percentage": 79.28, "elapsed_time": "7:10:45", "remaining_time": "1:52:35"}
265
+ {"current_steps": 265, "total_steps": 333, "loss": 0.4175, "lr": 9.782530692928832e-06, "epoch": 2.3820224719101124, "percentage": 79.58, "elapsed_time": "7:12:22", "remaining_time": "1:50:56"}
266
+ {"current_steps": 266, "total_steps": 333, "loss": 0.4087, "lr": 9.508827200716273e-06, "epoch": 2.391011235955056, "percentage": 79.88, "elapsed_time": "7:13:59", "remaining_time": "1:49:18"}
267
+ {"current_steps": 267, "total_steps": 333, "loss": 0.4081, "lr": 9.238489812291469e-06, "epoch": 2.4, "percentage": 80.18, "elapsed_time": "7:15:36", "remaining_time": "1:47:40"}
268
+ {"current_steps": 268, "total_steps": 333, "loss": 0.4082, "lr": 8.971548371823205e-06, "epoch": 2.4089887640449437, "percentage": 80.48, "elapsed_time": "7:17:13", "remaining_time": "1:46:02"}
269
+ {"current_steps": 269, "total_steps": 333, "loss": 0.4073, "lr": 8.708032348581144e-06, "epoch": 2.417977528089888, "percentage": 80.78, "elapsed_time": "7:18:50", "remaining_time": "1:44:24"}
270
+ {"current_steps": 270, "total_steps": 333, "loss": 0.4113, "lr": 8.447970833682584e-06, "epoch": 2.4269662921348316, "percentage": 81.08, "elapsed_time": "7:20:26", "remaining_time": "1:42:46"}
271
+ {"current_steps": 271, "total_steps": 333, "loss": 0.4071, "lr": 8.191392536880852e-06, "epoch": 2.4359550561797754, "percentage": 81.38, "elapsed_time": "7:22:03", "remaining_time": "1:41:08"}
272
+ {"current_steps": 272, "total_steps": 333, "loss": 0.4019, "lr": 7.938325783395924e-06, "epoch": 2.444943820224719, "percentage": 81.68, "elapsed_time": "7:23:41", "remaining_time": "1:39:30"}
273
+ {"current_steps": 273, "total_steps": 333, "loss": 0.4116, "lr": 7.68879851078741e-06, "epoch": 2.453932584269663, "percentage": 81.98, "elapsed_time": "7:25:17", "remaining_time": "1:37:52"}
274
+ {"current_steps": 274, "total_steps": 333, "loss": 0.4097, "lr": 7.442838265870347e-06, "epoch": 2.4629213483146066, "percentage": 82.28, "elapsed_time": "7:26:54", "remaining_time": "1:36:14"}
275
+ {"current_steps": 275, "total_steps": 333, "loss": 0.4086, "lr": 7.2004722016741605e-06, "epoch": 2.4719101123595504, "percentage": 82.58, "elapsed_time": "7:28:32", "remaining_time": "1:34:36"}
276
+ {"current_steps": 276, "total_steps": 333, "loss": 0.4048, "lr": 6.961727074445055e-06, "epoch": 2.4808988764044946, "percentage": 82.88, "elapsed_time": "7:30:09", "remaining_time": "1:32:57"}
277
+ {"current_steps": 277, "total_steps": 333, "loss": 0.406, "lr": 6.726629240692255e-06, "epoch": 2.4898876404494383, "percentage": 83.18, "elapsed_time": "7:31:46", "remaining_time": "1:31:19"}
278
+ {"current_steps": 278, "total_steps": 333, "loss": 0.4084, "lr": 6.4952046542783395e-06, "epoch": 2.498876404494382, "percentage": 83.48, "elapsed_time": "7:33:22", "remaining_time": "1:29:41"}
279
+ {"current_steps": 279, "total_steps": 333, "loss": 0.4088, "lr": 6.2674788635540415e-06, "epoch": 2.507865168539326, "percentage": 83.78, "elapsed_time": "7:34:59", "remaining_time": "1:28:03"}
280
+ {"current_steps": 280, "total_steps": 333, "loss": 0.4091, "lr": 6.04347700853781e-06, "epoch": 2.5168539325842696, "percentage": 84.08, "elapsed_time": "7:36:36", "remaining_time": "1:26:25"}
281
+ {"current_steps": 281, "total_steps": 333, "loss": 0.4135, "lr": 5.823223818140458e-06, "epoch": 2.5258426966292133, "percentage": 84.38, "elapsed_time": "7:38:13", "remaining_time": "1:24:47"}
282
+ {"current_steps": 282, "total_steps": 333, "loss": 0.4192, "lr": 5.606743607435183e-06, "epoch": 2.534831460674157, "percentage": 84.68, "elapsed_time": "7:39:50", "remaining_time": "1:23:09"}
283
+ {"current_steps": 283, "total_steps": 333, "loss": 0.4143, "lr": 5.394060274973267e-06, "epoch": 2.5438202247191013, "percentage": 84.98, "elapsed_time": "7:41:27", "remaining_time": "1:21:31"}
284
+ {"current_steps": 284, "total_steps": 333, "loss": 0.4073, "lr": 5.185197300145817e-06, "epoch": 2.552808988764045, "percentage": 85.29, "elapsed_time": "7:43:04", "remaining_time": "1:19:53"}
285
+ {"current_steps": 285, "total_steps": 333, "loss": 0.408, "lr": 4.980177740591678e-06, "epoch": 2.561797752808989, "percentage": 85.59, "elapsed_time": "7:44:41", "remaining_time": "1:18:15"}
286
+ {"current_steps": 286, "total_steps": 333, "loss": 0.4086, "lr": 4.779024229652005e-06, "epoch": 2.5707865168539326, "percentage": 85.89, "elapsed_time": "7:46:18", "remaining_time": "1:16:37"}
287
+ {"current_steps": 287, "total_steps": 333, "loss": 0.4053, "lr": 4.581758973871609e-06, "epoch": 2.5797752808988763, "percentage": 86.19, "elapsed_time": "7:47:55", "remaining_time": "1:14:59"}
288
+ {"current_steps": 288, "total_steps": 333, "loss": 0.4051, "lr": 4.3884037505474455e-06, "epoch": 2.58876404494382, "percentage": 86.49, "elapsed_time": "7:49:32", "remaining_time": "1:13:21"}
289
+ {"current_steps": 289, "total_steps": 333, "loss": 0.4062, "lr": 4.198979905324496e-06, "epoch": 2.597752808988764, "percentage": 86.79, "elapsed_time": "7:51:09", "remaining_time": "1:11:43"}
290
+ {"current_steps": 290, "total_steps": 333, "loss": 0.4143, "lr": 4.0135083498392905e-06, "epoch": 2.606741573033708, "percentage": 87.09, "elapsed_time": "7:52:46", "remaining_time": "1:10:06"}
291
+ {"current_steps": 291, "total_steps": 333, "loss": 0.407, "lr": 3.832009559411338e-06, "epoch": 2.6157303370786518, "percentage": 87.39, "elapsed_time": "7:54:22", "remaining_time": "1:08:28"}
292
+ {"current_steps": 292, "total_steps": 333, "loss": 0.4094, "lr": 3.654503570782755e-06, "epoch": 2.6247191011235955, "percentage": 87.69, "elapsed_time": "7:55:59", "remaining_time": "1:06:50"}
293
+ {"current_steps": 293, "total_steps": 333, "loss": 0.408, "lr": 3.481009979906258e-06, "epoch": 2.6337078651685393, "percentage": 87.99, "elapsed_time": "7:57:36", "remaining_time": "1:05:12"}
294
+ {"current_steps": 294, "total_steps": 333, "loss": 0.4064, "lr": 3.311547939781887e-06, "epoch": 2.642696629213483, "percentage": 88.29, "elapsed_time": "7:59:13", "remaining_time": "1:03:34"}
295
+ {"current_steps": 295, "total_steps": 333, "loss": 0.4044, "lr": 3.14613615834253e-06, "epoch": 2.6516853932584272, "percentage": 88.59, "elapsed_time": "8:00:50", "remaining_time": "1:01:56"}
296
+ {"current_steps": 296, "total_steps": 333, "loss": 0.4054, "lr": 2.9847928963887198e-06, "epoch": 2.6606741573033705, "percentage": 88.89, "elapsed_time": "8:02:27", "remaining_time": "1:00:18"}
297
+ {"current_steps": 297, "total_steps": 333, "loss": 0.4065, "lr": 2.8275359655726586e-06, "epoch": 2.6696629213483147, "percentage": 89.19, "elapsed_time": "8:04:04", "remaining_time": "0:58:40"}
298
+ {"current_steps": 298, "total_steps": 333, "loss": 0.4027, "lr": 2.6743827264319012e-06, "epoch": 2.6786516853932585, "percentage": 89.49, "elapsed_time": "8:05:41", "remaining_time": "0:57:02"}
299
+ {"current_steps": 299, "total_steps": 333, "loss": 0.4048, "lr": 2.5253500864728155e-06, "epoch": 2.6876404494382022, "percentage": 89.79, "elapsed_time": "8:07:18", "remaining_time": "0:55:24"}
300
+ {"current_steps": 300, "total_steps": 333, "loss": 0.4025, "lr": 2.3804544983040724e-06, "epoch": 2.696629213483146, "percentage": 90.09, "elapsed_time": "8:08:55", "remaining_time": "0:53:46"}
301
+ {"current_steps": 301, "total_steps": 333, "loss": 0.406, "lr": 2.23971195782033e-06, "epoch": 2.7056179775280897, "percentage": 90.39, "elapsed_time": "8:10:32", "remaining_time": "0:52:09"}
302
+ {"current_steps": 302, "total_steps": 333, "loss": 0.4121, "lr": 2.1031380024363645e-06, "epoch": 2.714606741573034, "percentage": 90.69, "elapsed_time": "8:12:09", "remaining_time": "0:50:31"}
303
+ {"current_steps": 303, "total_steps": 333, "loss": 0.4083, "lr": 1.9707477093717786e-06, "epoch": 2.7235955056179773, "percentage": 90.99, "elapsed_time": "8:13:46", "remaining_time": "0:48:53"}
304
+ {"current_steps": 304, "total_steps": 333, "loss": 0.4146, "lr": 1.8425556939865696e-06, "epoch": 2.7325842696629215, "percentage": 91.29, "elapsed_time": "8:15:23", "remaining_time": "0:47:15"}
305
+ {"current_steps": 305, "total_steps": 333, "loss": 0.4076, "lr": 1.7185761081676222e-06, "epoch": 2.741573033707865, "percentage": 91.59, "elapsed_time": "8:17:00", "remaining_time": "0:45:37"}
306
+ {"current_steps": 306, "total_steps": 333, "loss": 0.4072, "lr": 1.5988226387664151e-06, "epoch": 2.750561797752809, "percentage": 91.89, "elapsed_time": "8:18:37", "remaining_time": "0:43:59"}
307
+ {"current_steps": 307, "total_steps": 333, "loss": 0.4116, "lr": 1.4833085060880349e-06, "epoch": 2.7595505617977527, "percentage": 92.19, "elapsed_time": "8:20:14", "remaining_time": "0:42:21"}
308
+ {"current_steps": 308, "total_steps": 333, "loss": 0.4028, "lr": 1.3720464624317108e-06, "epoch": 2.7685393258426965, "percentage": 92.49, "elapsed_time": "8:21:51", "remaining_time": "0:40:44"}
309
+ {"current_steps": 309, "total_steps": 333, "loss": 0.408, "lr": 1.2650487906830234e-06, "epoch": 2.7775280898876407, "percentage": 92.79, "elapsed_time": "8:23:28", "remaining_time": "0:39:06"}
310
+ {"current_steps": 310, "total_steps": 333, "loss": 0.4124, "lr": 1.1623273029579195e-06, "epoch": 2.7865168539325844, "percentage": 93.09, "elapsed_time": "8:25:05", "remaining_time": "0:37:28"}
311
+ {"current_steps": 311, "total_steps": 333, "loss": 0.4153, "lr": 1.063893339298674e-06, "epoch": 2.795505617977528, "percentage": 93.39, "elapsed_time": "8:26:42", "remaining_time": "0:35:50"}
312
+ {"current_steps": 312, "total_steps": 333, "loss": 0.4128, "lr": 9.697577664220303e-07, "epoch": 2.804494382022472, "percentage": 93.69, "elapsed_time": "8:28:19", "remaining_time": "0:34:12"}
313
+ {"current_steps": 313, "total_steps": 333, "loss": 0.4047, "lr": 8.799309765195452e-07, "epoch": 2.8134831460674157, "percentage": 93.99, "elapsed_time": "8:29:56", "remaining_time": "0:32:35"}
314
+ {"current_steps": 314, "total_steps": 333, "loss": 0.4035, "lr": 7.944228861103264e-07, "epoch": 2.8224719101123594, "percentage": 94.29, "elapsed_time": "8:31:33", "remaining_time": "0:30:57"}
315
+ {"current_steps": 315, "total_steps": 333, "loss": 0.4059, "lr": 7.132429349463011e-07, "epoch": 2.831460674157303, "percentage": 94.59, "elapsed_time": "8:33:09", "remaining_time": "0:29:19"}
316
+ {"current_steps": 316, "total_steps": 333, "loss": 0.4039, "lr": 6.364000849700791e-07, "epoch": 2.8404494382022474, "percentage": 94.89, "elapsed_time": "8:34:46", "remaining_time": "0:27:41"}
317
+ {"current_steps": 317, "total_steps": 333, "loss": 0.4067, "lr": 5.639028193256257e-07, "epoch": 2.849438202247191, "percentage": 95.2, "elapsed_time": "8:36:23", "remaining_time": "0:26:03"}
318
+ {"current_steps": 318, "total_steps": 333, "loss": 0.4077, "lr": 4.957591414217344e-07, "epoch": 2.858426966292135, "percentage": 95.5, "elapsed_time": "8:38:00", "remaining_time": "0:24:26"}
319
+ {"current_steps": 319, "total_steps": 333, "loss": 0.4163, "lr": 4.3197657404848935e-07, "epoch": 2.8674157303370786, "percentage": 95.8, "elapsed_time": "8:39:37", "remaining_time": "0:22:48"}
320
+ {"current_steps": 320, "total_steps": 333, "loss": 0.4074, "lr": 3.725621585467698e-07, "epoch": 2.8764044943820224, "percentage": 96.1, "elapsed_time": "8:41:14", "remaining_time": "0:21:10"}
321
+ {"current_steps": 321, "total_steps": 333, "loss": 0.4047, "lr": 3.1752245403092963e-07, "epoch": 2.885393258426966, "percentage": 96.4, "elapsed_time": "8:42:51", "remaining_time": "0:19:32"}
322
+ {"current_steps": 322, "total_steps": 333, "loss": 0.4015, "lr": 2.6686353666468323e-07, "epoch": 2.89438202247191, "percentage": 96.7, "elapsed_time": "8:44:28", "remaining_time": "0:17:55"}
323
+ {"current_steps": 323, "total_steps": 333, "loss": 0.4007, "lr": 2.2059099899033098e-07, "epoch": 2.903370786516854, "percentage": 97.0, "elapsed_time": "8:46:05", "remaining_time": "0:16:17"}
324
+ {"current_steps": 324, "total_steps": 333, "loss": 0.4088, "lr": 1.7870994931135977e-07, "epoch": 2.912359550561798, "percentage": 97.3, "elapsed_time": "8:47:42", "remaining_time": "0:14:39"}
325
+ {"current_steps": 325, "total_steps": 333, "loss": 0.4081, "lr": 1.412250111285074e-07, "epoch": 2.9213483146067416, "percentage": 97.6, "elapsed_time": "8:49:20", "remaining_time": "0:13:01"}
326
+ {"current_steps": 326, "total_steps": 333, "loss": 0.4079, "lr": 1.0814032262935315e-07, "epoch": 2.9303370786516854, "percentage": 97.9, "elapsed_time": "8:50:56", "remaining_time": "0:11:24"}
327
+ {"current_steps": 327, "total_steps": 333, "loss": 0.4076, "lr": 7.945953623146096e-08, "epoch": 2.939325842696629, "percentage": 98.2, "elapsed_time": "8:52:33", "remaining_time": "0:09:46"}
328
+ {"current_steps": 328, "total_steps": 333, "loss": 0.4127, "lr": 5.518581817918645e-08, "epoch": 2.9483146067415733, "percentage": 98.5, "elapsed_time": "8:54:10", "remaining_time": "0:08:08"}
329
+ {"current_steps": 329, "total_steps": 333, "loss": 0.4074, "lr": 3.532184819412532e-08, "epoch": 2.9573033707865166, "percentage": 98.8, "elapsed_time": "8:55:47", "remaining_time": "0:06:30"}
330
+ {"current_steps": 330, "total_steps": 333, "loss": 0.4099, "lr": 1.9869819179292315e-08, "epoch": 2.966292134831461, "percentage": 99.1, "elapsed_time": "8:57:24", "remaining_time": "0:04:53"}
331
+ {"current_steps": 331, "total_steps": 333, "loss": 0.4092, "lr": 8.83143697702149e-09, "epoch": 2.9752808988764046, "percentage": 99.4, "elapsed_time": "8:59:01", "remaining_time": "0:03:15"}
332
+ {"current_steps": 332, "total_steps": 333, "loss": 0.4106, "lr": 2.2079201806501916e-09, "epoch": 2.9842696629213483, "percentage": 99.7, "elapsed_time": "9:00:38", "remaining_time": "0:01:37"}
333
+ {"current_steps": 333, "total_steps": 333, "loss": 0.4064, "lr": 0.0, "epoch": 2.993258426966292, "percentage": 100.0, "elapsed_time": "9:02:15", "remaining_time": "0:00:00"}
334
+ {"current_steps": 333, "total_steps": 333, "epoch": 2.993258426966292, "percentage": 100.0, "elapsed_time": "9:03:44", "remaining_time": "0:00:00"}