htlou's picture
Upload folder using huggingface_hub
122ae77 verified
raw
history blame
14.7 kB
{"current_steps": 5, "total_steps": 330, "loss": 1.7371, "learning_rate": 5e-07, "epoch": 0.045146726862302484, "percentage": 1.52, "elapsed_time": "0:01:09", "remaining_time": "1:15:20"}
{"current_steps": 10, "total_steps": 330, "loss": 1.6227, "learning_rate": 1e-06, "epoch": 0.09029345372460497, "percentage": 3.03, "elapsed_time": "0:02:15", "remaining_time": "1:12:04"}
{"current_steps": 15, "total_steps": 330, "loss": 1.2966, "learning_rate": 9.993977281025862e-07, "epoch": 0.13544018058690746, "percentage": 4.55, "elapsed_time": "0:03:19", "remaining_time": "1:09:48"}
{"current_steps": 20, "total_steps": 330, "loss": 1.1552, "learning_rate": 9.975923633360984e-07, "epoch": 0.18058690744920994, "percentage": 6.06, "elapsed_time": "0:04:24", "remaining_time": "1:08:22"}
{"current_steps": 25, "total_steps": 330, "loss": 1.0619, "learning_rate": 9.945882549823904e-07, "epoch": 0.22573363431151242, "percentage": 7.58, "elapsed_time": "0:05:29", "remaining_time": "1:07:00"}
{"current_steps": 30, "total_steps": 330, "loss": 1.0028, "learning_rate": 9.90392640201615e-07, "epoch": 0.2708803611738149, "percentage": 9.09, "elapsed_time": "0:06:34", "remaining_time": "1:05:47"}
{"current_steps": 35, "total_steps": 330, "loss": 1.0079, "learning_rate": 9.85015626597272e-07, "epoch": 0.3160270880361174, "percentage": 10.61, "elapsed_time": "0:07:40", "remaining_time": "1:04:42"}
{"current_steps": 40, "total_steps": 330, "loss": 0.971, "learning_rate": 9.784701678661044e-07, "epoch": 0.3611738148984199, "percentage": 12.12, "elapsed_time": "0:08:46", "remaining_time": "1:03:36"}
{"current_steps": 45, "total_steps": 330, "loss": 0.9516, "learning_rate": 9.707720325915103e-07, "epoch": 0.40632054176072235, "percentage": 13.64, "elapsed_time": "0:09:52", "remaining_time": "1:02:29"}
{"current_steps": 50, "total_steps": 330, "loss": 0.9534, "learning_rate": 9.619397662556433e-07, "epoch": 0.45146726862302483, "percentage": 15.15, "elapsed_time": "0:10:57", "remaining_time": "1:01:23"}
{"current_steps": 50, "total_steps": 330, "eval_loss": 0.9350618124008179, "epoch": 0.45146726862302483, "percentage": 15.15, "elapsed_time": "0:11:53", "remaining_time": "1:06:36"}
{"current_steps": 55, "total_steps": 330, "loss": 0.9279, "learning_rate": 9.519946465617217e-07, "epoch": 0.4966139954853273, "percentage": 16.67, "elapsed_time": "0:12:59", "remaining_time": "1:04:55"}
{"current_steps": 60, "total_steps": 330, "loss": 0.9373, "learning_rate": 9.409606321741774e-07, "epoch": 0.5417607223476298, "percentage": 18.18, "elapsed_time": "0:14:04", "remaining_time": "1:03:20"}
{"current_steps": 65, "total_steps": 330, "loss": 0.9134, "learning_rate": 9.28864305000136e-07, "epoch": 0.5869074492099323, "percentage": 19.7, "elapsed_time": "0:15:09", "remaining_time": "1:01:49"}
{"current_steps": 70, "total_steps": 330, "loss": 0.8902, "learning_rate": 9.157348061512726e-07, "epoch": 0.6320541760722348, "percentage": 21.21, "elapsed_time": "0:16:15", "remaining_time": "1:00:23"}
{"current_steps": 75, "total_steps": 330, "loss": 0.8907, "learning_rate": 9.016037657403223e-07, "epoch": 0.6772009029345373, "percentage": 22.73, "elapsed_time": "0:17:20", "remaining_time": "0:58:59"}
{"current_steps": 80, "total_steps": 330, "loss": 0.8798, "learning_rate": 8.865052266813685e-07, "epoch": 0.7223476297968398, "percentage": 24.24, "elapsed_time": "0:18:26", "remaining_time": "0:57:38"}
{"current_steps": 85, "total_steps": 330, "loss": 0.8873, "learning_rate": 8.704755626774795e-07, "epoch": 0.7674943566591422, "percentage": 25.76, "elapsed_time": "0:19:31", "remaining_time": "0:56:17"}
{"current_steps": 90, "total_steps": 330, "loss": 0.8951, "learning_rate": 8.535533905932737e-07, "epoch": 0.8126410835214447, "percentage": 27.27, "elapsed_time": "0:20:37", "remaining_time": "0:54:59"}
{"current_steps": 95, "total_steps": 330, "loss": 0.8813, "learning_rate": 8.357794774235092e-07, "epoch": 0.8577878103837472, "percentage": 28.79, "elapsed_time": "0:21:42", "remaining_time": "0:53:42"}
{"current_steps": 100, "total_steps": 330, "loss": 0.8729, "learning_rate": 8.171966420818227e-07, "epoch": 0.9029345372460497, "percentage": 30.3, "elapsed_time": "0:22:48", "remaining_time": "0:52:27"}
{"current_steps": 100, "total_steps": 330, "eval_loss": 0.8780717253684998, "epoch": 0.9029345372460497, "percentage": 30.3, "elapsed_time": "0:23:43", "remaining_time": "0:54:34"}
{"current_steps": 105, "total_steps": 330, "loss": 0.8738, "learning_rate": 7.978496522462167e-07, "epoch": 0.9480812641083521, "percentage": 31.82, "elapsed_time": "0:24:48", "remaining_time": "0:53:10"}
{"current_steps": 110, "total_steps": 330, "loss": 0.8693, "learning_rate": 7.777851165098011e-07, "epoch": 0.9932279909706546, "percentage": 33.33, "elapsed_time": "0:25:53", "remaining_time": "0:51:47"}
{"current_steps": 115, "total_steps": 330, "loss": 0.8148, "learning_rate": 7.570513720966107e-07, "epoch": 1.0383747178329572, "percentage": 34.85, "elapsed_time": "0:26:59", "remaining_time": "0:50:27"}
{"current_steps": 120, "total_steps": 330, "loss": 0.8324, "learning_rate": 7.356983684129989e-07, "epoch": 1.0835214446952597, "percentage": 36.36, "elapsed_time": "0:28:05", "remaining_time": "0:49:09"}
{"current_steps": 125, "total_steps": 330, "loss": 0.7914, "learning_rate": 7.13777546715141e-07, "epoch": 1.1286681715575622, "percentage": 37.88, "elapsed_time": "0:29:10", "remaining_time": "0:47:51"}
{"current_steps": 130, "total_steps": 330, "loss": 0.7891, "learning_rate": 6.913417161825449e-07, "epoch": 1.1738148984198646, "percentage": 39.39, "elapsed_time": "0:30:15", "remaining_time": "0:46:33"}
{"current_steps": 135, "total_steps": 330, "loss": 0.7905, "learning_rate": 6.684449266961099e-07, "epoch": 1.2189616252821671, "percentage": 40.91, "elapsed_time": "0:31:21", "remaining_time": "0:45:17"}
{"current_steps": 140, "total_steps": 330, "loss": 0.7919, "learning_rate": 6.451423386272311e-07, "epoch": 1.2641083521444696, "percentage": 42.42, "elapsed_time": "0:32:26", "remaining_time": "0:44:02"}
{"current_steps": 145, "total_steps": 330, "loss": 0.8129, "learning_rate": 6.21490089951632e-07, "epoch": 1.309255079006772, "percentage": 43.94, "elapsed_time": "0:33:32", "remaining_time": "0:42:47"}
{"current_steps": 150, "total_steps": 330, "loss": 0.8045, "learning_rate": 5.975451610080642e-07, "epoch": 1.3544018058690745, "percentage": 45.45, "elapsed_time": "0:34:37", "remaining_time": "0:41:32"}
{"current_steps": 150, "total_steps": 330, "eval_loss": 0.859570324420929, "epoch": 1.3544018058690745, "percentage": 45.45, "elapsed_time": "0:35:32", "remaining_time": "0:42:39"}
{"current_steps": 155, "total_steps": 330, "loss": 0.8012, "learning_rate": 5.733652372276809e-07, "epoch": 1.399548532731377, "percentage": 46.97, "elapsed_time": "0:36:38", "remaining_time": "0:41:22"}
{"current_steps": 160, "total_steps": 330, "loss": 0.7977, "learning_rate": 5.490085701647804e-07, "epoch": 1.4446952595936795, "percentage": 48.48, "elapsed_time": "0:37:43", "remaining_time": "0:40:05"}
{"current_steps": 165, "total_steps": 330, "loss": 0.7953, "learning_rate": 5.245338371637091e-07, "epoch": 1.489841986455982, "percentage": 50.0, "elapsed_time": "0:38:49", "remaining_time": "0:38:49"}
{"current_steps": 170, "total_steps": 330, "loss": 0.7917, "learning_rate": 5e-07, "epoch": 1.5349887133182845, "percentage": 51.52, "elapsed_time": "0:39:54", "remaining_time": "0:37:33"}
{"current_steps": 175, "total_steps": 330, "loss": 0.7905, "learning_rate": 4.75466162836291e-07, "epoch": 1.580135440180587, "percentage": 53.03, "elapsed_time": "0:40:58", "remaining_time": "0:36:17"}
{"current_steps": 180, "total_steps": 330, "loss": 0.7948, "learning_rate": 4.5099142983521963e-07, "epoch": 1.6252821670428894, "percentage": 54.55, "elapsed_time": "0:42:04", "remaining_time": "0:35:03"}
{"current_steps": 185, "total_steps": 330, "loss": 0.7983, "learning_rate": 4.2663476277231915e-07, "epoch": 1.670428893905192, "percentage": 56.06, "elapsed_time": "0:43:09", "remaining_time": "0:33:49"}
{"current_steps": 190, "total_steps": 330, "loss": 0.8006, "learning_rate": 4.0245483899193586e-07, "epoch": 1.7155756207674944, "percentage": 57.58, "elapsed_time": "0:44:15", "remaining_time": "0:32:36"}
{"current_steps": 195, "total_steps": 330, "loss": 0.7879, "learning_rate": 3.785099100483681e-07, "epoch": 1.7607223476297968, "percentage": 59.09, "elapsed_time": "0:45:20", "remaining_time": "0:31:23"}
{"current_steps": 200, "total_steps": 330, "loss": 0.7875, "learning_rate": 3.548576613727689e-07, "epoch": 1.8058690744920993, "percentage": 60.61, "elapsed_time": "0:46:26", "remaining_time": "0:30:10"}
{"current_steps": 200, "total_steps": 330, "eval_loss": 0.847703754901886, "epoch": 1.8058690744920993, "percentage": 60.61, "elapsed_time": "0:47:21", "remaining_time": "0:30:46"}
{"current_steps": 205, "total_steps": 330, "loss": 0.7951, "learning_rate": 3.3155507330388996e-07, "epoch": 1.8510158013544018, "percentage": 62.12, "elapsed_time": "0:48:27", "remaining_time": "0:29:32"}
{"current_steps": 210, "total_steps": 330, "loss": 0.7895, "learning_rate": 3.086582838174551e-07, "epoch": 1.8961625282167043, "percentage": 63.64, "elapsed_time": "0:49:32", "remaining_time": "0:28:18"}
{"current_steps": 215, "total_steps": 330, "loss": 0.7825, "learning_rate": 2.8622245328485907e-07, "epoch": 1.9413092550790068, "percentage": 65.15, "elapsed_time": "0:50:37", "remaining_time": "0:27:04"}
{"current_steps": 220, "total_steps": 330, "loss": 0.7836, "learning_rate": 2.6430163158700113e-07, "epoch": 1.9864559819413092, "percentage": 66.67, "elapsed_time": "0:51:43", "remaining_time": "0:25:51"}
{"current_steps": 225, "total_steps": 330, "loss": 0.7546, "learning_rate": 2.4294862790338916e-07, "epoch": 2.0316027088036117, "percentage": 68.18, "elapsed_time": "0:52:48", "remaining_time": "0:24:38"}
{"current_steps": 230, "total_steps": 330, "loss": 0.7482, "learning_rate": 2.2221488349019902e-07, "epoch": 2.0767494356659144, "percentage": 69.7, "elapsed_time": "0:53:54", "remaining_time": "0:23:26"}
{"current_steps": 235, "total_steps": 330, "loss": 0.7402, "learning_rate": 2.021503477537833e-07, "epoch": 2.1218961625282167, "percentage": 71.21, "elapsed_time": "0:55:00", "remaining_time": "0:22:14"}
{"current_steps": 240, "total_steps": 330, "loss": 0.7451, "learning_rate": 1.828033579181773e-07, "epoch": 2.1670428893905194, "percentage": 72.73, "elapsed_time": "0:56:06", "remaining_time": "0:21:02"}
{"current_steps": 245, "total_steps": 330, "loss": 0.7465, "learning_rate": 1.6422052257649077e-07, "epoch": 2.2121896162528216, "percentage": 74.24, "elapsed_time": "0:57:11", "remaining_time": "0:19:50"}
{"current_steps": 250, "total_steps": 330, "loss": 0.7391, "learning_rate": 1.4644660940672627e-07, "epoch": 2.2573363431151243, "percentage": 75.76, "elapsed_time": "0:58:17", "remaining_time": "0:18:39"}
{"current_steps": 250, "total_steps": 330, "eval_loss": 0.8480744957923889, "epoch": 2.2573363431151243, "percentage": 75.76, "elapsed_time": "0:59:12", "remaining_time": "0:18:56"}
{"current_steps": 255, "total_steps": 330, "loss": 0.7314, "learning_rate": 1.2952443732252054e-07, "epoch": 2.3024830699774266, "percentage": 77.27, "elapsed_time": "1:00:17", "remaining_time": "0:17:44"}
{"current_steps": 260, "total_steps": 330, "loss": 0.7484, "learning_rate": 1.134947733186315e-07, "epoch": 2.3476297968397293, "percentage": 78.79, "elapsed_time": "1:01:22", "remaining_time": "0:16:31"}
{"current_steps": 265, "total_steps": 330, "loss": 0.7429, "learning_rate": 9.839623425967758e-08, "epoch": 2.3927765237020315, "percentage": 80.3, "elapsed_time": "1:02:27", "remaining_time": "0:15:19"}
{"current_steps": 270, "total_steps": 330, "loss": 0.7335, "learning_rate": 8.426519384872732e-08, "epoch": 2.4379232505643342, "percentage": 81.82, "elapsed_time": "1:03:32", "remaining_time": "0:14:07"}
{"current_steps": 275, "total_steps": 330, "loss": 0.757, "learning_rate": 7.1135694999864e-08, "epoch": 2.4830699774266365, "percentage": 83.33, "elapsed_time": "1:04:37", "remaining_time": "0:12:55"}
{"current_steps": 280, "total_steps": 330, "loss": 0.7237, "learning_rate": 5.9039367825822526e-08, "epoch": 2.528216704288939, "percentage": 84.85, "elapsed_time": "1:05:42", "remaining_time": "0:11:44"}
{"current_steps": 285, "total_steps": 330, "loss": 0.7379, "learning_rate": 4.800535343827833e-08, "epoch": 2.5733634311512414, "percentage": 86.36, "elapsed_time": "1:06:47", "remaining_time": "0:10:32"}
{"current_steps": 290, "total_steps": 330, "loss": 0.7406, "learning_rate": 3.806023374435663e-08, "epoch": 2.618510158013544, "percentage": 87.88, "elapsed_time": "1:07:54", "remaining_time": "0:09:21"}
{"current_steps": 295, "total_steps": 330, "loss": 0.7231, "learning_rate": 2.922796740848965e-08, "epoch": 2.6636568848758464, "percentage": 89.39, "elapsed_time": "1:08:59", "remaining_time": "0:08:11"}
{"current_steps": 300, "total_steps": 330, "loss": 0.7339, "learning_rate": 2.1529832133895588e-08, "epoch": 2.708803611738149, "percentage": 90.91, "elapsed_time": "1:10:04", "remaining_time": "0:07:00"}
{"current_steps": 300, "total_steps": 330, "eval_loss": 0.8461548089981079, "epoch": 2.708803611738149, "percentage": 90.91, "elapsed_time": "1:10:59", "remaining_time": "0:07:05"}
{"current_steps": 305, "total_steps": 330, "loss": 0.7323, "learning_rate": 1.4984373402728012e-08, "epoch": 2.7539503386004514, "percentage": 92.42, "elapsed_time": "1:12:05", "remaining_time": "0:05:54"}
{"current_steps": 310, "total_steps": 330, "loss": 0.7267, "learning_rate": 9.607359798384784e-09, "epoch": 2.799097065462754, "percentage": 93.94, "elapsed_time": "1:13:11", "remaining_time": "0:04:43"}
{"current_steps": 315, "total_steps": 330, "loss": 0.7242, "learning_rate": 5.411745017609493e-09, "epoch": 2.8442437923250563, "percentage": 95.45, "elapsed_time": "1:14:17", "remaining_time": "0:03:32"}
{"current_steps": 320, "total_steps": 330, "loss": 0.7201, "learning_rate": 2.407636663901591e-09, "epoch": 2.889390519187359, "percentage": 96.97, "elapsed_time": "1:15:23", "remaining_time": "0:02:21"}
{"current_steps": 325, "total_steps": 330, "loss": 0.7308, "learning_rate": 6.022718974137975e-10, "epoch": 2.9345372460496613, "percentage": 98.48, "elapsed_time": "1:16:28", "remaining_time": "0:01:10"}
{"current_steps": 330, "total_steps": 330, "loss": 0.7362, "learning_rate": 0.0, "epoch": 2.979683972911964, "percentage": 100.0, "elapsed_time": "1:17:34", "remaining_time": "0:00:00"}
{"current_steps": 330, "total_steps": 330, "epoch": 2.979683972911964, "percentage": 100.0, "elapsed_time": "1:18:04", "remaining_time": "0:00:00"}