chchen's picture
Training in progress, step 1050
4b1bcae verified
raw
history blame
24.3 kB
{"current_steps": 10, "total_steps": 3320, "loss": 1.3483, "lr": 3.0120481927710846e-06, "epoch": 0.015053156458744943, "percentage": 0.3, "elapsed_time": "0:01:16", "remaining_time": "7:03:14"}
{"current_steps": 20, "total_steps": 3320, "loss": 1.2949, "lr": 6.024096385542169e-06, "epoch": 0.030106312917489886, "percentage": 0.6, "elapsed_time": "0:02:32", "remaining_time": "6:59:21"}
{"current_steps": 30, "total_steps": 3320, "loss": 1.1399, "lr": 9.036144578313253e-06, "epoch": 0.04515946937623483, "percentage": 0.9, "elapsed_time": "0:03:47", "remaining_time": "6:56:29"}
{"current_steps": 40, "total_steps": 3320, "loss": 0.9064, "lr": 1.2048192771084338e-05, "epoch": 0.06021262583497977, "percentage": 1.2, "elapsed_time": "0:05:04", "remaining_time": "6:55:32"}
{"current_steps": 50, "total_steps": 3320, "loss": 0.4566, "lr": 1.5060240963855424e-05, "epoch": 0.07526578229372471, "percentage": 1.51, "elapsed_time": "0:06:19", "remaining_time": "6:53:37"}
{"current_steps": 50, "total_steps": 3320, "eval_loss": 0.31506142020225525, "epoch": 0.07526578229372471, "percentage": 1.51, "elapsed_time": "0:08:56", "remaining_time": "9:44:29"}
{"current_steps": 60, "total_steps": 3320, "loss": 0.2427, "lr": 1.8072289156626505e-05, "epoch": 0.09031893875246966, "percentage": 1.81, "elapsed_time": "0:10:16", "remaining_time": "9:17:51"}
{"current_steps": 70, "total_steps": 3320, "loss": 0.2342, "lr": 2.1084337349397593e-05, "epoch": 0.1053720952112146, "percentage": 2.11, "elapsed_time": "0:11:31", "remaining_time": "8:55:16"}
{"current_steps": 80, "total_steps": 3320, "loss": 0.1697, "lr": 2.4096385542168677e-05, "epoch": 0.12042525166995954, "percentage": 2.41, "elapsed_time": "0:12:47", "remaining_time": "8:37:51"}
{"current_steps": 90, "total_steps": 3320, "loss": 0.1242, "lr": 2.7108433734939758e-05, "epoch": 0.1354784081287045, "percentage": 2.71, "elapsed_time": "0:14:02", "remaining_time": "8:24:06"}
{"current_steps": 100, "total_steps": 3320, "loss": 0.1039, "lr": 3.012048192771085e-05, "epoch": 0.15053156458744943, "percentage": 3.01, "elapsed_time": "0:15:18", "remaining_time": "8:12:48"}
{"current_steps": 100, "total_steps": 3320, "eval_loss": 0.09335148334503174, "epoch": 0.15053156458744943, "percentage": 3.01, "elapsed_time": "0:17:55", "remaining_time": "9:37:01"}
{"current_steps": 110, "total_steps": 3320, "loss": 0.0837, "lr": 3.313253012048193e-05, "epoch": 0.16558472104619437, "percentage": 3.31, "elapsed_time": "0:19:15", "remaining_time": "9:21:50"}
{"current_steps": 120, "total_steps": 3320, "loss": 0.1008, "lr": 3.614457831325301e-05, "epoch": 0.18063787750493931, "percentage": 3.61, "elapsed_time": "0:20:30", "remaining_time": "9:07:01"}
{"current_steps": 130, "total_steps": 3320, "loss": 0.0816, "lr": 3.91566265060241e-05, "epoch": 0.19569103396368426, "percentage": 3.92, "elapsed_time": "0:21:46", "remaining_time": "8:54:17"}
{"current_steps": 140, "total_steps": 3320, "loss": 0.0828, "lr": 4.2168674698795186e-05, "epoch": 0.2107441904224292, "percentage": 4.22, "elapsed_time": "0:23:01", "remaining_time": "8:43:09"}
{"current_steps": 150, "total_steps": 3320, "loss": 0.0879, "lr": 4.5180722891566266e-05, "epoch": 0.22579734688117414, "percentage": 4.52, "elapsed_time": "0:24:17", "remaining_time": "8:33:21"}
{"current_steps": 150, "total_steps": 3320, "eval_loss": 0.07289445400238037, "epoch": 0.22579734688117414, "percentage": 4.52, "elapsed_time": "0:26:54", "remaining_time": "9:28:38"}
{"current_steps": 160, "total_steps": 3320, "loss": 0.0821, "lr": 4.8192771084337354e-05, "epoch": 0.2408505033399191, "percentage": 4.82, "elapsed_time": "0:28:14", "remaining_time": "9:17:51"}
{"current_steps": 170, "total_steps": 3320, "loss": 0.0799, "lr": 5.120481927710844e-05, "epoch": 0.25590365979866403, "percentage": 5.12, "elapsed_time": "0:29:30", "remaining_time": "9:06:47"}
{"current_steps": 180, "total_steps": 3320, "loss": 0.0729, "lr": 5.4216867469879516e-05, "epoch": 0.270956816257409, "percentage": 5.42, "elapsed_time": "0:30:46", "remaining_time": "8:56:50"}
{"current_steps": 190, "total_steps": 3320, "loss": 0.0699, "lr": 5.72289156626506e-05, "epoch": 0.2860099727161539, "percentage": 5.72, "elapsed_time": "0:32:02", "remaining_time": "8:47:44"}
{"current_steps": 200, "total_steps": 3320, "loss": 0.0684, "lr": 6.02409638554217e-05, "epoch": 0.30106312917489886, "percentage": 6.02, "elapsed_time": "0:33:18", "remaining_time": "8:39:32"}
{"current_steps": 200, "total_steps": 3320, "eval_loss": 0.06437338143587112, "epoch": 0.30106312917489886, "percentage": 6.02, "elapsed_time": "0:35:55", "remaining_time": "9:20:21"}
{"current_steps": 210, "total_steps": 3320, "loss": 0.0706, "lr": 6.325301204819278e-05, "epoch": 0.3161162856336438, "percentage": 6.33, "elapsed_time": "0:37:15", "remaining_time": "9:11:44"}
{"current_steps": 220, "total_steps": 3320, "loss": 0.066, "lr": 6.626506024096386e-05, "epoch": 0.33116944209238874, "percentage": 6.63, "elapsed_time": "0:38:30", "remaining_time": "9:02:41"}
{"current_steps": 230, "total_steps": 3320, "loss": 0.0741, "lr": 6.927710843373494e-05, "epoch": 0.3462225985511337, "percentage": 6.93, "elapsed_time": "0:39:46", "remaining_time": "8:54:23"}
{"current_steps": 240, "total_steps": 3320, "loss": 0.0612, "lr": 7.228915662650602e-05, "epoch": 0.36127575500987863, "percentage": 7.23, "elapsed_time": "0:41:02", "remaining_time": "8:46:37"}
{"current_steps": 250, "total_steps": 3320, "loss": 0.0696, "lr": 7.530120481927712e-05, "epoch": 0.3763289114686236, "percentage": 7.53, "elapsed_time": "0:42:18", "remaining_time": "8:39:26"}
{"current_steps": 250, "total_steps": 3320, "eval_loss": 0.060398537665605545, "epoch": 0.3763289114686236, "percentage": 7.53, "elapsed_time": "0:44:54", "remaining_time": "9:11:28"}
{"current_steps": 260, "total_steps": 3320, "loss": 0.0436, "lr": 7.83132530120482e-05, "epoch": 0.3913820679273685, "percentage": 7.83, "elapsed_time": "0:46:14", "remaining_time": "9:04:16"}
{"current_steps": 270, "total_steps": 3320, "loss": 0.0543, "lr": 8.132530120481928e-05, "epoch": 0.40643522438611346, "percentage": 8.13, "elapsed_time": "0:47:30", "remaining_time": "8:56:34"}
{"current_steps": 280, "total_steps": 3320, "loss": 0.0613, "lr": 8.433734939759037e-05, "epoch": 0.4214883808448584, "percentage": 8.43, "elapsed_time": "0:48:45", "remaining_time": "8:49:26"}
{"current_steps": 290, "total_steps": 3320, "loss": 0.0506, "lr": 8.734939759036145e-05, "epoch": 0.43654153730360334, "percentage": 8.73, "elapsed_time": "0:50:01", "remaining_time": "8:42:41"}
{"current_steps": 300, "total_steps": 3320, "loss": 0.064, "lr": 9.036144578313253e-05, "epoch": 0.4515946937623483, "percentage": 9.04, "elapsed_time": "0:51:17", "remaining_time": "8:36:16"}
{"current_steps": 300, "total_steps": 3320, "eval_loss": 0.053826671093702316, "epoch": 0.4515946937623483, "percentage": 9.04, "elapsed_time": "0:53:53", "remaining_time": "9:02:31"}
{"current_steps": 310, "total_steps": 3320, "loss": 0.0469, "lr": 9.337349397590361e-05, "epoch": 0.46664785022109323, "percentage": 9.34, "elapsed_time": "0:55:13", "remaining_time": "8:56:12"}
{"current_steps": 320, "total_steps": 3320, "loss": 0.0784, "lr": 9.638554216867471e-05, "epoch": 0.4817010066798382, "percentage": 9.64, "elapsed_time": "0:56:28", "remaining_time": "8:49:26"}
{"current_steps": 330, "total_steps": 3320, "loss": 0.056, "lr": 9.939759036144579e-05, "epoch": 0.4967541631385831, "percentage": 9.94, "elapsed_time": "0:57:44", "remaining_time": "8:43:07"}
{"current_steps": 340, "total_steps": 3320, "loss": 0.0396, "lr": 9.999823129264712e-05, "epoch": 0.5118073195973281, "percentage": 10.24, "elapsed_time": "0:58:59", "remaining_time": "8:37:02"}
{"current_steps": 350, "total_steps": 3320, "loss": 0.048, "lr": 9.999104613348688e-05, "epoch": 0.526860476056073, "percentage": 10.54, "elapsed_time": "1:00:15", "remaining_time": "8:31:16"}
{"current_steps": 350, "total_steps": 3320, "eval_loss": 0.055311419069767, "epoch": 0.526860476056073, "percentage": 10.54, "elapsed_time": "1:02:51", "remaining_time": "8:53:23"}
{"current_steps": 360, "total_steps": 3320, "loss": 0.0501, "lr": 9.997833477197385e-05, "epoch": 0.541913632514818, "percentage": 10.84, "elapsed_time": "1:04:11", "remaining_time": "8:47:46"}
{"current_steps": 370, "total_steps": 3320, "loss": 0.0474, "lr": 9.996009861327077e-05, "epoch": 0.5569667889735629, "percentage": 11.14, "elapsed_time": "1:05:26", "remaining_time": "8:41:44"}
{"current_steps": 380, "total_steps": 3320, "loss": 0.0538, "lr": 9.993633967327269e-05, "epoch": 0.5720199454323078, "percentage": 11.45, "elapsed_time": "1:06:42", "remaining_time": "8:36:02"}
{"current_steps": 390, "total_steps": 3320, "loss": 0.0417, "lr": 9.990706057838416e-05, "epoch": 0.5870731018910528, "percentage": 11.75, "elapsed_time": "1:07:57", "remaining_time": "8:30:33"}
{"current_steps": 400, "total_steps": 3320, "loss": 0.0568, "lr": 9.987226456522884e-05, "epoch": 0.6021262583497977, "percentage": 12.05, "elapsed_time": "1:09:12", "remaining_time": "8:25:15"}
{"current_steps": 400, "total_steps": 3320, "eval_loss": 0.05042395368218422, "epoch": 0.6021262583497977, "percentage": 12.05, "elapsed_time": "1:11:49", "remaining_time": "8:44:18"}
{"current_steps": 410, "total_steps": 3320, "loss": 0.0403, "lr": 9.983195548029173e-05, "epoch": 0.6171794148085427, "percentage": 12.35, "elapsed_time": "1:13:12", "remaining_time": "8:39:34"}
{"current_steps": 420, "total_steps": 3320, "loss": 0.0613, "lr": 9.9786137779494e-05, "epoch": 0.6322325712672876, "percentage": 12.65, "elapsed_time": "1:14:27", "remaining_time": "8:34:08"}
{"current_steps": 430, "total_steps": 3320, "loss": 0.0427, "lr": 9.973481652770038e-05, "epoch": 0.6472857277260325, "percentage": 12.95, "elapsed_time": "1:15:43", "remaining_time": "8:28:53"}
{"current_steps": 440, "total_steps": 3320, "loss": 0.0413, "lr": 9.967799739815925e-05, "epoch": 0.6623388841847775, "percentage": 13.25, "elapsed_time": "1:16:58", "remaining_time": "8:23:49"}
{"current_steps": 450, "total_steps": 3320, "loss": 0.0548, "lr": 9.961568667187556e-05, "epoch": 0.6773920406435224, "percentage": 13.55, "elapsed_time": "1:18:13", "remaining_time": "8:18:54"}
{"current_steps": 450, "total_steps": 3320, "eval_loss": 0.046242497861385345, "epoch": 0.6773920406435224, "percentage": 13.55, "elapsed_time": "1:20:50", "remaining_time": "8:35:34"}
{"current_steps": 460, "total_steps": 3320, "loss": 0.0444, "lr": 9.954789123691642e-05, "epoch": 0.6924451971022674, "percentage": 13.86, "elapsed_time": "1:22:10", "remaining_time": "8:30:56"}
{"current_steps": 470, "total_steps": 3320, "loss": 0.0486, "lr": 9.947461858764978e-05, "epoch": 0.7074983535610123, "percentage": 14.16, "elapsed_time": "1:23:26", "remaining_time": "8:25:55"}
{"current_steps": 480, "total_steps": 3320, "loss": 0.0423, "lr": 9.939587682391586e-05, "epoch": 0.7225515100197573, "percentage": 14.46, "elapsed_time": "1:24:41", "remaining_time": "8:21:07"}
{"current_steps": 490, "total_steps": 3320, "loss": 0.0604, "lr": 9.931167465013182e-05, "epoch": 0.7376046664785022, "percentage": 14.76, "elapsed_time": "1:25:57", "remaining_time": "8:16:27"}
{"current_steps": 500, "total_steps": 3320, "loss": 0.0387, "lr": 9.922202137432955e-05, "epoch": 0.7526578229372471, "percentage": 15.06, "elapsed_time": "1:27:13", "remaining_time": "8:11:54"}
{"current_steps": 500, "total_steps": 3320, "eval_loss": 0.04570082202553749, "epoch": 0.7526578229372471, "percentage": 15.06, "elapsed_time": "1:29:50", "remaining_time": "8:26:40"}
{"current_steps": 510, "total_steps": 3320, "loss": 0.0443, "lr": 9.912692690712665e-05, "epoch": 0.7677109793959921, "percentage": 15.36, "elapsed_time": "1:31:12", "remaining_time": "8:22:32"}
{"current_steps": 520, "total_steps": 3320, "loss": 0.0482, "lr": 9.902640176063103e-05, "epoch": 0.782764135854737, "percentage": 15.66, "elapsed_time": "1:32:28", "remaining_time": "8:17:55"}
{"current_steps": 530, "total_steps": 3320, "loss": 0.0529, "lr": 9.892045704727864e-05, "epoch": 0.797817292313482, "percentage": 15.96, "elapsed_time": "1:33:43", "remaining_time": "8:13:24"}
{"current_steps": 540, "total_steps": 3320, "loss": 0.0636, "lr": 9.880910447860527e-05, "epoch": 0.8128704487722269, "percentage": 16.27, "elapsed_time": "1:34:59", "remaining_time": "8:09:01"}
{"current_steps": 550, "total_steps": 3320, "loss": 0.0454, "lr": 9.869235636395177e-05, "epoch": 0.8279236052309719, "percentage": 16.57, "elapsed_time": "1:36:15", "remaining_time": "8:04:45"}
{"current_steps": 550, "total_steps": 3320, "eval_loss": 0.043903350830078125, "epoch": 0.8279236052309719, "percentage": 16.57, "elapsed_time": "1:38:52", "remaining_time": "8:17:57"}
{"current_steps": 560, "total_steps": 3320, "loss": 0.0639, "lr": 9.857022560910338e-05, "epoch": 0.8429767616897168, "percentage": 16.87, "elapsed_time": "1:40:12", "remaining_time": "8:13:51"}
{"current_steps": 570, "total_steps": 3320, "loss": 0.0414, "lr": 9.844272571486311e-05, "epoch": 0.8580299181484617, "percentage": 17.17, "elapsed_time": "1:41:27", "remaining_time": "8:09:31"}
{"current_steps": 580, "total_steps": 3320, "loss": 0.0569, "lr": 9.830987077555924e-05, "epoch": 0.8730830746072067, "percentage": 17.47, "elapsed_time": "1:42:43", "remaining_time": "8:05:17"}
{"current_steps": 590, "total_steps": 3320, "loss": 0.0629, "lr": 9.817167547748729e-05, "epoch": 0.8881362310659516, "percentage": 17.77, "elapsed_time": "1:43:59", "remaining_time": "8:01:10"}
{"current_steps": 600, "total_steps": 3320, "loss": 0.0343, "lr": 9.802815509728662e-05, "epoch": 0.9031893875246966, "percentage": 18.07, "elapsed_time": "1:45:15", "remaining_time": "7:57:09"}
{"current_steps": 600, "total_steps": 3320, "eval_loss": 0.042122405022382736, "epoch": 0.9031893875246966, "percentage": 18.07, "elapsed_time": "1:47:52", "remaining_time": "8:09:03"}
{"current_steps": 610, "total_steps": 3320, "loss": 0.0373, "lr": 9.787932550025158e-05, "epoch": 0.9182425439834415, "percentage": 18.37, "elapsed_time": "1:49:13", "remaining_time": "8:05:13"}
{"current_steps": 620, "total_steps": 3320, "loss": 0.0413, "lr": 9.772520313857775e-05, "epoch": 0.9332957004421865, "percentage": 18.67, "elapsed_time": "1:50:28", "remaining_time": "8:01:07"}
{"current_steps": 630, "total_steps": 3320, "loss": 0.0462, "lr": 9.756580504954334e-05, "epoch": 0.9483488569009314, "percentage": 18.98, "elapsed_time": "1:51:44", "remaining_time": "7:57:07"}
{"current_steps": 640, "total_steps": 3320, "loss": 0.047, "lr": 9.740114885362562e-05, "epoch": 0.9634020133596763, "percentage": 19.28, "elapsed_time": "1:53:00", "remaining_time": "7:53:14"}
{"current_steps": 650, "total_steps": 3320, "loss": 0.0363, "lr": 9.723125275255325e-05, "epoch": 0.9784551698184213, "percentage": 19.58, "elapsed_time": "1:54:16", "remaining_time": "7:49:24"}
{"current_steps": 650, "total_steps": 3320, "eval_loss": 0.0401780903339386, "epoch": 0.9784551698184213, "percentage": 19.58, "elapsed_time": "1:56:54", "remaining_time": "8:00:12"}
{"current_steps": 660, "total_steps": 3320, "loss": 0.0306, "lr": 9.705613552729415e-05, "epoch": 0.9935083262771662, "percentage": 19.88, "elapsed_time": "1:58:14", "remaining_time": "7:56:33"}
{"current_steps": 670, "total_steps": 3320, "loss": 0.0412, "lr": 9.68758165359794e-05, "epoch": 1.0085614827359113, "percentage": 20.18, "elapsed_time": "1:59:30", "remaining_time": "7:52:41"}
{"current_steps": 680, "total_steps": 3320, "loss": 0.0404, "lr": 9.669031571176322e-05, "epoch": 1.0236146391946561, "percentage": 20.48, "elapsed_time": "2:00:46", "remaining_time": "7:48:52"}
{"current_steps": 690, "total_steps": 3320, "loss": 0.0377, "lr": 9.64996535606196e-05, "epoch": 1.0386677956534012, "percentage": 20.78, "elapsed_time": "2:02:02", "remaining_time": "7:45:08"}
{"current_steps": 700, "total_steps": 3320, "loss": 0.0272, "lr": 9.630385115907545e-05, "epoch": 1.053720952112146, "percentage": 21.08, "elapsed_time": "2:03:18", "remaining_time": "7:41:30"}
{"current_steps": 700, "total_steps": 3320, "eval_loss": 0.04149024188518524, "epoch": 1.053720952112146, "percentage": 21.08, "elapsed_time": "2:05:56", "remaining_time": "7:51:21"}
{"current_steps": 710, "total_steps": 3320, "loss": 0.0345, "lr": 9.610293015188067e-05, "epoch": 1.068774108570891, "percentage": 21.39, "elapsed_time": "2:07:16", "remaining_time": "7:47:52"}
{"current_steps": 720, "total_steps": 3320, "loss": 0.0271, "lr": 9.589691274961556e-05, "epoch": 1.083827265029636, "percentage": 21.69, "elapsed_time": "2:08:32", "remaining_time": "7:44:09"}
{"current_steps": 730, "total_steps": 3320, "loss": 0.0437, "lr": 9.568582172623544e-05, "epoch": 1.098880421488381, "percentage": 21.99, "elapsed_time": "2:09:48", "remaining_time": "7:40:31"}
{"current_steps": 740, "total_steps": 3320, "loss": 0.0355, "lr": 9.546968041655326e-05, "epoch": 1.1139335779471258, "percentage": 22.29, "elapsed_time": "2:11:03", "remaining_time": "7:36:57"}
{"current_steps": 750, "total_steps": 3320, "loss": 0.0324, "lr": 9.524851271366001e-05, "epoch": 1.1289867344058706, "percentage": 22.59, "elapsed_time": "2:12:19", "remaining_time": "7:33:27"}
{"current_steps": 750, "total_steps": 3320, "eval_loss": 0.03844917565584183, "epoch": 1.1289867344058706, "percentage": 22.59, "elapsed_time": "2:14:58", "remaining_time": "7:42:29"}
{"current_steps": 760, "total_steps": 3320, "loss": 0.0288, "lr": 9.502234306628355e-05, "epoch": 1.1440398908646157, "percentage": 22.89, "elapsed_time": "2:16:18", "remaining_time": "7:39:09"}
{"current_steps": 770, "total_steps": 3320, "loss": 0.0327, "lr": 9.47911964760858e-05, "epoch": 1.1590930473233607, "percentage": 23.19, "elapsed_time": "2:17:34", "remaining_time": "7:35:37"}
{"current_steps": 780, "total_steps": 3320, "loss": 0.0284, "lr": 9.455509849489915e-05, "epoch": 1.1741462037821055, "percentage": 23.49, "elapsed_time": "2:18:50", "remaining_time": "7:32:08"}
{"current_steps": 790, "total_steps": 3320, "loss": 0.0361, "lr": 9.431407522190175e-05, "epoch": 1.1891993602408506, "percentage": 23.8, "elapsed_time": "2:20:06", "remaining_time": "7:28:43"}
{"current_steps": 800, "total_steps": 3320, "loss": 0.0394, "lr": 9.406815330073244e-05, "epoch": 1.2042525166995954, "percentage": 24.1, "elapsed_time": "2:21:23", "remaining_time": "7:25:21"}
{"current_steps": 800, "total_steps": 3320, "eval_loss": 0.042881306260824203, "epoch": 1.2042525166995954, "percentage": 24.1, "elapsed_time": "2:24:01", "remaining_time": "7:33:40"}
{"current_steps": 810, "total_steps": 3320, "loss": 0.0394, "lr": 9.381735991654546e-05, "epoch": 1.2193056731583405, "percentage": 24.4, "elapsed_time": "2:25:21", "remaining_time": "7:30:27"}
{"current_steps": 820, "total_steps": 3320, "loss": 0.038, "lr": 9.356172279300528e-05, "epoch": 1.2343588296170853, "percentage": 24.7, "elapsed_time": "2:26:38", "remaining_time": "7:27:03"}
{"current_steps": 830, "total_steps": 3320, "loss": 0.0351, "lr": 9.330127018922194e-05, "epoch": 1.2494119860758304, "percentage": 25.0, "elapsed_time": "2:27:54", "remaining_time": "7:23:42"}
{"current_steps": 840, "total_steps": 3320, "loss": 0.0379, "lr": 9.303603089662716e-05, "epoch": 1.2644651425345752, "percentage": 25.3, "elapsed_time": "2:29:10", "remaining_time": "7:20:25"}
{"current_steps": 850, "total_steps": 3320, "loss": 0.0297, "lr": 9.276603423579164e-05, "epoch": 1.2795182989933203, "percentage": 25.6, "elapsed_time": "2:30:26", "remaining_time": "7:17:10"}
{"current_steps": 850, "total_steps": 3320, "eval_loss": 0.04107122868299484, "epoch": 1.2795182989933203, "percentage": 25.6, "elapsed_time": "2:33:05", "remaining_time": "7:24:51"}
{"current_steps": 860, "total_steps": 3320, "loss": 0.0429, "lr": 9.249131005318387e-05, "epoch": 1.294571455452065, "percentage": 25.9, "elapsed_time": "2:34:26", "remaining_time": "7:21:45"}
{"current_steps": 870, "total_steps": 3320, "loss": 0.0349, "lr": 9.221188871787075e-05, "epoch": 1.30962461191081, "percentage": 26.2, "elapsed_time": "2:35:42", "remaining_time": "7:18:29"}
{"current_steps": 880, "total_steps": 3320, "loss": 0.037, "lr": 9.192780111816047e-05, "epoch": 1.324677768369555, "percentage": 26.51, "elapsed_time": "2:36:59", "remaining_time": "7:15:16"}
{"current_steps": 890, "total_steps": 3320, "loss": 0.0327, "lr": 9.163907865818806e-05, "epoch": 1.3397309248283, "percentage": 26.81, "elapsed_time": "2:38:15", "remaining_time": "7:12:05"}
{"current_steps": 900, "total_steps": 3320, "loss": 0.0423, "lr": 9.134575325444376e-05, "epoch": 1.3547840812870449, "percentage": 27.11, "elapsed_time": "2:39:31", "remaining_time": "7:08:56"}
{"current_steps": 900, "total_steps": 3320, "eval_loss": 0.03963349014520645, "epoch": 1.3547840812870449, "percentage": 27.11, "elapsed_time": "2:42:10", "remaining_time": "7:16:03"}
{"current_steps": 910, "total_steps": 3320, "loss": 0.0292, "lr": 9.104785733224496e-05, "epoch": 1.3698372377457897, "percentage": 27.41, "elapsed_time": "2:43:30", "remaining_time": "7:13:02"}
{"current_steps": 920, "total_steps": 3320, "loss": 0.0358, "lr": 9.07454238221517e-05, "epoch": 1.3848903942045347, "percentage": 27.71, "elapsed_time": "2:44:47", "remaining_time": "7:09:52"}
{"current_steps": 930, "total_steps": 3320, "loss": 0.0294, "lr": 9.043848615632642e-05, "epoch": 1.3999435506632798, "percentage": 28.01, "elapsed_time": "2:46:03", "remaining_time": "7:06:44"}
{"current_steps": 940, "total_steps": 3320, "loss": 0.0375, "lr": 9.012707826483823e-05, "epoch": 1.4149967071220246, "percentage": 28.31, "elapsed_time": "2:47:19", "remaining_time": "7:03:40"}
{"current_steps": 950, "total_steps": 3320, "loss": 0.0324, "lr": 8.98112345719122e-05, "epoch": 1.4300498635807695, "percentage": 28.61, "elapsed_time": "2:48:36", "remaining_time": "7:00:38"}
{"current_steps": 950, "total_steps": 3320, "eval_loss": 0.03718731552362442, "epoch": 1.4300498635807695, "percentage": 28.61, "elapsed_time": "2:51:15", "remaining_time": "7:07:14"}
{"current_steps": 960, "total_steps": 3320, "loss": 0.0385, "lr": 8.949098999212391e-05, "epoch": 1.4451030200395145, "percentage": 28.92, "elapsed_time": "2:52:35", "remaining_time": "7:04:18"}
{"current_steps": 970, "total_steps": 3320, "loss": 0.0321, "lr": 8.916637992653991e-05, "epoch": 1.4601561764982596, "percentage": 29.22, "elapsed_time": "2:53:52", "remaining_time": "7:01:13"}
{"current_steps": 980, "total_steps": 3320, "loss": 0.0299, "lr": 8.883744025880428e-05, "epoch": 1.4752093329570044, "percentage": 29.52, "elapsed_time": "2:55:08", "remaining_time": "6:58:11"}
{"current_steps": 990, "total_steps": 3320, "loss": 0.0304, "lr": 8.850420735117202e-05, "epoch": 1.4902624894157492, "percentage": 29.82, "elapsed_time": "2:56:24", "remaining_time": "6:55:11"}
{"current_steps": 1000, "total_steps": 3320, "loss": 0.0311, "lr": 8.816671804048933e-05, "epoch": 1.5053156458744943, "percentage": 30.12, "elapsed_time": "2:57:41", "remaining_time": "6:52:13"}
{"current_steps": 1000, "total_steps": 3320, "eval_loss": 0.03950938582420349, "epoch": 1.5053156458744943, "percentage": 30.12, "elapsed_time": "3:00:19", "remaining_time": "6:58:22"}
{"current_steps": 1010, "total_steps": 3320, "loss": 0.0358, "lr": 8.782500963412156e-05, "epoch": 1.5203688023332393, "percentage": 30.42, "elapsed_time": "3:01:40", "remaining_time": "6:55:30"}
{"current_steps": 1020, "total_steps": 3320, "loss": 0.029, "lr": 8.747911990582912e-05, "epoch": 1.5354219587919842, "percentage": 30.72, "elapsed_time": "3:02:56", "remaining_time": "6:52:32"}
{"current_steps": 1030, "total_steps": 3320, "loss": 0.0288, "lr": 8.712908709159183e-05, "epoch": 1.550475115250729, "percentage": 31.02, "elapsed_time": "3:04:13", "remaining_time": "6:49:35"}
{"current_steps": 1040, "total_steps": 3320, "loss": 0.0422, "lr": 8.677494988538211e-05, "epoch": 1.565528271709474, "percentage": 31.33, "elapsed_time": "3:05:29", "remaining_time": "6:46:40"}
{"current_steps": 1050, "total_steps": 3320, "loss": 0.0309, "lr": 8.641674743488769e-05, "epoch": 1.5805814281682191, "percentage": 31.63, "elapsed_time": "3:06:46", "remaining_time": "6:43:47"}
{"current_steps": 1050, "total_steps": 3320, "eval_loss": 0.04065566882491112, "epoch": 1.5805814281682191, "percentage": 31.63, "elapsed_time": "3:09:25", "remaining_time": "6:49:31"}