chchen's picture
Training in progress, step 350
e33a3b0 verified
raw
history blame
8.14 kB
{"current_steps": 10, "total_steps": 3270, "loss": 1.3515, "lr": 3.0581039755351682e-06, "epoch": 0.015278838808250574, "percentage": 0.31, "elapsed_time": "0:01:29", "remaining_time": "8:08:42"}
{"current_steps": 20, "total_steps": 3270, "loss": 1.2833, "lr": 6.1162079510703365e-06, "epoch": 0.030557677616501147, "percentage": 0.61, "elapsed_time": "0:03:02", "remaining_time": "8:14:52"}
{"current_steps": 30, "total_steps": 3270, "loss": 1.0237, "lr": 9.174311926605506e-06, "epoch": 0.04583651642475172, "percentage": 0.92, "elapsed_time": "0:04:35", "remaining_time": "8:15:23"}
{"current_steps": 40, "total_steps": 3270, "loss": 0.8029, "lr": 1.2232415902140673e-05, "epoch": 0.061115355233002294, "percentage": 1.22, "elapsed_time": "0:06:07", "remaining_time": "8:14:51"}
{"current_steps": 50, "total_steps": 3270, "loss": 0.5143, "lr": 1.5290519877675842e-05, "epoch": 0.07639419404125286, "percentage": 1.53, "elapsed_time": "0:07:39", "remaining_time": "8:13:22"}
{"current_steps": 50, "total_steps": 3270, "eval_loss": 0.30689939856529236, "epoch": 0.07639419404125286, "percentage": 1.53, "elapsed_time": "0:10:51", "remaining_time": "11:39:34"}
{"current_steps": 60, "total_steps": 3270, "loss": 0.2999, "lr": 1.834862385321101e-05, "epoch": 0.09167303284950344, "percentage": 1.83, "elapsed_time": "0:12:27", "remaining_time": "11:06:14"}
{"current_steps": 70, "total_steps": 3270, "loss": 0.2094, "lr": 2.140672782874618e-05, "epoch": 0.10695187165775401, "percentage": 2.14, "elapsed_time": "0:13:59", "remaining_time": "10:39:22"}
{"current_steps": 80, "total_steps": 3270, "loss": 0.1623, "lr": 2.4464831804281346e-05, "epoch": 0.12223071046600459, "percentage": 2.45, "elapsed_time": "0:15:30", "remaining_time": "10:18:38"}
{"current_steps": 90, "total_steps": 3270, "loss": 0.1138, "lr": 2.7522935779816515e-05, "epoch": 0.13750954927425516, "percentage": 2.75, "elapsed_time": "0:17:02", "remaining_time": "10:02:16"}
{"current_steps": 100, "total_steps": 3270, "loss": 0.1115, "lr": 3.0581039755351684e-05, "epoch": 0.15278838808250572, "percentage": 3.06, "elapsed_time": "0:18:34", "remaining_time": "9:48:48"}
{"current_steps": 100, "total_steps": 3270, "eval_loss": 0.08002135157585144, "epoch": 0.15278838808250572, "percentage": 3.06, "elapsed_time": "0:21:46", "remaining_time": "11:30:00"}
{"current_steps": 110, "total_steps": 3270, "loss": 0.0747, "lr": 3.363914373088685e-05, "epoch": 0.16806722689075632, "percentage": 3.36, "elapsed_time": "0:23:20", "remaining_time": "11:10:39"}
{"current_steps": 120, "total_steps": 3270, "loss": 0.0824, "lr": 3.669724770642202e-05, "epoch": 0.18334606569900688, "percentage": 3.67, "elapsed_time": "0:24:52", "remaining_time": "10:52:58"}
{"current_steps": 130, "total_steps": 3270, "loss": 0.0737, "lr": 3.9755351681957185e-05, "epoch": 0.19862490450725745, "percentage": 3.98, "elapsed_time": "0:26:24", "remaining_time": "10:37:46"}
{"current_steps": 140, "total_steps": 3270, "loss": 0.0822, "lr": 4.281345565749236e-05, "epoch": 0.21390374331550802, "percentage": 4.28, "elapsed_time": "0:27:55", "remaining_time": "10:24:26"}
{"current_steps": 150, "total_steps": 3270, "loss": 0.0781, "lr": 4.587155963302753e-05, "epoch": 0.22918258212375858, "percentage": 4.59, "elapsed_time": "0:29:28", "remaining_time": "10:13:03"}
{"current_steps": 150, "total_steps": 3270, "eval_loss": 0.06360089778900146, "epoch": 0.22918258212375858, "percentage": 4.59, "elapsed_time": "0:32:40", "remaining_time": "11:19:37"}
{"current_steps": 160, "total_steps": 3270, "loss": 0.0754, "lr": 4.892966360856269e-05, "epoch": 0.24446142093200918, "percentage": 4.89, "elapsed_time": "0:34:15", "remaining_time": "11:05:56"}
{"current_steps": 170, "total_steps": 3270, "loss": 0.0666, "lr": 5.1987767584097854e-05, "epoch": 0.2597402597402597, "percentage": 5.2, "elapsed_time": "0:35:48", "remaining_time": "10:52:51"}
{"current_steps": 180, "total_steps": 3270, "loss": 0.0705, "lr": 5.504587155963303e-05, "epoch": 0.2750190985485103, "percentage": 5.5, "elapsed_time": "0:37:20", "remaining_time": "10:40:55"}
{"current_steps": 190, "total_steps": 3270, "loss": 0.0741, "lr": 5.81039755351682e-05, "epoch": 0.2902979373567609, "percentage": 5.81, "elapsed_time": "0:38:51", "remaining_time": "10:30:02"}
{"current_steps": 200, "total_steps": 3270, "loss": 0.0677, "lr": 6.116207951070337e-05, "epoch": 0.30557677616501144, "percentage": 6.12, "elapsed_time": "0:40:23", "remaining_time": "10:20:03"}
{"current_steps": 200, "total_steps": 3270, "eval_loss": 0.059481341391801834, "epoch": 0.30557677616501144, "percentage": 6.12, "elapsed_time": "0:43:34", "remaining_time": "11:08:54"}
{"current_steps": 210, "total_steps": 3270, "loss": 0.0619, "lr": 6.422018348623854e-05, "epoch": 0.32085561497326204, "percentage": 6.42, "elapsed_time": "0:45:09", "remaining_time": "10:57:55"}
{"current_steps": 220, "total_steps": 3270, "loss": 0.0806, "lr": 6.72782874617737e-05, "epoch": 0.33613445378151263, "percentage": 6.73, "elapsed_time": "0:46:40", "remaining_time": "10:47:11"}
{"current_steps": 230, "total_steps": 3270, "loss": 0.0677, "lr": 7.033639143730886e-05, "epoch": 0.35141329258976317, "percentage": 7.03, "elapsed_time": "0:48:12", "remaining_time": "10:37:13"}
{"current_steps": 240, "total_steps": 3270, "loss": 0.0606, "lr": 7.339449541284404e-05, "epoch": 0.36669213139801377, "percentage": 7.34, "elapsed_time": "0:49:44", "remaining_time": "10:27:58"}
{"current_steps": 250, "total_steps": 3270, "loss": 0.0609, "lr": 7.645259938837921e-05, "epoch": 0.3819709702062643, "percentage": 7.65, "elapsed_time": "0:51:16", "remaining_time": "10:19:22"}
{"current_steps": 250, "total_steps": 3270, "eval_loss": 0.04995494335889816, "epoch": 0.3819709702062643, "percentage": 7.65, "elapsed_time": "0:54:27", "remaining_time": "10:57:49"}
{"current_steps": 260, "total_steps": 3270, "loss": 0.0462, "lr": 7.951070336391437e-05, "epoch": 0.3972498090145149, "percentage": 7.95, "elapsed_time": "0:56:01", "remaining_time": "10:48:37"}
{"current_steps": 270, "total_steps": 3270, "loss": 0.0799, "lr": 8.256880733944955e-05, "epoch": 0.4125286478227655, "percentage": 8.26, "elapsed_time": "0:57:33", "remaining_time": "10:39:31"}
{"current_steps": 280, "total_steps": 3270, "loss": 0.0758, "lr": 8.562691131498472e-05, "epoch": 0.42780748663101603, "percentage": 8.56, "elapsed_time": "0:59:04", "remaining_time": "10:30:51"}
{"current_steps": 290, "total_steps": 3270, "loss": 0.0554, "lr": 8.868501529051988e-05, "epoch": 0.4430863254392666, "percentage": 8.87, "elapsed_time": "1:00:35", "remaining_time": "10:22:42"}
{"current_steps": 300, "total_steps": 3270, "loss": 0.0442, "lr": 9.174311926605506e-05, "epoch": 0.45836516424751717, "percentage": 9.17, "elapsed_time": "1:02:07", "remaining_time": "10:14:58"}
{"current_steps": 300, "total_steps": 3270, "eval_loss": 0.051944799721241, "epoch": 0.45836516424751717, "percentage": 9.17, "elapsed_time": "1:05:18", "remaining_time": "10:46:31"}
{"current_steps": 310, "total_steps": 3270, "loss": 0.0433, "lr": 9.480122324159021e-05, "epoch": 0.47364400305576776, "percentage": 9.48, "elapsed_time": "1:06:53", "remaining_time": "10:38:45"}
{"current_steps": 320, "total_steps": 3270, "loss": 0.0546, "lr": 9.785932721712538e-05, "epoch": 0.48892284186401835, "percentage": 9.79, "elapsed_time": "1:08:25", "remaining_time": "10:30:45"}
{"current_steps": 330, "total_steps": 3270, "loss": 0.0597, "lr": 9.999974360983129e-05, "epoch": 0.5042016806722689, "percentage": 10.09, "elapsed_time": "1:09:56", "remaining_time": "10:23:11"}
{"current_steps": 340, "total_steps": 3270, "loss": 0.0626, "lr": 9.999518563553522e-05, "epoch": 0.5194805194805194, "percentage": 10.4, "elapsed_time": "1:11:28", "remaining_time": "10:15:59"}
{"current_steps": 350, "total_steps": 3270, "loss": 0.0605, "lr": 9.998493069976636e-05, "epoch": 0.5347593582887701, "percentage": 10.7, "elapsed_time": "1:13:01", "remaining_time": "10:09:10"}
{"current_steps": 350, "total_steps": 3270, "eval_loss": 0.052965257316827774, "epoch": 0.5347593582887701, "percentage": 10.7, "elapsed_time": "1:16:13", "remaining_time": "10:35:54"}