Training in progress, step 400
Browse files- model-00001-of-00014.safetensors +1 -1
- model-00002-of-00014.safetensors +1 -1
- model-00003-of-00014.safetensors +1 -1
- model-00004-of-00014.safetensors +1 -1
- model-00005-of-00014.safetensors +1 -1
- model-00006-of-00014.safetensors +1 -1
- model-00007-of-00014.safetensors +1 -1
- model-00008-of-00014.safetensors +1 -1
- model-00009-of-00014.safetensors +1 -1
- model-00010-of-00014.safetensors +1 -1
- model-00011-of-00014.safetensors +1 -1
- model-00012-of-00014.safetensors +1 -1
- model-00013-of-00014.safetensors +1 -1
- model-00014-of-00014.safetensors +1 -1
- trainer_log.jsonl +100 -0
model-00001-of-00014.safetensors
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 4891730992
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:90fd55e3b7341e0c7caaa5f8a404dbc154fbfc2e3d3e9a34159ee70f27e8ff8f
|
3 |
size 4891730992
|
model-00002-of-00014.safetensors
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 4876059352
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:2fdba3eab8ad630dbc9f0977e0151c13ffb211c7c8b934c2e666fd73532836dd
|
3 |
size 4876059352
|
model-00003-of-00014.safetensors
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 4876059384
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:8ff940fdcf39da7a33e8a8e70e01c33a3b5942e934d6be7a283b407dbb189ab0
|
3 |
size 4876059384
|
model-00004-of-00014.safetensors
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 4876059416
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:fe09e069c26199583846a6cb76731f304bdd9d19b01e1de6d8f265fa8c02c8d7
|
3 |
size 4876059416
|
model-00005-of-00014.safetensors
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 4876059416
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:adb02c233e80fb2679692ed8b59c9aa0af939a60f755a3570cbd0b3beeaea8d0
|
3 |
size 4876059416
|
model-00006-of-00014.safetensors
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 4876059416
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:7a05d04215f2a17c0d485de8616436597a3004956645c0dfb9978b6a56d80775
|
3 |
size 4876059416
|
model-00007-of-00014.safetensors
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 4876059416
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:406b75ec6a0bd6773ae51827508a8115d1da447469518b7cbb3f94ff05f95ba8
|
3 |
size 4876059416
|
model-00008-of-00014.safetensors
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 4876059416
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:781a84b7d941078506b614f1ff615a4adbd565e177db1c6f9ca0af1f4f733a46
|
3 |
size 4876059416
|
model-00009-of-00014.safetensors
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 4876059416
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:62f79a6ae1854b8710deb203b2cad9303d4138e63cfdf56fe22943c5c4a20bfa
|
3 |
size 4876059416
|
model-00010-of-00014.safetensors
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 4876059416
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:1126670cde0455f25ae2a59c7c9b1eefb3e33be41a6d4fb969da6d4c058ed034
|
3 |
size 4876059416
|
model-00011-of-00014.safetensors
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 4876059416
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:2cdc8b8281cffb33a38ac544a03f6268bc3a76e852f7e33fde2694e4937e41fc
|
3 |
size 4876059416
|
model-00012-of-00014.safetensors
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 4876059416
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:b3b407465950e7d870072da1ebb5c5749b205471db520488ac19082ca000303b
|
3 |
size 4876059416
|
model-00013-of-00014.safetensors
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 4876059416
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:b0e839c9936ba781b64285ac3e05ca088cf94204b7c08081c53f1fc8814df955
|
3 |
size 4876059416
|
model-00014-of-00014.safetensors
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 2123397800
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:bb6163bf3b89ee02b357ee2f079fe09f878792e2d02e53406b5ef736cd452fdb
|
3 |
size 2123397800
|
trainer_log.jsonl
CHANGED
@@ -300,3 +300,103 @@
|
|
300 |
{"current_steps": 300, "total_steps": 411, "loss": 0.3634, "lr": 2.071415028359026e-06, "epoch": 2.1750759878419452, "percentage": 72.99, "elapsed_time": "1 day, 4:29:13", "remaining_time": "10:32:24"}
|
301 |
{"current_steps": 301, "total_steps": 411, "loss": 0.3362, "lr": 2.037018738245707e-06, "epoch": 2.182370820668693, "percentage": 73.24, "elapsed_time": "1 day, 4:48:41", "remaining_time": "10:31:45"}
|
302 |
{"current_steps": 302, "total_steps": 411, "loss": 0.3511, "lr": 2.0028372179729405e-06, "epoch": 2.1896656534954406, "percentage": 73.48, "elapsed_time": "1 day, 4:53:23", "remaining_time": "10:25:37"}
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
300 |
{"current_steps": 300, "total_steps": 411, "loss": 0.3634, "lr": 2.071415028359026e-06, "epoch": 2.1750759878419452, "percentage": 72.99, "elapsed_time": "1 day, 4:29:13", "remaining_time": "10:32:24"}
|
301 |
{"current_steps": 301, "total_steps": 411, "loss": 0.3362, "lr": 2.037018738245707e-06, "epoch": 2.182370820668693, "percentage": 73.24, "elapsed_time": "1 day, 4:48:41", "remaining_time": "10:31:45"}
|
302 |
{"current_steps": 302, "total_steps": 411, "loss": 0.3511, "lr": 2.0028372179729405e-06, "epoch": 2.1896656534954406, "percentage": 73.48, "elapsed_time": "1 day, 4:53:23", "remaining_time": "10:25:37"}
|
303 |
+
{"current_steps": 303, "total_steps": 411, "loss": 0.3336, "lr": 1.9688729451668116e-06, "epoch": 2.1969604863221885, "percentage": 73.72, "elapsed_time": "1 day, 4:59:08", "remaining_time": "10:19:53"}
|
304 |
+
{"current_steps": 304, "total_steps": 411, "loss": 0.3349, "lr": 1.935128381706355e-06, "epoch": 2.204255319148936, "percentage": 73.97, "elapsed_time": "1 day, 5:06:02", "remaining_time": "10:14:33"}
|
305 |
+
{"current_steps": 305, "total_steps": 411, "loss": 0.3537, "lr": 1.901605973545116e-06, "epoch": 2.211550151975684, "percentage": 74.21, "elapsed_time": "1 day, 5:12:02", "remaining_time": "10:08:54"}
|
306 |
+
{"current_steps": 306, "total_steps": 411, "loss": 0.3373, "lr": 1.8683081505338468e-06, "epoch": 2.2188449848024314, "percentage": 74.45, "elapsed_time": "1 day, 5:17:16", "remaining_time": "10:02:59"}
|
307 |
+
{"current_steps": 307, "total_steps": 411, "loss": 0.3436, "lr": 1.8352373262443918e-06, "epoch": 2.2261398176291793, "percentage": 74.7, "elapsed_time": "1 day, 5:22:36", "remaining_time": "9:57:06"}
|
308 |
+
{"current_steps": 308, "total_steps": 411, "loss": 0.3245, "lr": 1.8023958977947303e-06, "epoch": 2.2334346504559273, "percentage": 74.94, "elapsed_time": "1 day, 5:28:45", "remaining_time": "9:51:29"}
|
309 |
+
{"current_steps": 309, "total_steps": 411, "loss": 0.3317, "lr": 1.7697862456752273e-06, "epoch": 2.2407294832826747, "percentage": 75.18, "elapsed_time": "1 day, 5:34:46", "remaining_time": "9:45:51"}
|
310 |
+
{"current_steps": 310, "total_steps": 411, "loss": 0.2976, "lr": 1.7374107335760937e-06, "epoch": 2.2480243161094227, "percentage": 75.43, "elapsed_time": "1 day, 5:39:49", "remaining_time": "9:39:52"}
|
311 |
+
{"current_steps": 311, "total_steps": 411, "loss": 0.3178, "lr": 1.7052717082160348e-06, "epoch": 2.25531914893617, "percentage": 75.67, "elapsed_time": "1 day, 5:45:48", "remaining_time": "9:34:13"}
|
312 |
+
{"current_steps": 312, "total_steps": 411, "loss": 0.3187, "lr": 1.6733714991721738e-06, "epoch": 2.262613981762918, "percentage": 75.91, "elapsed_time": "1 day, 5:51:35", "remaining_time": "9:28:29"}
|
313 |
+
{"current_steps": 313, "total_steps": 411, "loss": 0.3194, "lr": 1.6417124187111778e-06, "epoch": 2.2699088145896655, "percentage": 76.16, "elapsed_time": "1 day, 5:56:32", "remaining_time": "9:22:29"}
|
314 |
+
{"current_steps": 314, "total_steps": 411, "loss": 0.3504, "lr": 1.610296761621662e-06, "epoch": 2.2772036474164135, "percentage": 76.4, "elapsed_time": "1 day, 6:02:18", "remaining_time": "9:16:45"}
|
315 |
+
{"current_steps": 315, "total_steps": 411, "loss": 0.3599, "lr": 1.5791268050478487e-06, "epoch": 2.284498480243161, "percentage": 76.64, "elapsed_time": "1 day, 6:08:10", "remaining_time": "9:11:03"}
|
316 |
+
{"current_steps": 316, "total_steps": 411, "loss": 0.3051, "lr": 1.5482048083245116e-06, "epoch": 2.291793313069909, "percentage": 76.89, "elapsed_time": "1 day, 6:13:25", "remaining_time": "9:05:10"}
|
317 |
+
{"current_steps": 317, "total_steps": 411, "loss": 0.3383, "lr": 1.517533012813217e-06, "epoch": 2.2990881458966568, "percentage": 77.13, "elapsed_time": "1 day, 6:20:44", "remaining_time": "8:59:54"}
|
318 |
+
{"current_steps": 318, "total_steps": 411, "loss": 0.3302, "lr": 1.4871136417398407e-06, "epoch": 2.3063829787234043, "percentage": 77.37, "elapsed_time": "1 day, 6:26:42", "remaining_time": "8:54:13"}
|
319 |
+
{"current_steps": 319, "total_steps": 411, "loss": 0.3615, "lr": 1.4569489000334435e-06, "epoch": 2.3136778115501517, "percentage": 77.62, "elapsed_time": "1 day, 6:31:58", "remaining_time": "8:48:20"}
|
320 |
+
{"current_steps": 320, "total_steps": 411, "loss": 0.3139, "lr": 1.427040974166427e-06, "epoch": 2.3209726443768997, "percentage": 77.86, "elapsed_time": "1 day, 6:37:23", "remaining_time": "8:42:30"}
|
321 |
+
{"current_steps": 321, "total_steps": 411, "loss": 0.3327, "lr": 1.3973920319960654e-06, "epoch": 2.3282674772036476, "percentage": 78.1, "elapsed_time": "1 day, 6:42:51", "remaining_time": "8:36:41"}
|
322 |
+
{"current_steps": 322, "total_steps": 411, "loss": 0.3183, "lr": 1.3680042226073554e-06, "epoch": 2.335562310030395, "percentage": 78.35, "elapsed_time": "1 day, 6:48:42", "remaining_time": "8:30:58"}
|
323 |
+
{"current_steps": 323, "total_steps": 411, "loss": 0.3411, "lr": 1.3388796761572493e-06, "epoch": 2.342857142857143, "percentage": 78.59, "elapsed_time": "1 day, 6:53:52", "remaining_time": "8:25:04"}
|
324 |
+
{"current_steps": 324, "total_steps": 411, "loss": 0.3722, "lr": 1.310020503720254e-06, "epoch": 2.3501519756838904, "percentage": 78.83, "elapsed_time": "1 day, 6:58:47", "remaining_time": "8:19:07"}
|
325 |
+
{"current_steps": 325, "total_steps": 411, "loss": 0.325, "lr": 1.2814287971354023e-06, "epoch": 2.3574468085106384, "percentage": 79.08, "elapsed_time": "1 day, 7:03:56", "remaining_time": "8:13:13"}
|
326 |
+
{"current_steps": 326, "total_steps": 411, "loss": 0.3247, "lr": 1.253106628854635e-06, "epoch": 2.364741641337386, "percentage": 79.32, "elapsed_time": "1 day, 7:09:18", "remaining_time": "8:07:23"}
|
327 |
+
{"current_steps": 327, "total_steps": 411, "loss": 0.3079, "lr": 1.2250560517925747e-06, "epoch": 2.3720364741641338, "percentage": 79.56, "elapsed_time": "1 day, 7:14:01", "remaining_time": "8:01:23"}
|
328 |
+
{"current_steps": 328, "total_steps": 411, "loss": 0.3446, "lr": 1.197279099177731e-06, "epoch": 2.3793313069908812, "percentage": 79.81, "elapsed_time": "1 day, 7:19:12", "remaining_time": "7:55:31"}
|
329 |
+
{"current_steps": 329, "total_steps": 411, "loss": 0.3501, "lr": 1.1697777844051105e-06, "epoch": 2.386626139817629, "percentage": 80.05, "elapsed_time": "1 day, 7:25:05", "remaining_time": "7:49:50"}
|
330 |
+
{"current_steps": 330, "total_steps": 411, "loss": 0.3213, "lr": 1.1425541008902852e-06, "epoch": 2.393920972644377, "percentage": 80.29, "elapsed_time": "1 day, 7:31:28", "remaining_time": "7:44:16"}
|
331 |
+
{"current_steps": 331, "total_steps": 411, "loss": 0.3232, "lr": 1.1156100219249022e-06, "epoch": 2.4012158054711246, "percentage": 80.54, "elapsed_time": "1 day, 7:36:32", "remaining_time": "7:38:22"}
|
332 |
+
{"current_steps": 332, "total_steps": 411, "loss": 0.3632, "lr": 1.0889475005336447e-06, "epoch": 2.4085106382978725, "percentage": 80.78, "elapsed_time": "1 day, 7:41:55", "remaining_time": "7:32:33"}
|
333 |
+
{"current_steps": 333, "total_steps": 411, "loss": 0.3355, "lr": 1.0625684693326727e-06, "epoch": 2.41580547112462, "percentage": 81.02, "elapsed_time": "1 day, 7:47:05", "remaining_time": "7:26:42"}
|
334 |
+
{"current_steps": 334, "total_steps": 411, "loss": 0.341, "lr": 1.0364748403895368e-06, "epoch": 2.423100303951368, "percentage": 81.27, "elapsed_time": "1 day, 7:52:41", "remaining_time": "7:20:57"}
|
335 |
+
{"current_steps": 335, "total_steps": 411, "loss": 0.3383, "lr": 1.0106685050845838e-06, "epoch": 2.4303951367781154, "percentage": 81.51, "elapsed_time": "1 day, 7:57:28", "remaining_time": "7:15:00"}
|
336 |
+
{"current_steps": 336, "total_steps": 411, "loss": 0.3246, "lr": 9.851513339738627e-07, "epoch": 2.4376899696048633, "percentage": 81.75, "elapsed_time": "1 day, 8:03:22", "remaining_time": "7:09:19"}
|
337 |
+
{"current_steps": 337, "total_steps": 411, "loss": 0.3418, "lr": 9.599251766535344e-07, "epoch": 2.4449848024316108, "percentage": 82.0, "elapsed_time": "1 day, 8:08:50", "remaining_time": "7:03:32"}
|
338 |
+
{"current_steps": 338, "total_steps": 411, "loss": 0.3536, "lr": 9.349918616258113e-07, "epoch": 2.4522796352583587, "percentage": 82.24, "elapsed_time": "1 day, 8:14:02", "remaining_time": "6:57:42"}
|
339 |
+
{"current_steps": 339, "total_steps": 411, "loss": 0.3278, "lr": 9.10353196166412e-07, "epoch": 2.4595744680851066, "percentage": 82.48, "elapsed_time": "1 day, 8:20:30", "remaining_time": "6:52:08"}
|
340 |
+
{"current_steps": 340, "total_steps": 411, "loss": 0.3417, "lr": 8.860109661935673e-07, "epoch": 2.466869300911854, "percentage": 82.73, "elapsed_time": "1 day, 8:26:01", "remaining_time": "6:46:22"}
|
341 |
+
{"current_steps": 341, "total_steps": 411, "loss": 0.3148, "lr": 8.619669361385663e-07, "epoch": 2.474164133738602, "percentage": 82.97, "elapsed_time": "1 day, 8:31:13", "remaining_time": "6:40:32"}
|
342 |
+
{"current_steps": 342, "total_steps": 411, "loss": 0.3392, "lr": 8.382228488178639e-07, "epoch": 2.4814589665653495, "percentage": 83.21, "elapsed_time": "1 day, 8:36:07", "remaining_time": "6:34:39"}
|
343 |
+
{"current_steps": 343, "total_steps": 411, "loss": 0.3273, "lr": 8.147804253067581e-07, "epoch": 2.4887537993920974, "percentage": 83.45, "elapsed_time": "1 day, 8:42:08", "remaining_time": "6:28:59"}
|
344 |
+
{"current_steps": 344, "total_steps": 411, "loss": 0.3112, "lr": 7.916413648146282e-07, "epoch": 2.496048632218845, "percentage": 83.7, "elapsed_time": "1 day, 8:47:11", "remaining_time": "6:23:08"}
|
345 |
+
{"current_steps": 345, "total_steps": 411, "loss": 0.3463, "lr": 7.6880734456178e-07, "epoch": 2.503343465045593, "percentage": 83.94, "elapsed_time": "1 day, 8:53:34", "remaining_time": "6:17:33"}
|
346 |
+
{"current_steps": 346, "total_steps": 411, "loss": 0.3439, "lr": 7.462800196578662e-07, "epoch": 2.5106382978723403, "percentage": 84.18, "elapsed_time": "1 day, 8:59:17", "remaining_time": "6:11:49"}
|
347 |
+
{"current_steps": 347, "total_steps": 411, "loss": 0.3303, "lr": 7.240610229819195e-07, "epoch": 2.517933130699088, "percentage": 84.43, "elapsed_time": "1 day, 9:04:56", "remaining_time": "6:06:05"}
|
348 |
+
{"current_steps": 348, "total_steps": 411, "loss": 0.3171, "lr": 7.021519650639952e-07, "epoch": 2.525227963525836, "percentage": 84.67, "elapsed_time": "1 day, 9:10:51", "remaining_time": "6:00:24"}
|
349 |
+
{"current_steps": 349, "total_steps": 411, "loss": 0.3239, "lr": 6.805544339684295e-07, "epoch": 2.5325227963525836, "percentage": 84.91, "elapsed_time": "1 day, 9:15:46", "remaining_time": "5:54:33"}
|
350 |
+
{"current_steps": 350, "total_steps": 411, "loss": 0.3378, "lr": 6.592699951787362e-07, "epoch": 2.539817629179331, "percentage": 85.16, "elapsed_time": "1 day, 9:21:27", "remaining_time": "5:48:49"}
|
351 |
+
{"current_steps": 351, "total_steps": 411, "loss": 0.2992, "lr": 6.383001914841252e-07, "epoch": 2.547112462006079, "percentage": 85.4, "elapsed_time": "1 day, 9:26:36", "remaining_time": "5:43:00"}
|
352 |
+
{"current_steps": 352, "total_steps": 411, "loss": 0.3503, "lr": 6.17646542867682e-07, "epoch": 2.554407294832827, "percentage": 85.64, "elapsed_time": "1 day, 9:32:02", "remaining_time": "5:37:14"}
|
353 |
+
{"current_steps": 353, "total_steps": 411, "loss": 0.3385, "lr": 5.973105463961864e-07, "epoch": 2.5617021276595744, "percentage": 85.89, "elapsed_time": "1 day, 9:36:47", "remaining_time": "5:31:22"}
|
354 |
+
{"current_steps": 354, "total_steps": 411, "loss": 0.3396, "lr": 5.772936761116027e-07, "epoch": 2.5689969604863223, "percentage": 86.13, "elapsed_time": "1 day, 9:42:06", "remaining_time": "5:25:35"}
|
355 |
+
{"current_steps": 355, "total_steps": 411, "loss": 0.3373, "lr": 5.575973829242365e-07, "epoch": 2.57629179331307, "percentage": 86.37, "elapsed_time": "1 day, 9:47:24", "remaining_time": "5:19:48"}
|
356 |
+
{"current_steps": 356, "total_steps": 411, "loss": 0.3386, "lr": 5.382230945075556e-07, "epoch": 2.5835866261398177, "percentage": 86.62, "elapsed_time": "1 day, 9:53:12", "remaining_time": "5:14:07"}
|
357 |
+
{"current_steps": 357, "total_steps": 411, "loss": 0.3319, "lr": 5.191722151947227e-07, "epoch": 2.590881458966565, "percentage": 86.86, "elapsed_time": "1 day, 9:58:30", "remaining_time": "5:08:20"}
|
358 |
+
{"current_steps": 358, "total_steps": 411, "loss": 0.3174, "lr": 5.004461258767873e-07, "epoch": 2.598176291793313, "percentage": 87.1, "elapsed_time": "1 day, 10:03:54", "remaining_time": "5:02:35"}
|
359 |
+
{"current_steps": 359, "total_steps": 411, "loss": 0.34, "lr": 4.820461839026047e-07, "epoch": 2.6054711246200606, "percentage": 87.35, "elapsed_time": "1 day, 10:10:05", "remaining_time": "4:56:56"}
|
360 |
+
{"current_steps": 360, "total_steps": 411, "loss": 0.3351, "lr": 4.639737229804403e-07, "epoch": 2.6127659574468085, "percentage": 87.59, "elapsed_time": "1 day, 10:15:30", "remaining_time": "4:51:11"}
|
361 |
+
{"current_steps": 361, "total_steps": 411, "loss": 0.3244, "lr": 4.4623005308130243e-07, "epoch": 2.6200607902735564, "percentage": 87.83, "elapsed_time": "1 day, 10:21:15", "remaining_time": "4:45:29"}
|
362 |
+
{"current_steps": 362, "total_steps": 411, "loss": 0.3065, "lr": 4.2881646034398926e-07, "epoch": 2.627355623100304, "percentage": 88.08, "elapsed_time": "1 day, 10:27:14", "remaining_time": "4:39:49"}
|
363 |
+
{"current_steps": 363, "total_steps": 411, "loss": 0.3306, "lr": 4.1173420698186027e-07, "epoch": 2.634650455927052, "percentage": 88.32, "elapsed_time": "1 day, 10:32:28", "remaining_time": "4:34:02"}
|
364 |
+
{"current_steps": 364, "total_steps": 411, "loss": 0.3514, "lr": 3.9498453119134917e-07, "epoch": 2.6419452887537993, "percentage": 88.56, "elapsed_time": "1 day, 10:37:59", "remaining_time": "4:28:18"}
|
365 |
+
{"current_steps": 365, "total_steps": 411, "loss": 0.3498, "lr": 3.7856864706221187e-07, "epoch": 2.6492401215805472, "percentage": 88.81, "elapsed_time": "1 day, 10:42:41", "remaining_time": "4:22:28"}
|
366 |
+
{"current_steps": 366, "total_steps": 411, "loss": 0.3358, "lr": 3.6248774448952695e-07, "epoch": 2.6565349544072947, "percentage": 89.05, "elapsed_time": "1 day, 10:48:43", "remaining_time": "4:16:48"}
|
367 |
+
{"current_steps": 367, "total_steps": 411, "loss": 0.3129, "lr": 3.467429890874424e-07, "epoch": 2.6638297872340426, "percentage": 89.29, "elapsed_time": "1 day, 10:53:36", "remaining_time": "4:11:00"}
|
368 |
+
{"current_steps": 368, "total_steps": 411, "loss": 0.3213, "lr": 3.313355221046888e-07, "epoch": 2.67112462006079, "percentage": 89.54, "elapsed_time": "1 day, 10:58:47", "remaining_time": "4:05:14"}
|
369 |
+
{"current_steps": 369, "total_steps": 411, "loss": 0.345, "lr": 3.1626646034186084e-07, "epoch": 2.678419452887538, "percentage": 89.78, "elapsed_time": "1 day, 11:04:25", "remaining_time": "3:59:31"}
|
370 |
+
{"current_steps": 370, "total_steps": 411, "loss": 0.3265, "lr": 3.015368960704584e-07, "epoch": 2.685714285714286, "percentage": 90.02, "elapsed_time": "1 day, 11:09:48", "remaining_time": "3:53:47"}
|
371 |
+
{"current_steps": 371, "total_steps": 411, "loss": 0.3434, "lr": 2.871478969537206e-07, "epoch": 2.6930091185410334, "percentage": 90.27, "elapsed_time": "1 day, 11:15:01", "remaining_time": "3:48:02"}
|
372 |
+
{"current_steps": 372, "total_steps": 411, "loss": 0.33, "lr": 2.7310050596923323e-07, "epoch": 2.700303951367781, "percentage": 90.51, "elapsed_time": "1 day, 11:20:56", "remaining_time": "3:42:21"}
|
373 |
+
{"current_steps": 373, "total_steps": 411, "loss": 0.3315, "lr": 2.593957413333331e-07, "epoch": 2.707598784194529, "percentage": 90.75, "elapsed_time": "1 day, 11:26:16", "remaining_time": "3:36:37"}
|
374 |
+
{"current_steps": 374, "total_steps": 411, "loss": 0.3574, "lr": 2.4603459642729867e-07, "epoch": 2.7148936170212767, "percentage": 91.0, "elapsed_time": "1 day, 11:31:44", "remaining_time": "3:30:53"}
|
375 |
+
{"current_steps": 375, "total_steps": 411, "loss": 0.3428, "lr": 2.330180397253473e-07, "epoch": 2.722188449848024, "percentage": 91.24, "elapsed_time": "1 day, 11:36:44", "remaining_time": "3:25:07"}
|
376 |
+
{"current_steps": 376, "total_steps": 411, "loss": 0.2903, "lr": 2.2034701472443854e-07, "epoch": 2.729483282674772, "percentage": 91.48, "elapsed_time": "1 day, 11:42:27", "remaining_time": "3:19:25"}
|
377 |
+
{"current_steps": 377, "total_steps": 411, "loss": 0.3664, "lr": 2.0802243987588068e-07, "epoch": 2.7367781155015196, "percentage": 91.73, "elapsed_time": "1 day, 11:48:02", "remaining_time": "3:13:43"}
|
378 |
+
{"current_steps": 378, "total_steps": 411, "loss": 0.3294, "lr": 1.9604520851876196e-07, "epoch": 2.7440729483282675, "percentage": 91.97, "elapsed_time": "1 day, 11:52:54", "remaining_time": "3:07:57"}
|
379 |
+
{"current_steps": 379, "total_steps": 411, "loss": 0.321, "lr": 1.8441618881519186e-07, "epoch": 2.7513677811550155, "percentage": 92.21, "elapsed_time": "1 day, 11:58:31", "remaining_time": "3:02:14"}
|
380 |
+
{"current_steps": 380, "total_steps": 411, "loss": 0.307, "lr": 1.7313622368738014e-07, "epoch": 2.758662613981763, "percentage": 92.46, "elapsed_time": "1 day, 12:03:54", "remaining_time": "2:56:31"}
|
381 |
+
{"current_steps": 381, "total_steps": 411, "loss": 0.3464, "lr": 1.6220613075653201e-07, "epoch": 2.7659574468085104, "percentage": 92.7, "elapsed_time": "1 day, 12:09:27", "remaining_time": "2:50:49"}
|
382 |
+
{"current_steps": 382, "total_steps": 411, "loss": 0.2907, "lr": 1.51626702283586e-07, "epoch": 2.7732522796352583, "percentage": 92.94, "elapsed_time": "1 day, 12:15:01", "remaining_time": "2:45:07"}
|
383 |
+
{"current_steps": 383, "total_steps": 411, "loss": 0.3481, "lr": 1.4139870511178767e-07, "epoch": 2.7805471124620063, "percentage": 93.19, "elapsed_time": "1 day, 12:20:28", "remaining_time": "2:39:24"}
|
384 |
+
{"current_steps": 384, "total_steps": 411, "loss": 0.2987, "lr": 1.3152288061110518e-07, "epoch": 2.7878419452887537, "percentage": 93.43, "elapsed_time": "1 day, 12:26:01", "remaining_time": "2:33:42"}
|
385 |
+
{"current_steps": 385, "total_steps": 411, "loss": 0.3612, "lr": 1.2199994462448906e-07, "epoch": 2.7951367781155017, "percentage": 93.67, "elapsed_time": "1 day, 12:31:11", "remaining_time": "2:27:58"}
|
386 |
+
{"current_steps": 386, "total_steps": 411, "loss": 0.3051, "lr": 1.1283058741598962e-07, "epoch": 2.802431610942249, "percentage": 93.92, "elapsed_time": "1 day, 12:36:58", "remaining_time": "2:22:17"}
|
387 |
+
{"current_steps": 387, "total_steps": 411, "loss": 0.3362, "lr": 1.0401547362071939e-07, "epoch": 2.809726443768997, "percentage": 94.16, "elapsed_time": "1 day, 12:42:42", "remaining_time": "2:16:36"}
|
388 |
+
{"current_steps": 388, "total_steps": 411, "loss": 0.3206, "lr": 9.555524219667989e-08, "epoch": 2.8170212765957445, "percentage": 94.4, "elapsed_time": "1 day, 12:48:25", "remaining_time": "2:10:54"}
|
389 |
+
{"current_steps": 389, "total_steps": 411, "loss": 0.3332, "lr": 8.745050637844532e-08, "epoch": 2.8243161094224924, "percentage": 94.65, "elapsed_time": "1 day, 12:54:08", "remaining_time": "2:05:13"}
|
390 |
+
{"current_steps": 390, "total_steps": 411, "loss": 0.2941, "lr": 7.970185363271432e-08, "epoch": 2.83161094224924, "percentage": 94.89, "elapsed_time": "1 day, 13:00:23", "remaining_time": "1:59:33"}
|
391 |
+
{"current_steps": 391, "total_steps": 411, "loss": 0.3409, "lr": 7.230984561572729e-08, "epoch": 2.838905775075988, "percentage": 95.13, "elapsed_time": "1 day, 13:06:03", "remaining_time": "1:53:51"}
|
392 |
+
{"current_steps": 392, "total_steps": 411, "loss": 0.3282, "lr": 6.527501813255344e-08, "epoch": 2.8462006079027358, "percentage": 95.38, "elapsed_time": "1 day, 13:12:52", "remaining_time": "1:48:13"}
|
393 |
+
{"current_steps": 393, "total_steps": 411, "loss": 0.3706, "lr": 5.8597881098257924e-08, "epoch": 2.8534954407294832, "percentage": 95.62, "elapsed_time": "1 day, 13:18:51", "remaining_time": "1:42:32"}
|
394 |
+
{"current_steps": 394, "total_steps": 411, "loss": 0.3159, "lr": 5.227891850093314e-08, "epoch": 2.860790273556231, "percentage": 95.86, "elapsed_time": "1 day, 13:24:37", "remaining_time": "1:36:50"}
|
395 |
+
{"current_steps": 395, "total_steps": 411, "loss": 0.3212, "lr": 4.631858836662562e-08, "epoch": 2.8680851063829786, "percentage": 96.11, "elapsed_time": "1 day, 13:30:17", "remaining_time": "1:31:09"}
|
396 |
+
{"current_steps": 396, "total_steps": 411, "loss": 0.3781, "lr": 4.071732272613149e-08, "epoch": 2.8753799392097266, "percentage": 96.35, "elapsed_time": "1 day, 13:36:45", "remaining_time": "1:25:29"}
|
397 |
+
{"current_steps": 397, "total_steps": 411, "loss": 0.3487, "lr": 3.5475527583681005e-08, "epoch": 2.882674772036474, "percentage": 96.59, "elapsed_time": "1 day, 13:42:17", "remaining_time": "1:19:46"}
|
398 |
+
{"current_steps": 398, "total_steps": 411, "loss": 0.3063, "lr": 3.059358288751202e-08, "epoch": 2.889969604863222, "percentage": 96.84, "elapsed_time": "1 day, 13:48:21", "remaining_time": "1:14:05"}
|
399 |
+
{"current_steps": 399, "total_steps": 411, "loss": 0.3352, "lr": 2.6071842502326526e-08, "epoch": 2.8972644376899694, "percentage": 97.08, "elapsed_time": "1 day, 13:53:32", "remaining_time": "1:08:22"}
|
400 |
+
{"current_steps": 400, "total_steps": 411, "loss": 0.3442, "lr": 2.1910634183644475e-08, "epoch": 2.9045592705167174, "percentage": 97.32, "elapsed_time": "1 day, 13:59:20", "remaining_time": "1:02:40"}
|
401 |
+
{"current_steps": 401, "total_steps": 411, "loss": 0.3196, "lr": 1.811025955404333e-08, "epoch": 2.9118541033434653, "percentage": 97.57, "elapsed_time": "1 day, 14:17:53", "remaining_time": "0:57:18"}
|
402 |
+
{"current_steps": 402, "total_steps": 411, "loss": 0.3319, "lr": 1.4670994081297796e-08, "epoch": 2.9191489361702128, "percentage": 97.81, "elapsed_time": "1 day, 14:22:59", "remaining_time": "0:51:33"}
|