Training in progress, step 32000, checkpoint
Browse files
last-checkpoint/README.md
CHANGED
|
@@ -1299,6 +1299,10 @@ You can finetune this model on your own dataset.
|
|
| 1299 |
| 0.5602 | 31700 | 0.3578 |
|
| 1300 |
| 0.5610 | 31750 | 0.3193 |
|
| 1301 |
| 0.5619 | 31800 | 0.327 |
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1302 |
|
| 1303 |
</details>
|
| 1304 |
|
|
|
|
| 1299 |
| 0.5602 | 31700 | 0.3578 |
|
| 1300 |
| 0.5610 | 31750 | 0.3193 |
|
| 1301 |
| 0.5619 | 31800 | 0.327 |
|
| 1302 |
+
| 0.5628 | 31850 | 0.3429 |
|
| 1303 |
+
| 0.5637 | 31900 | 0.2994 |
|
| 1304 |
+
| 0.5646 | 31950 | 0.3219 |
|
| 1305 |
+
| 0.5655 | 32000 | 0.2902 |
|
| 1306 |
|
| 1307 |
</details>
|
| 1308 |
|
last-checkpoint/model.safetensors
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
size 90864192
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:cea8950aa6683070e22c1a564e52123795831f72f71fb839c14d7de92ee17a17
|
| 3 |
size 90864192
|
last-checkpoint/optimizer.pt
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
size 180609210
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:4ac2571e8a99f96a6e948efc2acbf6f064d1c41ef24c68243b8bfa9248b61bef
|
| 3 |
size 180609210
|
last-checkpoint/rng_state.pth
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
size 14244
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:ea96a97725aec5e3c937ef8955386071fe1d87cf2432c4445ce113e85618ebef
|
| 3 |
size 14244
|
last-checkpoint/scaler.pt
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
size 988
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:b78f9ce48aa6920e09eb307b60e2b49742b779f95ad33075f31c6652ec108e55
|
| 3 |
size 988
|
last-checkpoint/scheduler.pt
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
size 1064
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:a6de4d7315ff5e38fd38a2be7f1976197684b731feeef6561c2bf9fe182bd3b1
|
| 3 |
size 1064
|
last-checkpoint/trainer_state.json
CHANGED
|
@@ -2,9 +2,9 @@
|
|
| 2 |
"best_global_step": null,
|
| 3 |
"best_metric": null,
|
| 4 |
"best_model_checkpoint": null,
|
| 5 |
-
"epoch": 0.
|
| 6 |
"eval_steps": 500,
|
| 7 |
-
"global_step":
|
| 8 |
"is_hyper_param_search": false,
|
| 9 |
"is_local_process_zero": true,
|
| 10 |
"is_world_process_zero": true,
|
|
@@ -4460,6 +4460,34 @@
|
|
| 4460 |
"learning_rate": 2.4348628536647623e-05,
|
| 4461 |
"loss": 0.327,
|
| 4462 |
"step": 31800
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 4463 |
}
|
| 4464 |
],
|
| 4465 |
"logging_steps": 50,
|
|
|
|
| 2 |
"best_global_step": null,
|
| 3 |
"best_metric": null,
|
| 4 |
"best_model_checkpoint": null,
|
| 5 |
+
"epoch": 0.5654609390185719,
|
| 6 |
"eval_steps": 500,
|
| 7 |
+
"global_step": 32000,
|
| 8 |
"is_hyper_param_search": false,
|
| 9 |
"is_local_process_zero": true,
|
| 10 |
"is_world_process_zero": true,
|
|
|
|
| 4460 |
"learning_rate": 2.4348628536647623e-05,
|
| 4461 |
"loss": 0.327,
|
| 4462 |
"step": 31800
|
| 4463 |
+
},
|
| 4464 |
+
{
|
| 4465 |
+
"epoch": 0.5628103408669223,
|
| 4466 |
+
"grad_norm": 1.445654034614563,
|
| 4467 |
+
"learning_rate": 2.4299542518309084e-05,
|
| 4468 |
+
"loss": 0.3429,
|
| 4469 |
+
"step": 31850
|
| 4470 |
+
},
|
| 4471 |
+
{
|
| 4472 |
+
"epoch": 0.5636938735841388,
|
| 4473 |
+
"grad_norm": 1.3795325756072998,
|
| 4474 |
+
"learning_rate": 2.425045649997055e-05,
|
| 4475 |
+
"loss": 0.2994,
|
| 4476 |
+
"step": 31900
|
| 4477 |
+
},
|
| 4478 |
+
{
|
| 4479 |
+
"epoch": 0.5645774063013553,
|
| 4480 |
+
"grad_norm": 1.7217411994934082,
|
| 4481 |
+
"learning_rate": 2.4201370481632014e-05,
|
| 4482 |
+
"loss": 0.3219,
|
| 4483 |
+
"step": 31950
|
| 4484 |
+
},
|
| 4485 |
+
{
|
| 4486 |
+
"epoch": 0.5654609390185719,
|
| 4487 |
+
"grad_norm": 1.3482351303100586,
|
| 4488 |
+
"learning_rate": 2.4152284463293475e-05,
|
| 4489 |
+
"loss": 0.2902,
|
| 4490 |
+
"step": 32000
|
| 4491 |
}
|
| 4492 |
],
|
| 4493 |
"logging_steps": 50,
|