Training in progress, step 32200, checkpoint
Browse files
last-checkpoint/README.md
CHANGED
|
@@ -1303,6 +1303,10 @@ You can finetune this model on your own dataset.
|
|
| 1303 |
| 0.5637 | 31900 | 0.2994 |
|
| 1304 |
| 0.5646 | 31950 | 0.3219 |
|
| 1305 |
| 0.5655 | 32000 | 0.2902 |
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1306 |
|
| 1307 |
</details>
|
| 1308 |
|
|
|
|
| 1303 |
| 0.5637 | 31900 | 0.2994 |
|
| 1304 |
| 0.5646 | 31950 | 0.3219 |
|
| 1305 |
| 0.5655 | 32000 | 0.2902 |
|
| 1306 |
+
| 0.5663 | 32050 | 0.3896 |
|
| 1307 |
+
| 0.5672 | 32100 | 0.2491 |
|
| 1308 |
+
| 0.5681 | 32150 | 0.2663 |
|
| 1309 |
+
| 0.5690 | 32200 | 0.3433 |
|
| 1310 |
|
| 1311 |
</details>
|
| 1312 |
|
last-checkpoint/model.safetensors
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
size 90864192
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:059e5ea13c385fd2b7824c1ae9f5d7517f93ed2064e18f707d204b5f00551fcf
|
| 3 |
size 90864192
|
last-checkpoint/optimizer.pt
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
size 180609210
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:3628f48729b03521592b21ba8e241dd8f7b12c27ab2d17f87975f425eeac02df
|
| 3 |
size 180609210
|
last-checkpoint/rng_state.pth
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
size 14244
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:50d8e0757ed6c29dd6ad40d6348476d9c45a6c913dbe6d558683a2aff7f6eeaa
|
| 3 |
size 14244
|
last-checkpoint/scaler.pt
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
size 988
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:05d2345a7bbddb12fb6a365e62bd73e47296785a601a5379725821a73d3794f3
|
| 3 |
size 988
|
last-checkpoint/scheduler.pt
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
size 1064
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:dfe5ee6b9c7e51d497fade31af9f8cbe420701d187e60d0b9c360cfa22b492c4
|
| 3 |
size 1064
|
last-checkpoint/trainer_state.json
CHANGED
|
@@ -2,9 +2,9 @@
|
|
| 2 |
"best_global_step": null,
|
| 3 |
"best_metric": null,
|
| 4 |
"best_model_checkpoint": null,
|
| 5 |
-
"epoch": 0.
|
| 6 |
"eval_steps": 500,
|
| 7 |
-
"global_step":
|
| 8 |
"is_hyper_param_search": false,
|
| 9 |
"is_local_process_zero": true,
|
| 10 |
"is_world_process_zero": true,
|
|
@@ -4488,6 +4488,34 @@
|
|
| 4488 |
"learning_rate": 2.4152284463293475e-05,
|
| 4489 |
"loss": 0.2902,
|
| 4490 |
"step": 32000
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 4491 |
}
|
| 4492 |
],
|
| 4493 |
"logging_steps": 50,
|
|
|
|
| 2 |
"best_global_step": null,
|
| 3 |
"best_metric": null,
|
| 4 |
"best_model_checkpoint": null,
|
| 5 |
+
"epoch": 0.568995069887438,
|
| 6 |
"eval_steps": 500,
|
| 7 |
+
"global_step": 32200,
|
| 8 |
"is_hyper_param_search": false,
|
| 9 |
"is_local_process_zero": true,
|
| 10 |
"is_world_process_zero": true,
|
|
|
|
| 4488 |
"learning_rate": 2.4152284463293475e-05,
|
| 4489 |
"loss": 0.2902,
|
| 4490 |
"step": 32000
|
| 4491 |
+
},
|
| 4492 |
+
{
|
| 4493 |
+
"epoch": 0.5663444717357884,
|
| 4494 |
+
"grad_norm": 2.785452365875244,
|
| 4495 |
+
"learning_rate": 2.4103198444954943e-05,
|
| 4496 |
+
"loss": 0.3896,
|
| 4497 |
+
"step": 32050
|
| 4498 |
+
},
|
| 4499 |
+
{
|
| 4500 |
+
"epoch": 0.5672280044530049,
|
| 4501 |
+
"grad_norm": 2.5383968353271484,
|
| 4502 |
+
"learning_rate": 2.4054112426616404e-05,
|
| 4503 |
+
"loss": 0.2491,
|
| 4504 |
+
"step": 32100
|
| 4505 |
+
},
|
| 4506 |
+
{
|
| 4507 |
+
"epoch": 0.5681115371702214,
|
| 4508 |
+
"grad_norm": 1.584861397743225,
|
| 4509 |
+
"learning_rate": 2.4005026408277866e-05,
|
| 4510 |
+
"loss": 0.2663,
|
| 4511 |
+
"step": 32150
|
| 4512 |
+
},
|
| 4513 |
+
{
|
| 4514 |
+
"epoch": 0.568995069887438,
|
| 4515 |
+
"grad_norm": 1.5586644411087036,
|
| 4516 |
+
"learning_rate": 2.395594038993933e-05,
|
| 4517 |
+
"loss": 0.3433,
|
| 4518 |
+
"step": 32200
|
| 4519 |
}
|
| 4520 |
],
|
| 4521 |
"logging_steps": 50,
|