Training in progress, step 27000, checkpoint
Browse files
last-checkpoint/README.md
CHANGED
|
@@ -1197,6 +1197,10 @@ You can finetune this model on your own dataset.
|
|
| 1197 |
| 0.4718 | 26700 | 0.2572 |
|
| 1198 |
| 0.4727 | 26750 | 0.2821 |
|
| 1199 |
| 0.4736 | 26800 | 0.2753 |
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1200 |
|
| 1201 |
|
| 1202 |
### Framework Versions
|
|
|
|
| 1197 |
| 0.4718 | 26700 | 0.2572 |
|
| 1198 |
| 0.4727 | 26750 | 0.2821 |
|
| 1199 |
| 0.4736 | 26800 | 0.2753 |
|
| 1200 |
+
| 0.4745 | 26850 | 0.2789 |
|
| 1201 |
+
| 0.4753 | 26900 | 0.5175 |
|
| 1202 |
+
| 0.4762 | 26950 | 0.3398 |
|
| 1203 |
+
| 0.4771 | 27000 | 0.3683 |
|
| 1204 |
|
| 1205 |
|
| 1206 |
### Framework Versions
|
last-checkpoint/model.safetensors
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
size 90864192
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:157a36f69c8d6be89b19a5fc2041a6a70bae891ca7bdb6e1f8c5561949e9bafa
|
| 3 |
size 90864192
|
last-checkpoint/optimizer.pt
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
size 180609210
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:3cf3f6a255c756d17edb6da60dbf398937995bd4e9513159583e5e4237f23a63
|
| 3 |
size 180609210
|
last-checkpoint/rng_state.pth
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
size 14244
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:77b7843d303f1fcbcb7ded0ee18633ae1a240b93a82ce64b7dc80620210cefa4
|
| 3 |
size 14244
|
last-checkpoint/scaler.pt
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
size 988
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:f721603f06800f16238813b709df823dd021b986d5f3f64a3fdb3ad2473f4313
|
| 3 |
size 988
|
last-checkpoint/scheduler.pt
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
size 1064
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:2b9c472a19e7b9448212aaddb68f6d9878d89c838a06487c2d680b2179532b97
|
| 3 |
size 1064
|
last-checkpoint/trainer_state.json
CHANGED
|
@@ -2,9 +2,9 @@
|
|
| 2 |
"best_global_step": null,
|
| 3 |
"best_metric": null,
|
| 4 |
"best_model_checkpoint": null,
|
| 5 |
-
"epoch": 0.
|
| 6 |
"eval_steps": 500,
|
| 7 |
-
"global_step":
|
| 8 |
"is_hyper_param_search": false,
|
| 9 |
"is_local_process_zero": true,
|
| 10 |
"is_world_process_zero": true,
|
|
@@ -3760,6 +3760,34 @@
|
|
| 3760 |
"learning_rate": 2.9256248650134498e-05,
|
| 3761 |
"loss": 0.2753,
|
| 3762 |
"step": 26800
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 3763 |
}
|
| 3764 |
],
|
| 3765 |
"logging_steps": 50,
|
|
|
|
| 2 |
"best_global_step": null,
|
| 3 |
"best_metric": null,
|
| 4 |
"best_model_checkpoint": null,
|
| 5 |
+
"epoch": 0.47710766729692,
|
| 6 |
"eval_steps": 500,
|
| 7 |
+
"global_step": 27000,
|
| 8 |
"is_hyper_param_search": false,
|
| 9 |
"is_local_process_zero": true,
|
| 10 |
"is_world_process_zero": true,
|
|
|
|
| 3760 |
"learning_rate": 2.9256248650134498e-05,
|
| 3761 |
"loss": 0.2753,
|
| 3762 |
"step": 26800
|
| 3763 |
+
},
|
| 3764 |
+
{
|
| 3765 |
+
"epoch": 0.47445706914527047,
|
| 3766 |
+
"grad_norm": 1.7398908138275146,
|
| 3767 |
+
"learning_rate": 2.920716263179596e-05,
|
| 3768 |
+
"loss": 0.2789,
|
| 3769 |
+
"step": 26850
|
| 3770 |
+
},
|
| 3771 |
+
{
|
| 3772 |
+
"epoch": 0.47534060186248694,
|
| 3773 |
+
"grad_norm": 1.456929087638855,
|
| 3774 |
+
"learning_rate": 2.9158076613457424e-05,
|
| 3775 |
+
"loss": 0.5175,
|
| 3776 |
+
"step": 26900
|
| 3777 |
+
},
|
| 3778 |
+
{
|
| 3779 |
+
"epoch": 0.4762241345797035,
|
| 3780 |
+
"grad_norm": 1.4763001203536987,
|
| 3781 |
+
"learning_rate": 2.910899059511889e-05,
|
| 3782 |
+
"loss": 0.3398,
|
| 3783 |
+
"step": 26950
|
| 3784 |
+
},
|
| 3785 |
+
{
|
| 3786 |
+
"epoch": 0.47710766729692,
|
| 3787 |
+
"grad_norm": 1.3316082954406738,
|
| 3788 |
+
"learning_rate": 2.905990457678035e-05,
|
| 3789 |
+
"loss": 0.3683,
|
| 3790 |
+
"step": 27000
|
| 3791 |
}
|
| 3792 |
],
|
| 3793 |
"logging_steps": 50,
|