Training in progress, step 55600, checkpoint
Browse files
last-checkpoint/README.md
CHANGED
|
@@ -1265,6 +1265,10 @@ You can finetune this model on your own dataset.
|
|
| 1265 |
| 0.9772 | 55300 | 0.3787 |
|
| 1266 |
| 0.9781 | 55350 | 0.3196 |
|
| 1267 |
| 0.9790 | 55400 | 0.3738 |
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1268 |
|
| 1269 |
|
| 1270 |
### Framework Versions
|
|
|
|
| 1265 |
| 0.9772 | 55300 | 0.3787 |
|
| 1266 |
| 0.9781 | 55350 | 0.3196 |
|
| 1267 |
| 0.9790 | 55400 | 0.3738 |
|
| 1268 |
+
| 0.9798 | 55450 | 0.3588 |
|
| 1269 |
+
| 0.9807 | 55500 | 0.3559 |
|
| 1270 |
+
| 0.9816 | 55550 | 0.4382 |
|
| 1271 |
+
| 0.9825 | 55600 | 0.2588 |
|
| 1272 |
|
| 1273 |
|
| 1274 |
### Framework Versions
|
last-checkpoint/model.safetensors
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
size 90864192
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:4757af97769f9bf496f79482c67b4ad52305ab54793692a8f0992bfb1b3e1d99
|
| 3 |
size 90864192
|
last-checkpoint/optimizer.pt
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
size 180609210
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:bc0ad85e5b5865c2909f3ef475b6781df3d6695ce915b04da508edcabe1e676c
|
| 3 |
size 180609210
|
last-checkpoint/rng_state.pth
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
size 14244
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:53cd51ebdd8de8dece2e081300401e55897bd6527506b231b719e81675496d96
|
| 3 |
size 14244
|
last-checkpoint/scaler.pt
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
size 988
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:9cadf5e13e62099775fee57e6f6e29864a5e8da9a1f19033bf424bca204d48d8
|
| 3 |
size 988
|
last-checkpoint/scheduler.pt
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
size 1064
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:40c3ccdbd565485480694df123a18cb3bc6089aca7ac0b1c3670702db7f9e007
|
| 3 |
size 1064
|
last-checkpoint/trainer_state.json
CHANGED
|
@@ -2,9 +2,9 @@
|
|
| 2 |
"best_global_step": null,
|
| 3 |
"best_metric": null,
|
| 4 |
"best_model_checkpoint": null,
|
| 5 |
-
"epoch": 0.
|
| 6 |
"eval_steps": 500,
|
| 7 |
-
"global_step":
|
| 8 |
"is_hyper_param_search": false,
|
| 9 |
"is_local_process_zero": true,
|
| 10 |
"is_world_process_zero": true,
|
|
@@ -7764,6 +7764,34 @@
|
|
| 7764 |
"learning_rate": 1.191808525259665e-06,
|
| 7765 |
"loss": 0.3738,
|
| 7766 |
"step": 55400
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 7767 |
}
|
| 7768 |
],
|
| 7769 |
"logging_steps": 50,
|
|
|
|
| 2 |
"best_global_step": null,
|
| 3 |
"best_metric": null,
|
| 4 |
"best_model_checkpoint": null,
|
| 5 |
+
"epoch": 0.9824883815447686,
|
| 6 |
"eval_steps": 500,
|
| 7 |
+
"global_step": 55600,
|
| 8 |
"is_hyper_param_search": false,
|
| 9 |
"is_local_process_zero": true,
|
| 10 |
"is_world_process_zero": true,
|
|
|
|
| 7764 |
"learning_rate": 1.191808525259665e-06,
|
| 7765 |
"loss": 0.3738,
|
| 7766 |
"step": 55400
|
| 7767 |
+
},
|
| 7768 |
+
{
|
| 7769 |
+
"epoch": 0.979837783393119,
|
| 7770 |
+
"grad_norm": 1.5018582344055176,
|
| 7771 |
+
"learning_rate": 1.1427225069211286e-06,
|
| 7772 |
+
"loss": 0.3588,
|
| 7773 |
+
"step": 55450
|
| 7774 |
+
},
|
| 7775 |
+
{
|
| 7776 |
+
"epoch": 0.9807213161103355,
|
| 7777 |
+
"grad_norm": 1.1979721784591675,
|
| 7778 |
+
"learning_rate": 1.0936364885825922e-06,
|
| 7779 |
+
"loss": 0.3559,
|
| 7780 |
+
"step": 55500
|
| 7781 |
+
},
|
| 7782 |
+
{
|
| 7783 |
+
"epoch": 0.9816048488275521,
|
| 7784 |
+
"grad_norm": 3.014507532119751,
|
| 7785 |
+
"learning_rate": 1.0445504702440556e-06,
|
| 7786 |
+
"loss": 0.4382,
|
| 7787 |
+
"step": 55550
|
| 7788 |
+
},
|
| 7789 |
+
{
|
| 7790 |
+
"epoch": 0.9824883815447686,
|
| 7791 |
+
"grad_norm": 1.5364562273025513,
|
| 7792 |
+
"learning_rate": 9.954644519055192e-07,
|
| 7793 |
+
"loss": 0.2588,
|
| 7794 |
+
"step": 55600
|
| 7795 |
}
|
| 7796 |
],
|
| 7797 |
"logging_steps": 50,
|