Training in progress, step 44200, checkpoint
Browse files
last-checkpoint/README.md
CHANGED
@@ -1399,6 +1399,10 @@ You can finetune this model on your own dataset.
|
|
1399 |
| 0.7757 | 43900 | 0.3049 |
|
1400 |
| 0.7766 | 43950 | 0.2939 |
|
1401 |
| 0.7775 | 44000 | 0.2909 |
|
|
|
|
|
|
|
|
|
1402 |
|
1403 |
</details>
|
1404 |
|
|
|
1399 |
| 0.7757 | 43900 | 0.3049 |
|
1400 |
| 0.7766 | 43950 | 0.2939 |
|
1401 |
| 0.7775 | 44000 | 0.2909 |
|
1402 |
+
| 0.7784 | 44050 | 0.2157 |
|
1403 |
+
| 0.7793 | 44100 | 0.2785 |
|
1404 |
+
| 0.7802 | 44150 | 0.2386 |
|
1405 |
+
| 0.7810 | 44200 | 0.3297 |
|
1406 |
|
1407 |
</details>
|
1408 |
|
last-checkpoint/model.safetensors
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 90864192
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:3c93ea012da084e7db255bf5307a12bc622616de2b559e1ebc270e29e3930b53
|
3 |
size 90864192
|
last-checkpoint/optimizer.pt
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 180609210
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:0fc375ce7c64e73dfae981ff1f0ee30f111e70f92ece0482506acc2e5c8b7278
|
3 |
size 180609210
|
last-checkpoint/rng_state.pth
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 14244
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:bc4603f12b61034f467c4243e5cacbd3dc08f83f508811af862a64abae5532b6
|
3 |
size 14244
|
last-checkpoint/scaler.pt
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 988
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:086b678b22870553eb0c5be0c61abb20b7fa45eb12fa31835cd26537ecba1df1
|
3 |
size 988
|
last-checkpoint/scheduler.pt
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 1064
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:af3f862129fa543cfe43517f44ed73b2bfc19062f029765e9ae1e7d6bb4162f5
|
3 |
size 1064
|
last-checkpoint/trainer_state.json
CHANGED
@@ -2,9 +2,9 @@
|
|
2 |
"best_global_step": null,
|
3 |
"best_metric": null,
|
4 |
"best_model_checkpoint": null,
|
5 |
-
"epoch": 0.
|
6 |
"eval_steps": 500,
|
7 |
-
"global_step":
|
8 |
"is_hyper_param_search": false,
|
9 |
"is_local_process_zero": true,
|
10 |
"is_world_process_zero": true,
|
@@ -6168,6 +6168,34 @@
|
|
6168 |
"learning_rate": 1.2377530384245351e-05,
|
6169 |
"loss": 0.2909,
|
6170 |
"step": 44000
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
6171 |
}
|
6172 |
],
|
6173 |
"logging_steps": 50,
|
|
|
2 |
"best_global_step": null,
|
3 |
"best_metric": null,
|
4 |
"best_model_checkpoint": null,
|
5 |
+
"epoch": 0.7810429220194024,
|
6 |
"eval_steps": 500,
|
7 |
+
"global_step": 44200,
|
8 |
"is_hyper_param_search": false,
|
9 |
"is_local_process_zero": true,
|
10 |
"is_world_process_zero": true,
|
|
|
6168 |
"learning_rate": 1.2377530384245351e-05,
|
6169 |
"loss": 0.2909,
|
6170 |
"step": 44000
|
6171 |
+
},
|
6172 |
+
{
|
6173 |
+
"epoch": 0.7783923238677528,
|
6174 |
+
"grad_norm": 1.421271562576294,
|
6175 |
+
"learning_rate": 1.2328444365906816e-05,
|
6176 |
+
"loss": 0.2157,
|
6177 |
+
"step": 44050
|
6178 |
+
},
|
6179 |
+
{
|
6180 |
+
"epoch": 0.7792758565849693,
|
6181 |
+
"grad_norm": 1.2172672748565674,
|
6182 |
+
"learning_rate": 1.2279358347568279e-05,
|
6183 |
+
"loss": 0.2785,
|
6184 |
+
"step": 44100
|
6185 |
+
},
|
6186 |
+
{
|
6187 |
+
"epoch": 0.7801593893021859,
|
6188 |
+
"grad_norm": 1.5359545946121216,
|
6189 |
+
"learning_rate": 1.2230272329229744e-05,
|
6190 |
+
"loss": 0.2386,
|
6191 |
+
"step": 44150
|
6192 |
+
},
|
6193 |
+
{
|
6194 |
+
"epoch": 0.7810429220194024,
|
6195 |
+
"grad_norm": 1.3057314157485962,
|
6196 |
+
"learning_rate": 1.2181186310891207e-05,
|
6197 |
+
"loss": 0.3297,
|
6198 |
+
"step": 44200
|
6199 |
}
|
6200 |
],
|
6201 |
"logging_steps": 50,
|