Training in progress, step 31000, checkpoint
Browse files
last-checkpoint/README.md
CHANGED
|
@@ -1277,6 +1277,10 @@ You can finetune this model on your own dataset.
|
|
| 1277 |
| 0.5425 | 30700 | 0.3094 |
|
| 1278 |
| 0.5434 | 30750 | 0.3077 |
|
| 1279 |
| 0.5443 | 30800 | 0.3505 |
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1280 |
|
| 1281 |
|
| 1282 |
### Framework Versions
|
|
|
|
| 1277 |
| 0.5425 | 30700 | 0.3094 |
|
| 1278 |
| 0.5434 | 30750 | 0.3077 |
|
| 1279 |
| 0.5443 | 30800 | 0.3505 |
|
| 1280 |
+
| 0.5451 | 30850 | 0.3485 |
|
| 1281 |
+
| 0.5460 | 30900 | 0.331 |
|
| 1282 |
+
| 0.5469 | 30950 | 0.2846 |
|
| 1283 |
+
| 0.5478 | 31000 | 0.3647 |
|
| 1284 |
|
| 1285 |
|
| 1286 |
### Framework Versions
|
last-checkpoint/model.safetensors
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
size 90864192
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:88d75ffa8acb9d0ae6da6b85c5ebacb5d6d497b0b7f8d1e0cc906632d66303da
|
| 3 |
size 90864192
|
last-checkpoint/optimizer.pt
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
size 180609210
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:1ce5db6bab84b13b8d6237d74a48b1c574cceb26d03115a289d544fd81b83fe0
|
| 3 |
size 180609210
|
last-checkpoint/rng_state.pth
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
size 14244
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:225aac588847ab0002b2ca78215dc480b08f8f2752e40d301dfd2554473eaa86
|
| 3 |
size 14244
|
last-checkpoint/scaler.pt
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
size 988
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:f17b09e37e3cf1eb4e07e5a39443f3088190a89ec52eee73b652e920bd5e3c6d
|
| 3 |
size 988
|
last-checkpoint/scheduler.pt
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
size 1064
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:2d9c6b8e683bd0522d336f6d260614dd403087df118f434096a2340dd6c2f5dd
|
| 3 |
size 1064
|
last-checkpoint/trainer_state.json
CHANGED
|
@@ -2,9 +2,9 @@
|
|
| 2 |
"best_global_step": null,
|
| 3 |
"best_metric": null,
|
| 4 |
"best_model_checkpoint": null,
|
| 5 |
-
"epoch": 0.
|
| 6 |
"eval_steps": 500,
|
| 7 |
-
"global_step":
|
| 8 |
"is_hyper_param_search": false,
|
| 9 |
"is_local_process_zero": true,
|
| 10 |
"is_world_process_zero": true,
|
|
@@ -4320,6 +4320,34 @@
|
|
| 4320 |
"learning_rate": 2.533034890341835e-05,
|
| 4321 |
"loss": 0.3505,
|
| 4322 |
"step": 30800
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 4323 |
}
|
| 4324 |
],
|
| 4325 |
"logging_steps": 50,
|
|
|
|
| 2 |
"best_global_step": null,
|
| 3 |
"best_metric": null,
|
| 4 |
"best_model_checkpoint": null,
|
| 5 |
+
"epoch": 0.5477902846742415,
|
| 6 |
"eval_steps": 500,
|
| 7 |
+
"global_step": 31000,
|
| 8 |
"is_hyper_param_search": false,
|
| 9 |
"is_local_process_zero": true,
|
| 10 |
"is_world_process_zero": true,
|
|
|
|
| 4320 |
"learning_rate": 2.533034890341835e-05,
|
| 4321 |
"loss": 0.3505,
|
| 4322 |
"step": 30800
|
| 4323 |
+
},
|
| 4324 |
+
{
|
| 4325 |
+
"epoch": 0.5451396865225919,
|
| 4326 |
+
"grad_norm": 1.785367488861084,
|
| 4327 |
+
"learning_rate": 2.5281262885079815e-05,
|
| 4328 |
+
"loss": 0.3485,
|
| 4329 |
+
"step": 30850
|
| 4330 |
+
},
|
| 4331 |
+
{
|
| 4332 |
+
"epoch": 0.5460232192398085,
|
| 4333 |
+
"grad_norm": 4.639885425567627,
|
| 4334 |
+
"learning_rate": 2.523217686674128e-05,
|
| 4335 |
+
"loss": 0.331,
|
| 4336 |
+
"step": 30900
|
| 4337 |
+
},
|
| 4338 |
+
{
|
| 4339 |
+
"epoch": 0.546906751957025,
|
| 4340 |
+
"grad_norm": 1.308772325515747,
|
| 4341 |
+
"learning_rate": 2.518309084840274e-05,
|
| 4342 |
+
"loss": 0.2846,
|
| 4343 |
+
"step": 30950
|
| 4344 |
+
},
|
| 4345 |
+
{
|
| 4346 |
+
"epoch": 0.5477902846742415,
|
| 4347 |
+
"grad_norm": 1.3961265087127686,
|
| 4348 |
+
"learning_rate": 2.5134004830064205e-05,
|
| 4349 |
+
"loss": 0.3647,
|
| 4350 |
+
"step": 31000
|
| 4351 |
}
|
| 4352 |
],
|
| 4353 |
"logging_steps": 50,
|