Training in progress, step 30600, checkpoint
Browse files
last-checkpoint/README.md
CHANGED
|
@@ -1269,6 +1269,10 @@ You can finetune this model on your own dataset.
|
|
| 1269 |
| 0.5354 | 30300 | 0.2758 |
|
| 1270 |
| 0.5363 | 30350 | 0.3166 |
|
| 1271 |
| 0.5372 | 30400 | 0.35 |
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1272 |
|
| 1273 |
|
| 1274 |
### Framework Versions
|
|
|
|
| 1269 |
| 0.5354 | 30300 | 0.2758 |
|
| 1270 |
| 0.5363 | 30350 | 0.3166 |
|
| 1271 |
| 0.5372 | 30400 | 0.35 |
|
| 1272 |
+
| 0.5381 | 30450 | 0.3391 |
|
| 1273 |
+
| 0.5390 | 30500 | 0.3576 |
|
| 1274 |
+
| 0.5398 | 30550 | 0.295 |
|
| 1275 |
+
| 0.5407 | 30600 | 0.3449 |
|
| 1276 |
|
| 1277 |
|
| 1278 |
### Framework Versions
|
last-checkpoint/model.safetensors
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
size 90864192
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:5fa3b9879e14ec9f5b4cd6c1fd0c5f2042c31d8024c507b2d4eb4e6f03a86557
|
| 3 |
size 90864192
|
last-checkpoint/optimizer.pt
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
size 180609210
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:2d918c870830ed1534f9d4acc1377f61959ec7838ebd0b23de0425c2b516e9d4
|
| 3 |
size 180609210
|
last-checkpoint/rng_state.pth
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
size 14244
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:c0b4ef05441e098f1fa59f720976907d8a3ce65ffd05fdaf038eebceb3ab3d49
|
| 3 |
size 14244
|
last-checkpoint/scaler.pt
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
size 988
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:5927361a532fb6c132d07b4ab7a520caf5f685a6698e2682d0ac3b35fea7ca5e
|
| 3 |
size 988
|
last-checkpoint/scheduler.pt
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
size 1064
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:9ea5eebe3d97676cf6ae4d334b17697b9e89bbac0efa0396db84f4cb8e005a81
|
| 3 |
size 1064
|
last-checkpoint/trainer_state.json
CHANGED
|
@@ -2,9 +2,9 @@
|
|
| 2 |
"best_global_step": null,
|
| 3 |
"best_metric": null,
|
| 4 |
"best_model_checkpoint": null,
|
| 5 |
-
"epoch": 0.
|
| 6 |
"eval_steps": 500,
|
| 7 |
-
"global_step":
|
| 8 |
"is_hyper_param_search": false,
|
| 9 |
"is_local_process_zero": true,
|
| 10 |
"is_world_process_zero": true,
|
|
@@ -4264,6 +4264,34 @@
|
|
| 4264 |
"learning_rate": 2.572205532975987e-05,
|
| 4265 |
"loss": 0.35,
|
| 4266 |
"step": 30400
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 4267 |
}
|
| 4268 |
],
|
| 4269 |
"logging_steps": 50,
|
|
|
|
| 2 |
"best_global_step": null,
|
| 3 |
"best_metric": null,
|
| 4 |
"best_model_checkpoint": null,
|
| 5 |
+
"epoch": 0.5407220229365094,
|
| 6 |
"eval_steps": 500,
|
| 7 |
+
"global_step": 30600,
|
| 8 |
"is_hyper_param_search": false,
|
| 9 |
"is_local_process_zero": true,
|
| 10 |
"is_world_process_zero": true,
|
|
|
|
| 4264 |
"learning_rate": 2.572205532975987e-05,
|
| 4265 |
"loss": 0.35,
|
| 4266 |
"step": 30400
|
| 4267 |
+
},
|
| 4268 |
+
{
|
| 4269 |
+
"epoch": 0.5380714247848598,
|
| 4270 |
+
"grad_norm": 1.1287676095962524,
|
| 4271 |
+
"learning_rate": 2.5672969311421334e-05,
|
| 4272 |
+
"loss": 0.3391,
|
| 4273 |
+
"step": 30450
|
| 4274 |
+
},
|
| 4275 |
+
{
|
| 4276 |
+
"epoch": 0.5389549575020763,
|
| 4277 |
+
"grad_norm": 1.7524675130844116,
|
| 4278 |
+
"learning_rate": 2.5623883293082802e-05,
|
| 4279 |
+
"loss": 0.3576,
|
| 4280 |
+
"step": 30500
|
| 4281 |
+
},
|
| 4282 |
+
{
|
| 4283 |
+
"epoch": 0.5398384902192929,
|
| 4284 |
+
"grad_norm": 1.1238594055175781,
|
| 4285 |
+
"learning_rate": 2.5575778995111033e-05,
|
| 4286 |
+
"loss": 0.295,
|
| 4287 |
+
"step": 30550
|
| 4288 |
+
},
|
| 4289 |
+
{
|
| 4290 |
+
"epoch": 0.5407220229365094,
|
| 4291 |
+
"grad_norm": 0.9298042058944702,
|
| 4292 |
+
"learning_rate": 2.5526692976772498e-05,
|
| 4293 |
+
"loss": 0.3449,
|
| 4294 |
+
"step": 30600
|
| 4295 |
}
|
| 4296 |
],
|
| 4297 |
"logging_steps": 50,
|