Training in progress, step 28200, checkpoint
Browse files
last-checkpoint/README.md
CHANGED
|
@@ -1221,6 +1221,10 @@ You can finetune this model on your own dataset.
|
|
| 1221 |
| 0.4930 | 27900 | 0.4098 |
|
| 1222 |
| 0.4939 | 27950 | 0.3364 |
|
| 1223 |
| 0.4948 | 28000 | 0.3354 |
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1224 |
|
| 1225 |
|
| 1226 |
### Framework Versions
|
|
|
|
| 1221 |
| 0.4930 | 27900 | 0.4098 |
|
| 1222 |
| 0.4939 | 27950 | 0.3364 |
|
| 1223 |
| 0.4948 | 28000 | 0.3354 |
|
| 1224 |
+
| 0.4957 | 28050 | 0.2879 |
|
| 1225 |
+
| 0.4965 | 28100 | 0.3604 |
|
| 1226 |
+
| 0.4974 | 28150 | 0.2612 |
|
| 1227 |
+
| 0.4983 | 28200 | 0.3593 |
|
| 1228 |
|
| 1229 |
|
| 1230 |
### Framework Versions
|
last-checkpoint/model.safetensors
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
size 90864192
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:aa1965a5554a69ff8c5d7634a28c5f04a03c69dd137851c93b70cebbac2f7e99
|
| 3 |
size 90864192
|
last-checkpoint/optimizer.pt
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
size 180609210
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:22731b099d557e9c813459e9016c90f95f238923990688ebd670d8401d82293f
|
| 3 |
size 180609210
|
last-checkpoint/rng_state.pth
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
size 14244
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:d49299668d565a8fbf28b1ad8ad6ea4712f5b9b7d3472cc8d598ff75082532ee
|
| 3 |
size 14244
|
last-checkpoint/scaler.pt
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
size 988
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:2a77e32486116fb80a72650dd1d3f8b1c3fcfe6b44b779b1f8fb0e11f75bb318
|
| 3 |
size 988
|
last-checkpoint/scheduler.pt
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
size 1064
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:be316569338339522180d5bdc62cd0944e9a3d23a5127275cdd38048e9eeda36
|
| 3 |
size 1064
|
last-checkpoint/trainer_state.json
CHANGED
|
@@ -2,9 +2,9 @@
|
|
| 2 |
"best_global_step": null,
|
| 3 |
"best_metric": null,
|
| 4 |
"best_model_checkpoint": null,
|
| 5 |
-
"epoch": 0.
|
| 6 |
"eval_steps": 500,
|
| 7 |
-
"global_step":
|
| 8 |
"is_hyper_param_search": false,
|
| 9 |
"is_local_process_zero": true,
|
| 10 |
"is_world_process_zero": true,
|
|
@@ -3928,6 +3928,34 @@
|
|
| 3928 |
"learning_rate": 2.8078184210009623e-05,
|
| 3929 |
"loss": 0.3354,
|
| 3930 |
"step": 28000
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 3931 |
}
|
| 3932 |
],
|
| 3933 |
"logging_steps": 50,
|
|
|
|
| 2 |
"best_global_step": null,
|
| 3 |
"best_metric": null,
|
| 4 |
"best_model_checkpoint": null,
|
| 5 |
+
"epoch": 0.49831245251011647,
|
| 6 |
"eval_steps": 500,
|
| 7 |
+
"global_step": 28200,
|
| 8 |
"is_hyper_param_search": false,
|
| 9 |
"is_local_process_zero": true,
|
| 10 |
"is_world_process_zero": true,
|
|
|
|
| 3928 |
"learning_rate": 2.8078184210009623e-05,
|
| 3929 |
"loss": 0.3354,
|
| 3930 |
"step": 28000
|
| 3931 |
+
},
|
| 3932 |
+
{
|
| 3933 |
+
"epoch": 0.4956618543584669,
|
| 3934 |
+
"grad_norm": 1.141662359237671,
|
| 3935 |
+
"learning_rate": 2.8029098191671088e-05,
|
| 3936 |
+
"loss": 0.2879,
|
| 3937 |
+
"step": 28050
|
| 3938 |
+
},
|
| 3939 |
+
{
|
| 3940 |
+
"epoch": 0.4965453870756834,
|
| 3941 |
+
"grad_norm": 1.5769354104995728,
|
| 3942 |
+
"learning_rate": 2.798001217333255e-05,
|
| 3943 |
+
"loss": 0.3604,
|
| 3944 |
+
"step": 28100
|
| 3945 |
+
},
|
| 3946 |
+
{
|
| 3947 |
+
"epoch": 0.49742891979289994,
|
| 3948 |
+
"grad_norm": 2.3104453086853027,
|
| 3949 |
+
"learning_rate": 2.7930926154994014e-05,
|
| 3950 |
+
"loss": 0.2612,
|
| 3951 |
+
"step": 28150
|
| 3952 |
+
},
|
| 3953 |
+
{
|
| 3954 |
+
"epoch": 0.49831245251011647,
|
| 3955 |
+
"grad_norm": 0.764305830001831,
|
| 3956 |
+
"learning_rate": 2.7881840136655475e-05,
|
| 3957 |
+
"loss": 0.3593,
|
| 3958 |
+
"step": 28200
|
| 3959 |
}
|
| 3960 |
],
|
| 3961 |
"logging_steps": 50,
|