guyhadad01 commited on
Commit
4400405
·
verified ·
1 Parent(s): 7de40c1

Training in progress, step 28200, checkpoint

Browse files
last-checkpoint/README.md CHANGED
@@ -1221,6 +1221,10 @@ You can finetune this model on your own dataset.
1221
  | 0.4930 | 27900 | 0.4098 |
1222
  | 0.4939 | 27950 | 0.3364 |
1223
  | 0.4948 | 28000 | 0.3354 |
 
 
 
 
1224
 
1225
 
1226
  ### Framework Versions
 
1221
  | 0.4930 | 27900 | 0.4098 |
1222
  | 0.4939 | 27950 | 0.3364 |
1223
  | 0.4948 | 28000 | 0.3354 |
1224
+ | 0.4957 | 28050 | 0.2879 |
1225
+ | 0.4965 | 28100 | 0.3604 |
1226
+ | 0.4974 | 28150 | 0.2612 |
1227
+ | 0.4983 | 28200 | 0.3593 |
1228
 
1229
 
1230
  ### Framework Versions
last-checkpoint/model.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:de68ecb62cb177a69e2ea7a2d8815c238cc32cec342188055a5fefa4de66dcc5
3
  size 90864192
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:aa1965a5554a69ff8c5d7634a28c5f04a03c69dd137851c93b70cebbac2f7e99
3
  size 90864192
last-checkpoint/optimizer.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:e99ec639b3e9bec0cbb3889051137c9795f5cf34c03f83c5e27e4203004378a8
3
  size 180609210
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:22731b099d557e9c813459e9016c90f95f238923990688ebd670d8401d82293f
3
  size 180609210
last-checkpoint/rng_state.pth CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:9b2bb1065a03f3a3cc81b13be34dd1b158c384419d61db5c56d91448ea10ea2e
3
  size 14244
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:d49299668d565a8fbf28b1ad8ad6ea4712f5b9b7d3472cc8d598ff75082532ee
3
  size 14244
last-checkpoint/scaler.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:b46b4db6042cc9cc0d2e82b27079ac2205bbc9a103068ad0178d3c56c11b3021
3
  size 988
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:2a77e32486116fb80a72650dd1d3f8b1c3fcfe6b44b779b1f8fb0e11f75bb318
3
  size 988
last-checkpoint/scheduler.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:2b4cd14cf09830d2d2a5966f0c329a3b566132e79593057303cd71a113d5be9d
3
  size 1064
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:be316569338339522180d5bdc62cd0944e9a3d23a5127275cdd38048e9eeda36
3
  size 1064
last-checkpoint/trainer_state.json CHANGED
@@ -2,9 +2,9 @@
2
  "best_global_step": null,
3
  "best_metric": null,
4
  "best_model_checkpoint": null,
5
- "epoch": 0.49477832164125035,
6
  "eval_steps": 500,
7
- "global_step": 28000,
8
  "is_hyper_param_search": false,
9
  "is_local_process_zero": true,
10
  "is_world_process_zero": true,
@@ -3928,6 +3928,34 @@
3928
  "learning_rate": 2.8078184210009623e-05,
3929
  "loss": 0.3354,
3930
  "step": 28000
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
3931
  }
3932
  ],
3933
  "logging_steps": 50,
 
2
  "best_global_step": null,
3
  "best_metric": null,
4
  "best_model_checkpoint": null,
5
+ "epoch": 0.49831245251011647,
6
  "eval_steps": 500,
7
+ "global_step": 28200,
8
  "is_hyper_param_search": false,
9
  "is_local_process_zero": true,
10
  "is_world_process_zero": true,
 
3928
  "learning_rate": 2.8078184210009623e-05,
3929
  "loss": 0.3354,
3930
  "step": 28000
3931
+ },
3932
+ {
3933
+ "epoch": 0.4956618543584669,
3934
+ "grad_norm": 1.141662359237671,
3935
+ "learning_rate": 2.8029098191671088e-05,
3936
+ "loss": 0.2879,
3937
+ "step": 28050
3938
+ },
3939
+ {
3940
+ "epoch": 0.4965453870756834,
3941
+ "grad_norm": 1.5769354104995728,
3942
+ "learning_rate": 2.798001217333255e-05,
3943
+ "loss": 0.3604,
3944
+ "step": 28100
3945
+ },
3946
+ {
3947
+ "epoch": 0.49742891979289994,
3948
+ "grad_norm": 2.3104453086853027,
3949
+ "learning_rate": 2.7930926154994014e-05,
3950
+ "loss": 0.2612,
3951
+ "step": 28150
3952
+ },
3953
+ {
3954
+ "epoch": 0.49831245251011647,
3955
+ "grad_norm": 0.764305830001831,
3956
+ "learning_rate": 2.7881840136655475e-05,
3957
+ "loss": 0.3593,
3958
+ "step": 28200
3959
  }
3960
  ],
3961
  "logging_steps": 50,