guyhadad01 commited on
Commit
aece7d9
·
verified ·
1 Parent(s): 5193284

Training in progress, step 30400, checkpoint

Browse files
last-checkpoint/README.md CHANGED
@@ -1265,6 +1265,10 @@ You can finetune this model on your own dataset.
1265
  | 0.5319 | 30100 | 0.3204 |
1266
  | 0.5328 | 30150 | 0.2496 |
1267
  | 0.5337 | 30200 | 0.4147 |
 
 
 
 
1268
 
1269
 
1270
  ### Framework Versions
 
1265
  | 0.5319 | 30100 | 0.3204 |
1266
  | 0.5328 | 30150 | 0.2496 |
1267
  | 0.5337 | 30200 | 0.4147 |
1268
+ | 0.5345 | 30250 | 0.3021 |
1269
+ | 0.5354 | 30300 | 0.2758 |
1270
+ | 0.5363 | 30350 | 0.3166 |
1271
+ | 0.5372 | 30400 | 0.35 |
1272
 
1273
 
1274
  ### Framework Versions
last-checkpoint/model.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:7fdaa72a1273993224fa25cd6ae828434957eb8fe61239c1e320466c47d9b825
3
  size 90864192
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:cf79ddb807641f21ab4f124fe2a7f27110c30ccaaa038e866819c2a6c3894db3
3
  size 90864192
last-checkpoint/optimizer.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:3f37496e89883f6fc386020ad2e2737fb211e26fa5f09d8c0b7ba33fa265d290
3
  size 180609210
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:ceffaa43e4f0c60b5feed0fbc2c3565eef53e3ad867186e6797fe95254c2affe
3
  size 180609210
last-checkpoint/rng_state.pth CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:81da5af6afb90a5f448879aab382d7c289ea5663dd55fc76a78e2ffba833506d
3
  size 14244
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:80122c84195c17eb984e073adfb25182010304afad0586ccdcb1a261a3a0f848
3
  size 14244
last-checkpoint/scaler.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:333f0c5d2657a0d36f7c5d0a5d113f16688fb194846ffda2f04f57fa9aad9a8b
3
  size 988
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:528a5407336a16734f58a4f46d586ee071f6f4a258839c4070d301e8f708f0a5
3
  size 988
last-checkpoint/scheduler.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:556d068be039654c814d6bf835c59f969aab843389d89f79ddf0f3729b9c071a
3
  size 1064
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:ba2e19f20627e37fe99b4ad87f03b959017a779a9fc1b80f764c9a8c0220d435
3
  size 1064
last-checkpoint/trainer_state.json CHANGED
@@ -2,9 +2,9 @@
2
  "best_global_step": null,
3
  "best_metric": null,
4
  "best_model_checkpoint": null,
5
- "epoch": 0.5336537611987772,
6
  "eval_steps": 500,
7
- "global_step": 30200,
8
  "is_hyper_param_search": false,
9
  "is_local_process_zero": true,
10
  "is_world_process_zero": true,
@@ -4236,6 +4236,34 @@
4236
  "learning_rate": 2.5918399403114018e-05,
4237
  "loss": 0.4147,
4238
  "step": 30200
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
4239
  }
4240
  ],
4241
  "logging_steps": 50,
 
2
  "best_global_step": null,
3
  "best_metric": null,
4
  "best_model_checkpoint": null,
5
+ "epoch": 0.5371878920676433,
6
  "eval_steps": 500,
7
+ "global_step": 30400,
8
  "is_hyper_param_search": false,
9
  "is_local_process_zero": true,
10
  "is_world_process_zero": true,
 
4236
  "learning_rate": 2.5918399403114018e-05,
4237
  "loss": 0.4147,
4238
  "step": 30200
4239
+ },
4240
+ {
4241
+ "epoch": 0.5345372939159937,
4242
+ "grad_norm": 1.886425495147705,
4243
+ "learning_rate": 2.5869313384775486e-05,
4244
+ "loss": 0.3021,
4245
+ "step": 30250
4246
+ },
4247
+ {
4248
+ "epoch": 0.5354208266332102,
4249
+ "grad_norm": 1.6316314935684204,
4250
+ "learning_rate": 2.5820227366436944e-05,
4251
+ "loss": 0.2758,
4252
+ "step": 30300
4253
+ },
4254
+ {
4255
+ "epoch": 0.5363043593504268,
4256
+ "grad_norm": 1.3990044593811035,
4257
+ "learning_rate": 2.577114134809841e-05,
4258
+ "loss": 0.3166,
4259
+ "step": 30350
4260
+ },
4261
+ {
4262
+ "epoch": 0.5371878920676433,
4263
+ "grad_norm": 2.1562857627868652,
4264
+ "learning_rate": 2.572205532975987e-05,
4265
+ "loss": 0.35,
4266
+ "step": 30400
4267
  }
4268
  ],
4269
  "logging_steps": 50,