guyhadad01 commited on
Commit
b733707
·
verified ·
1 Parent(s): 4a0f280

Training in progress, step 30600, checkpoint

Browse files
last-checkpoint/README.md CHANGED
@@ -1269,6 +1269,10 @@ You can finetune this model on your own dataset.
1269
  | 0.5354 | 30300 | 0.2758 |
1270
  | 0.5363 | 30350 | 0.3166 |
1271
  | 0.5372 | 30400 | 0.35 |
 
 
 
 
1272
 
1273
 
1274
  ### Framework Versions
 
1269
  | 0.5354 | 30300 | 0.2758 |
1270
  | 0.5363 | 30350 | 0.3166 |
1271
  | 0.5372 | 30400 | 0.35 |
1272
+ | 0.5381 | 30450 | 0.3391 |
1273
+ | 0.5390 | 30500 | 0.3576 |
1274
+ | 0.5398 | 30550 | 0.295 |
1275
+ | 0.5407 | 30600 | 0.3449 |
1276
 
1277
 
1278
  ### Framework Versions
last-checkpoint/model.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:cf79ddb807641f21ab4f124fe2a7f27110c30ccaaa038e866819c2a6c3894db3
3
  size 90864192
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:5fa3b9879e14ec9f5b4cd6c1fd0c5f2042c31d8024c507b2d4eb4e6f03a86557
3
  size 90864192
last-checkpoint/optimizer.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:ceffaa43e4f0c60b5feed0fbc2c3565eef53e3ad867186e6797fe95254c2affe
3
  size 180609210
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:2d918c870830ed1534f9d4acc1377f61959ec7838ebd0b23de0425c2b516e9d4
3
  size 180609210
last-checkpoint/rng_state.pth CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:80122c84195c17eb984e073adfb25182010304afad0586ccdcb1a261a3a0f848
3
  size 14244
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:c0b4ef05441e098f1fa59f720976907d8a3ce65ffd05fdaf038eebceb3ab3d49
3
  size 14244
last-checkpoint/scaler.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:528a5407336a16734f58a4f46d586ee071f6f4a258839c4070d301e8f708f0a5
3
  size 988
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:5927361a532fb6c132d07b4ab7a520caf5f685a6698e2682d0ac3b35fea7ca5e
3
  size 988
last-checkpoint/scheduler.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:ba2e19f20627e37fe99b4ad87f03b959017a779a9fc1b80f764c9a8c0220d435
3
  size 1064
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:9ea5eebe3d97676cf6ae4d334b17697b9e89bbac0efa0396db84f4cb8e005a81
3
  size 1064
last-checkpoint/trainer_state.json CHANGED
@@ -2,9 +2,9 @@
2
  "best_global_step": null,
3
  "best_metric": null,
4
  "best_model_checkpoint": null,
5
- "epoch": 0.5371878920676433,
6
  "eval_steps": 500,
7
- "global_step": 30400,
8
  "is_hyper_param_search": false,
9
  "is_local_process_zero": true,
10
  "is_world_process_zero": true,
@@ -4264,6 +4264,34 @@
4264
  "learning_rate": 2.572205532975987e-05,
4265
  "loss": 0.35,
4266
  "step": 30400
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
4267
  }
4268
  ],
4269
  "logging_steps": 50,
 
2
  "best_global_step": null,
3
  "best_metric": null,
4
  "best_model_checkpoint": null,
5
+ "epoch": 0.5407220229365094,
6
  "eval_steps": 500,
7
+ "global_step": 30600,
8
  "is_hyper_param_search": false,
9
  "is_local_process_zero": true,
10
  "is_world_process_zero": true,
 
4264
  "learning_rate": 2.572205532975987e-05,
4265
  "loss": 0.35,
4266
  "step": 30400
4267
+ },
4268
+ {
4269
+ "epoch": 0.5380714247848598,
4270
+ "grad_norm": 1.1287676095962524,
4271
+ "learning_rate": 2.5672969311421334e-05,
4272
+ "loss": 0.3391,
4273
+ "step": 30450
4274
+ },
4275
+ {
4276
+ "epoch": 0.5389549575020763,
4277
+ "grad_norm": 1.7524675130844116,
4278
+ "learning_rate": 2.5623883293082802e-05,
4279
+ "loss": 0.3576,
4280
+ "step": 30500
4281
+ },
4282
+ {
4283
+ "epoch": 0.5398384902192929,
4284
+ "grad_norm": 1.1238594055175781,
4285
+ "learning_rate": 2.5575778995111033e-05,
4286
+ "loss": 0.295,
4287
+ "step": 30550
4288
+ },
4289
+ {
4290
+ "epoch": 0.5407220229365094,
4291
+ "grad_norm": 0.9298042058944702,
4292
+ "learning_rate": 2.5526692976772498e-05,
4293
+ "loss": 0.3449,
4294
+ "step": 30600
4295
  }
4296
  ],
4297
  "logging_steps": 50,