guyhadad01 commited on
Commit
09ab688
·
verified ·
1 Parent(s): e2c73e6

Training in progress, step 32800, checkpoint

Browse files
last-checkpoint/README.md CHANGED
@@ -1315,6 +1315,10 @@ You can finetune this model on your own dataset.
1315
  | 0.5743 | 32500 | 0.2741 |
1316
  | 0.5752 | 32550 | 0.3546 |
1317
  | 0.5761 | 32600 | 0.3927 |
 
 
 
 
1318
 
1319
  </details>
1320
 
 
1315
  | 0.5743 | 32500 | 0.2741 |
1316
  | 0.5752 | 32550 | 0.3546 |
1317
  | 0.5761 | 32600 | 0.3927 |
1318
+ | 0.5769 | 32650 | 0.2725 |
1319
+ | 0.5778 | 32700 | 0.3167 |
1320
+ | 0.5787 | 32750 | 0.3249 |
1321
+ | 0.5796 | 32800 | 0.2443 |
1322
 
1323
  </details>
1324
 
last-checkpoint/model.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:45fd58276a613db39a02b73ae7fb0f916427f84c68306d47cd2dd77d778f740d
3
  size 90864192
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:c149da7590ac756041ddcfa88541f8f1672d3db78462e24c5f353c18f8cebb1d
3
  size 90864192
last-checkpoint/optimizer.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:ad0c582d327743ee610c3253c0a4bdc5cb41fe46898db21b3b1c785e2413a4e9
3
  size 180609210
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:a8e3fdce41c8faa034bc2a86a395da561d04329337006adacae71b20e28f454b
3
  size 180609210
last-checkpoint/rng_state.pth CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:92457d32429f413543dc4a520ec7ff903eebfb5a9a30773f04a7c15eb4dca6c4
3
  size 14244
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:4dd0555a80b9ec33d03df384178c64ec05cac6166fd02e539edd48eaea584c82
3
  size 14244
last-checkpoint/scaler.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:dc7b96e3cd8fbcf40fa74eb52caa9f2570529a551c9001ee45b2d2020cedf149
3
  size 988
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:fd929e14e8b21c3d41ba7c4043d8f146abd5c239c07932d39cf0ff21021e6682
3
  size 988
last-checkpoint/scheduler.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:afd2952fde33bc16ddb69c03104a4d42ffc3097dd2a6f3924f62735831aaadce
3
  size 1064
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:14aac029153ded9414487d954464b6a95a9d2baa46bd0202f6e9ea6df2629338
3
  size 1064
last-checkpoint/trainer_state.json CHANGED
@@ -2,9 +2,9 @@
2
  "best_global_step": null,
3
  "best_metric": null,
4
  "best_model_checkpoint": null,
5
- "epoch": 0.5760633316251701,
6
  "eval_steps": 500,
7
- "global_step": 32600,
8
  "is_hyper_param_search": false,
9
  "is_local_process_zero": true,
10
  "is_world_process_zero": true,
@@ -4572,6 +4572,34 @@
4572
  "learning_rate": 2.356423396359781e-05,
4573
  "loss": 0.3927,
4574
  "step": 32600
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
4575
  }
4576
  ],
4577
  "logging_steps": 50,
 
2
  "best_global_step": null,
3
  "best_metric": null,
4
  "best_model_checkpoint": null,
5
+ "epoch": 0.5795974624940362,
6
  "eval_steps": 500,
7
+ "global_step": 32800,
8
  "is_hyper_param_search": false,
9
  "is_local_process_zero": true,
10
  "is_world_process_zero": true,
 
4572
  "learning_rate": 2.356423396359781e-05,
4573
  "loss": 0.3927,
4574
  "step": 32600
4575
+ },
4576
+ {
4577
+ "epoch": 0.5769468643423866,
4578
+ "grad_norm": 2.3731272220611572,
4579
+ "learning_rate": 2.3515147945259272e-05,
4580
+ "loss": 0.2725,
4581
+ "step": 32650
4582
+ },
4583
+ {
4584
+ "epoch": 0.5778303970596032,
4585
+ "grad_norm": 1.4900075197219849,
4586
+ "learning_rate": 2.3466061926920737e-05,
4587
+ "loss": 0.3167,
4588
+ "step": 32700
4589
+ },
4590
+ {
4591
+ "epoch": 0.5787139297768197,
4592
+ "grad_norm": 1.2145545482635498,
4593
+ "learning_rate": 2.34169759085822e-05,
4594
+ "loss": 0.3249,
4595
+ "step": 32750
4596
+ },
4597
+ {
4598
+ "epoch": 0.5795974624940362,
4599
+ "grad_norm": 1.725298285484314,
4600
+ "learning_rate": 2.3367889890243662e-05,
4601
+ "loss": 0.2443,
4602
+ "step": 32800
4603
  }
4604
  ],
4605
  "logging_steps": 50,