guyhadad01 commited on
Commit
095f1be
·
verified ·
1 Parent(s): 8708928

Training in progress, step 33000, checkpoint

Browse files
last-checkpoint/README.md CHANGED
@@ -1319,6 +1319,10 @@ You can finetune this model on your own dataset.
1319
  | 0.5778 | 32700 | 0.3167 |
1320
  | 0.5787 | 32750 | 0.3249 |
1321
  | 0.5796 | 32800 | 0.2443 |
 
 
 
 
1322
 
1323
  </details>
1324
 
 
1319
  | 0.5778 | 32700 | 0.3167 |
1320
  | 0.5787 | 32750 | 0.3249 |
1321
  | 0.5796 | 32800 | 0.2443 |
1322
+ | 0.5805 | 32850 | 0.4113 |
1323
+ | 0.5814 | 32900 | 0.3106 |
1324
+ | 0.5822 | 32950 | 0.2841 |
1325
+ | 0.5831 | 33000 | 0.2786 |
1326
 
1327
  </details>
1328
 
last-checkpoint/model.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:c149da7590ac756041ddcfa88541f8f1672d3db78462e24c5f353c18f8cebb1d
3
  size 90864192
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:c8b30dec528d42a5a4b58c0779ef0039999b571e7dcbffef2ce111e2a8ea9c9a
3
  size 90864192
last-checkpoint/optimizer.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:a8e3fdce41c8faa034bc2a86a395da561d04329337006adacae71b20e28f454b
3
  size 180609210
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:05ca6048b5b24e0bf5be4461f7f2142898161795f74ad16a156816bab1b72a69
3
  size 180609210
last-checkpoint/rng_state.pth CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:4dd0555a80b9ec33d03df384178c64ec05cac6166fd02e539edd48eaea584c82
3
  size 14244
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:6f49fa5ae18072a5e2dded1d5d47789d5b789b12fb1067e4364304bf9f3ffb85
3
  size 14244
last-checkpoint/scaler.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:fd929e14e8b21c3d41ba7c4043d8f146abd5c239c07932d39cf0ff21021e6682
3
  size 988
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:6bbae4a00cda14f6ae28057ccdaac068a27c16d42d3b8e6b2ea21512dca904e3
3
  size 988
last-checkpoint/scheduler.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:14aac029153ded9414487d954464b6a95a9d2baa46bd0202f6e9ea6df2629338
3
  size 1064
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:956ff3c13215961a07ede8fd0b963f4f72d5b8c4c7c87011ef7e07dba7cddb0e
3
  size 1064
last-checkpoint/trainer_state.json CHANGED
@@ -2,9 +2,9 @@
2
  "best_global_step": null,
3
  "best_metric": null,
4
  "best_model_checkpoint": null,
5
- "epoch": 0.5795974624940362,
6
  "eval_steps": 500,
7
- "global_step": 32800,
8
  "is_hyper_param_search": false,
9
  "is_local_process_zero": true,
10
  "is_world_process_zero": true,
@@ -4600,6 +4600,34 @@
4600
  "learning_rate": 2.3367889890243662e-05,
4601
  "loss": 0.2443,
4602
  "step": 32800
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
4603
  }
4604
  ],
4605
  "logging_steps": 50,
 
2
  "best_global_step": null,
3
  "best_metric": null,
4
  "best_model_checkpoint": null,
5
+ "epoch": 0.5831315933629022,
6
  "eval_steps": 500,
7
+ "global_step": 33000,
8
  "is_hyper_param_search": false,
9
  "is_local_process_zero": true,
10
  "is_world_process_zero": true,
 
4600
  "learning_rate": 2.3367889890243662e-05,
4601
  "loss": 0.2443,
4602
  "step": 32800
4603
+ },
4604
+ {
4605
+ "epoch": 0.5804809952112526,
4606
+ "grad_norm": 1.316084384918213,
4607
+ "learning_rate": 2.331880387190513e-05,
4608
+ "loss": 0.4113,
4609
+ "step": 32850
4610
+ },
4611
+ {
4612
+ "epoch": 0.5813645279284692,
4613
+ "grad_norm": 1.8195414543151855,
4614
+ "learning_rate": 2.3269717853566592e-05,
4615
+ "loss": 0.3106,
4616
+ "step": 32900
4617
+ },
4618
+ {
4619
+ "epoch": 0.5822480606456857,
4620
+ "grad_norm": 1.1715435981750488,
4621
+ "learning_rate": 2.3220631835228053e-05,
4622
+ "loss": 0.2841,
4623
+ "step": 32950
4624
+ },
4625
+ {
4626
+ "epoch": 0.5831315933629022,
4627
+ "grad_norm": 1.3928303718566895,
4628
+ "learning_rate": 2.3171545816889518e-05,
4629
+ "loss": 0.2786,
4630
+ "step": 33000
4631
  }
4632
  ],
4633
  "logging_steps": 50,