guyhadad01 commited on
Commit
6be6dca
·
verified ·
1 Parent(s): 114ec5d

Training in progress, step 26200, checkpoint

Browse files
last-checkpoint/README.md CHANGED
@@ -1547,6 +1547,10 @@ You can finetune this model on your own dataset.
1547
  | 0.4577 | 25900 | 0.3418 |
1548
  | 0.4586 | 25950 | 0.3351 |
1549
  | 0.4594 | 26000 | 0.3117 |
 
 
 
 
1550
 
1551
  </details>
1552
 
 
1547
  | 0.4577 | 25900 | 0.3418 |
1548
  | 0.4586 | 25950 | 0.3351 |
1549
  | 0.4594 | 26000 | 0.3117 |
1550
+ | 0.4603 | 26050 | 0.3197 |
1551
+ | 0.4612 | 26100 | 0.2856 |
1552
+ | 0.4621 | 26150 | 0.3668 |
1553
+ | 0.4630 | 26200 | 0.4672 |
1554
 
1555
  </details>
1556
 
last-checkpoint/model.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:3d9b275662690960867e4c5004de25c023e37f1f7c4ebe3e55950090be859db5
3
  size 90864192
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:7aa3ad48db251d65c420989c1a1065641651336023e357be269465da6c52b747
3
  size 90864192
last-checkpoint/optimizer.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:ccf58858fe88830e35307ea10b8a5b6180e3bcc733d316d0262f05ad1036e132
3
  size 180609210
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:4cd5be8c20557f7368b8eca8b965e515fb0eede32019b1a858661a9114b93a2a
3
  size 180609210
last-checkpoint/rng_state.pth CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:fa2ed85cbcfc26a558906734eea48312aeda57b3baa4220e882e04b5dde95173
3
  size 14244
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:37d8388f61f2558efc37c86034b939b40258c4860b329143c81ea5c904f59277
3
  size 14244
last-checkpoint/scaler.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:a5a1824f2390986b90c617282d9a88df5bdc60e3f12c5d84551697fb36352fa3
3
  size 988
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:7f427cb46047bcb3e8371ea8ff734f8d8ca109ef018f2637b4d5fa5935ce5feb
3
  size 988
last-checkpoint/scheduler.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:67c6214bd46d06bb31b87e2550447bf08cbff7452cc6c1e25562bc8a18251786
3
  size 1064
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:bdb82bc459c496a0f434edcf728ea9313ee27e26d061cb72011f6899ef196598
3
  size 1064
last-checkpoint/trainer_state.json CHANGED
@@ -2,9 +2,9 @@
2
  "best_global_step": null,
3
  "best_metric": null,
4
  "best_model_checkpoint": null,
5
- "epoch": 0.45943701295258965,
6
  "eval_steps": 500,
7
- "global_step": 26000,
8
  "is_hyper_param_search": false,
9
  "is_local_process_zero": true,
10
  "is_world_process_zero": true,
@@ -3648,6 +3648,34 @@
3648
  "learning_rate": 3.004064322318431e-05,
3649
  "loss": 0.3117,
3650
  "step": 26000
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
3651
  }
3652
  ],
3653
  "logging_steps": 50,
 
2
  "best_global_step": null,
3
  "best_metric": null,
4
  "best_model_checkpoint": null,
5
+ "epoch": 0.4629711438214557,
6
  "eval_steps": 500,
7
+ "global_step": 26200,
8
  "is_hyper_param_search": false,
9
  "is_local_process_zero": true,
10
  "is_world_process_zero": true,
 
3648
  "learning_rate": 3.004064322318431e-05,
3649
  "loss": 0.3117,
3650
  "step": 26000
3651
+ },
3652
+ {
3653
+ "epoch": 0.4603205456698062,
3654
+ "grad_norm": 1.4303230047225952,
3655
+ "learning_rate": 2.9991557204845772e-05,
3656
+ "loss": 0.3197,
3657
+ "step": 26050
3658
+ },
3659
+ {
3660
+ "epoch": 0.46120407838702265,
3661
+ "grad_norm": 3.692739248275757,
3662
+ "learning_rate": 2.9942471186507237e-05,
3663
+ "loss": 0.2856,
3664
+ "step": 26100
3665
+ },
3666
+ {
3667
+ "epoch": 0.4620876111042392,
3668
+ "grad_norm": 2.6494288444519043,
3669
+ "learning_rate": 2.98933851681687e-05,
3670
+ "loss": 0.3668,
3671
+ "step": 26150
3672
+ },
3673
+ {
3674
+ "epoch": 0.4629711438214557,
3675
+ "grad_norm": 1.832560420036316,
3676
+ "learning_rate": 2.9844299149830163e-05,
3677
+ "loss": 0.4672,
3678
+ "step": 26200
3679
  }
3680
  ],
3681
  "logging_steps": 50,