guyhadad01 commited on
Commit
35c6e74
·
verified ·
1 Parent(s): 2d2130f

Training in progress, step 27000, checkpoint

Browse files
last-checkpoint/README.md CHANGED
@@ -1197,6 +1197,10 @@ You can finetune this model on your own dataset.
1197
  | 0.4718 | 26700 | 0.2572 |
1198
  | 0.4727 | 26750 | 0.2821 |
1199
  | 0.4736 | 26800 | 0.2753 |
 
 
 
 
1200
 
1201
 
1202
  ### Framework Versions
 
1197
  | 0.4718 | 26700 | 0.2572 |
1198
  | 0.4727 | 26750 | 0.2821 |
1199
  | 0.4736 | 26800 | 0.2753 |
1200
+ | 0.4745 | 26850 | 0.2789 |
1201
+ | 0.4753 | 26900 | 0.5175 |
1202
+ | 0.4762 | 26950 | 0.3398 |
1203
+ | 0.4771 | 27000 | 0.3683 |
1204
 
1205
 
1206
  ### Framework Versions
last-checkpoint/model.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:6af9e8fc53f229d8df337a8754e2d3d5b113d4716605b013bad83e9e09dacdb0
3
  size 90864192
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:157a36f69c8d6be89b19a5fc2041a6a70bae891ca7bdb6e1f8c5561949e9bafa
3
  size 90864192
last-checkpoint/optimizer.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:de6d4daedba612d713f9144d945bcc7668fddc99a7c572a8a7ecdaadfce55d9f
3
  size 180609210
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:3cf3f6a255c756d17edb6da60dbf398937995bd4e9513159583e5e4237f23a63
3
  size 180609210
last-checkpoint/rng_state.pth CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:bd90d4d272f52093bcd166fb2fee1129e8da49cd6cade68a0c1872a9ab44bae6
3
  size 14244
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:77b7843d303f1fcbcb7ded0ee18633ae1a240b93a82ce64b7dc80620210cefa4
3
  size 14244
last-checkpoint/scaler.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:9102615210716abefe38c971af7617c4ceba795e3412ef59968e79b6fe53891e
3
  size 988
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:f721603f06800f16238813b709df823dd021b986d5f3f64a3fdb3ad2473f4313
3
  size 988
last-checkpoint/scheduler.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:4ca320c82587b083501742caf7cc80ec1a98ca247bf4b8c7cd91053ff97a2d44
3
  size 1064
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:2b9c472a19e7b9448212aaddb68f6d9878d89c838a06487c2d680b2179532b97
3
  size 1064
last-checkpoint/trainer_state.json CHANGED
@@ -2,9 +2,9 @@
2
  "best_global_step": null,
3
  "best_metric": null,
4
  "best_model_checkpoint": null,
5
- "epoch": 0.47357353642805394,
6
  "eval_steps": 500,
7
- "global_step": 26800,
8
  "is_hyper_param_search": false,
9
  "is_local_process_zero": true,
10
  "is_world_process_zero": true,
@@ -3760,6 +3760,34 @@
3760
  "learning_rate": 2.9256248650134498e-05,
3761
  "loss": 0.2753,
3762
  "step": 26800
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
3763
  }
3764
  ],
3765
  "logging_steps": 50,
 
2
  "best_global_step": null,
3
  "best_metric": null,
4
  "best_model_checkpoint": null,
5
+ "epoch": 0.47710766729692,
6
  "eval_steps": 500,
7
+ "global_step": 27000,
8
  "is_hyper_param_search": false,
9
  "is_local_process_zero": true,
10
  "is_world_process_zero": true,
 
3760
  "learning_rate": 2.9256248650134498e-05,
3761
  "loss": 0.2753,
3762
  "step": 26800
3763
+ },
3764
+ {
3765
+ "epoch": 0.47445706914527047,
3766
+ "grad_norm": 1.7398908138275146,
3767
+ "learning_rate": 2.920716263179596e-05,
3768
+ "loss": 0.2789,
3769
+ "step": 26850
3770
+ },
3771
+ {
3772
+ "epoch": 0.47534060186248694,
3773
+ "grad_norm": 1.456929087638855,
3774
+ "learning_rate": 2.9158076613457424e-05,
3775
+ "loss": 0.5175,
3776
+ "step": 26900
3777
+ },
3778
+ {
3779
+ "epoch": 0.4762241345797035,
3780
+ "grad_norm": 1.4763001203536987,
3781
+ "learning_rate": 2.910899059511889e-05,
3782
+ "loss": 0.3398,
3783
+ "step": 26950
3784
+ },
3785
+ {
3786
+ "epoch": 0.47710766729692,
3787
+ "grad_norm": 1.3316082954406738,
3788
+ "learning_rate": 2.905990457678035e-05,
3789
+ "loss": 0.3683,
3790
+ "step": 27000
3791
  }
3792
  ],
3793
  "logging_steps": 50,