guyhadad01 commited on
Commit
0230a0a
·
verified ·
1 Parent(s): a289786

Training in progress, step 44200, checkpoint

Browse files
last-checkpoint/README.md CHANGED
@@ -1399,6 +1399,10 @@ You can finetune this model on your own dataset.
1399
  | 0.7757 | 43900 | 0.3049 |
1400
  | 0.7766 | 43950 | 0.2939 |
1401
  | 0.7775 | 44000 | 0.2909 |
 
 
 
 
1402
 
1403
  </details>
1404
 
 
1399
  | 0.7757 | 43900 | 0.3049 |
1400
  | 0.7766 | 43950 | 0.2939 |
1401
  | 0.7775 | 44000 | 0.2909 |
1402
+ | 0.7784 | 44050 | 0.2157 |
1403
+ | 0.7793 | 44100 | 0.2785 |
1404
+ | 0.7802 | 44150 | 0.2386 |
1405
+ | 0.7810 | 44200 | 0.3297 |
1406
 
1407
  </details>
1408
 
last-checkpoint/model.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:12bbe29ea94a2a3e248956e4ad4f48429053ec1581ede3091505ee45e42c209e
3
  size 90864192
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:3c93ea012da084e7db255bf5307a12bc622616de2b559e1ebc270e29e3930b53
3
  size 90864192
last-checkpoint/optimizer.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:fc95281118678bfa685a8fa9d0f9c2b4de3f7f9c764726219c4efe80cd17496a
3
  size 180609210
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:0fc375ce7c64e73dfae981ff1f0ee30f111e70f92ece0482506acc2e5c8b7278
3
  size 180609210
last-checkpoint/rng_state.pth CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:2248c4c2662777880f6435205956f86ee9cef13d01a64d9b6e6e97f9ff29c8a6
3
  size 14244
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:bc4603f12b61034f467c4243e5cacbd3dc08f83f508811af862a64abae5532b6
3
  size 14244
last-checkpoint/scaler.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:41c83ba4cca9cc14a64aa6c3e0597b81f5560663b8d07b1843663e365af550c1
3
  size 988
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:086b678b22870553eb0c5be0c61abb20b7fa45eb12fa31835cd26537ecba1df1
3
  size 988
last-checkpoint/scheduler.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:947d6bd91fa66a1fa64426daf31057323ec244470e03f87d8bca1497c127e637
3
  size 1064
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:af3f862129fa543cfe43517f44ed73b2bfc19062f029765e9ae1e7d6bb4162f5
3
  size 1064
last-checkpoint/trainer_state.json CHANGED
@@ -2,9 +2,9 @@
2
  "best_global_step": null,
3
  "best_metric": null,
4
  "best_model_checkpoint": null,
5
- "epoch": 0.7775087911505363,
6
  "eval_steps": 500,
7
- "global_step": 44000,
8
  "is_hyper_param_search": false,
9
  "is_local_process_zero": true,
10
  "is_world_process_zero": true,
@@ -6168,6 +6168,34 @@
6168
  "learning_rate": 1.2377530384245351e-05,
6169
  "loss": 0.2909,
6170
  "step": 44000
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
6171
  }
6172
  ],
6173
  "logging_steps": 50,
 
2
  "best_global_step": null,
3
  "best_metric": null,
4
  "best_model_checkpoint": null,
5
+ "epoch": 0.7810429220194024,
6
  "eval_steps": 500,
7
+ "global_step": 44200,
8
  "is_hyper_param_search": false,
9
  "is_local_process_zero": true,
10
  "is_world_process_zero": true,
 
6168
  "learning_rate": 1.2377530384245351e-05,
6169
  "loss": 0.2909,
6170
  "step": 44000
6171
+ },
6172
+ {
6173
+ "epoch": 0.7783923238677528,
6174
+ "grad_norm": 1.421271562576294,
6175
+ "learning_rate": 1.2328444365906816e-05,
6176
+ "loss": 0.2157,
6177
+ "step": 44050
6178
+ },
6179
+ {
6180
+ "epoch": 0.7792758565849693,
6181
+ "grad_norm": 1.2172672748565674,
6182
+ "learning_rate": 1.2279358347568279e-05,
6183
+ "loss": 0.2785,
6184
+ "step": 44100
6185
+ },
6186
+ {
6187
+ "epoch": 0.7801593893021859,
6188
+ "grad_norm": 1.5359545946121216,
6189
+ "learning_rate": 1.2230272329229744e-05,
6190
+ "loss": 0.2386,
6191
+ "step": 44150
6192
+ },
6193
+ {
6194
+ "epoch": 0.7810429220194024,
6195
+ "grad_norm": 1.3057314157485962,
6196
+ "learning_rate": 1.2181186310891207e-05,
6197
+ "loss": 0.3297,
6198
+ "step": 44200
6199
  }
6200
  ],
6201
  "logging_steps": 50,