guyhadad01 commited on
Commit
c791334
·
verified ·
1 Parent(s): d9983ab

Training in progress, step 44000, checkpoint

Browse files
last-checkpoint/README.md CHANGED
@@ -1395,6 +1395,10 @@ You can finetune this model on your own dataset.
1395
  | 0.7722 | 43700 | 0.251 |
1396
  | 0.7731 | 43750 | 0.3154 |
1397
  | 0.7740 | 43800 | 0.3309 |
 
 
 
 
1398
 
1399
  </details>
1400
 
 
1395
  | 0.7722 | 43700 | 0.251 |
1396
  | 0.7731 | 43750 | 0.3154 |
1397
  | 0.7740 | 43800 | 0.3309 |
1398
+ | 0.7749 | 43850 | 0.2768 |
1399
+ | 0.7757 | 43900 | 0.3049 |
1400
+ | 0.7766 | 43950 | 0.2939 |
1401
+ | 0.7775 | 44000 | 0.2909 |
1402
 
1403
  </details>
1404
 
last-checkpoint/model.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:87245a00c511204e0c66583191ab9429ad97c78538541227c616f90b8381119e
3
  size 90864192
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:12bbe29ea94a2a3e248956e4ad4f48429053ec1581ede3091505ee45e42c209e
3
  size 90864192
last-checkpoint/optimizer.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:8b6c1541af87dcd1797f9d736a3cac898e50e3ecafd501e98798ccab543ede07
3
  size 180609210
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:fc95281118678bfa685a8fa9d0f9c2b4de3f7f9c764726219c4efe80cd17496a
3
  size 180609210
last-checkpoint/rng_state.pth CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:69c36e80b730b2d3f19367fe96dc275025a093a975c30683cdcf06771c2e520f
3
  size 14244
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:2248c4c2662777880f6435205956f86ee9cef13d01a64d9b6e6e97f9ff29c8a6
3
  size 14244
last-checkpoint/scaler.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:0c2a170b686e6b3841063ec2a8f0cf18b4985f4986723acd35709abf15d5c19e
3
  size 988
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:41c83ba4cca9cc14a64aa6c3e0597b81f5560663b8d07b1843663e365af550c1
3
  size 988
last-checkpoint/scheduler.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:a1960f4f5d6f42011bfc954842f6c57ccfbbc8ac7380b9fbe5cdcbb8bd1b0029
3
  size 1064
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:947d6bd91fa66a1fa64426daf31057323ec244470e03f87d8bca1497c127e637
3
  size 1064
last-checkpoint/trainer_state.json CHANGED
@@ -2,9 +2,9 @@
2
  "best_global_step": null,
3
  "best_metric": null,
4
  "best_model_checkpoint": null,
5
- "epoch": 0.7739746602816703,
6
  "eval_steps": 500,
7
- "global_step": 43800,
8
  "is_hyper_param_search": false,
9
  "is_local_process_zero": true,
10
  "is_world_process_zero": true,
@@ -6140,6 +6140,34 @@
6140
  "learning_rate": 1.25738744575995e-05,
6141
  "loss": 0.3309,
6142
  "step": 43800
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
6143
  }
6144
  ],
6145
  "logging_steps": 50,
 
2
  "best_global_step": null,
3
  "best_metric": null,
4
  "best_model_checkpoint": null,
5
+ "epoch": 0.7775087911505363,
6
  "eval_steps": 500,
7
+ "global_step": 44000,
8
  "is_hyper_param_search": false,
9
  "is_local_process_zero": true,
10
  "is_world_process_zero": true,
 
6140
  "learning_rate": 1.25738744575995e-05,
6141
  "loss": 0.3309,
6142
  "step": 43800
6143
+ },
6144
+ {
6145
+ "epoch": 0.7748581929988867,
6146
+ "grad_norm": 1.3661130666732788,
6147
+ "learning_rate": 1.2524788439260962e-05,
6148
+ "loss": 0.2768,
6149
+ "step": 43850
6150
+ },
6151
+ {
6152
+ "epoch": 0.7757417257161032,
6153
+ "grad_norm": 1.3001888990402222,
6154
+ "learning_rate": 1.2475702420922425e-05,
6155
+ "loss": 0.3049,
6156
+ "step": 43900
6157
+ },
6158
+ {
6159
+ "epoch": 0.7766252584333198,
6160
+ "grad_norm": 1.4377065896987915,
6161
+ "learning_rate": 1.2426616402583888e-05,
6162
+ "loss": 0.2939,
6163
+ "step": 43950
6164
+ },
6165
+ {
6166
+ "epoch": 0.7775087911505363,
6167
+ "grad_norm": 2.084547519683838,
6168
+ "learning_rate": 1.2377530384245351e-05,
6169
+ "loss": 0.2909,
6170
+ "step": 44000
6171
  }
6172
  ],
6173
  "logging_steps": 50,