guyhadad01 commited on
Commit
4516c7d
·
verified ·
1 Parent(s): a03bff4

Training in progress, step 32200, checkpoint

Browse files
last-checkpoint/README.md CHANGED
@@ -1303,6 +1303,10 @@ You can finetune this model on your own dataset.
1303
  | 0.5637 | 31900 | 0.2994 |
1304
  | 0.5646 | 31950 | 0.3219 |
1305
  | 0.5655 | 32000 | 0.2902 |
 
 
 
 
1306
 
1307
  </details>
1308
 
 
1303
  | 0.5637 | 31900 | 0.2994 |
1304
  | 0.5646 | 31950 | 0.3219 |
1305
  | 0.5655 | 32000 | 0.2902 |
1306
+ | 0.5663 | 32050 | 0.3896 |
1307
+ | 0.5672 | 32100 | 0.2491 |
1308
+ | 0.5681 | 32150 | 0.2663 |
1309
+ | 0.5690 | 32200 | 0.3433 |
1310
 
1311
  </details>
1312
 
last-checkpoint/model.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:cea8950aa6683070e22c1a564e52123795831f72f71fb839c14d7de92ee17a17
3
  size 90864192
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:059e5ea13c385fd2b7824c1ae9f5d7517f93ed2064e18f707d204b5f00551fcf
3
  size 90864192
last-checkpoint/optimizer.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:4ac2571e8a99f96a6e948efc2acbf6f064d1c41ef24c68243b8bfa9248b61bef
3
  size 180609210
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:3628f48729b03521592b21ba8e241dd8f7b12c27ab2d17f87975f425eeac02df
3
  size 180609210
last-checkpoint/rng_state.pth CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:ea96a97725aec5e3c937ef8955386071fe1d87cf2432c4445ce113e85618ebef
3
  size 14244
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:50d8e0757ed6c29dd6ad40d6348476d9c45a6c913dbe6d558683a2aff7f6eeaa
3
  size 14244
last-checkpoint/scaler.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:b78f9ce48aa6920e09eb307b60e2b49742b779f95ad33075f31c6652ec108e55
3
  size 988
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:05d2345a7bbddb12fb6a365e62bd73e47296785a601a5379725821a73d3794f3
3
  size 988
last-checkpoint/scheduler.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:a6de4d7315ff5e38fd38a2be7f1976197684b731feeef6561c2bf9fe182bd3b1
3
  size 1064
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:dfe5ee6b9c7e51d497fade31af9f8cbe420701d187e60d0b9c360cfa22b492c4
3
  size 1064
last-checkpoint/trainer_state.json CHANGED
@@ -2,9 +2,9 @@
2
  "best_global_step": null,
3
  "best_metric": null,
4
  "best_model_checkpoint": null,
5
- "epoch": 0.5654609390185719,
6
  "eval_steps": 500,
7
- "global_step": 32000,
8
  "is_hyper_param_search": false,
9
  "is_local_process_zero": true,
10
  "is_world_process_zero": true,
@@ -4488,6 +4488,34 @@
4488
  "learning_rate": 2.4152284463293475e-05,
4489
  "loss": 0.2902,
4490
  "step": 32000
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
4491
  }
4492
  ],
4493
  "logging_steps": 50,
 
2
  "best_global_step": null,
3
  "best_metric": null,
4
  "best_model_checkpoint": null,
5
+ "epoch": 0.568995069887438,
6
  "eval_steps": 500,
7
+ "global_step": 32200,
8
  "is_hyper_param_search": false,
9
  "is_local_process_zero": true,
10
  "is_world_process_zero": true,
 
4488
  "learning_rate": 2.4152284463293475e-05,
4489
  "loss": 0.2902,
4490
  "step": 32000
4491
+ },
4492
+ {
4493
+ "epoch": 0.5663444717357884,
4494
+ "grad_norm": 2.785452365875244,
4495
+ "learning_rate": 2.4103198444954943e-05,
4496
+ "loss": 0.3896,
4497
+ "step": 32050
4498
+ },
4499
+ {
4500
+ "epoch": 0.5672280044530049,
4501
+ "grad_norm": 2.5383968353271484,
4502
+ "learning_rate": 2.4054112426616404e-05,
4503
+ "loss": 0.2491,
4504
+ "step": 32100
4505
+ },
4506
+ {
4507
+ "epoch": 0.5681115371702214,
4508
+ "grad_norm": 1.584861397743225,
4509
+ "learning_rate": 2.4005026408277866e-05,
4510
+ "loss": 0.2663,
4511
+ "step": 32150
4512
+ },
4513
+ {
4514
+ "epoch": 0.568995069887438,
4515
+ "grad_norm": 1.5586644411087036,
4516
+ "learning_rate": 2.395594038993933e-05,
4517
+ "loss": 0.3433,
4518
+ "step": 32200
4519
  }
4520
  ],
4521
  "logging_steps": 50,