guyhadad01 commited on
Commit
3128349
·
verified ·
1 Parent(s): 1d2c3f3

Training in progress, step 3000, checkpoint

Browse files
last-checkpoint/README.md CHANGED
@@ -286,9 +286,9 @@ print(embeddings.shape)
286
  # Get the similarity scores for the embeddings
287
  similarities = model.similarity(embeddings, embeddings)
288
  print(similarities)
289
- # tensor([[1.0000, 0.6549, 0.0935],
290
- # [0.6549, 1.0000, 0.1232],
291
- # [0.0935, 0.1232, 1.0000]])
292
  ```
293
 
294
  <!--
@@ -1280,6 +1280,10 @@ You can finetune this model on your own dataset.
1280
  | 0.0477 | 2700 | 0.5661 |
1281
  | 0.0486 | 2750 | 0.6125 |
1282
  | 0.0495 | 2800 | 0.5105 |
 
 
 
 
1283
 
1284
 
1285
  ### Framework Versions
 
286
  # Get the similarity scores for the embeddings
287
  similarities = model.similarity(embeddings, embeddings)
288
  print(similarities)
289
+ # tensor([[1.0000, 0.5851, 0.1104],
290
+ # [0.5851, 1.0000, 0.1499],
291
+ # [0.1104, 0.1499, 1.0000]])
292
  ```
293
 
294
  <!--
 
1280
  | 0.0477 | 2700 | 0.5661 |
1281
  | 0.0486 | 2750 | 0.6125 |
1282
  | 0.0495 | 2800 | 0.5105 |
1283
+ | 0.0504 | 2850 | 0.5893 |
1284
+ | 0.0512 | 2900 | 0.545 |
1285
+ | 0.0521 | 2950 | 0.5299 |
1286
+ | 0.0530 | 3000 | 0.5186 |
1287
 
1288
 
1289
  ### Framework Versions
last-checkpoint/model.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:3e151efa72ee25c48973734218defa123cf60ee46518a0b274dfcbca393fb422
3
  size 90864192
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:59bbbce60ef16e762bba9f8a3d9a23a215afa3ee462d98aeaeff69de27f89341
3
  size 90864192
last-checkpoint/optimizer.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:73660affbc9d00f2fca3a340ebf70404475af29a08ec697b69c11c1edfc06ecd
3
  size 180609611
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:6b5d645070344294324c8e72697f2c1b516db72cb3276a26e4ef639ee18da667
3
  size 180609611
last-checkpoint/rng_state.pth CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:64b89b481388e8776a92f8ffb923a2d2f40d85d6a0313cf7ed6f16d7e6a29dcb
3
  size 14645
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:2e56f09343792c3d21faf51137b042a641d6fa07972ad9c4af87d2751a155e0e
3
  size 14645
last-checkpoint/scaler.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:091185d50211af5c59ac65d06f51cb55a1ff4a1312de54456a306e4731eb1fa7
3
  size 1383
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:5ac1c46a2776d12775d23d0f587efc112188137ce2140da35bc15d301c9f620e
3
  size 1383
last-checkpoint/scheduler.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:d4232c28bf6d44f06b5f73efd0dc91c5ec7abf414fa6e4b4449aae1bd59d8543
3
  size 1465
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:301ffba56ec75fdb730415687e7a885bf8c0dc112cbdcb4314fb3614afb6e000
3
  size 1465
last-checkpoint/trainer_state.json CHANGED
@@ -2,9 +2,9 @@
2
  "best_global_step": null,
3
  "best_metric": null,
4
  "best_model_checkpoint": null,
5
- "epoch": 0.04947783216412504,
6
  "eval_steps": 500,
7
- "global_step": 2800,
8
  "is_hyper_param_search": false,
9
  "is_local_process_zero": true,
10
  "is_world_process_zero": true,
@@ -400,6 +400,34 @@
400
  "learning_rate": 2.4726148409893997e-05,
401
  "loss": 0.5105,
402
  "step": 2800
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
403
  }
404
  ],
405
  "logging_steps": 50,
 
2
  "best_global_step": null,
3
  "best_metric": null,
4
  "best_model_checkpoint": null,
5
+ "epoch": 0.05301196303299111,
6
  "eval_steps": 500,
7
+ "global_step": 3000,
8
  "is_hyper_param_search": false,
9
  "is_local_process_zero": true,
10
  "is_world_process_zero": true,
 
400
  "learning_rate": 2.4726148409893997e-05,
401
  "loss": 0.5105,
402
  "step": 2800
403
+ },
404
+ {
405
+ "epoch": 0.050361364881341554,
406
+ "grad_norm": 3.1281192302703857,
407
+ "learning_rate": 2.5167844522968198e-05,
408
+ "loss": 0.5893,
409
+ "step": 2850
410
+ },
411
+ {
412
+ "epoch": 0.051244897598558076,
413
+ "grad_norm": 2.345649242401123,
414
+ "learning_rate": 2.5609540636042406e-05,
415
+ "loss": 0.545,
416
+ "step": 2900
417
+ },
418
+ {
419
+ "epoch": 0.05212843031577459,
420
+ "grad_norm": 2.9023561477661133,
421
+ "learning_rate": 2.605123674911661e-05,
422
+ "loss": 0.5299,
423
+ "step": 2950
424
+ },
425
+ {
426
+ "epoch": 0.05301196303299111,
427
+ "grad_norm": 2.491269588470459,
428
+ "learning_rate": 2.649293286219081e-05,
429
+ "loss": 0.5186,
430
+ "step": 3000
431
  }
432
  ],
433
  "logging_steps": 50,