guyhadad01 commited on
Commit
ed61099
·
verified ·
1 Parent(s): 0140d2a

Training in progress, step 4800, checkpoint

Browse files
last-checkpoint/README.md CHANGED
@@ -286,9 +286,9 @@ print(embeddings.shape)
286
  # Get the similarity scores for the embeddings
287
  similarities = model.similarity(embeddings, embeddings)
288
  print(similarities)
289
- # tensor([[1.0000, 0.6246, 0.1173],
290
- # [0.6246, 1.0000, 0.1638],
291
- # [0.1173, 0.1638, 1.0000]])
292
  ```
293
 
294
  <!--
@@ -1316,6 +1316,10 @@ You can finetune this model on your own dataset.
1316
  | 0.0795 | 4500 | 0.4553 |
1317
  | 0.0804 | 4550 | 0.4598 |
1318
  | 0.0813 | 4600 | 0.5445 |
 
 
 
 
1319
 
1320
 
1321
  ### Framework Versions
 
286
  # Get the similarity scores for the embeddings
287
  similarities = model.similarity(embeddings, embeddings)
288
  print(similarities)
289
+ # tensor([[1.0000, 0.6133, 0.1462],
290
+ # [0.6133, 1.0000, 0.1725],
291
+ # [0.1462, 0.1725, 1.0000]])
292
  ```
293
 
294
  <!--
 
1316
  | 0.0795 | 4500 | 0.4553 |
1317
  | 0.0804 | 4550 | 0.4598 |
1318
  | 0.0813 | 4600 | 0.5445 |
1319
+ | 0.0822 | 4650 | 0.4537 |
1320
+ | 0.0831 | 4700 | 0.5158 |
1321
+ | 0.0839 | 4750 | 0.4598 |
1322
+ | 0.0848 | 4800 | 0.4662 |
1323
 
1324
 
1325
  ### Framework Versions
last-checkpoint/model.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:8de4e67c75f4b4a7427b2810b985973120199b61a5e131a31184941440675588
3
  size 90864192
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:455ab825540498b5f5b373a58b71653674612a70e8ee7fc5be9b1867efa7eac4
3
  size 90864192
last-checkpoint/optimizer.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:7a2de7647e7106c94dd0498982cecf5e23bcd6cc4a2d106abd4e0a67ed761131
3
  size 180609611
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:3bf9c1feb933a833e9a1940398a123539c973a5c3ef49342b6ba0a21987b8a62
3
  size 180609611
last-checkpoint/rng_state.pth CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:a0c125bd90db08e6be99cb0172e0d523e9ccee0b8234c431ef93a30e9252f3b6
3
  size 14645
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:eb98f3b30b900a902f900b8100ff06f09878e462230501b172e1989e2314478f
3
  size 14645
last-checkpoint/scaler.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:1d5f1d0b668240e318afe61a3e255204044d52e6d78b98d08469e3aaa3293711
3
  size 1383
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:b429070a564985551cfca2e541b4c4fca20d998c67cc7cb6e2b59f638df425a3
3
  size 1383
last-checkpoint/scheduler.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:c485dc831eee1163015670289f311918797d3da6236e5f584fb1d2dbee1714b9
3
  size 1465
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:b4d7d41c126e55275e34a7a7f11165206f98f8c233f762fcdd72745ff49aac18
3
  size 1465
last-checkpoint/trainer_state.json CHANGED
@@ -2,9 +2,9 @@
2
  "best_global_step": null,
3
  "best_metric": null,
4
  "best_model_checkpoint": null,
5
- "epoch": 0.0812850099839197,
6
  "eval_steps": 500,
7
- "global_step": 4600,
8
  "is_hyper_param_search": false,
9
  "is_local_process_zero": true,
10
  "is_world_process_zero": true,
@@ -652,6 +652,34 @@
652
  "learning_rate": 4.0627208480565374e-05,
653
  "loss": 0.5445,
654
  "step": 4600
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
655
  }
656
  ],
657
  "logging_steps": 50,
 
2
  "best_global_step": null,
3
  "best_metric": null,
4
  "best_model_checkpoint": null,
5
+ "epoch": 0.08481914085278577,
6
  "eval_steps": 500,
7
+ "global_step": 4800,
8
  "is_hyper_param_search": false,
9
  "is_local_process_zero": true,
10
  "is_world_process_zero": true,
 
652
  "learning_rate": 4.0627208480565374e-05,
653
  "loss": 0.5445,
654
  "step": 4600
655
+ },
656
+ {
657
+ "epoch": 0.08216854270113623,
658
+ "grad_norm": 2.4177329540252686,
659
+ "learning_rate": 4.106890459363958e-05,
660
+ "loss": 0.4537,
661
+ "step": 4650
662
+ },
663
+ {
664
+ "epoch": 0.08305207541835274,
665
+ "grad_norm": 2.6188764572143555,
666
+ "learning_rate": 4.151060070671378e-05,
667
+ "loss": 0.5158,
668
+ "step": 4700
669
+ },
670
+ {
671
+ "epoch": 0.08393560813556926,
672
+ "grad_norm": 3.5044455528259277,
673
+ "learning_rate": 4.195229681978799e-05,
674
+ "loss": 0.4598,
675
+ "step": 4750
676
+ },
677
+ {
678
+ "epoch": 0.08481914085278577,
679
+ "grad_norm": 2.2751505374908447,
680
+ "learning_rate": 4.239399293286219e-05,
681
+ "loss": 0.4662,
682
+ "step": 4800
683
  }
684
  ],
685
  "logging_steps": 50,