guyhadad01 commited on
Commit
ccc9b01
·
verified ·
1 Parent(s): d579338

Training in progress, step 7400, checkpoint

Browse files
last-checkpoint/README.md CHANGED
@@ -286,9 +286,9 @@ print(embeddings.shape)
286
  # Get the similarity scores for the embeddings
287
  similarities = model.similarity(embeddings, embeddings)
288
  print(similarities)
289
- # tensor([[1.0000, 0.6879, 0.1286],
290
- # [0.6879, 1.0000, 0.1688],
291
- # [0.1286, 0.1688, 1.0000]])
292
  ```
293
 
294
  <!--
@@ -1260,6 +1260,10 @@ You can finetune this model on your own dataset.
1260
  | 0.1255 | 7100 | 0.5155 |
1261
  | 0.1263 | 7150 | 0.4282 |
1262
  | 0.1272 | 7200 | 0.4639 |
 
 
 
 
1263
 
1264
 
1265
  ### Framework Versions
 
286
  # Get the similarity scores for the embeddings
287
  similarities = model.similarity(embeddings, embeddings)
288
  print(similarities)
289
+ # tensor([[1.0000, 0.6815, 0.1033],
290
+ # [0.6815, 1.0000, 0.1434],
291
+ # [0.1033, 0.1434, 1.0000]])
292
  ```
293
 
294
  <!--
 
1260
  | 0.1255 | 7100 | 0.5155 |
1261
  | 0.1263 | 7150 | 0.4282 |
1262
  | 0.1272 | 7200 | 0.4639 |
1263
+ | 0.1281 | 7250 | 0.5294 |
1264
+ | 0.1290 | 7300 | 0.4121 |
1265
+ | 0.1299 | 7350 | 0.4139 |
1266
+ | 0.1308 | 7400 | 0.4311 |
1267
 
1268
 
1269
  ### Framework Versions
last-checkpoint/model.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:67e0640c0093f6938269cf5b0ca154261896c0baa13615b9ac24acbc00815c24
3
  size 90864192
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:7640a8c5c08cd84ea9d34e9a392788849c161e51fab1fb1e24cf029e4bd1e02b
3
  size 90864192
last-checkpoint/optimizer.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:5fca48ccb7c4a584f7af19fddac5f49e519b33cedea2b5a68a882138149c59ef
3
  size 180609611
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:d8bba72a7f616d924ad3ea248b2f6cbefe36b03a9a05b0265d1aae461c6b1d0f
3
  size 180609611
last-checkpoint/rng_state.pth CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:309540c657541ac81d087cbb68ec4167d38f8c9f78a01a5baabdd0e371dee4d2
3
  size 14645
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:234f75280c102551c5f624e1ddf7b22e58abe72b0541e05f85525df9445290c6
3
  size 14645
last-checkpoint/scaler.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:1789ba0d507fa201879591abbc90e77d1dba00075efb5f28f2624ffc56affbc2
3
  size 1383
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:d4c7f383c5c3caed78012349896a057bf1feaccde880a982830ace58530daa75
3
  size 1383
last-checkpoint/scheduler.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:eb2d3fce775411949a9aaee54964b6ea09aaa40534b915c7642ea1c1b586b54a
3
  size 1465
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:86c610364818334e39ecc9c71264546e8b8d4a41c51d290cd21e1ca096739e20
3
  size 1465
last-checkpoint/trainer_state.json CHANGED
@@ -2,9 +2,9 @@
2
  "best_global_step": null,
3
  "best_metric": null,
4
  "best_model_checkpoint": null,
5
- "epoch": 0.12722871127917867,
6
  "eval_steps": 500,
7
- "global_step": 7200,
8
  "is_hyper_param_search": false,
9
  "is_local_process_zero": true,
10
  "is_world_process_zero": true,
@@ -1016,6 +1016,34 @@
1016
  "learning_rate": 4.8489132355539854e-05,
1017
  "loss": 0.4639,
1018
  "step": 7200
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1019
  }
1020
  ],
1021
  "logging_steps": 50,
 
2
  "best_global_step": null,
3
  "best_metric": null,
4
  "best_model_checkpoint": null,
5
+ "epoch": 0.13076284214804473,
6
  "eval_steps": 500,
7
+ "global_step": 7400,
8
  "is_hyper_param_search": false,
9
  "is_local_process_zero": true,
10
  "is_world_process_zero": true,
 
1016
  "learning_rate": 4.8489132355539854e-05,
1017
  "loss": 0.4639,
1018
  "step": 7200
1019
+ },
1020
+ {
1021
+ "epoch": 0.12811224399639518,
1022
+ "grad_norm": 1.7154817581176758,
1023
+ "learning_rate": 4.844004633720131e-05,
1024
+ "loss": 0.5294,
1025
+ "step": 7250
1026
+ },
1027
+ {
1028
+ "epoch": 0.1289957767136117,
1029
+ "grad_norm": 2.130659580230713,
1030
+ "learning_rate": 4.839096031886278e-05,
1031
+ "loss": 0.4121,
1032
+ "step": 7300
1033
+ },
1034
+ {
1035
+ "epoch": 0.12987930943082823,
1036
+ "grad_norm": 1.8878060579299927,
1037
+ "learning_rate": 4.834187430052424e-05,
1038
+ "loss": 0.4139,
1039
+ "step": 7350
1040
+ },
1041
+ {
1042
+ "epoch": 0.13076284214804473,
1043
+ "grad_norm": 1.9885565042495728,
1044
+ "learning_rate": 4.82927882821857e-05,
1045
+ "loss": 0.4311,
1046
+ "step": 7400
1047
  }
1048
  ],
1049
  "logging_steps": 50,