guyhadad01 commited on
Commit
2d101a2
·
verified ·
1 Parent(s): a08a767

Training in progress, step 7600, checkpoint

Browse files
last-checkpoint/README.md CHANGED
@@ -286,9 +286,9 @@ print(embeddings.shape)
286
  # Get the similarity scores for the embeddings
287
  similarities = model.similarity(embeddings, embeddings)
288
  print(similarities)
289
- # tensor([[1.0000, 0.6815, 0.1033],
290
- # [0.6815, 1.0000, 0.1434],
291
- # [0.1033, 0.1434, 1.0000]])
292
  ```
293
 
294
  <!--
@@ -1264,6 +1264,10 @@ You can finetune this model on your own dataset.
1264
  | 0.1290 | 7300 | 0.4121 |
1265
  | 0.1299 | 7350 | 0.4139 |
1266
  | 0.1308 | 7400 | 0.4311 |
 
 
 
 
1267
 
1268
 
1269
  ### Framework Versions
 
286
  # Get the similarity scores for the embeddings
287
  similarities = model.similarity(embeddings, embeddings)
288
  print(similarities)
289
+ # tensor([[1.0000, 0.6585, 0.1068],
290
+ # [0.6585, 1.0000, 0.1405],
291
+ # [0.1068, 0.1405, 1.0000]])
292
  ```
293
 
294
  <!--
 
1264
  | 0.1290 | 7300 | 0.4121 |
1265
  | 0.1299 | 7350 | 0.4139 |
1266
  | 0.1308 | 7400 | 0.4311 |
1267
+ | 0.1316 | 7450 | 0.4025 |
1268
+ | 0.1325 | 7500 | 0.4791 |
1269
+ | 0.1334 | 7550 | 0.4498 |
1270
+ | 0.1343 | 7600 | 0.4538 |
1271
 
1272
 
1273
  ### Framework Versions
last-checkpoint/model.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:7640a8c5c08cd84ea9d34e9a392788849c161e51fab1fb1e24cf029e4bd1e02b
3
  size 90864192
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:fd4bdcdcbc94340067a5db9757cb8dc5e18160f6e0052a5271f3a3014faaad5b
3
  size 90864192
last-checkpoint/optimizer.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:d8bba72a7f616d924ad3ea248b2f6cbefe36b03a9a05b0265d1aae461c6b1d0f
3
  size 180609611
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:d1614719d6dd7c8ee90660bde3185c3bc7b3a45d06a5325bcddbb32753674ab3
3
  size 180609611
last-checkpoint/rng_state.pth CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:234f75280c102551c5f624e1ddf7b22e58abe72b0541e05f85525df9445290c6
3
  size 14645
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:09557c453e6a16e29d297517245393e31d8c1c2292c9705909c930c0a8bcca5a
3
  size 14645
last-checkpoint/scaler.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:d4c7f383c5c3caed78012349896a057bf1feaccde880a982830ace58530daa75
3
  size 1383
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:405bd92270a66c48608fa1efe67da0e3e668cf968c7d25ea748071fc5b6c3d6a
3
  size 1383
last-checkpoint/scheduler.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:86c610364818334e39ecc9c71264546e8b8d4a41c51d290cd21e1ca096739e20
3
  size 1465
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:23842e055dc64db6d0feb0d9e09209b01e916046b58ef6d199cb81b51ea994ff
3
  size 1465
last-checkpoint/trainer_state.json CHANGED
@@ -2,9 +2,9 @@
2
  "best_global_step": null,
3
  "best_metric": null,
4
  "best_model_checkpoint": null,
5
- "epoch": 0.13076284214804473,
6
  "eval_steps": 500,
7
- "global_step": 7400,
8
  "is_hyper_param_search": false,
9
  "is_local_process_zero": true,
10
  "is_world_process_zero": true,
@@ -1044,6 +1044,34 @@
1044
  "learning_rate": 4.82927882821857e-05,
1045
  "loss": 0.4311,
1046
  "step": 7400
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1047
  }
1048
  ],
1049
  "logging_steps": 50,
 
2
  "best_global_step": null,
3
  "best_metric": null,
4
  "best_model_checkpoint": null,
5
+ "epoch": 0.13429697301691082,
6
  "eval_steps": 500,
7
+ "global_step": 7600,
8
  "is_hyper_param_search": false,
9
  "is_local_process_zero": true,
10
  "is_world_process_zero": true,
 
1044
  "learning_rate": 4.82927882821857e-05,
1045
  "loss": 0.4311,
1046
  "step": 7400
1047
+ },
1048
+ {
1049
+ "epoch": 0.13164637486526126,
1050
+ "grad_norm": 2.3639650344848633,
1051
+ "learning_rate": 4.824370226384717e-05,
1052
+ "loss": 0.4025,
1053
+ "step": 7450
1054
+ },
1055
+ {
1056
+ "epoch": 0.1325299075824778,
1057
+ "grad_norm": 3.4997270107269287,
1058
+ "learning_rate": 4.8194616245508635e-05,
1059
+ "loss": 0.4791,
1060
+ "step": 7500
1061
+ },
1062
+ {
1063
+ "epoch": 0.1334134402996943,
1064
+ "grad_norm": 1.644084095954895,
1065
+ "learning_rate": 4.814553022717009e-05,
1066
+ "loss": 0.4498,
1067
+ "step": 7550
1068
+ },
1069
+ {
1070
+ "epoch": 0.13429697301691082,
1071
+ "grad_norm": 1.8292336463928223,
1072
+ "learning_rate": 4.809644420883156e-05,
1073
+ "loss": 0.4538,
1074
+ "step": 7600
1075
  }
1076
  ],
1077
  "logging_steps": 50,