guyhadad01 commited on
Commit
352252b
·
verified ·
1 Parent(s): c6ca203

Training in progress, step 1200, checkpoint

Browse files
last-checkpoint/README.md CHANGED
@@ -286,9 +286,9 @@ print(embeddings.shape)
286
  # Get the similarity scores for the embeddings
287
  similarities = model.similarity(embeddings, embeddings)
288
  print(similarities)
289
- # tensor([[1.0000, 0.5961, 0.1032],
290
- # [0.5961, 1.0000, 0.1553],
291
- # [0.1032, 0.1553, 1.0000]])
292
  ```
293
 
294
  <!--
@@ -1244,6 +1244,10 @@ You can finetune this model on your own dataset.
1244
  | 0.0159 | 900 | 0.6899 |
1245
  | 0.0168 | 950 | 0.6655 |
1246
  | 0.0177 | 1000 | 0.6601 |
 
 
 
 
1247
 
1248
 
1249
  ### Framework Versions
 
286
  # Get the similarity scores for the embeddings
287
  similarities = model.similarity(embeddings, embeddings)
288
  print(similarities)
289
+ # tensor([[1.0000, 0.6149, 0.1330],
290
+ # [0.6149, 1.0000, 0.1618],
291
+ # [0.1330, 0.1618, 1.0000]])
292
  ```
293
 
294
  <!--
 
1244
  | 0.0159 | 900 | 0.6899 |
1245
  | 0.0168 | 950 | 0.6655 |
1246
  | 0.0177 | 1000 | 0.6601 |
1247
+ | 0.0186 | 1050 | 0.6925 |
1248
+ | 0.0194 | 1100 | 0.6169 |
1249
+ | 0.0203 | 1150 | 0.6367 |
1250
+ | 0.0212 | 1200 | 0.615 |
1251
 
1252
 
1253
  ### Framework Versions
last-checkpoint/model.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:897e48ca4a1b0c79cf2429b6ef4ca73b309f3c5bcc06ba0c170b921c50590ea0
3
  size 90864192
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:a9a3361ca69436d4dea95cdcd29cea53aad0e253053cdc5876ca978a2c32a909
3
  size 90864192
last-checkpoint/optimizer.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:4b5b75bdfd9f13b9fd5af71157d29fb1f2150a495f511bd4c3ae1ede089c6f6e
3
  size 180609611
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:7762e45714247d845b98566f70065d2e826d2dad86f6f5a0df3a0f6e4cc3e852
3
  size 180609611
last-checkpoint/rng_state.pth CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:435c96c122df13db75824be5f8aff8593c48e01c0d3f8f0275499435e34f1b52
3
  size 14645
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:92073e2121fa1a50d2393b4b193256ae067f8269c786bb12674760941abf850b
3
  size 14645
last-checkpoint/scaler.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:14ae2a2128444abab378aa06c09a61a84665f758fcc19fc46f5789b0bc1b5665
3
  size 1383
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:18783150ac09b6b81cea5af47876a10bfe5f36c3d76aca4ffce5382bdfaf7b28
3
  size 1383
last-checkpoint/scheduler.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:dfb73f8c20bf0b1f8fb2141f8979207ef099f052597bee612ca21a5ed63b4554
3
  size 1465
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:8ed3eff7033631ee9ecca3bfddfbb19428dfe42f7f70d962500698dee83c17e2
3
  size 1465
last-checkpoint/trainer_state.json CHANGED
@@ -2,9 +2,9 @@
2
  "best_global_step": null,
3
  "best_metric": null,
4
  "best_model_checkpoint": null,
5
- "epoch": 0.01767065434433037,
6
  "eval_steps": 500,
7
- "global_step": 1000,
8
  "is_hyper_param_search": false,
9
  "is_local_process_zero": true,
10
  "is_world_process_zero": true,
@@ -148,6 +148,34 @@
148
  "learning_rate": 8.825088339222614e-06,
149
  "loss": 0.6601,
150
  "step": 1000
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
151
  }
152
  ],
153
  "logging_steps": 50,
 
2
  "best_global_step": null,
3
  "best_metric": null,
4
  "best_model_checkpoint": null,
5
+ "epoch": 0.021204785213196443,
6
  "eval_steps": 500,
7
+ "global_step": 1200,
8
  "is_hyper_param_search": false,
9
  "is_local_process_zero": true,
10
  "is_world_process_zero": true,
 
148
  "learning_rate": 8.825088339222614e-06,
149
  "loss": 0.6601,
150
  "step": 1000
151
+ },
152
+ {
153
+ "epoch": 0.01855418706154689,
154
+ "grad_norm": 4.492621898651123,
155
+ "learning_rate": 9.26678445229682e-06,
156
+ "loss": 0.6925,
157
+ "step": 1050
158
+ },
159
+ {
160
+ "epoch": 0.019437719778763407,
161
+ "grad_norm": 3.8099517822265625,
162
+ "learning_rate": 9.708480565371025e-06,
163
+ "loss": 0.6169,
164
+ "step": 1100
165
+ },
166
+ {
167
+ "epoch": 0.020321252495979925,
168
+ "grad_norm": 4.58193826675415,
169
+ "learning_rate": 1.0150176678445231e-05,
170
+ "loss": 0.6367,
171
+ "step": 1150
172
+ },
173
+ {
174
+ "epoch": 0.021204785213196443,
175
+ "grad_norm": 4.745123863220215,
176
+ "learning_rate": 1.0591872791519434e-05,
177
+ "loss": 0.615,
178
+ "step": 1200
179
  }
180
  ],
181
  "logging_steps": 50,