guyhadad01 commited on
Commit
5f9d28c
·
verified ·
1 Parent(s): 139465d

Training in progress, step 1000, checkpoint

Browse files
last-checkpoint/README.md CHANGED
@@ -286,9 +286,9 @@ print(embeddings.shape)
286
  # Get the similarity scores for the embeddings
287
  similarities = model.similarity(embeddings, embeddings)
288
  print(similarities)
289
- # tensor([[1.0000, 0.5922, 0.0910],
290
- # [0.5922, 1.0000, 0.1485],
291
- # [0.0910, 0.1485, 1.0000]])
292
  ```
293
 
294
  <!--
@@ -1240,6 +1240,10 @@ You can finetune this model on your own dataset.
1240
  | 0.0124 | 700 | 0.7701 |
1241
  | 0.0133 | 750 | 0.7525 |
1242
  | 0.0141 | 800 | 0.7097 |
 
 
 
 
1243
 
1244
 
1245
  ### Framework Versions
 
286
  # Get the similarity scores for the embeddings
287
  similarities = model.similarity(embeddings, embeddings)
288
  print(similarities)
289
+ # tensor([[1.0000, 0.5961, 0.1032],
290
+ # [0.5961, 1.0000, 0.1553],
291
+ # [0.1032, 0.1553, 1.0000]])
292
  ```
293
 
294
  <!--
 
1240
  | 0.0124 | 700 | 0.7701 |
1241
  | 0.0133 | 750 | 0.7525 |
1242
  | 0.0141 | 800 | 0.7097 |
1243
+ | 0.0150 | 850 | 0.7575 |
1244
+ | 0.0159 | 900 | 0.6899 |
1245
+ | 0.0168 | 950 | 0.6655 |
1246
+ | 0.0177 | 1000 | 0.6601 |
1247
 
1248
 
1249
  ### Framework Versions
last-checkpoint/model.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:4edf45758f8655b39949040bb376942e3eaf9cabfbd997bdd27d281a59e48fd7
3
  size 90864192
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:897e48ca4a1b0c79cf2429b6ef4ca73b309f3c5bcc06ba0c170b921c50590ea0
3
  size 90864192
last-checkpoint/optimizer.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:b860245e653a414010bafe2c3c8174c59f95411463e02d1f20aed248e44dc779
3
  size 180609611
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:4b5b75bdfd9f13b9fd5af71157d29fb1f2150a495f511bd4c3ae1ede089c6f6e
3
  size 180609611
last-checkpoint/rng_state.pth CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:6604fa50a947bb7a8c4e40ff3e2a5641ad506d5aa6a161b0cd0a5fa0c1d78ee8
3
  size 14645
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:435c96c122df13db75824be5f8aff8593c48e01c0d3f8f0275499435e34f1b52
3
  size 14645
last-checkpoint/scaler.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:6fef122931c86c2d2736773be787da21ac6460d41580735381e953556fb410be
3
  size 1383
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:14ae2a2128444abab378aa06c09a61a84665f758fcc19fc46f5789b0bc1b5665
3
  size 1383
last-checkpoint/scheduler.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:8ec1539c27d7283f1e5aca2a0dde35cb977a77f34c850320b82d506a15f4bbbb
3
  size 1465
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:dfb73f8c20bf0b1f8fb2141f8979207ef099f052597bee612ca21a5ed63b4554
3
  size 1465
last-checkpoint/trainer_state.json CHANGED
@@ -2,9 +2,9 @@
2
  "best_global_step": null,
3
  "best_metric": null,
4
  "best_model_checkpoint": null,
5
- "epoch": 0.014136523475464296,
6
  "eval_steps": 500,
7
- "global_step": 800,
8
  "is_hyper_param_search": false,
9
  "is_local_process_zero": true,
10
  "is_world_process_zero": true,
@@ -120,6 +120,34 @@
120
  "learning_rate": 7.058303886925795e-06,
121
  "loss": 0.7097,
122
  "step": 800
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
123
  }
124
  ],
125
  "logging_steps": 50,
 
2
  "best_global_step": null,
3
  "best_metric": null,
4
  "best_model_checkpoint": null,
5
+ "epoch": 0.01767065434433037,
6
  "eval_steps": 500,
7
+ "global_step": 1000,
8
  "is_hyper_param_search": false,
9
  "is_local_process_zero": true,
10
  "is_world_process_zero": true,
 
120
  "learning_rate": 7.058303886925795e-06,
121
  "loss": 0.7097,
122
  "step": 800
123
+ },
124
+ {
125
+ "epoch": 0.015020056192680814,
126
+ "grad_norm": 3.297929286956787,
127
+ "learning_rate": 7.5e-06,
128
+ "loss": 0.7575,
129
+ "step": 850
130
+ },
131
+ {
132
+ "epoch": 0.015903588909897334,
133
+ "grad_norm": 4.028406143188477,
134
+ "learning_rate": 7.941696113074205e-06,
135
+ "loss": 0.6899,
136
+ "step": 900
137
+ },
138
+ {
139
+ "epoch": 0.016787121627113853,
140
+ "grad_norm": 2.2513041496276855,
141
+ "learning_rate": 8.38339222614841e-06,
142
+ "loss": 0.6655,
143
+ "step": 950
144
+ },
145
+ {
146
+ "epoch": 0.01767065434433037,
147
+ "grad_norm": 2.402355670928955,
148
+ "learning_rate": 8.825088339222614e-06,
149
+ "loss": 0.6601,
150
+ "step": 1000
151
  }
152
  ],
153
  "logging_steps": 50,