guyhadad01 commited on
Commit
99db132
·
verified ·
1 Parent(s): de5c955

Training in progress, step 3200, checkpoint

Browse files
last-checkpoint/README.md CHANGED
@@ -286,9 +286,9 @@ print(embeddings.shape)
286
  # Get the similarity scores for the embeddings
287
  similarities = model.similarity(embeddings, embeddings)
288
  print(similarities)
289
- # tensor([[1.0000, 0.5851, 0.1104],
290
- # [0.5851, 1.0000, 0.1499],
291
- # [0.1104, 0.1499, 1.0000]])
292
  ```
293
 
294
  <!--
@@ -1284,6 +1284,10 @@ You can finetune this model on your own dataset.
1284
  | 0.0512 | 2900 | 0.545 |
1285
  | 0.0521 | 2950 | 0.5299 |
1286
  | 0.0530 | 3000 | 0.5186 |
 
 
 
 
1287
 
1288
 
1289
  ### Framework Versions
 
286
  # Get the similarity scores for the embeddings
287
  similarities = model.similarity(embeddings, embeddings)
288
  print(similarities)
289
+ # tensor([[1.0000, 0.6239, 0.0843],
290
+ # [0.6239, 1.0000, 0.1270],
291
+ # [0.0843, 0.1270, 1.0000]])
292
  ```
293
 
294
  <!--
 
1284
  | 0.0512 | 2900 | 0.545 |
1285
  | 0.0521 | 2950 | 0.5299 |
1286
  | 0.0530 | 3000 | 0.5186 |
1287
+ | 0.0539 | 3050 | 0.5259 |
1288
+ | 0.0548 | 3100 | 0.6663 |
1289
+ | 0.0557 | 3150 | 0.5152 |
1290
+ | 0.0565 | 3200 | 0.5417 |
1291
 
1292
 
1293
  ### Framework Versions
last-checkpoint/model.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:59bbbce60ef16e762bba9f8a3d9a23a215afa3ee462d98aeaeff69de27f89341
3
  size 90864192
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:0d2f7da0d95d2430f6d13687995e080c3fed754535ee0392c4ac0d988595c206
3
  size 90864192
last-checkpoint/optimizer.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:6b5d645070344294324c8e72697f2c1b516db72cb3276a26e4ef639ee18da667
3
  size 180609611
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:512331db4e7bbde846026f7146ee83d4cd409399e1029e49f0bdd154597bf767
3
  size 180609611
last-checkpoint/rng_state.pth CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:2e56f09343792c3d21faf51137b042a641d6fa07972ad9c4af87d2751a155e0e
3
  size 14645
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:e09a17a8985bbbf88900bb9c55cd9603d6be0205a4acbc9e556c560a96f36436
3
  size 14645
last-checkpoint/scaler.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:5ac1c46a2776d12775d23d0f587efc112188137ce2140da35bc15d301c9f620e
3
  size 1383
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:c180209d079915ff6b1a53d381fcf729d9a0c187b6ef7700d80eb57e51fa070b
3
  size 1383
last-checkpoint/scheduler.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:301ffba56ec75fdb730415687e7a885bf8c0dc112cbdcb4314fb3614afb6e000
3
  size 1465
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:473270958e9e1e76d015dca5bcc9949e4f7aea727004c8a1e7514a0b959338f7
3
  size 1465
last-checkpoint/trainer_state.json CHANGED
@@ -2,9 +2,9 @@
2
  "best_global_step": null,
3
  "best_metric": null,
4
  "best_model_checkpoint": null,
5
- "epoch": 0.05301196303299111,
6
  "eval_steps": 500,
7
- "global_step": 3000,
8
  "is_hyper_param_search": false,
9
  "is_local_process_zero": true,
10
  "is_world_process_zero": true,
@@ -428,6 +428,34 @@
428
  "learning_rate": 2.649293286219081e-05,
429
  "loss": 0.5186,
430
  "step": 3000
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
431
  }
432
  ],
433
  "logging_steps": 50,
 
2
  "best_global_step": null,
3
  "best_metric": null,
4
  "best_model_checkpoint": null,
5
+ "epoch": 0.056546093901857185,
6
  "eval_steps": 500,
7
+ "global_step": 3200,
8
  "is_hyper_param_search": false,
9
  "is_local_process_zero": true,
10
  "is_world_process_zero": true,
 
428
  "learning_rate": 2.649293286219081e-05,
429
  "loss": 0.5186,
430
  "step": 3000
431
+ },
432
+ {
433
+ "epoch": 0.05389549575020763,
434
+ "grad_norm": 1.842517375946045,
435
+ "learning_rate": 2.693462897526502e-05,
436
+ "loss": 0.5259,
437
+ "step": 3050
438
+ },
439
+ {
440
+ "epoch": 0.05477902846742415,
441
+ "grad_norm": 3.319514274597168,
442
+ "learning_rate": 2.7376325088339223e-05,
443
+ "loss": 0.6663,
444
+ "step": 3100
445
+ },
446
+ {
447
+ "epoch": 0.05566256118464067,
448
+ "grad_norm": 2.7143654823303223,
449
+ "learning_rate": 2.781802120141343e-05,
450
+ "loss": 0.5152,
451
+ "step": 3150
452
+ },
453
+ {
454
+ "epoch": 0.056546093901857185,
455
+ "grad_norm": 2.8187732696533203,
456
+ "learning_rate": 2.8259717314487632e-05,
457
+ "loss": 0.5417,
458
+ "step": 3200
459
  }
460
  ],
461
  "logging_steps": 50,