yalhessi commited on
Commit
5692f91
·
verified ·
1 Parent(s): 45fc7c8

End of training

Browse files
README.md CHANGED
@@ -43,11 +43,14 @@ The following hyperparameters were used during training:
43
  - total_eval_batch_size: 8
44
  - optimizer: Use OptimizerNames.ADAMW_TORCH with betas=(0.9,0.999) and epsilon=1e-08 and optimizer_args=No additional optimizer arguments
45
  - lr_scheduler_type: linear
46
- - training_steps: 10
47
  - mixed_precision_training: Native AMP
48
 
49
  ### Training results
50
 
 
 
 
51
 
52
 
53
  ### Framework versions
 
43
  - total_eval_batch_size: 8
44
  - optimizer: Use OptimizerNames.ADAMW_TORCH with betas=(0.9,0.999) and epsilon=1e-08 and optimizer_args=No additional optimizer arguments
45
  - lr_scheduler_type: linear
46
+ - training_steps: 100
47
  - mixed_precision_training: Native AMP
48
 
49
  ### Training results
50
 
51
+ | Training Loss | Epoch | Step | Validation Loss |
52
+ |:-------------:|:------:|:----:|:---------------:|
53
+ | No log | 0.0159 | 100 | 0.5223 |
54
 
55
 
56
  ### Framework versions
adapter_config.json CHANGED
@@ -23,8 +23,8 @@
23
  "rank_pattern": {},
24
  "revision": null,
25
  "target_modules": [
26
- "v_proj",
27
- "q_proj"
28
  ],
29
  "task_type": "CAUSAL_LM",
30
  "use_dora": false,
 
23
  "rank_pattern": {},
24
  "revision": null,
25
  "target_modules": [
26
+ "q_proj",
27
+ "v_proj"
28
  ],
29
  "task_type": "CAUSAL_LM",
30
  "use_dora": false,
adapter_model.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:554f3c73a6d1540f19169ad48d20d648065c40b0998aaa1c2e8fe6e91d25e98b
3
  size 6304096
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:e6773d22d06c3573c8757eb20a87babba791dfb6264b4238f861cd5a1ece6fa5
3
  size 6304096
training_args.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:f574f3944025b1ebe89b204e5a9a117a7a06c2c01ff12ec2bd53ab1ed25cb1cc
3
  size 5432
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:2b7db89eec48161a0794f002b65667c918fb3936a11e22c0211de5430bc3a8e7
3
  size 5432