Pelmeshek commited on
Commit
8eb1e83
·
verified ·
1 Parent(s): 888e249

Pelmeshek/qwen3-0.6B-function-calling-lora

Browse files
README.md CHANGED
@@ -36,9 +36,9 @@ This model was trained with SFT.
36
 
37
  - TRL: 0.17.0
38
  - Transformers: 4.51.3
39
- - Pytorch: 2.6.0+cu124
40
  - Datasets: 3.5.1
41
- - Tokenizers: 0.21.1
42
 
43
  ## Citations
44
 
 
36
 
37
  - TRL: 0.17.0
38
  - Transformers: 4.51.3
39
+ - Pytorch: 2.5.1
40
  - Datasets: 3.5.1
41
+ - Tokenizers: 0.21.0
42
 
43
  ## Citations
44
 
adapter_config.json CHANGED
@@ -24,15 +24,15 @@
24
  "rank_pattern": {},
25
  "revision": null,
26
  "target_modules": [
27
- "down_proj",
28
- "lm_head",
29
- "k_proj",
30
  "embed_tokens",
31
  "gate_proj",
32
- "o_proj",
33
  "q_proj",
 
 
 
34
  "v_proj",
35
- "up_proj"
36
  ],
37
  "task_type": "CAUSAL_LM",
38
  "trainable_token_indices": null,
 
24
  "rank_pattern": {},
25
  "revision": null,
26
  "target_modules": [
 
 
 
27
  "embed_tokens",
28
  "gate_proj",
29
+ "up_proj",
30
  "q_proj",
31
+ "lm_head",
32
+ "o_proj",
33
+ "k_proj",
34
  "v_proj",
35
+ "down_proj"
36
  ],
37
  "task_type": "CAUSAL_LM",
38
  "trainable_token_indices": null,
adapter_model.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:b2ab1ffc3096ef34be9b1fe98e3ead14c09d1ea1a87861ad82cb60d44da86df6
3
- size 681212472
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:c937aa9b05f0856a06ae85c2506481ae54b788eecbcde20b9805ee1b499b00ff
3
+ size 681204024
added_tokens.json CHANGED
@@ -2,11 +2,9 @@
2
  "</think>": 151668,
3
  "</tool_call>": 151658,
4
  "</tool_response>": 151666,
5
- "</tools>": 151670,
6
  "<think>": 151667,
7
  "<tool_call>": 151657,
8
  "<tool_response>": 151665,
9
- "<tools>": 151669,
10
  "<|box_end|>": 151649,
11
  "<|box_start|>": 151648,
12
  "<|endoftext|>": 151643,
 
2
  "</think>": 151668,
3
  "</tool_call>": 151658,
4
  "</tool_response>": 151666,
 
5
  "<think>": 151667,
6
  "<tool_call>": 151657,
7
  "<tool_response>": 151665,
 
8
  "<|box_end|>": 151649,
9
  "<|box_start|>": 151648,
10
  "<|endoftext|>": 151643,
runs/May02_12-45-08_Nikitas-MacBook-Pro.local/events.out.tfevents.1746179143.Nikitas-MacBook-Pro.local ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:5fd7c2923438ff2d9fb5384d4f625ec19723483cb6e8c7c48155962e80f05811
3
+ size 6181
runs/May02_12-51-51_Nikitas-MacBook-Pro.local/events.out.tfevents.1746179542.Nikitas-MacBook-Pro.local ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:74bd6bd101a816027a7f543c61de1025e630715ac407e0b3aa679426eecc70b7
3
+ size 77252
special_tokens_map.json CHANGED
@@ -1,61 +1,18 @@
1
  {
2
  "additional_special_tokens": [
3
- {
4
- "content": "<tools>",
5
- "lstrip": false,
6
- "normalized": false,
7
- "rstrip": false,
8
- "single_word": false
9
- },
10
- {
11
- "content": "</tools>",
12
- "lstrip": false,
13
- "normalized": false,
14
- "rstrip": false,
15
- "single_word": false
16
- },
17
- {
18
- "content": "<think>",
19
- "lstrip": false,
20
- "normalized": false,
21
- "rstrip": false,
22
- "single_word": false
23
- },
24
- {
25
- "content": "</think>",
26
- "lstrip": false,
27
- "normalized": false,
28
- "rstrip": false,
29
- "single_word": false
30
- },
31
- {
32
- "content": "<tool_call>",
33
- "lstrip": false,
34
- "normalized": false,
35
- "rstrip": false,
36
- "single_word": false
37
- },
38
- {
39
- "content": "</tool_call>",
40
- "lstrip": false,
41
- "normalized": false,
42
- "rstrip": false,
43
- "single_word": false
44
- },
45
- {
46
- "content": "<tool_response>",
47
- "lstrip": false,
48
- "normalized": false,
49
- "rstrip": false,
50
- "single_word": false
51
- },
52
- {
53
- "content": "</tool_response>",
54
- "lstrip": false,
55
- "normalized": false,
56
- "rstrip": false,
57
- "single_word": false
58
- }
59
  ],
60
  "eos_token": {
61
  "content": "<|im_end|>",
 
1
  {
2
  "additional_special_tokens": [
3
+ "<|im_start|>",
4
+ "<|im_end|>",
5
+ "<|object_ref_start|>",
6
+ "<|object_ref_end|>",
7
+ "<|box_start|>",
8
+ "<|box_end|>",
9
+ "<|quad_start|>",
10
+ "<|quad_end|>",
11
+ "<|vision_start|>",
12
+ "<|vision_end|>",
13
+ "<|vision_pad|>",
14
+ "<|image_pad|>",
15
+ "<|video_pad|>"
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
16
  ],
17
  "eos_token": {
18
  "content": "<|im_end|>",
tokenizer.json CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:529f547f99f91cef0a10b47f12b253231c666833e2b8eb22493a956853de322d
3
- size 11423017
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:aeb13307a71acd8fe81861d94ad54ab689df773318809eed3cbe794b4492dae4
3
+ size 11422654
tokenizer_config.json CHANGED
@@ -120,7 +120,7 @@
120
  "normalized": false,
121
  "rstrip": false,
122
  "single_word": false,
123
- "special": true
124
  },
125
  "151658": {
126
  "content": "</tool_call>",
@@ -128,7 +128,7 @@
128
  "normalized": false,
129
  "rstrip": false,
130
  "single_word": false,
131
- "special": true
132
  },
133
  "151659": {
134
  "content": "<|fim_prefix|>",
@@ -184,7 +184,7 @@
184
  "normalized": false,
185
  "rstrip": false,
186
  "single_word": false,
187
- "special": true
188
  },
189
  "151666": {
190
  "content": "</tool_response>",
@@ -192,7 +192,7 @@
192
  "normalized": false,
193
  "rstrip": false,
194
  "single_word": false,
195
- "special": true
196
  },
197
  "151667": {
198
  "content": "<think>",
@@ -200,7 +200,7 @@
200
  "normalized": false,
201
  "rstrip": false,
202
  "single_word": false,
203
- "special": true
204
  },
205
  "151668": {
206
  "content": "</think>",
@@ -208,34 +208,23 @@
208
  "normalized": false,
209
  "rstrip": false,
210
  "single_word": false,
211
- "special": true
212
- },
213
- "151669": {
214
- "content": "<tools>",
215
- "lstrip": false,
216
- "normalized": false,
217
- "rstrip": false,
218
- "single_word": false,
219
- "special": true
220
- },
221
- "151670": {
222
- "content": "</tools>",
223
- "lstrip": false,
224
- "normalized": false,
225
- "rstrip": false,
226
- "single_word": false,
227
- "special": true
228
  }
229
  },
230
  "additional_special_tokens": [
231
- "<tools>",
232
- "</tools>",
233
- "<think>",
234
- "</think>",
235
- "<tool_call>",
236
- "</tool_call>",
237
- "<tool_response>",
238
- "</tool_response>"
 
 
 
 
 
239
  ],
240
  "bos_token": null,
241
  "chat_template": "{{ bos_token }}{% for message in messages %}{{ '<start_of_turn>' + message['role'] + '\\n' + message['content'] | trim + '<end_of_turn><eos>\\n' }}{% endfor %}{% if add_generation_prompt %}{{'<start_of_turn>model\\n'}}{% endif %}",
 
120
  "normalized": false,
121
  "rstrip": false,
122
  "single_word": false,
123
+ "special": false
124
  },
125
  "151658": {
126
  "content": "</tool_call>",
 
128
  "normalized": false,
129
  "rstrip": false,
130
  "single_word": false,
131
+ "special": false
132
  },
133
  "151659": {
134
  "content": "<|fim_prefix|>",
 
184
  "normalized": false,
185
  "rstrip": false,
186
  "single_word": false,
187
+ "special": false
188
  },
189
  "151666": {
190
  "content": "</tool_response>",
 
192
  "normalized": false,
193
  "rstrip": false,
194
  "single_word": false,
195
+ "special": false
196
  },
197
  "151667": {
198
  "content": "<think>",
 
200
  "normalized": false,
201
  "rstrip": false,
202
  "single_word": false,
203
+ "special": false
204
  },
205
  "151668": {
206
  "content": "</think>",
 
208
  "normalized": false,
209
  "rstrip": false,
210
  "single_word": false,
211
+ "special": false
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
212
  }
213
  },
214
  "additional_special_tokens": [
215
+ "<|im_start|>",
216
+ "<|im_end|>",
217
+ "<|object_ref_start|>",
218
+ "<|object_ref_end|>",
219
+ "<|box_start|>",
220
+ "<|box_end|>",
221
+ "<|quad_start|>",
222
+ "<|quad_end|>",
223
+ "<|vision_start|>",
224
+ "<|vision_end|>",
225
+ "<|vision_pad|>",
226
+ "<|image_pad|>",
227
+ "<|video_pad|>"
228
  ],
229
  "bos_token": null,
230
  "chat_template": "{{ bos_token }}{% for message in messages %}{{ '<start_of_turn>' + message['role'] + '\\n' + message['content'] | trim + '<end_of_turn><eos>\\n' }}{% endfor %}{% if add_generation_prompt %}{{'<start_of_turn>model\\n'}}{% endif %}",
training_args.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:33dbbb8d1b1f00d6101780837a648e781e7ca05891ada8e7dfb493cf879685c2
3
  size 5688
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:eb9bd71b71cb780f4e84e9fbb44e8e6a279ee4d67b68ccc1616f62848f870ec2
3
  size 5688