Training in progress, step 3
Browse files- adapter_config.json +1 -1
- adapter_model.safetensors +1 -1
- chat_template.jinja +61 -26
- training_args.bin +2 -2
adapter_config.json
CHANGED
@@ -26,8 +26,8 @@
|
|
26 |
"revision": null,
|
27 |
"target_modules": [
|
28 |
"q_proj",
|
29 |
-
"o_proj",
|
30 |
"v_proj",
|
|
|
31 |
"k_proj"
|
32 |
],
|
33 |
"target_parameters": null,
|
|
|
26 |
"revision": null,
|
27 |
"target_modules": [
|
28 |
"q_proj",
|
|
|
29 |
"v_proj",
|
30 |
+
"o_proj",
|
31 |
"k_proj"
|
32 |
],
|
33 |
"target_parameters": null,
|
adapter_model.safetensors
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 101748240
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:633baa6615812857a5c1a995933ff86fa3d7dced1bf0bc0d0213e5afbc48286f
|
3 |
size 101748240
|
chat_template.jinja
CHANGED
@@ -1,48 +1,80 @@
|
|
1 |
{%- if tools %}
|
2 |
{{- '<|im_start|>system\n' }}
|
3 |
-
{%- if messages[0]
|
4 |
-
{{- messages[0]
|
5 |
-
{%- else %}
|
6 |
-
{{- 'You are Open-R1, a language model trained by Hugging Face to help users. Your role as an assistant involves thoroughly exploring questions through a systematic thinking process before providing the final precise and accurate solutions. This requires engaging in a comprehensive cycle of analysis, summarizing, exploration, reassessment, reflection, backtracing, and iteration to develop well-considered thinking process. Please structure your response into two main sections: Thought and Solution using the specified format: <think> Thought section </think> Solution section. In the Thought section, detail your reasoning process in steps. Each step should include detailed considerations such as analysing questions, summarizing relevant findings, brainstorming new ideas, verifying the accuracy of the current steps, refining any errors, and revisiting previous steps. In the Solution section, based on various attempts, explorations, and reflections from the Thought section, systematically present the final solution that you deem correct. The Solution section should be logical, accurate, and concise and detail necessary steps needed to reach the conclusion. Now, try to solve the following question through the above guidelines.' }}
|
7 |
{%- endif %}
|
8 |
-
{{- "
|
9 |
{%- for tool in tools %}
|
10 |
{{- "\n" }}
|
11 |
{{- tool | tojson }}
|
12 |
{%- endfor %}
|
13 |
{{- "\n</tools>\n\nFor each function call, return a json object with function name and arguments within <tool_call></tool_call> XML tags:\n<tool_call>\n{\"name\": <function-name>, \"arguments\": <args-json-object>}\n</tool_call><|im_end|>\n" }}
|
14 |
{%- else %}
|
15 |
-
{%- if messages[0]
|
16 |
-
{{- '<|im_start|>system\n' + messages[0]
|
17 |
-
{%- else %}
|
18 |
-
{{- '<|im_start|>system\nYou are Open-R1, a language model trained by Hugging Face to help users. Your role as an assistant involves thoroughly exploring questions through a systematic thinking process before providing the final precise and accurate solutions. This requires engaging in a comprehensive cycle of analysis, summarizing, exploration, reassessment, reflection, backtracing, and iteration to develop well-considered thinking process. Please structure your response into two main sections: Thought and Solution using the specified format: <think> Thought section </think> Solution section. In the Thought section, detail your reasoning process in steps. Each step should include detailed considerations such as analysing questions, summarizing relevant findings, brainstorming new ideas, verifying the accuracy of the current steps, refining any errors, and revisiting previous steps. In the Solution section, based on various attempts, explorations, and reflections from the Thought section, systematically present the final solution that you deem correct. The Solution section should be logical, accurate, and concise and detail necessary steps needed to reach the conclusion. Now, try to solve the following question through the above guidelines.<|im_end|>\n' }}
|
19 |
{%- endif %}
|
20 |
{%- endif %}
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
21 |
{%- for message in messages %}
|
22 |
-
{%- if
|
23 |
-
{
|
|
|
|
|
|
|
|
|
|
|
24 |
{%- elif message.role == "assistant" %}
|
25 |
-
{
|
26 |
-
{%- if message.
|
27 |
-
{
|
|
|
|
|
|
|
|
|
|
|
28 |
{%- endif %}
|
29 |
-
{%-
|
30 |
-
{%- if
|
31 |
-
{
|
|
|
|
|
32 |
{%- endif %}
|
33 |
-
|
34 |
-
{{-
|
35 |
-
|
36 |
-
|
37 |
-
{
|
38 |
-
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
39 |
{{- '<|im_end|>\n' }}
|
40 |
{%- elif message.role == "tool" %}
|
41 |
-
{%- if
|
42 |
{{- '<|im_start|>user' }}
|
43 |
{%- endif %}
|
44 |
{{- '\n<tool_response>\n' }}
|
45 |
-
{{-
|
46 |
{{- '\n</tool_response>' }}
|
47 |
{%- if loop.last or (messages[loop.index0 + 1].role != "tool") %}
|
48 |
{{- '<|im_end|>\n' }}
|
@@ -51,4 +83,7 @@
|
|
51 |
{%- endfor %}
|
52 |
{%- if add_generation_prompt %}
|
53 |
{{- '<|im_start|>assistant\n' }}
|
54 |
-
{%-
|
|
|
|
|
|
|
|
1 |
{%- if tools %}
|
2 |
{{- '<|im_start|>system\n' }}
|
3 |
+
{%- if messages[0].role == 'system' %}
|
4 |
+
{{- messages[0].content + '\n\n' }}
|
|
|
|
|
5 |
{%- endif %}
|
6 |
+
{{- "# Tools\n\nYou may call one or more functions to assist with the user query.\n\nYou are provided with function signatures within <tools></tools> XML tags:\n<tools>" }}
|
7 |
{%- for tool in tools %}
|
8 |
{{- "\n" }}
|
9 |
{{- tool | tojson }}
|
10 |
{%- endfor %}
|
11 |
{{- "\n</tools>\n\nFor each function call, return a json object with function name and arguments within <tool_call></tool_call> XML tags:\n<tool_call>\n{\"name\": <function-name>, \"arguments\": <args-json-object>}\n</tool_call><|im_end|>\n" }}
|
12 |
{%- else %}
|
13 |
+
{%- if messages[0].role == 'system' %}
|
14 |
+
{{- '<|im_start|>system\n' + messages[0].content + '<|im_end|>\n' }}
|
|
|
|
|
15 |
{%- endif %}
|
16 |
{%- endif %}
|
17 |
+
{%- set ns = namespace(multi_step_tool=true, last_query_index=messages|length - 1) %}
|
18 |
+
{%- for message in messages[::-1] %}
|
19 |
+
{%- set index = (messages|length - 1) - loop.index0 %}
|
20 |
+
{%- if ns.multi_step_tool and message.role == "user" and message.content is string and not(message.content.startswith('<tool_response>') and message.content.endswith('</tool_response>')) %}
|
21 |
+
{%- set ns.multi_step_tool = false %}
|
22 |
+
{%- set ns.last_query_index = index %}
|
23 |
+
{%- endif %}
|
24 |
+
{%- endfor %}
|
25 |
{%- for message in messages %}
|
26 |
+
{%- if message.content is string %}
|
27 |
+
{%- set content = message.content %}
|
28 |
+
{%- else %}
|
29 |
+
{%- set content = '' %}
|
30 |
+
{%- endif %}
|
31 |
+
{%- if (message.role == "user") or (message.role == "system" and not loop.first) %}
|
32 |
+
{{- '<|im_start|>' + message.role + '\n' + content + '<|im_end|>' + '\n' }}
|
33 |
{%- elif message.role == "assistant" %}
|
34 |
+
{%- set reasoning_content = '' %}
|
35 |
+
{%- if message.reasoning_content is string %}
|
36 |
+
{%- set reasoning_content = message.reasoning_content %}
|
37 |
+
{%- else %}
|
38 |
+
{%- if '</think>' in content %}
|
39 |
+
{%- set reasoning_content = content.split('</think>')[0].rstrip('\n').split('<think>')[-1].lstrip('\n') %}
|
40 |
+
{%- set content = content.split('</think>')[-1].lstrip('\n') %}
|
41 |
+
{%- endif %}
|
42 |
{%- endif %}
|
43 |
+
{%- if loop.index0 > ns.last_query_index %}
|
44 |
+
{%- if loop.last or (not loop.last and reasoning_content) %}
|
45 |
+
{{- '<|im_start|>' + message.role + '\n<think>\n' + reasoning_content.strip('\n') + '\n</think>\n\n' + content.lstrip('\n') }}
|
46 |
+
{%- else %}
|
47 |
+
{{- '<|im_start|>' + message.role + '\n' + content }}
|
48 |
{%- endif %}
|
49 |
+
{%- else %}
|
50 |
+
{{- '<|im_start|>' + message.role + '\n' + content }}
|
51 |
+
{%- endif %}
|
52 |
+
{%- if message.tool_calls %}
|
53 |
+
{%- for tool_call in message.tool_calls %}
|
54 |
+
{%- if (loop.first and content) or (not loop.first) %}
|
55 |
+
{{- '\n' }}
|
56 |
+
{%- endif %}
|
57 |
+
{%- if tool_call.function %}
|
58 |
+
{%- set tool_call = tool_call.function %}
|
59 |
+
{%- endif %}
|
60 |
+
{{- '<tool_call>\n{"name": "' }}
|
61 |
+
{{- tool_call.name }}
|
62 |
+
{{- '", "arguments": ' }}
|
63 |
+
{%- if tool_call.arguments is string %}
|
64 |
+
{{- tool_call.arguments }}
|
65 |
+
{%- else %}
|
66 |
+
{{- tool_call.arguments | tojson }}
|
67 |
+
{%- endif %}
|
68 |
+
{{- '}\n</tool_call>' }}
|
69 |
+
{%- endfor %}
|
70 |
+
{%- endif %}
|
71 |
{{- '<|im_end|>\n' }}
|
72 |
{%- elif message.role == "tool" %}
|
73 |
+
{%- if loop.first or (messages[loop.index0 - 1].role != "tool") %}
|
74 |
{{- '<|im_start|>user' }}
|
75 |
{%- endif %}
|
76 |
{{- '\n<tool_response>\n' }}
|
77 |
+
{{- content }}
|
78 |
{{- '\n</tool_response>' }}
|
79 |
{%- if loop.last or (messages[loop.index0 + 1].role != "tool") %}
|
80 |
{{- '<|im_end|>\n' }}
|
|
|
83 |
{%- endfor %}
|
84 |
{%- if add_generation_prompt %}
|
85 |
{{- '<|im_start|>assistant\n' }}
|
86 |
+
{%- if enable_thinking is defined and enable_thinking is false %}
|
87 |
+
{{- '<think>\n\n</think>\n\n' }}
|
88 |
+
{%- endif %}
|
89 |
+
{%- endif %}
|
training_args.bin
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
-
size
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:eae859289f663cc784ee7d7fe9ad753ae5c9b1f49727b3515e9b37fe90fc2a6b
|
3 |
+
size 7416
|