diff --git a/.gitattributes b/.gitattributes
index a6344aac8c09253b3b630fb776ae94478aa0275b..aa7aacd0134a92c3c1943fdecc75cd8b7420cce6 100644
--- a/.gitattributes
+++ b/.gitattributes
@@ -33,3 +33,5 @@ saved_model/**/* filter=lfs diff=lfs merge=lfs -text
*.zip filter=lfs diff=lfs merge=lfs -text
*.zst filter=lfs diff=lfs merge=lfs -text
*tfevents* filter=lfs diff=lfs merge=lfs -text
+model.safetensors.index.json filter=lfs diff=lfs merge=lfs -text
+tokenizer.json filter=lfs diff=lfs merge=lfs -text
diff --git a/.mdl b/.mdl
new file mode 100644
index 0000000000000000000000000000000000000000..3b940d405e39dff8d36da2a61cd1dbf197f51cc4
Binary files /dev/null and b/.mdl differ
diff --git a/.msc b/.msc
new file mode 100644
index 0000000000000000000000000000000000000000..706d9786519e92dc694820305a377a2a76d8350e
Binary files /dev/null and b/.msc differ
diff --git a/.mv b/.mv
new file mode 100644
index 0000000000000000000000000000000000000000..0beb780a4ddfc8fc98024520db2e86d497d9594f
--- /dev/null
+++ b/.mv
@@ -0,0 +1 @@
+Revision:master,CreatedAt:1753860431
\ No newline at end of file
diff --git a/README.md b/README.md
new file mode 100644
index 0000000000000000000000000000000000000000..ee29a19f89eccf7eeda5be2f5406140edff91ebc
--- /dev/null
+++ b/README.md
@@ -0,0 +1,104 @@
+---
+library_name: transformers
+pipeline_tag: text-generation
+tags:
+- glm4_moe
+- GPTQ
+- Int4-Int8Mix
+- 量化修复
+- vLLM
+base_model:
+ - ZhipuAI/GLM-4.5
+base_model_relation: quantized
+---
+# GLM-4.5-GPTQ-Int4-Int8Mix
+基础型 [ZhipuAI/GLM-4.5](https://www.modelscope.cn/models/ZhipuAI/GLM-4.5)
+
+
+### 【Vllm 单机8卡启动命令】
+注: 8卡启动该模型一定要跟`--enable-expert-parallel` ,否则其专家张量TP整除除不尽;4卡则不需要。
+```
+CONTEXT_LENGTH=32768
+
+vllm serve \
+ tclf90/GLM-4.5-GPTQ-Int4-Int8Mix \
+ --served-model-name GLM-4.5-GPTQ-Int4-Int8Mix \
+ --enable-expert-parallel \
+ --swap-space 16 \
+ --max-num-seqs 512 \
+ --max-model-len $CONTEXT_LENGTH \
+ --max-seq-len-to-capture $CONTEXT_LENGTH \
+ --gpu-memory-utilization 0.9 \
+ --tensor-parallel-size 8 \
+ --trust-remote-code \
+ --disable-log-requests \
+ --host 0.0.0.0 \
+ --port 8000
+```
+
+### 【依赖】
+
+```
+vllm==0.10.0
+```
+
+### 【模型更新日期】
+```
+2025-07-30
+1. 首次commit
+```
+
+### 【模型列表】
+
+| 文件大小 | 最近更新时间 |
+|---------|--------------|
+| `192GB` | `2025-07-30` |
+
+
+
+### 【模型下载】
+
+```python
+from modelscope import snapshot_download
+snapshot_download('tclf90/GLM-4.5-GPTQ-Int4-Int8Mix', cache_dir="本地路径")
+```
+
+
+### 【介绍】
+# GLM-4.5
+
+
+

+
+
+ 👋 加入我们的 微信群 。
+
+ 📖 查看GLM-4.5 技术博客 。
+
+ 📍 在 智谱AI开放平台 上使用GLM-4.5 API服务。
+
+ 👉 一键体验 GLM-4.5 。
+
+
+## 模型介绍
+
+**GLM-4.5** 系列模型是专为智能体设计的基础模型。GLM-4.5拥有 **3550** 亿总参数量,其中 **320** 亿活跃参数;GLM-4.5-Air采用更紧凑的设计,拥有
+ **1060** 亿总参数量,其中 **120** 亿活跃参数。GLM-4.5模型统一了推理、编码和智能体能力,以满足智能体应用的复杂需求。
+
+GLM-4.5 和 GLM-4.5-Air 都是混合推理模型,提供两种模式:用于复杂推理和工具使用的思考模式,以及用于即时响应的非思考模式。
+
+我们已开源了 GLM-4.5 和 GLM-4.5-Air 的基础模型、混合推理模型以及混合推理模型的FP8版本。它们采用MIT开源许可证发布,可用于商业用途和二次开发。
+
+在我们对12项行业标准基准的全面评估中,GLM-4.5表现卓越,得分 **63.2**,在所有专有和开源模型中排名**第3**
+。值得注意的是,GLM-4.5-Air在保持优异效率的同时,仍取得了 **59.8** 的竞争性成绩。
+
+
+
+如需了解更多评估结果、展示案例和技术细节,请访问我们的 [技术博客](https://z.ai/blog/glm-4.5)。技术报告将很快发布。
+
+模型代码、工具解析器和推理解析器可在 [transformers](https://github.com/huggingface/transformers/tree/main/src/transformers/models/glm4_moe)、 [vLLM](https://github.com/vllm-project/vllm/blob/main/vllm/model_executor/models/glm4_moe_mtp.py)
+和 [SGLang](https://github.com/sgl-project/sglang/blob/main/python/sglang/srt/models/glm4_moe.py) 的实现中找到。
+
+## 快速开始
+
+请参考我们的[github](https://github.com/zai-org/GLM-4.5)项目。
diff --git a/chat_template.jinja b/chat_template.jinja
new file mode 100644
index 0000000000000000000000000000000000000000..41478957aca7a04b7321022e7d1f73de5badd995
--- /dev/null
+++ b/chat_template.jinja
@@ -0,0 +1,103 @@
+[gMASK]
+{%- if tools -%}
+<|system|>
+# Tools
+
+You may call one or more functions to assist with the user query.
+
+You are provided with function signatures within XML tags:
+
+{% for tool in tools %}
+{{ tool | tojson(ensure_ascii=False) }}
+{% endfor %}
+
+
+For each function call, output the function name and arguments within the following XML format:
+{function-name}
+{arg-key-1}
+{arg-value-1}
+{arg-key-2}
+{arg-value-2}
+...
+{%- endif -%}
+{%- macro visible_text(content) -%}
+ {%- if content is string -%}
+ {{- content }}
+ {%- elif content is iterable and content is not mapping -%}
+ {%- for item in content -%}
+ {%- if item is mapping and item.type == 'text' -%}
+ {{- item.text }}
+ {%- elif item is string -%}
+ {{- item }}
+ {%- endif -%}
+ {%- endfor -%}
+ {%- else -%}
+ {{- content }}
+ {%- endif -%}
+{%- endmacro -%}
+{%- set ns = namespace(last_user_index=-1) %}
+{%- for m in messages %}
+ {%- if m.role == 'user' %}
+ {% set ns.last_user_index = loop.index0 -%}
+ {%- endif %}
+{%- endfor %}
+{% for m in messages %}
+{%- if m.role == 'user' -%}<|user|>
+{{ visible_text(m.content) }}
+{{- '/nothink' if (enable_thinking is defined and not enable_thinking and not visible_text(m.content).endswith("/nothink")) else '' -}}
+{%- elif m.role == 'assistant' -%}
+<|assistant|>
+{%- set reasoning_content = '' %}
+{%- set content = visible_text(m.content) %}
+{%- if m.reasoning_content is string %}
+ {%- set reasoning_content = m.reasoning_content %}
+{%- else %}
+ {%- if '' in content %}
+ {%- set reasoning_content = content.split('')[0].rstrip('\n').split('')[-1].lstrip('\n') %}
+ {%- set content = content.split('')[-1].lstrip('\n') %}
+ {%- endif %}
+{%- endif %}
+{%- if loop.index0 > ns.last_user_index and reasoning_content -%}
+{{ '\n' + reasoning_content.strip() + ''}}
+{%- else -%}
+{{ '\n' }}
+{%- endif -%}
+{%- if content.strip() -%}
+{{ '\n' + content.strip() }}
+{%- endif -%}
+{% if m.tool_calls %}
+{% for tc in m.tool_calls %}
+{%- if tc.function %}
+ {%- set tc = tc.function %}
+{%- endif %}
+{{ '\n' + tc.name }}
+{% set _args = tc.arguments %}
+{% for k, v in _args.items() %}
+{{ k }}
+{{ v | tojson(ensure_ascii=False) if v is not string else v }}
+{% endfor %}
+{% endfor %}
+{% endif %}
+{%- elif m.role == 'tool' -%}
+{%- if m.content is string -%}
+{%- if loop.first or (messages[loop.index0 - 1].role != "tool") %}
+ {{- '<|observation|>' }}
+{%- endif %}
+{{- '\n\n' }}
+{{- m.content }}
+{{- '\n' }}
+{%- else -%}
+<|observation|>{% for tr in m.content %}
+
+
+{{ tr.output if tr.output is defined else tr }}
+{% endfor -%}
+{% endif -%}
+{%- elif m.role == 'system' -%}
+<|system|>
+{{ visible_text(m.content) }}
+{%- endif -%}
+{%- endfor -%}
+{%- if add_generation_prompt -%}
+ <|assistant|>{{- '\n' if (enable_thinking is defined and not enable_thinking) else '' -}}
+{%- endif -%}
\ No newline at end of file
diff --git a/config.json b/config.json
new file mode 100644
index 0000000000000000000000000000000000000000..32979fc8b1bb39c34a48593b8054955a92288492
--- /dev/null
+++ b/config.json
@@ -0,0 +1,60 @@
+{
+ "name_or_path": "tclf90/GLM-4.5-GPTQ-Int4-Int8Mix",
+ "architectures": [
+ "Glm4MoeForCausalLM"
+ ],
+ "attention_bias": true,
+ "attention_dropout": 0.0,
+ "pad_token_id": 151329,
+ "eos_token_id": [
+ 151329,
+ 151336,
+ 151338
+ ],
+ "head_dim": 128,
+ "hidden_act": "silu",
+ "hidden_size": 5120,
+ "partial_rotary_factor": 0.5,
+ "initializer_range": 0.02,
+ "intermediate_size": 12288,
+ "max_position_embeddings": 131072,
+ "model_type": "glm4_moe",
+ "moe_intermediate_size": 1536,
+ "norm_topk_prob": true,
+ "num_attention_heads": 96,
+ "n_group": 1,
+ "topk_group": 1,
+ "n_routed_experts": 160,
+ "n_shared_experts": 1,
+ "routed_scaling_factor": 2.5,
+ "num_experts_per_tok": 8,
+ "first_k_dense_replace": 3,
+ "num_hidden_layers": 92,
+ "num_key_value_heads": 8,
+ "rms_norm_eps": 1e-05,
+ "rope_scaling": null,
+ "rope_theta": 1000000,
+ "num_nextn_predict_layers": 1,
+ "tie_word_embeddings": false,
+ "torch_dtype": "float16",
+ "transformers_version": "4.54.0",
+ "use_cache": true,
+ "use_qk_norm": true,
+ "vocab_size": 151552,
+ "quantization_config": {
+ "quant_method": "gptq_marlin",
+ "bits": 4,
+ "group_size": 128,
+ "sym": true,
+ "desc_act": false,
+ "dynamic": {
+ "-:model.embed_tokens.weight": {},
+ "-:.*shared_experts": {},
+ "-:.*shared_head": {},
+ "-:lm_head.weight": {},
+ "+:model[.]layers[.]([0-4]|9[0-2])[.].*": {
+ "bits": 8
+ }
+ }
+ }
+}
\ No newline at end of file
diff --git a/configuration.json b/configuration.json
new file mode 100644
index 0000000000000000000000000000000000000000..f9291c34499303a5103dea21c45e605bb20981bb
--- /dev/null
+++ b/configuration.json
@@ -0,0 +1 @@
+{"framework":"Pytorch","task":"text-generation"}
\ No newline at end of file
diff --git a/generation_config.json b/generation_config.json
new file mode 100644
index 0000000000000000000000000000000000000000..4d49113f3e19072368c98e53180331c77c07c8a6
--- /dev/null
+++ b/generation_config.json
@@ -0,0 +1,10 @@
+{
+ "_from_model_config": true,
+ "eos_token_id": [
+ 151329,
+ 151336,
+ 151338
+ ],
+ "pad_token_id": 151329,
+ "transformers_version": "4.54.0"
+}
diff --git a/model-00001-of-00042.safetensors b/model-00001-of-00042.safetensors
new file mode 100644
index 0000000000000000000000000000000000000000..19daf20f8c9e31e194bcd8ea0bea1d475a642b25
--- /dev/null
+++ b/model-00001-of-00042.safetensors
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:0f46be18c5c61ad77e75b44481c02392f82d761ff7a734d85fa6bd274f841319
+size 4997791792
diff --git a/model-00002-of-00042.safetensors b/model-00002-of-00042.safetensors
new file mode 100644
index 0000000000000000000000000000000000000000..10b129d86543002f8c7d90f40d9376eeab99bf25
--- /dev/null
+++ b/model-00002-of-00042.safetensors
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:0d0c23be7ba1c2c4a2f8e25e3ac1aca18faa729a0ac0231dc011340f2dab8862
+size 4995143368
diff --git a/model-00003-of-00042.safetensors b/model-00003-of-00042.safetensors
new file mode 100644
index 0000000000000000000000000000000000000000..888d0e5bb3762d34ae858b5e9d98227c12efb732
--- /dev/null
+++ b/model-00003-of-00042.safetensors
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:119ee325fad2b030c9b18cfbdfde59e8fa520748e9a01eef54e6f13bd4a6ca62
+size 4998558160
diff --git a/model-00004-of-00042.safetensors b/model-00004-of-00042.safetensors
new file mode 100644
index 0000000000000000000000000000000000000000..3d12f33bc29e718cbbeb8ee5d88f088ea8840cb5
--- /dev/null
+++ b/model-00004-of-00042.safetensors
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:5f01b3af8cabb53ac62b9e03d9751fc7447620b7a21b88ac93c05c1a45ead73a
+size 4997866008
diff --git a/model-00005-of-00042.safetensors b/model-00005-of-00042.safetensors
new file mode 100644
index 0000000000000000000000000000000000000000..85c1839177f03ead4821a07e88fe1944e72d20ba
--- /dev/null
+++ b/model-00005-of-00042.safetensors
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:5715b92e0875862e66c6f6cfb4308e344933ace38939be051b0bca1a5fbd6d9e
+size 4998724880
diff --git a/model-00006-of-00042.safetensors b/model-00006-of-00042.safetensors
new file mode 100644
index 0000000000000000000000000000000000000000..754acc6a06bbec428c6adb8e6301510fdec0e822
--- /dev/null
+++ b/model-00006-of-00042.safetensors
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:cbd0166ddde1deda2605e9cfae0fbc6a6aa67ef5055adef790e782f82e616650
+size 4997885480
diff --git a/model-00007-of-00042.safetensors b/model-00007-of-00042.safetensors
new file mode 100644
index 0000000000000000000000000000000000000000..372fdc0d23b00d7eba3c66bcbd130d53bf5ad90e
--- /dev/null
+++ b/model-00007-of-00042.safetensors
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:1d7b08652f20b58e62214cc90d68ba5e1db63e7bc2673413c34bc41271076eaa
+size 4997870632
diff --git a/model-00008-of-00042.safetensors b/model-00008-of-00042.safetensors
new file mode 100644
index 0000000000000000000000000000000000000000..699b6a19cab43b068302fc613c0f3b21bc23d4fc
--- /dev/null
+++ b/model-00008-of-00042.safetensors
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:652608a7e87e29bc971d87049b0271e9668dc9c97d2891c2fb886c507c2c3864
+size 4998727768
diff --git a/model-00009-of-00042.safetensors b/model-00009-of-00042.safetensors
new file mode 100644
index 0000000000000000000000000000000000000000..83d91bddbd78c5fb48f33717c930c8238fef4065
--- /dev/null
+++ b/model-00009-of-00042.safetensors
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:8f99aeb3c53dcdcb562a8b7dad870a4bb073b56e128a85f990d45472ebea7fa4
+size 4997870784
diff --git a/model-00010-of-00042.safetensors b/model-00010-of-00042.safetensors
new file mode 100644
index 0000000000000000000000000000000000000000..53735ace7822f0e33d14972b447c2253204b37ae
--- /dev/null
+++ b/model-00010-of-00042.safetensors
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:f6b93fe2d1f3bf1032d106987a3a7bf60f9a24cf03a6d3297326f5396e67dbf3
+size 4998727328
diff --git a/model-00011-of-00042.safetensors b/model-00011-of-00042.safetensors
new file mode 100644
index 0000000000000000000000000000000000000000..517559958754861b2486b18efe98e96d2b0724ec
--- /dev/null
+++ b/model-00011-of-00042.safetensors
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:3c7c12475ba2bffebd3feae808826d71199472d52a415cbd041a923d8064b0c1
+size 4997885552
diff --git a/model-00012-of-00042.safetensors b/model-00012-of-00042.safetensors
new file mode 100644
index 0000000000000000000000000000000000000000..efb5362a04b97262f1868ac2c47a837d66606503
--- /dev/null
+++ b/model-00012-of-00042.safetensors
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:d67574ca8ddfef22e618bbc3f30a111b20cd1407b4a7e214e3542c880b42973a
+size 4997870600
diff --git a/model-00013-of-00042.safetensors b/model-00013-of-00042.safetensors
new file mode 100644
index 0000000000000000000000000000000000000000..ab7b427daed6619a4c82fbba1d1ca947a878bcbe
--- /dev/null
+++ b/model-00013-of-00042.safetensors
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:33d35d61b1d96d5f2e539e4db5d7d5a2c9577ebf45ee3018cb5cb64f8b922f98
+size 4998727688
diff --git a/model-00014-of-00042.safetensors b/model-00014-of-00042.safetensors
new file mode 100644
index 0000000000000000000000000000000000000000..88bc755148133b7f8c12c51748649576d3c84f22
--- /dev/null
+++ b/model-00014-of-00042.safetensors
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:5fe9ea1814714f05063d10f52608ba26f6c8eead6c5f70bcaa9561eecb9aab67
+size 4997870848
diff --git a/model-00015-of-00042.safetensors b/model-00015-of-00042.safetensors
new file mode 100644
index 0000000000000000000000000000000000000000..d1c64ba7acf58d40d8b99b552e92ae8908904875
--- /dev/null
+++ b/model-00015-of-00042.safetensors
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:5af3aa46d331a1f71b7a59d2f24404923dc09c1353ba2d62398ea6d27d115d07
+size 4998727256
diff --git a/model-00016-of-00042.safetensors b/model-00016-of-00042.safetensors
new file mode 100644
index 0000000000000000000000000000000000000000..fe12ad946ed59b2dd46d23aec57df8982d905882
--- /dev/null
+++ b/model-00016-of-00042.safetensors
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:bf76d7ccaad77b3a949b3da4e84df952474760d1883e46582c0c3862c053ff50
+size 4997885624
diff --git a/model-00017-of-00042.safetensors b/model-00017-of-00042.safetensors
new file mode 100644
index 0000000000000000000000000000000000000000..2589dd6a0be084bf887e92202c3020b8a373acdb
--- /dev/null
+++ b/model-00017-of-00042.safetensors
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:2f12cb86218ac0874e77ca060b98e3a1e26992e72da45eae7d14fd87e53a9b45
+size 4997870552
diff --git a/model-00018-of-00042.safetensors b/model-00018-of-00042.safetensors
new file mode 100644
index 0000000000000000000000000000000000000000..40bca92ce29cb0c5cf236748f9d165ff2aa66fd2
--- /dev/null
+++ b/model-00018-of-00042.safetensors
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:eab1bae4f78987bfb1d3faa9d09c623743b828cd57671e2414e62e295a68e0b4
+size 4998727616
diff --git a/model-00019-of-00042.safetensors b/model-00019-of-00042.safetensors
new file mode 100644
index 0000000000000000000000000000000000000000..92be3ca09b93a0fbb9243c614945e2ea23f45aff
--- /dev/null
+++ b/model-00019-of-00042.safetensors
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:76c572c7086e1c2f8e846c63a7143123a965c5375580700ac09c0ace5ef67bfb
+size 4997870928
diff --git a/model-00020-of-00042.safetensors b/model-00020-of-00042.safetensors
new file mode 100644
index 0000000000000000000000000000000000000000..b6c811a010a2e5dce62b4371b5cb49fa44e65bb4
--- /dev/null
+++ b/model-00020-of-00042.safetensors
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:4b421afde37aa9f9d7deae828afedba5bca49690d0bb2738314c1e81c9d33735
+size 4998727200
diff --git a/model-00021-of-00042.safetensors b/model-00021-of-00042.safetensors
new file mode 100644
index 0000000000000000000000000000000000000000..a8cc4b99ab0b1a84f310be5b89283b7455c4fab1
--- /dev/null
+++ b/model-00021-of-00042.safetensors
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:83d77013b648e243bccb682c6316c559994d687e21d2aa9267b14fa42bcc167c
+size 4997885672
diff --git a/model-00022-of-00042.safetensors b/model-00022-of-00042.safetensors
new file mode 100644
index 0000000000000000000000000000000000000000..d0fb14ab49571e481e97da99dee32febceda805d
--- /dev/null
+++ b/model-00022-of-00042.safetensors
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:391ee2914fbcd742e95e7b6638d9f1114f24573d15d58c12724249fae2e90dd6
+size 4997870560
diff --git a/model-00023-of-00042.safetensors b/model-00023-of-00042.safetensors
new file mode 100644
index 0000000000000000000000000000000000000000..2a01c7db4ea2273164ca8729a7ef1c66d52dc29c
--- /dev/null
+++ b/model-00023-of-00042.safetensors
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:d5aaf6e316274fdbe49fb7e74d3030e923ef2ed3566f9b4c31faec7647881a0a
+size 4998727544
diff --git a/model-00024-of-00042.safetensors b/model-00024-of-00042.safetensors
new file mode 100644
index 0000000000000000000000000000000000000000..ff0682b6f22f505c8cb2fea30592135b2558029a
--- /dev/null
+++ b/model-00024-of-00042.safetensors
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:87247632f93b563907e41d1c49cae6f5f93d4bffc7f4accafe3f1e357502a454
+size 4997870992
diff --git a/model-00025-of-00042.safetensors b/model-00025-of-00042.safetensors
new file mode 100644
index 0000000000000000000000000000000000000000..e488303e02856eaa5afdf57b407bdf9da6ad96e7
--- /dev/null
+++ b/model-00025-of-00042.safetensors
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:085fdc3105b20d70457ed941917f2be8891d2e4f74efe66a240320e546da18cc
+size 4992074384
diff --git a/model-00026-of-00042.safetensors b/model-00026-of-00042.safetensors
new file mode 100644
index 0000000000000000000000000000000000000000..09044100e8032d496462c137a7943b01a3bd584d
--- /dev/null
+++ b/model-00026-of-00042.safetensors
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:2e141471ee2844b34835a9762a5f430abbbfd55e17bb00f16506796690114c84
+size 5000431872
diff --git a/model-00027-of-00042.safetensors b/model-00027-of-00042.safetensors
new file mode 100644
index 0000000000000000000000000000000000000000..9d66405c5457ae57eb33f90aa1ac587e2041c76a
--- /dev/null
+++ b/model-00027-of-00042.safetensors
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:4782ffe566b700905c1f7308575794cc8a1ff3ac0a88cb18e60b9e34c8494d10
+size 4997870632
diff --git a/model-00028-of-00042.safetensors b/model-00028-of-00042.safetensors
new file mode 100644
index 0000000000000000000000000000000000000000..ae71e657debb566123bc3a28d2f2b0fcd5ccccbf
--- /dev/null
+++ b/model-00028-of-00042.safetensors
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:b76437186c4d750f514dad4a658a946da715ccd39956c98c6b3a10a55a3f2cbd
+size 4998727472
diff --git a/model-00029-of-00042.safetensors b/model-00029-of-00042.safetensors
new file mode 100644
index 0000000000000000000000000000000000000000..b8aec0cad7796e006671bf066fa42f350d6692d0
--- /dev/null
+++ b/model-00029-of-00042.safetensors
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:6520a59490e95c2601fbd5189b999c2a177460927ce38c83dc31fb3a0870e924
+size 4997885424
diff --git a/model-00030-of-00042.safetensors b/model-00030-of-00042.safetensors
new file mode 100644
index 0000000000000000000000000000000000000000..b30046e6548e9685c8252569355f41923bf4e688
--- /dev/null
+++ b/model-00030-of-00042.safetensors
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:e25cfb597302a5f0dbaa8f2e125d4e6fdc82102f6df9e8d1b11554dda48abd0b
+size 4997870632
diff --git a/model-00031-of-00042.safetensors b/model-00031-of-00042.safetensors
new file mode 100644
index 0000000000000000000000000000000000000000..929931b216c24e14d77d005fbc2f117218ce713a
--- /dev/null
+++ b/model-00031-of-00042.safetensors
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:cfd7f8b1d038061d82c622f1312957e0fc71527a5866b155a3d337f6e23f1e2e
+size 4998727920
diff --git a/model-00032-of-00042.safetensors b/model-00032-of-00042.safetensors
new file mode 100644
index 0000000000000000000000000000000000000000..5ca0e650fae21161d4e8aea8ca5b26509b386e14
--- /dev/null
+++ b/model-00032-of-00042.safetensors
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:d05c7451e1ee61e6743f8fec34616f0f264087a61accb64d2bb2beef87af2db4
+size 4997870704
diff --git a/model-00033-of-00042.safetensors b/model-00033-of-00042.safetensors
new file mode 100644
index 0000000000000000000000000000000000000000..680513b5ee17523e0911933d279cceaad2d46ab4
--- /dev/null
+++ b/model-00033-of-00042.safetensors
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:c6e84066f314fb27dec57a9c926ee44b38efa5e356689bbf72bac0049a476b5c
+size 4998727400
diff --git a/model-00034-of-00042.safetensors b/model-00034-of-00042.safetensors
new file mode 100644
index 0000000000000000000000000000000000000000..3207473c1a51524e79cc2a5ac7210b4d3bfeb0b1
--- /dev/null
+++ b/model-00034-of-00042.safetensors
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:d8df659065fb44433c1c9f3c7072f49f1dcb208c1acb3c2dcca5d9c0884c7788
+size 4997885480
diff --git a/model-00035-of-00042.safetensors b/model-00035-of-00042.safetensors
new file mode 100644
index 0000000000000000000000000000000000000000..5d6ce01316303c4abb055e0a219536ad72e78e92
--- /dev/null
+++ b/model-00035-of-00042.safetensors
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:b70521cac48074544b02ecacb87ebda92ffd0561e313a7caac92dbce7867aa01
+size 4997870632
diff --git a/model-00036-of-00042.safetensors b/model-00036-of-00042.safetensors
new file mode 100644
index 0000000000000000000000000000000000000000..dc4e4cf7d7a127a4ea836d7d636064f808e1e535
--- /dev/null
+++ b/model-00036-of-00042.safetensors
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:9cd8902455f4b079b11938d21bfd8c18cc184bb1e5575f92df030f7ab5ec9520
+size 4998727768
diff --git a/model-00037-of-00042.safetensors b/model-00037-of-00042.safetensors
new file mode 100644
index 0000000000000000000000000000000000000000..cdf3ebe24f56c697ed9542b3532e715a726985a5
--- /dev/null
+++ b/model-00037-of-00042.safetensors
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:ff5e9f40e4d734b4709d9dd93ff15e2db656ceac53e5cc59ac55877fd1820641
+size 4997870784
diff --git a/model-00038-of-00042.safetensors b/model-00038-of-00042.safetensors
new file mode 100644
index 0000000000000000000000000000000000000000..4dd3de69e8e9e35e171e070d4733b2c0e037f8d3
--- /dev/null
+++ b/model-00038-of-00042.safetensors
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:8cebed347d069631ce5954cb926aca7b088cdecbb38cd25fac4149a1d63c793d
+size 5000057424
diff --git a/model-00039-of-00042.safetensors b/model-00039-of-00042.safetensors
new file mode 100644
index 0000000000000000000000000000000000000000..b65de9b8550e96a6958a24b5d94d96aba9405883
--- /dev/null
+++ b/model-00039-of-00042.safetensors
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:a806592646ceca0325e2ac917eb02769efaef3d2dee0ca1b66540aae3b6ac5e7
+size 3898292992
diff --git a/model-00040-of-00042.safetensors b/model-00040-of-00042.safetensors
new file mode 100644
index 0000000000000000000000000000000000000000..e1183d5dade4ce9508f31b86b1ab4d6bf1d1ddd6
--- /dev/null
+++ b/model-00040-of-00042.safetensors
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:ec535fba714a3a2a869a50a4311dfa699064e29567bc53ff4c2f9f9826970f0d
+size 4995595616
diff --git a/model-00041-of-00042.safetensors b/model-00041-of-00042.safetensors
new file mode 100644
index 0000000000000000000000000000000000000000..cd160a28a416ae567c6f7404aafc53c388d61d28
--- /dev/null
+++ b/model-00041-of-00042.safetensors
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:9c4d750640cbff926a5892cdcf1831747d3d9bcb0fc7208f73af0e2dea56e65c
+size 4998632224
diff --git a/model-00042-of-00042.safetensors b/model-00042-of-00042.safetensors
new file mode 100644
index 0000000000000000000000000000000000000000..998818f6f741f8f8127b3914894c2df3c1e6afbb
--- /dev/null
+++ b/model-00042-of-00042.safetensors
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:50a3be345ac099740315f5e48e4e0c5914fd7e9c319a08c948bd33a65570454c
+size 1333687200
diff --git a/model.safetensors.index.json b/model.safetensors.index.json
new file mode 100644
index 0000000000000000000000000000000000000000..8ef744d2f29a3d1a6c1172ac4302e16e7c821b36
--- /dev/null
+++ b/model.safetensors.index.json
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:49dbd0a1da7cc76fa1f14902f4cec3fb5b658d056da59b652a4345e3e27fdfaf
+size 15871572
diff --git a/tokenizer.json b/tokenizer.json
new file mode 100644
index 0000000000000000000000000000000000000000..43a71efad1ab3f7e4d66d1e48e7cc44f68f21f3a
--- /dev/null
+++ b/tokenizer.json
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:9340665016419c825c4bdabbcc9acc43b7ca2c68ce142724afa829abb1be5efd
+size 19970699
diff --git a/tokenizer_config.json b/tokenizer_config.json
new file mode 100644
index 0000000000000000000000000000000000000000..053f12c9b03d5acbcc921042ea0c87a6baa5d3f7
--- /dev/null
+++ b/tokenizer_config.json
@@ -0,0 +1,325 @@
+{
+ "added_tokens_decoder": {
+ "151329": {
+ "content": "<|endoftext|>",
+ "lstrip": false,
+ "normalized": false,
+ "rstrip": false,
+ "single_word": false,
+ "special": true
+ },
+ "151330": {
+ "content": "[MASK]",
+ "lstrip": false,
+ "normalized": false,
+ "rstrip": false,
+ "single_word": false,
+ "special": true
+ },
+ "151331": {
+ "content": "[gMASK]",
+ "lstrip": false,
+ "normalized": false,
+ "rstrip": false,
+ "single_word": false,
+ "special": true
+ },
+ "151332": {
+ "content": "[sMASK]",
+ "lstrip": false,
+ "normalized": false,
+ "rstrip": false,
+ "single_word": false,
+ "special": true
+ },
+ "151333": {
+ "content": "",
+ "lstrip": false,
+ "normalized": false,
+ "rstrip": false,
+ "single_word": false,
+ "special": true
+ },
+ "151334": {
+ "content": "",
+ "lstrip": false,
+ "normalized": false,
+ "rstrip": false,
+ "single_word": false,
+ "special": true
+ },
+ "151335": {
+ "content": "<|system|>",
+ "lstrip": false,
+ "normalized": false,
+ "rstrip": false,
+ "single_word": false,
+ "special": true
+ },
+ "151336": {
+ "content": "<|user|>",
+ "lstrip": false,
+ "normalized": false,
+ "rstrip": false,
+ "single_word": false,
+ "special": true
+ },
+ "151337": {
+ "content": "<|assistant|>",
+ "lstrip": false,
+ "normalized": false,
+ "rstrip": false,
+ "single_word": false,
+ "special": true
+ },
+ "151338": {
+ "content": "<|observation|>",
+ "lstrip": false,
+ "normalized": false,
+ "rstrip": false,
+ "single_word": false,
+ "special": true
+ },
+ "151339": {
+ "content": "<|begin_of_image|>",
+ "lstrip": false,
+ "normalized": false,
+ "rstrip": false,
+ "single_word": false,
+ "special": true
+ },
+ "151340": {
+ "content": "<|end_of_image|>",
+ "lstrip": false,
+ "normalized": false,
+ "rstrip": false,
+ "single_word": false,
+ "special": true
+ },
+ "151341": {
+ "content": "<|begin_of_video|>",
+ "lstrip": false,
+ "normalized": false,
+ "rstrip": false,
+ "single_word": false,
+ "special": true
+ },
+ "151342": {
+ "content": "<|end_of_video|>",
+ "lstrip": false,
+ "normalized": false,
+ "rstrip": false,
+ "single_word": false,
+ "special": true
+ },
+ "151343": {
+ "content": "<|begin_of_audio|>",
+ "lstrip": false,
+ "normalized": false,
+ "rstrip": false,
+ "single_word": false,
+ "special": true
+ },
+ "151344": {
+ "content": "<|end_of_audio|>",
+ "lstrip": false,
+ "normalized": false,
+ "rstrip": false,
+ "single_word": false,
+ "special": true
+ },
+ "151345": {
+ "content": "<|begin_of_transcription|>",
+ "lstrip": false,
+ "normalized": false,
+ "rstrip": false,
+ "single_word": false,
+ "special": true
+ },
+ "151346": {
+ "content": "<|end_of_transcription|>",
+ "lstrip": false,
+ "normalized": false,
+ "rstrip": false,
+ "single_word": false,
+ "special": true
+ },
+ "151347": {
+ "content": "<|code_prefix|>",
+ "lstrip": false,
+ "normalized": false,
+ "rstrip": false,
+ "single_word": false,
+ "special": true
+ },
+ "151348": {
+ "content": "<|code_middle|>",
+ "lstrip": false,
+ "normalized": false,
+ "rstrip": false,
+ "single_word": false,
+ "special": true
+ },
+ "151349": {
+ "content": "<|code_suffix|>",
+ "lstrip": false,
+ "normalized": false,
+ "rstrip": false,
+ "single_word": false,
+ "special": true
+ },
+ "151350": {
+ "content": "",
+ "lstrip": false,
+ "normalized": false,
+ "rstrip": false,
+ "single_word": false,
+ "special": false
+ },
+ "151351": {
+ "content": "",
+ "lstrip": false,
+ "normalized": false,
+ "rstrip": false,
+ "single_word": false,
+ "special": false
+ },
+ "151352": {
+ "content": "",
+ "lstrip": false,
+ "normalized": false,
+ "rstrip": false,
+ "single_word": false,
+ "special": false
+ },
+ "151353": {
+ "content": "",
+ "lstrip": false,
+ "normalized": false,
+ "rstrip": false,
+ "single_word": false,
+ "special": false
+ },
+ "151354": {
+ "content": "",
+ "lstrip": false,
+ "normalized": false,
+ "rstrip": false,
+ "single_word": false,
+ "special": false
+ },
+ "151355": {
+ "content": "",
+ "lstrip": false,
+ "normalized": false,
+ "rstrip": false,
+ "single_word": false,
+ "special": false
+ },
+ "151356": {
+ "content": "",
+ "lstrip": false,
+ "normalized": false,
+ "rstrip": false,
+ "single_word": false,
+ "special": false
+ },
+ "151357": {
+ "content": "",
+ "lstrip": false,
+ "normalized": false,
+ "rstrip": false,
+ "single_word": false,
+ "special": false
+ },
+ "151358": {
+ "content": "",
+ "lstrip": false,
+ "normalized": false,
+ "rstrip": false,
+ "single_word": false,
+ "special": false
+ },
+ "151359": {
+ "content": "",
+ "lstrip": false,
+ "normalized": false,
+ "rstrip": false,
+ "single_word": false,
+ "special": false
+ },
+ "151360": {
+ "content": "/nothink",
+ "lstrip": false,
+ "normalized": false,
+ "rstrip": false,
+ "single_word": false,
+ "special": true
+ },
+ "151361": {
+ "content": "<|begin_of_box|>",
+ "lstrip": false,
+ "normalized": false,
+ "rstrip": false,
+ "single_word": false,
+ "special": false
+ },
+ "151362": {
+ "content": "<|end_of_box|>",
+ "lstrip": false,
+ "normalized": false,
+ "rstrip": false,
+ "single_word": false,
+ "special": false
+ },
+ "151363": {
+ "content": "<|image|>",
+ "lstrip": false,
+ "normalized": false,
+ "rstrip": false,
+ "single_word": false,
+ "special": false
+ },
+ "151364": {
+ "content": "<|video|>",
+ "lstrip": false,
+ "normalized": false,
+ "rstrip": false,
+ "single_word": false,
+ "special": false
+ }
+ },
+ "additional_special_tokens": [
+ "<|endoftext|>",
+ "[MASK]",
+ "[gMASK]",
+ "[sMASK]",
+ "",
+ "",
+ "<|system|>",
+ "<|user|>",
+ "<|assistant|>",
+ "<|observation|>",
+ "<|begin_of_image|>",
+ "<|end_of_image|>",
+ "<|begin_of_video|>",
+ "<|end_of_video|>",
+ "<|begin_of_audio|>",
+ "<|end_of_audio|>",
+ "<|begin_of_transcription|>",
+ "<|end_of_transcription|>",
+ "<|code_prefix|>",
+ "<|code_middle|>",
+ "<|code_suffix|>",
+ "/nothink"
+ ],
+ "clean_up_tokenization_spaces": false,
+ "do_lower_case": false,
+ "eos_token": "<|endoftext|>",
+ "extra_special_tokens": {},
+ "model_max_length": 128000,
+ "pad_token": "<|endoftext|>",
+ "padding_side": "left",
+ "remove_space": false,
+ "tokenizer_class": "PreTrainedTokenizer"
+}