diff --git a/.gitattributes b/.gitattributes index a6344aac8c09253b3b630fb776ae94478aa0275b..52373fe24473b1aa44333d318f578ae6bf04b49b 100644 --- a/.gitattributes +++ b/.gitattributes @@ -33,3 +33,4 @@ saved_model/**/* filter=lfs diff=lfs merge=lfs -text *.zip filter=lfs diff=lfs merge=lfs -text *.zst filter=lfs diff=lfs merge=lfs -text *tfevents* filter=lfs diff=lfs merge=lfs -text +tokenizer.json filter=lfs diff=lfs merge=lfs -text diff --git a/chat_template.jinja b/chat_template.jinja new file mode 100644 index 0000000000000000000000000000000000000000..41478957aca7a04b7321022e7d1f73de5badd995 --- /dev/null +++ b/chat_template.jinja @@ -0,0 +1,103 @@ +[gMASK] +{%- if tools -%} +<|system|> +# Tools + +You may call one or more functions to assist with the user query. + +You are provided with function signatures within XML tags: + +{% for tool in tools %} +{{ tool | tojson(ensure_ascii=False) }} +{% endfor %} + + +For each function call, output the function name and arguments within the following XML format: +{function-name} +{arg-key-1} +{arg-value-1} +{arg-key-2} +{arg-value-2} +... +{%- endif -%} +{%- macro visible_text(content) -%} + {%- if content is string -%} + {{- content }} + {%- elif content is iterable and content is not mapping -%} + {%- for item in content -%} + {%- if item is mapping and item.type == 'text' -%} + {{- item.text }} + {%- elif item is string -%} + {{- item }} + {%- endif -%} + {%- endfor -%} + {%- else -%} + {{- content }} + {%- endif -%} +{%- endmacro -%} +{%- set ns = namespace(last_user_index=-1) %} +{%- for m in messages %} + {%- if m.role == 'user' %} + {% set ns.last_user_index = loop.index0 -%} + {%- endif %} +{%- endfor %} +{% for m in messages %} +{%- if m.role == 'user' -%}<|user|> +{{ visible_text(m.content) }} +{{- '/nothink' if (enable_thinking is defined and not enable_thinking and not visible_text(m.content).endswith("/nothink")) else '' -}} +{%- elif m.role == 'assistant' -%} +<|assistant|> +{%- set reasoning_content = '' %} +{%- set content = visible_text(m.content) %} +{%- if m.reasoning_content is string %} + {%- set reasoning_content = m.reasoning_content %} +{%- else %} + {%- if '' in content %} + {%- set reasoning_content = content.split('')[0].rstrip('\n').split('')[-1].lstrip('\n') %} + {%- set content = content.split('')[-1].lstrip('\n') %} + {%- endif %} +{%- endif %} +{%- if loop.index0 > ns.last_user_index and reasoning_content -%} +{{ '\n' + reasoning_content.strip() + ''}} +{%- else -%} +{{ '\n' }} +{%- endif -%} +{%- if content.strip() -%} +{{ '\n' + content.strip() }} +{%- endif -%} +{% if m.tool_calls %} +{% for tc in m.tool_calls %} +{%- if tc.function %} + {%- set tc = tc.function %} +{%- endif %} +{{ '\n' + tc.name }} +{% set _args = tc.arguments %} +{% for k, v in _args.items() %} +{{ k }} +{{ v | tojson(ensure_ascii=False) if v is not string else v }} +{% endfor %} +{% endfor %} +{% endif %} +{%- elif m.role == 'tool' -%} +{%- if m.content is string -%} +{%- if loop.first or (messages[loop.index0 - 1].role != "tool") %} + {{- '<|observation|>' }} +{%- endif %} +{{- '\n\n' }} +{{- m.content }} +{{- '\n' }} +{%- else -%} +<|observation|>{% for tr in m.content %} + + +{{ tr.output if tr.output is defined else tr }} +{% endfor -%} +{% endif -%} +{%- elif m.role == 'system' -%} +<|system|> +{{ visible_text(m.content) }} +{%- endif -%} +{%- endfor -%} +{%- if add_generation_prompt -%} + <|assistant|>{{- '\n' if (enable_thinking is defined and not enable_thinking) else '' -}} +{%- endif -%} \ No newline at end of file diff --git a/config.json b/config.json new file mode 100644 index 0000000000000000000000000000000000000000..78eecfe543bad2caf772f9c28852d8e7bc25f301 --- /dev/null +++ b/config.json @@ -0,0 +1,417 @@ +{ + "architectures": [ + "Glm4MoeForCausalLM" + ], + "attention_bias": true, + "attention_dropout": 0.0, + "pad_token_id": 151329, + "eos_token_id": [ + 151329, + 151336, + 151338 + ], + "head_dim": 128, + "hidden_act": "silu", + "hidden_size": 4096, + "partial_rotary_factor": 0.5, + "initializer_range": 0.02, + "intermediate_size": 10944, + "max_position_embeddings": 131072, + "model_type": "glm4_moe", + "moe_intermediate_size": 1408, + "norm_topk_prob": true, + "num_attention_heads": 96, + "n_group": 1, + "topk_group": 1, + "n_routed_experts": 128, + "n_shared_experts": 1, + "routed_scaling_factor": 1.0, + "num_experts_per_tok": 8, + "first_k_dense_replace": 1, + "num_hidden_layers": 46, + "num_key_value_heads": 8, + "rms_norm_eps": 1e-05, + "rope_scaling": null, + "rope_theta": 1000000, + "num_nextn_predict_layers": 1, + "tie_word_embeddings": false, + "torch_dtype": "bfloat16", + "transformers_version": "4.54.0", + "use_cache": true, + "use_qk_norm": false, + "vocab_size": 151552, + "quantization_config": { + "config_groups": { + "group_0": { + "input_activations": { + "actorder": null, + "block_structure": null, + "dynamic": true, + "group_size": null, + "num_bits": 8, + "observer": null, + "observer_kwargs": {}, + "strategy": "token", + "symmetric": true, + "type": "float" + }, + "output_activations": null, + "targets": [ + "Linear" + ], + "weights": { + "actorder": null, + "block_structure": null, + "dynamic": false, + "group_size": null, + "num_bits": 8, + "observer": "minmax", + "observer_kwargs": {}, + "strategy": "channel", + "symmetric": true, + "type": "float" + } + } + }, + "format": "float-quantized", + "ignore": [ + "model.layers.9.mlp.gate", + "model.layers.22.self_attn.q_proj.bias", + "model.layers.21.post_attention_layernorm", + "model.layers.46.post_attention_layernorm", + "model.layers.33.mlp.gate.e_score_correction_bias", + "model.layers.19.input_layernorm", + "model.layers.23.input_layernorm", + "model.layers.26.input_layernorm", + "model.layers.16.input_layernorm", + "model.layers.2.input_layernorm", + "model.layers.43.mlp.gate.e_score_correction_bias", + "model.layers.17.self_attn.v_proj.bias", + "model.layers.4.self_attn.k_proj.bias", + "model.layers.24.mlp.gate", + "model.layers.42.self_attn.q_proj.bias", + "model.layers.19.self_attn.v_proj.bias", + "model.layers.36.self_attn.k_proj.bias", + "model.layers.43.self_attn.k_proj.bias", + "model.layers.26.self_attn.v_proj.bias", + "model.layers.33.mlp.gate", + "model.layers.31.input_layernorm", + "model.layers.8.input_layernorm", + "model.layers.9.mlp.gate.e_score_correction_bias", + "model.layers.19.mlp.gate.e_score_correction_bias", + "model.layers.14.self_attn.v_proj.bias", + "model.layers.19.mlp.gate", + "model.layers.12.mlp.gate", + "model.layers.37.mlp.gate.e_score_correction_bias", + "model.layers.39.mlp.gate", + "model.layers.20.self_attn.v_proj.bias", + "model.layers.1.self_attn.q_proj.bias", + "model.layers.7.self_attn.k_proj.bias", + "model.layers.19.self_attn.k_proj.bias", + "model.layers.30.mlp.gate.e_score_correction_bias", + "model.layers.37.input_layernorm", + "model.layers.40.self_attn.q_proj.bias", + "model.layers.30.input_layernorm", + "model.layers.10.post_attention_layernorm", + "model.layers.10.mlp.gate", + "model.layers.21.mlp.gate", + "model.layers.39.post_attention_layernorm", + "model.layers.20.self_attn.q_proj.bias", + "model.layers.20.input_layernorm", + "model.layers.16.self_attn.v_proj.bias", + "model.layers.5.self_attn.k_proj.bias", + "model.layers.18.input_layernorm", + "model.layers.35.input_layernorm", + "model.layers.43.mlp.gate", + "model.layers.5.self_attn.v_proj.bias", + "model.layers.28.mlp.gate", + "model.layers.4.self_attn.v_proj.bias", + "model.layers.46.mlp.gate.e_score_correction_bias", + "model.layers.25.mlp.gate.e_score_correction_bias", + "model.layers.46.enorm", + "model.layers.30.self_attn.k_proj.bias", + "model.layers.27.self_attn.v_proj.bias", + "model.layers.23.mlp.gate", + "model.layers.38.post_attention_layernorm", + "model.layers.0.post_attention_layernorm", + "model.layers.46.self_attn.k_proj.bias", + "model.layers.26.post_attention_layernorm", + "model.layers.26.self_attn.q_proj.bias", + "model.layers.46.embed_tokens", + "model.layers.24.input_layernorm", + "model.layers.41.post_attention_layernorm", + "model.layers.20.mlp.gate", + "model.layers.3.mlp.gate", + "model.layers.22.input_layernorm", + "model.layers.15.post_attention_layernorm", + "model.layers.39.input_layernorm", + "model.layers.42.mlp.gate.e_score_correction_bias", + "model.layers.34.mlp.gate", + "model.layers.13.mlp.gate", + "model.layers.38.input_layernorm", + "model.layers.15.self_attn.q_proj.bias", + "model.layers.7.post_attention_layernorm", + "model.layers.28.self_attn.v_proj.bias", + "model.layers.36.post_attention_layernorm", + "model.layers.34.self_attn.k_proj.bias", + "model.layers.23.post_attention_layernorm", + "model.layers.43.input_layernorm", + "model.layers.39.self_attn.k_proj.bias", + "model.layers.18.post_attention_layernorm", + "model.layers.29.mlp.gate.e_score_correction_bias", + "model.layers.34.mlp.gate.e_score_correction_bias", + "model.layers.28.self_attn.q_proj.bias", + "model.layers.46.eh_proj", + "model.layers.14.mlp.gate.e_score_correction_bias", + "model.layers.7.mlp.gate.e_score_correction_bias", + "model.layers.35.self_attn.k_proj.bias", + "model.layers.13.post_attention_layernorm", + "model.layers.22.self_attn.k_proj.bias", + "model.layers.4.self_attn.q_proj.bias", + "model.layers.41.self_attn.k_proj.bias", + "model.layers.12.post_attention_layernorm", + "model.layers.37.self_attn.q_proj.bias", + "model.layers.46.input_layernorm", + "model.layers.24.self_attn.k_proj.bias", + "model.layers.5.mlp.gate", + "model.layers.9.self_attn.k_proj.bias", + "model.layers.10.self_attn.v_proj.bias", + "model.layers.42.self_attn.v_proj.bias", + "model.embed_tokens", + "model.layers.2.self_attn.q_proj.bias", + "model.layers.28.mlp.gate.e_score_correction_bias", + "model.layers.24.self_attn.v_proj.bias", + "model.layers.15.input_layernorm", + "model.layers.9.input_layernorm", + "model.layers.33.input_layernorm", + "model.layers.45.self_attn.v_proj.bias", + "model.layers.31.self_attn.q_proj.bias", + "model.layers.34.input_layernorm", + "model.layers.14.input_layernorm", + "model.layers.17.post_attention_layernorm", + "model.layers.0.self_attn.k_proj.bias", + "model.layers.37.self_attn.v_proj.bias", + "model.norm", + "model.layers.9.self_attn.q_proj.bias", + "model.layers.4.input_layernorm", + "model.layers.45.self_attn.q_proj.bias", + "model.layers.7.self_attn.q_proj.bias", + "model.layers.32.self_attn.v_proj.bias", + "model.layers.22.self_attn.v_proj.bias", + "model.layers.45.post_attention_layernorm", + "model.layers.40.mlp.gate", + "model.layers.29.self_attn.v_proj.bias", + "model.layers.3.mlp.gate.e_score_correction_bias", + "model.layers.31.post_attention_layernorm", + "model.layers.41.self_attn.v_proj.bias", + "model.layers.5.input_layernorm", + "model.layers.13.self_attn.v_proj.bias", + "model.layers.26.self_attn.k_proj.bias", + "model.layers.28.post_attention_layernorm", + "model.layers.17.mlp.gate", + "model.layers.42.mlp.gate", + "model.layers.34.self_attn.v_proj.bias", + "model.layers.1.mlp.gate.e_score_correction_bias", + "model.layers.21.input_layernorm", + "model.layers.21.self_attn.k_proj.bias", + "model.layers.29.self_attn.k_proj.bias", + "model.layers.20.post_attention_layernorm", + "model.layers.14.post_attention_layernorm", + "model.layers.34.post_attention_layernorm", + "model.layers.27.self_attn.k_proj.bias", + "model.layers.24.mlp.gate.e_score_correction_bias", + "model.layers.31.mlp.gate.e_score_correction_bias", + "model.layers.2.self_attn.k_proj.bias", + "model.layers.25.self_attn.v_proj.bias", + "model.layers.1.post_attention_layernorm", + "model.layers.10.self_attn.q_proj.bias", + "model.layers.16.mlp.gate.e_score_correction_bias", + "model.layers.16.self_attn.q_proj.bias", + "model.layers.38.mlp.gate.e_score_correction_bias", + "model.layers.46.self_attn.q_proj.bias", + "model.layers.23.self_attn.k_proj.bias", + "model.layers.42.post_attention_layernorm", + "model.layers.33.self_attn.k_proj.bias", + "model.layers.30.mlp.gate", + "model.layers.34.self_attn.q_proj.bias", + "model.layers.4.post_attention_layernorm", + "model.layers.13.self_attn.k_proj.bias", + "model.layers.2.post_attention_layernorm", + "model.layers.40.post_attention_layernorm", + "model.layers.38.self_attn.k_proj.bias", + "model.layers.1.self_attn.k_proj.bias", + "model.layers.10.mlp.gate.e_score_correction_bias", + "model.layers.43.self_attn.v_proj.bias", + "model.layers.11.input_layernorm", + "model.layers.42.input_layernorm", + "model.layers.19.self_attn.q_proj.bias", + "model.layers.24.post_attention_layernorm", + "model.layers.12.input_layernorm", + "model.layers.42.self_attn.k_proj.bias", + "model.layers.12.self_attn.k_proj.bias", + "model.layers.0.self_attn.v_proj.bias", + "model.layers.1.mlp.gate", + "model.layers.39.self_attn.v_proj.bias", + "model.layers.14.mlp.gate", + "model.layers.44.post_attention_layernorm", + "model.layers.37.mlp.gate", + "model.layers.31.mlp.gate", + "model.layers.8.post_attention_layernorm", + "model.layers.2.mlp.gate.e_score_correction_bias", + "model.layers.36.input_layernorm", + "model.layers.30.post_attention_layernorm", + "model.layers.46.shared_head.norm", + "model.layers.4.mlp.gate", + "model.layers.6.mlp.gate", + "model.layers.29.mlp.gate", + "model.layers.7.mlp.gate", + "model.layers.0.self_attn.q_proj.bias", + "model.layers.44.mlp.gate", + "model.layers.32.self_attn.k_proj.bias", + "model.layers.4.mlp.gate.e_score_correction_bias", + "model.layers.18.self_attn.v_proj.bias", + "model.layers.30.self_attn.q_proj.bias", + "model.layers.21.mlp.gate.e_score_correction_bias", + "model.layers.32.post_attention_layernorm", + "model.layers.19.post_attention_layernorm", + "model.layers.22.mlp.gate", + "model.layers.13.mlp.gate.e_score_correction_bias", + "model.layers.8.mlp.gate", + "model.layers.36.self_attn.v_proj.bias", + "model.layers.5.post_attention_layernorm", + "model.layers.32.input_layernorm", + "model.layers.33.post_attention_layernorm", + "model.layers.21.self_attn.v_proj.bias", + "model.layers.2.mlp.gate", + "model.layers.13.input_layernorm", + "model.layers.15.self_attn.v_proj.bias", + "model.layers.16.self_attn.k_proj.bias", + "model.layers.2.self_attn.v_proj.bias", + "model.layers.43.post_attention_layernorm", + "model.layers.7.input_layernorm", + "model.layers.29.post_attention_layernorm", + "model.layers.20.self_attn.k_proj.bias", + "model.layers.38.mlp.gate", + "model.layers.18.mlp.gate.e_score_correction_bias", + "model.layers.25.input_layernorm", + "model.layers.1.input_layernorm", + "model.layers.46.hnorm", + "model.layers.31.self_attn.v_proj.bias", + "model.layers.14.self_attn.q_proj.bias", + "model.layers.18.self_attn.q_proj.bias", + "model.layers.8.self_attn.q_proj.bias", + "model.layers.35.self_attn.v_proj.bias", + "model.layers.45.mlp.gate.e_score_correction_bias", + "model.layers.9.post_attention_layernorm", + "model.layers.30.self_attn.v_proj.bias", + "model.layers.15.mlp.gate", + "model.layers.10.input_layernorm", + "model.layers.6.self_attn.q_proj.bias", + "model.layers.11.mlp.gate.e_score_correction_bias", + "model.layers.41.input_layernorm", + "model.layers.22.mlp.gate.e_score_correction_bias", + "model.layers.15.mlp.gate.e_score_correction_bias", + "model.layers.21.self_attn.q_proj.bias", + "model.layers.17.mlp.gate.e_score_correction_bias", + "model.layers.16.mlp.gate", + "model.layers.25.self_attn.q_proj.bias", + "model.layers.6.input_layernorm", + "model.layers.17.input_layernorm", + "model.layers.26.mlp.gate.e_score_correction_bias", + "model.layers.35.mlp.gate.e_score_correction_bias", + "model.layers.0.input_layernorm", + "model.layers.3.post_attention_layernorm", + "model.layers.6.self_attn.v_proj.bias", + "model.layers.27.mlp.gate.e_score_correction_bias", + "model.layers.18.mlp.gate", + "model.layers.28.input_layernorm", + "model.layers.9.self_attn.v_proj.bias", + "model.layers.31.self_attn.k_proj.bias", + "model.layers.40.self_attn.v_proj.bias", + "model.layers.12.self_attn.q_proj.bias", + "model.layers.41.mlp.gate", + "model.layers.5.self_attn.q_proj.bias", + "model.layers.11.self_attn.v_proj.bias", + "model.layers.36.mlp.gate", + "model.layers.27.self_attn.q_proj.bias", + "model.layers.40.self_attn.k_proj.bias", + "model.layers.11.post_attention_layernorm", + "model.layers.27.input_layernorm", + "model.layers.12.self_attn.v_proj.bias", + "model.layers.46.mlp.gate", + "model.layers.17.self_attn.k_proj.bias", + "model.layers.3.input_layernorm", + "model.layers.44.input_layernorm", + "model.layers.10.self_attn.k_proj.bias", + "model.layers.41.mlp.gate.e_score_correction_bias", + "model.layers.7.self_attn.v_proj.bias", + "model.layers.18.self_attn.k_proj.bias", + "model.layers.1.self_attn.v_proj.bias", + "model.layers.26.mlp.gate", + "model.layers.45.input_layernorm", + "model.layers.23.self_attn.v_proj.bias", + "model.layers.39.mlp.gate.e_score_correction_bias", + "model.layers.12.mlp.gate.e_score_correction_bias", + "model.layers.37.post_attention_layernorm", + "model.layers.46.self_attn.v_proj.bias", + "model.layers.36.mlp.gate.e_score_correction_bias", + "model.layers.5.mlp.gate.e_score_correction_bias", + "model.layers.35.mlp.gate", + "model.layers.44.self_attn.k_proj.bias", + "model.layers.3.self_attn.k_proj.bias", + "model.layers.11.mlp.gate", + "model.layers.11.self_attn.q_proj.bias", + "model.layers.17.self_attn.q_proj.bias", + "model.layers.32.self_attn.q_proj.bias", + "model.layers.11.self_attn.k_proj.bias", + "model.layers.40.mlp.gate.e_score_correction_bias", + "model.layers.41.self_attn.q_proj.bias", + "model.layers.15.self_attn.k_proj.bias", + "model.layers.44.self_attn.v_proj.bias", + "model.layers.25.self_attn.k_proj.bias", + "model.layers.25.post_attention_layernorm", + "model.layers.29.input_layernorm", + "model.layers.44.self_attn.q_proj.bias", + "model.layers.16.post_attention_layernorm", + "model.layers.6.mlp.gate.e_score_correction_bias", + "model.layers.38.self_attn.v_proj.bias", + "model.layers.40.input_layernorm", + "model.layers.6.post_attention_layernorm", + "model.layers.22.post_attention_layernorm", + "model.layers.8.self_attn.k_proj.bias", + "model.layers.37.self_attn.k_proj.bias", + "model.layers.23.mlp.gate.e_score_correction_bias", + "model.layers.27.mlp.gate", + "model.layers.8.mlp.gate.e_score_correction_bias", + "model.layers.28.self_attn.k_proj.bias", + "model.layers.24.self_attn.q_proj.bias", + "model.layers.39.self_attn.q_proj.bias", + "model.layers.36.self_attn.q_proj.bias", + "model.layers.45.self_attn.k_proj.bias", + "model.layers.32.mlp.gate.e_score_correction_bias", + "model.layers.35.self_attn.q_proj.bias", + "model.layers.33.self_attn.q_proj.bias", + "model.layers.14.self_attn.k_proj.bias", + "lm_head", + "model.layers.3.self_attn.v_proj.bias", + "model.layers.44.mlp.gate.e_score_correction_bias", + "model.layers.45.mlp.gate", + "model.layers.32.mlp.gate", + "model.layers.33.self_attn.v_proj.bias", + "model.layers.29.self_attn.q_proj.bias", + "model.layers.3.self_attn.q_proj.bias", + "model.layers.35.post_attention_layernorm", + "model.layers.6.self_attn.k_proj.bias", + "model.layers.43.self_attn.q_proj.bias", + "model.layers.20.mlp.gate.e_score_correction_bias", + "model.layers.8.self_attn.v_proj.bias", + "model.layers.13.self_attn.q_proj.bias", + "model.layers.27.post_attention_layernorm", + "model.layers.38.self_attn.q_proj.bias", + "model.layers.25.mlp.gate", + "model.layers.23.self_attn.q_proj.bias" + ], + "quant_method": "compressed-tensors", + "quantization_status": "compressed" + } +} \ No newline at end of file diff --git a/generation_config.json b/generation_config.json new file mode 100644 index 0000000000000000000000000000000000000000..4d49113f3e19072368c98e53180331c77c07c8a6 --- /dev/null +++ b/generation_config.json @@ -0,0 +1,10 @@ +{ + "_from_model_config": true, + "eos_token_id": [ + 151329, + 151336, + 151338 + ], + "pad_token_id": 151329, + "transformers_version": "4.54.0" +} diff --git a/model-00001-of-00047.safetensors b/model-00001-of-00047.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..290e4b0d0bf0812440ac2f5967aefd5f11342bdf --- /dev/null +++ b/model-00001-of-00047.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a402a8fac66c090eddd032e70aaa5ab9c87307aa44451c659e1b650f9c60ad53 +size 2726784880 diff --git a/model-00002-of-00047.safetensors b/model-00002-of-00047.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..1bbdd2b955e1a2faf53b5ff5d9190e9984da6076 --- /dev/null +++ b/model-00002-of-00047.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0d3801d622ff4292be51939389c2e30aac77dfc0d6728d777077b1d892c8eb7f +size 2345777464 diff --git a/model-00003-of-00047.safetensors b/model-00003-of-00047.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..89751787d32c8e726c2cf74316b861d1425e8978 --- /dev/null +++ b/model-00003-of-00047.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:370acfd3919de83ddde52b13520200c889233d776546a9b8f6834ce09163af72 +size 2345777464 diff --git a/model-00004-of-00047.safetensors b/model-00004-of-00047.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..e564db1357862ace20d4dea25297e8974659163d --- /dev/null +++ b/model-00004-of-00047.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0ee5f8494b76e349c0065073df819272b4abf799a56815ac0faa216251cd9075 +size 2345777464 diff --git a/model-00005-of-00047.safetensors b/model-00005-of-00047.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..4c3127d141df656228fcfea62e24a0165e87f811 --- /dev/null +++ b/model-00005-of-00047.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:fdc1fe9b9550617ee72997b29fc8f13d391a7bb1439d1df1d5ba5c159bcd5c78 +size 2345777464 diff --git a/model-00006-of-00047.safetensors b/model-00006-of-00047.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..c1dd17f83b56655a9da6deb4a36abbc2b1dd4cb6 --- /dev/null +++ b/model-00006-of-00047.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ee91fb563f9d471d1870f99496bbe576dd7435127d506cd251d8a40a0581ea25 +size 2345777464 diff --git a/model-00007-of-00047.safetensors b/model-00007-of-00047.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..c1d01bfb66ae815825233859f551924005fc665a --- /dev/null +++ b/model-00007-of-00047.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b56b80408c45881d8b1aa234ebe4c4826af24abc26038051cd92ce0aa2212070 +size 2345777464 diff --git a/model-00008-of-00047.safetensors b/model-00008-of-00047.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..dd5a8d6c5e292bcf7f9f8be3cef03179a1b6d7b2 --- /dev/null +++ b/model-00008-of-00047.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f78687be00665850826872a5666ac3fb72c15cb70ffb6f8ab7da2e402ddfa307 +size 2345777464 diff --git a/model-00009-of-00047.safetensors b/model-00009-of-00047.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..b61947f11ba0577f530056ae93bbded5fcc631e6 --- /dev/null +++ b/model-00009-of-00047.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:65c39636822e6fa307ca0e27c4cc14e8045a80799f801d638a1ef6138534db37 +size 2345777464 diff --git a/model-00010-of-00047.safetensors b/model-00010-of-00047.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..d3ac34905f2f8f1cf2c18bd980788a7c77ce649e --- /dev/null +++ b/model-00010-of-00047.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4dd40942500a67c1c7f3eee752a6777876923eea9b00fe3abe898794f5b44e28 +size 2345777464 diff --git a/model-00011-of-00047.safetensors b/model-00011-of-00047.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..5913627131920353a61716f581d5b99f11c45605 --- /dev/null +++ b/model-00011-of-00047.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e400a5ca71912ac0ca8da5fc103c0ee6a7dd25eb68816620b4f30eb48e30138c +size 2345778256 diff --git a/model-00012-of-00047.safetensors b/model-00012-of-00047.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..39b791f4a2cb769fc278554ea335e1a677743f72 --- /dev/null +++ b/model-00012-of-00047.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ef8b28bbe7d35824f3fcd79833333c1427dd844f9fa5872fb9b4e237a4b923e9 +size 2345778256 diff --git a/model-00013-of-00047.safetensors b/model-00013-of-00047.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..2d5ae4a4511094fac615fd05c7f62ef2a43857f0 --- /dev/null +++ b/model-00013-of-00047.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6b08854bbbeebd8df2cca69c83036698950b0ab0aca37497d4db5af1da55e021 +size 2345778256 diff --git a/model-00014-of-00047.safetensors b/model-00014-of-00047.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..25c45a2d89c6ce27fef0ea401ee88b8e3a7d5d63 --- /dev/null +++ b/model-00014-of-00047.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:97df7e09418afdbeb89677b8baa1a8456a45c70f92597f307ea710c7fc71e5b5 +size 2345778256 diff --git a/model-00015-of-00047.safetensors b/model-00015-of-00047.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..d501fa4f2fef819b26250bc7960a1ae1f8e4916d --- /dev/null +++ b/model-00015-of-00047.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:eb3cd4497d95e3fc0d679a3344d7bcf8ef50bcf9074eed34b5596099e6061624 +size 2345778256 diff --git a/model-00016-of-00047.safetensors b/model-00016-of-00047.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..225638feb8f8ac8374b2adc85788343afa136934 --- /dev/null +++ b/model-00016-of-00047.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e9e55954e25fda8f2b1c224a39e2350ed29595659786ed9db1fdf30b03623ba9 +size 2345778256 diff --git a/model-00017-of-00047.safetensors b/model-00017-of-00047.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..306de6e1b204e65cb2c1f69ffd3f7a696e57bb65 --- /dev/null +++ b/model-00017-of-00047.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:fdda21d70b7bf6e067a7da0b9abfbde5d7fbb33740fa0b4d2839b316f61f2f69 +size 2345778256 diff --git a/model-00018-of-00047.safetensors b/model-00018-of-00047.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..47abed9bb056aa173f008cbc5fe3088f625a0cc7 --- /dev/null +++ b/model-00018-of-00047.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:235e3a593ac9bccd5e6ee9ba1d8d5539c78b30632dafa2ce39ede0a6e7ce8a5f +size 2345778256 diff --git a/model-00019-of-00047.safetensors b/model-00019-of-00047.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..5792c1b63a3da104594b5e9877e65c018bdcdcfb --- /dev/null +++ b/model-00019-of-00047.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:75fe5acbcb61b0c243f52d7e2a3436f73c4b41f2b7645779d7f092cac8d6c122 +size 2345778256 diff --git a/model-00020-of-00047.safetensors b/model-00020-of-00047.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..d39758ef6586ed7662f118f0bdc4f622c94f9a02 --- /dev/null +++ b/model-00020-of-00047.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e68c695f2d732a714c09ab07832dca8443ddcdc745bc4fc19c49962a1ff69a79 +size 2345778256 diff --git a/model-00021-of-00047.safetensors b/model-00021-of-00047.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..aecc6246d673e6bb6fde8afa1cd7d3eb2a5bf141 --- /dev/null +++ b/model-00021-of-00047.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8bcd058b41a7fef9d6c05cb024e776ee78f7cd00cf8c73b5e912fc28e32e7454 +size 2345778256 diff --git a/model-00022-of-00047.safetensors b/model-00022-of-00047.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..64afbb9bfcac85f24b92c21bf4aad817ef634b4f --- /dev/null +++ b/model-00022-of-00047.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:31225cc96950af59d7775e287a7af7ffdf2a13ce8073114cef082a06e5c58083 +size 2345778256 diff --git a/model-00023-of-00047.safetensors b/model-00023-of-00047.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..ba5fec7def6a42bda2f559ebb0e18c6324d2d214 --- /dev/null +++ b/model-00023-of-00047.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d71c2b109c55b79c61e98af7b80148a91a008770de217fee16483ec9f1eb8eef +size 2345778256 diff --git a/model-00024-of-00047.safetensors b/model-00024-of-00047.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..fbd491155af8a94af282ce3b9a119802dec132f1 --- /dev/null +++ b/model-00024-of-00047.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6077ad7f4ef58045de15cb4bdf66ca773d9917eb8179f1b5160ed65931be07cf +size 2345778256 diff --git a/model-00025-of-00047.safetensors b/model-00025-of-00047.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..c59edbc9170db2a3872cb98597b527c1d475522c --- /dev/null +++ b/model-00025-of-00047.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4fa816ebe9f85d1a21c26182a4f2620b090604066136e2dee997d7c16c62e845 +size 2345778256 diff --git a/model-00026-of-00047.safetensors b/model-00026-of-00047.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..86516b7d0aa38986418f4e2d07c1c858b5a1c237 --- /dev/null +++ b/model-00026-of-00047.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ede66e0f34d047a685d0c88d4392b2ea7320c1f9ec58a91cdf86a3aa3187c111 +size 2345778256 diff --git a/model-00027-of-00047.safetensors b/model-00027-of-00047.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..03eec03cb845c351589cfe579235eb835091046d --- /dev/null +++ b/model-00027-of-00047.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ae3404cd91efa7632e7761cef0e36d287531043b8293e8ca231f80556de0c943 +size 2345778256 diff --git a/model-00028-of-00047.safetensors b/model-00028-of-00047.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..018b85c8682fca5b4f599a6387c440d3305ba6cc --- /dev/null +++ b/model-00028-of-00047.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:bc866b2ceb0c216a0e34f0a5d7d7178e28db4f1170778ea2ee813c487adad690 +size 2345778256 diff --git a/model-00029-of-00047.safetensors b/model-00029-of-00047.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..a56b2f3b6192aaaa17cb55641a43052dea7d16c1 --- /dev/null +++ b/model-00029-of-00047.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:86c0aeefe2ccf3db32de08f211c89b2dac92f08ab9fce79a9cd0dac3a7168c94 +size 2345778256 diff --git a/model-00030-of-00047.safetensors b/model-00030-of-00047.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..1246989dec814c569f626e15c12a6180fb14bc3f --- /dev/null +++ b/model-00030-of-00047.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:934d52a70fce1b5350a6097a60b6e7d56e5c62e74bbd1f978b06b2cb05eda181 +size 2345778256 diff --git a/model-00031-of-00047.safetensors b/model-00031-of-00047.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..0492796a91aea0549e5d00c7ea97b0b6d1f2b0e8 --- /dev/null +++ b/model-00031-of-00047.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e1ae794e253939c3ace1438e156ee049c8380294a7cf2ceb71df6d24f3db7529 +size 2345778256 diff --git a/model-00032-of-00047.safetensors b/model-00032-of-00047.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..42384892618af9aca09c7a76b52ca9f1811c4d06 --- /dev/null +++ b/model-00032-of-00047.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:be9c3a1a94eb73278eee04f20536984049a19d22cfec99842f130f9a0124b679 +size 2345778256 diff --git a/model-00033-of-00047.safetensors b/model-00033-of-00047.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..b75414de57589536fa4b8ecffd6f92d35178f24d --- /dev/null +++ b/model-00033-of-00047.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2fe977ee1930c5371511e72358fe28b6652153c144682f0d0b25985396a2d9f3 +size 2345778256 diff --git a/model-00034-of-00047.safetensors b/model-00034-of-00047.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..c6fc06d8a8a3859db19b032fb426c64c24d86c18 --- /dev/null +++ b/model-00034-of-00047.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:56e8edad38c7825a51eb2d95e696779b126571861a23570d3c830d5145af88d5 +size 2345778256 diff --git a/model-00035-of-00047.safetensors b/model-00035-of-00047.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..6cf27e593213a8cf3c0347a34f1afdc2a83c2e43 --- /dev/null +++ b/model-00035-of-00047.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1987ca16a5051008d42528a6090e0858cca95e96635c17630fc4b42be64fba2b +size 2345778256 diff --git a/model-00036-of-00047.safetensors b/model-00036-of-00047.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..6ce26d99d949ad18405cff5e264f93a3dac08a9d --- /dev/null +++ b/model-00036-of-00047.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4d96fd512b5e06a9ba547a9075c0c92ed87d48f58bd55e70cd1d36ab370e953d +size 2345778256 diff --git a/model-00037-of-00047.safetensors b/model-00037-of-00047.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..83e1ffdf2830b65647f90375a2ce3510b8ecf86a --- /dev/null +++ b/model-00037-of-00047.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:043d5e8e4fce151634a4bcb8a06a782eacd12cbe10617c4e6dad70036040b6d6 +size 2345778256 diff --git a/model-00038-of-00047.safetensors b/model-00038-of-00047.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..00ea0f9539da2423de46b95b64e457544c698984 --- /dev/null +++ b/model-00038-of-00047.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:abd38bbfa42f52515791133a1f613fdb59bfbc7c36eb5494c56367545c025df8 +size 2345778256 diff --git a/model-00039-of-00047.safetensors b/model-00039-of-00047.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..fbefbcb5aa3eb567d7f229a25e9f203e1954ce1e --- /dev/null +++ b/model-00039-of-00047.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e9d9984281c5587e6749846705853d14287a6bf13ac4f55cc8eb45db25d85123 +size 2345778256 diff --git a/model-00041-of-00047.safetensors b/model-00041-of-00047.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..04d5920585dd43dd4b8310f8e5bca9597699e4a4 --- /dev/null +++ b/model-00041-of-00047.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:dc0dbeba62a43bc2bb5420e32c2fbbd0b246f3422210c45338a34567f814e166 +size 2345778256 diff --git a/model-00042-of-00047.safetensors b/model-00042-of-00047.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..4ed2dbfa5f98ad6ea3be76da4650e1d9692bc684 --- /dev/null +++ b/model-00042-of-00047.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:140b23ed6313b17d3bb83dfa408489f416e2b4fb69ab213a0fa95cdaa9266022 +size 2345778256 diff --git a/model-00043-of-00047.safetensors b/model-00043-of-00047.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..23732a88a9a46c2e0459f1335b2ca2bc8a565ff2 --- /dev/null +++ b/model-00043-of-00047.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:405cc1ce09cb6f98b93465847c673266b6e2769322929cb7a89a4bad1f23995f +size 2345778256 diff --git a/model-00045-of-00047.safetensors b/model-00045-of-00047.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..64ca43371afe41e6bbe072b74883da3a57964bc5 --- /dev/null +++ b/model-00045-of-00047.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:660f9a5d8ce0fc3c6bb06dadbe7ef096737a56583222f127219185d6636490c9 +size 2345778256 diff --git a/model-00047-of-00047.safetensors b/model-00047-of-00047.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..8d1356f8a2e670e6c2ab2b6d56c44d13d1fc5b85 --- /dev/null +++ b/model-00047-of-00047.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3e40754924a9ee2229bd1f5ec0a2191a831f6dbf9f9d6f5ef534c6a2a1e8f7cb +size 2412912168 diff --git a/model.safetensors.index.json b/model.safetensors.index.json new file mode 100644 index 0000000000000000000000000000000000000000..0a1d7c74af7900f6fb8ea24c6ee7043f869e04de --- /dev/null +++ b/model.safetensors.index.json @@ -0,0 +1,36330 @@ +{ + "weight_map": { + "model.embed_tokens.weight": "model-00001-of-00047.safetensors", + "model.layers.0.input_layernorm.weight": "model-00001-of-00047.safetensors", + "model.layers.0.mlp.down_proj.weight": "model-00001-of-00047.safetensors", + "model.layers.0.mlp.down_proj.weight_scale": "model-00001-of-00047.safetensors", + "model.layers.0.mlp.gate_proj.weight": "model-00001-of-00047.safetensors", + "model.layers.0.mlp.gate_proj.weight_scale": "model-00001-of-00047.safetensors", + "model.layers.0.mlp.up_proj.weight": "model-00001-of-00047.safetensors", + "model.layers.0.mlp.up_proj.weight_scale": "model-00001-of-00047.safetensors", + "model.layers.0.post_attention_layernorm.weight": "model-00001-of-00047.safetensors", + "model.layers.0.self_attn.k_proj.bias": "model-00001-of-00047.safetensors", + "model.layers.0.self_attn.k_proj.weight": "model-00001-of-00047.safetensors", + "model.layers.0.self_attn.k_proj.weight_scale": "model-00001-of-00047.safetensors", + "model.layers.0.self_attn.o_proj.weight": "model-00001-of-00047.safetensors", + "model.layers.0.self_attn.o_proj.weight_scale": "model-00001-of-00047.safetensors", + "model.layers.0.self_attn.q_proj.bias": "model-00001-of-00047.safetensors", + "model.layers.0.self_attn.q_proj.weight": "model-00001-of-00047.safetensors", + "model.layers.0.self_attn.q_proj.weight_scale": "model-00001-of-00047.safetensors", + "model.layers.0.self_attn.v_proj.bias": "model-00001-of-00047.safetensors", + "model.layers.0.self_attn.v_proj.weight": "model-00001-of-00047.safetensors", + "model.layers.0.self_attn.v_proj.weight_scale": "model-00001-of-00047.safetensors", + "model.layers.46.embed_tokens.weight": "model-00001-of-00047.safetensors", + "model.layers.1.input_layernorm.weight": "model-00002-of-00047.safetensors", + "model.layers.1.mlp.experts.0.down_proj.weight": "model-00002-of-00047.safetensors", + "model.layers.1.mlp.experts.0.down_proj.weight_scale": "model-00002-of-00047.safetensors", + "model.layers.1.mlp.experts.0.gate_proj.weight": "model-00002-of-00047.safetensors", + "model.layers.1.mlp.experts.0.gate_proj.weight_scale": "model-00002-of-00047.safetensors", + "model.layers.1.mlp.experts.0.up_proj.weight": "model-00002-of-00047.safetensors", + "model.layers.1.mlp.experts.0.up_proj.weight_scale": "model-00002-of-00047.safetensors", + "model.layers.1.mlp.experts.1.down_proj.weight": "model-00002-of-00047.safetensors", + "model.layers.1.mlp.experts.1.down_proj.weight_scale": "model-00002-of-00047.safetensors", + "model.layers.1.mlp.experts.1.gate_proj.weight": "model-00002-of-00047.safetensors", + "model.layers.1.mlp.experts.1.gate_proj.weight_scale": "model-00002-of-00047.safetensors", + "model.layers.1.mlp.experts.1.up_proj.weight": "model-00002-of-00047.safetensors", + "model.layers.1.mlp.experts.1.up_proj.weight_scale": "model-00002-of-00047.safetensors", + "model.layers.1.mlp.experts.10.down_proj.weight": "model-00002-of-00047.safetensors", + "model.layers.1.mlp.experts.10.down_proj.weight_scale": "model-00002-of-00047.safetensors", + "model.layers.1.mlp.experts.10.gate_proj.weight": "model-00002-of-00047.safetensors", + "model.layers.1.mlp.experts.10.gate_proj.weight_scale": "model-00002-of-00047.safetensors", + "model.layers.1.mlp.experts.10.up_proj.weight": "model-00002-of-00047.safetensors", + "model.layers.1.mlp.experts.10.up_proj.weight_scale": "model-00002-of-00047.safetensors", + "model.layers.1.mlp.experts.100.down_proj.weight": "model-00002-of-00047.safetensors", + "model.layers.1.mlp.experts.100.down_proj.weight_scale": "model-00002-of-00047.safetensors", + "model.layers.1.mlp.experts.100.gate_proj.weight": "model-00002-of-00047.safetensors", + "model.layers.1.mlp.experts.100.gate_proj.weight_scale": "model-00002-of-00047.safetensors", + "model.layers.1.mlp.experts.100.up_proj.weight": "model-00002-of-00047.safetensors", + "model.layers.1.mlp.experts.100.up_proj.weight_scale": "model-00002-of-00047.safetensors", + "model.layers.1.mlp.experts.101.down_proj.weight": "model-00002-of-00047.safetensors", + "model.layers.1.mlp.experts.101.down_proj.weight_scale": "model-00002-of-00047.safetensors", + "model.layers.1.mlp.experts.101.gate_proj.weight": "model-00002-of-00047.safetensors", + "model.layers.1.mlp.experts.101.gate_proj.weight_scale": "model-00002-of-00047.safetensors", + "model.layers.1.mlp.experts.101.up_proj.weight": "model-00002-of-00047.safetensors", + "model.layers.1.mlp.experts.101.up_proj.weight_scale": "model-00002-of-00047.safetensors", + "model.layers.1.mlp.experts.102.down_proj.weight": "model-00002-of-00047.safetensors", + "model.layers.1.mlp.experts.102.down_proj.weight_scale": "model-00002-of-00047.safetensors", + "model.layers.1.mlp.experts.102.gate_proj.weight": "model-00002-of-00047.safetensors", + "model.layers.1.mlp.experts.102.gate_proj.weight_scale": "model-00002-of-00047.safetensors", + "model.layers.1.mlp.experts.102.up_proj.weight": "model-00002-of-00047.safetensors", + "model.layers.1.mlp.experts.102.up_proj.weight_scale": "model-00002-of-00047.safetensors", + "model.layers.1.mlp.experts.103.down_proj.weight": "model-00002-of-00047.safetensors", + "model.layers.1.mlp.experts.103.down_proj.weight_scale": "model-00002-of-00047.safetensors", + "model.layers.1.mlp.experts.103.gate_proj.weight": "model-00002-of-00047.safetensors", + "model.layers.1.mlp.experts.103.gate_proj.weight_scale": "model-00002-of-00047.safetensors", + "model.layers.1.mlp.experts.103.up_proj.weight": "model-00002-of-00047.safetensors", + "model.layers.1.mlp.experts.103.up_proj.weight_scale": "model-00002-of-00047.safetensors", + "model.layers.1.mlp.experts.104.down_proj.weight": "model-00002-of-00047.safetensors", + "model.layers.1.mlp.experts.104.down_proj.weight_scale": "model-00002-of-00047.safetensors", + "model.layers.1.mlp.experts.104.gate_proj.weight": "model-00002-of-00047.safetensors", + "model.layers.1.mlp.experts.104.gate_proj.weight_scale": "model-00002-of-00047.safetensors", + "model.layers.1.mlp.experts.104.up_proj.weight": "model-00002-of-00047.safetensors", + "model.layers.1.mlp.experts.104.up_proj.weight_scale": "model-00002-of-00047.safetensors", + "model.layers.1.mlp.experts.105.down_proj.weight": "model-00002-of-00047.safetensors", + "model.layers.1.mlp.experts.105.down_proj.weight_scale": "model-00002-of-00047.safetensors", + "model.layers.1.mlp.experts.105.gate_proj.weight": "model-00002-of-00047.safetensors", + "model.layers.1.mlp.experts.105.gate_proj.weight_scale": "model-00002-of-00047.safetensors", + "model.layers.1.mlp.experts.105.up_proj.weight": "model-00002-of-00047.safetensors", + "model.layers.1.mlp.experts.105.up_proj.weight_scale": "model-00002-of-00047.safetensors", + "model.layers.1.mlp.experts.106.down_proj.weight": "model-00002-of-00047.safetensors", + "model.layers.1.mlp.experts.106.down_proj.weight_scale": "model-00002-of-00047.safetensors", + "model.layers.1.mlp.experts.106.gate_proj.weight": "model-00002-of-00047.safetensors", + "model.layers.1.mlp.experts.106.gate_proj.weight_scale": "model-00002-of-00047.safetensors", + "model.layers.1.mlp.experts.106.up_proj.weight": "model-00002-of-00047.safetensors", + "model.layers.1.mlp.experts.106.up_proj.weight_scale": "model-00002-of-00047.safetensors", + "model.layers.1.mlp.experts.107.down_proj.weight": "model-00002-of-00047.safetensors", + "model.layers.1.mlp.experts.107.down_proj.weight_scale": "model-00002-of-00047.safetensors", + "model.layers.1.mlp.experts.107.gate_proj.weight": "model-00002-of-00047.safetensors", + "model.layers.1.mlp.experts.107.gate_proj.weight_scale": "model-00002-of-00047.safetensors", + "model.layers.1.mlp.experts.107.up_proj.weight": "model-00002-of-00047.safetensors", + "model.layers.1.mlp.experts.107.up_proj.weight_scale": "model-00002-of-00047.safetensors", + "model.layers.1.mlp.experts.108.down_proj.weight": "model-00002-of-00047.safetensors", + "model.layers.1.mlp.experts.108.down_proj.weight_scale": "model-00002-of-00047.safetensors", + "model.layers.1.mlp.experts.108.gate_proj.weight": "model-00002-of-00047.safetensors", + "model.layers.1.mlp.experts.108.gate_proj.weight_scale": "model-00002-of-00047.safetensors", + "model.layers.1.mlp.experts.108.up_proj.weight": "model-00002-of-00047.safetensors", + "model.layers.1.mlp.experts.108.up_proj.weight_scale": "model-00002-of-00047.safetensors", + "model.layers.1.mlp.experts.109.down_proj.weight": "model-00002-of-00047.safetensors", + "model.layers.1.mlp.experts.109.down_proj.weight_scale": "model-00002-of-00047.safetensors", + "model.layers.1.mlp.experts.109.gate_proj.weight": "model-00002-of-00047.safetensors", + "model.layers.1.mlp.experts.109.gate_proj.weight_scale": "model-00002-of-00047.safetensors", + "model.layers.1.mlp.experts.109.up_proj.weight": "model-00002-of-00047.safetensors", + "model.layers.1.mlp.experts.109.up_proj.weight_scale": "model-00002-of-00047.safetensors", + "model.layers.1.mlp.experts.11.down_proj.weight": "model-00002-of-00047.safetensors", + "model.layers.1.mlp.experts.11.down_proj.weight_scale": "model-00002-of-00047.safetensors", + "model.layers.1.mlp.experts.11.gate_proj.weight": "model-00002-of-00047.safetensors", + "model.layers.1.mlp.experts.11.gate_proj.weight_scale": "model-00002-of-00047.safetensors", + "model.layers.1.mlp.experts.11.up_proj.weight": "model-00002-of-00047.safetensors", + "model.layers.1.mlp.experts.11.up_proj.weight_scale": "model-00002-of-00047.safetensors", + "model.layers.1.mlp.experts.110.down_proj.weight": "model-00002-of-00047.safetensors", + "model.layers.1.mlp.experts.110.down_proj.weight_scale": "model-00002-of-00047.safetensors", + "model.layers.1.mlp.experts.110.gate_proj.weight": "model-00002-of-00047.safetensors", + "model.layers.1.mlp.experts.110.gate_proj.weight_scale": "model-00002-of-00047.safetensors", + "model.layers.1.mlp.experts.110.up_proj.weight": "model-00002-of-00047.safetensors", + "model.layers.1.mlp.experts.110.up_proj.weight_scale": "model-00002-of-00047.safetensors", + "model.layers.1.mlp.experts.111.down_proj.weight": "model-00002-of-00047.safetensors", + "model.layers.1.mlp.experts.111.down_proj.weight_scale": "model-00002-of-00047.safetensors", + "model.layers.1.mlp.experts.111.gate_proj.weight": "model-00002-of-00047.safetensors", + "model.layers.1.mlp.experts.111.gate_proj.weight_scale": "model-00002-of-00047.safetensors", + "model.layers.1.mlp.experts.111.up_proj.weight": "model-00002-of-00047.safetensors", + "model.layers.1.mlp.experts.111.up_proj.weight_scale": "model-00002-of-00047.safetensors", + "model.layers.1.mlp.experts.112.down_proj.weight": "model-00002-of-00047.safetensors", + "model.layers.1.mlp.experts.112.down_proj.weight_scale": "model-00002-of-00047.safetensors", + "model.layers.1.mlp.experts.112.gate_proj.weight": "model-00002-of-00047.safetensors", + "model.layers.1.mlp.experts.112.gate_proj.weight_scale": "model-00002-of-00047.safetensors", + "model.layers.1.mlp.experts.112.up_proj.weight": "model-00002-of-00047.safetensors", + "model.layers.1.mlp.experts.112.up_proj.weight_scale": "model-00002-of-00047.safetensors", + "model.layers.1.mlp.experts.113.down_proj.weight": "model-00002-of-00047.safetensors", + "model.layers.1.mlp.experts.113.down_proj.weight_scale": "model-00002-of-00047.safetensors", + "model.layers.1.mlp.experts.113.gate_proj.weight": "model-00002-of-00047.safetensors", + "model.layers.1.mlp.experts.113.gate_proj.weight_scale": "model-00002-of-00047.safetensors", + "model.layers.1.mlp.experts.113.up_proj.weight": "model-00002-of-00047.safetensors", + "model.layers.1.mlp.experts.113.up_proj.weight_scale": "model-00002-of-00047.safetensors", + "model.layers.1.mlp.experts.114.down_proj.weight": "model-00002-of-00047.safetensors", + "model.layers.1.mlp.experts.114.down_proj.weight_scale": "model-00002-of-00047.safetensors", + "model.layers.1.mlp.experts.114.gate_proj.weight": "model-00002-of-00047.safetensors", + "model.layers.1.mlp.experts.114.gate_proj.weight_scale": "model-00002-of-00047.safetensors", + "model.layers.1.mlp.experts.114.up_proj.weight": "model-00002-of-00047.safetensors", + "model.layers.1.mlp.experts.114.up_proj.weight_scale": "model-00002-of-00047.safetensors", + "model.layers.1.mlp.experts.115.down_proj.weight": "model-00002-of-00047.safetensors", + "model.layers.1.mlp.experts.115.down_proj.weight_scale": "model-00002-of-00047.safetensors", + "model.layers.1.mlp.experts.115.gate_proj.weight": "model-00002-of-00047.safetensors", + "model.layers.1.mlp.experts.115.gate_proj.weight_scale": "model-00002-of-00047.safetensors", + "model.layers.1.mlp.experts.115.up_proj.weight": "model-00002-of-00047.safetensors", + "model.layers.1.mlp.experts.115.up_proj.weight_scale": "model-00002-of-00047.safetensors", + "model.layers.1.mlp.experts.116.down_proj.weight": "model-00002-of-00047.safetensors", + "model.layers.1.mlp.experts.116.down_proj.weight_scale": "model-00002-of-00047.safetensors", + "model.layers.1.mlp.experts.116.gate_proj.weight": "model-00002-of-00047.safetensors", + "model.layers.1.mlp.experts.116.gate_proj.weight_scale": "model-00002-of-00047.safetensors", + "model.layers.1.mlp.experts.116.up_proj.weight": "model-00002-of-00047.safetensors", + "model.layers.1.mlp.experts.116.up_proj.weight_scale": "model-00002-of-00047.safetensors", + "model.layers.1.mlp.experts.117.down_proj.weight": "model-00002-of-00047.safetensors", + "model.layers.1.mlp.experts.117.down_proj.weight_scale": "model-00002-of-00047.safetensors", + "model.layers.1.mlp.experts.117.gate_proj.weight": "model-00002-of-00047.safetensors", + "model.layers.1.mlp.experts.117.gate_proj.weight_scale": "model-00002-of-00047.safetensors", + "model.layers.1.mlp.experts.117.up_proj.weight": "model-00002-of-00047.safetensors", + "model.layers.1.mlp.experts.117.up_proj.weight_scale": "model-00002-of-00047.safetensors", + "model.layers.1.mlp.experts.118.down_proj.weight": "model-00002-of-00047.safetensors", + "model.layers.1.mlp.experts.118.down_proj.weight_scale": "model-00002-of-00047.safetensors", + "model.layers.1.mlp.experts.118.gate_proj.weight": "model-00002-of-00047.safetensors", + "model.layers.1.mlp.experts.118.gate_proj.weight_scale": "model-00002-of-00047.safetensors", + "model.layers.1.mlp.experts.118.up_proj.weight": "model-00002-of-00047.safetensors", + "model.layers.1.mlp.experts.118.up_proj.weight_scale": "model-00002-of-00047.safetensors", + "model.layers.1.mlp.experts.119.down_proj.weight": "model-00002-of-00047.safetensors", + "model.layers.1.mlp.experts.119.down_proj.weight_scale": "model-00002-of-00047.safetensors", + "model.layers.1.mlp.experts.119.gate_proj.weight": "model-00002-of-00047.safetensors", + "model.layers.1.mlp.experts.119.gate_proj.weight_scale": "model-00002-of-00047.safetensors", + "model.layers.1.mlp.experts.119.up_proj.weight": "model-00002-of-00047.safetensors", + "model.layers.1.mlp.experts.119.up_proj.weight_scale": "model-00002-of-00047.safetensors", + "model.layers.1.mlp.experts.12.down_proj.weight": "model-00002-of-00047.safetensors", + "model.layers.1.mlp.experts.12.down_proj.weight_scale": "model-00002-of-00047.safetensors", + "model.layers.1.mlp.experts.12.gate_proj.weight": "model-00002-of-00047.safetensors", + "model.layers.1.mlp.experts.12.gate_proj.weight_scale": "model-00002-of-00047.safetensors", + "model.layers.1.mlp.experts.12.up_proj.weight": "model-00002-of-00047.safetensors", + "model.layers.1.mlp.experts.12.up_proj.weight_scale": "model-00002-of-00047.safetensors", + "model.layers.1.mlp.experts.120.down_proj.weight": "model-00002-of-00047.safetensors", + "model.layers.1.mlp.experts.120.down_proj.weight_scale": "model-00002-of-00047.safetensors", + "model.layers.1.mlp.experts.120.gate_proj.weight": "model-00002-of-00047.safetensors", + "model.layers.1.mlp.experts.120.gate_proj.weight_scale": "model-00002-of-00047.safetensors", + "model.layers.1.mlp.experts.120.up_proj.weight": "model-00002-of-00047.safetensors", + "model.layers.1.mlp.experts.120.up_proj.weight_scale": "model-00002-of-00047.safetensors", + "model.layers.1.mlp.experts.121.down_proj.weight": "model-00002-of-00047.safetensors", + "model.layers.1.mlp.experts.121.down_proj.weight_scale": "model-00002-of-00047.safetensors", + "model.layers.1.mlp.experts.121.gate_proj.weight": "model-00002-of-00047.safetensors", + "model.layers.1.mlp.experts.121.gate_proj.weight_scale": "model-00002-of-00047.safetensors", + "model.layers.1.mlp.experts.121.up_proj.weight": "model-00002-of-00047.safetensors", + "model.layers.1.mlp.experts.121.up_proj.weight_scale": "model-00002-of-00047.safetensors", + "model.layers.1.mlp.experts.122.down_proj.weight": "model-00002-of-00047.safetensors", + "model.layers.1.mlp.experts.122.down_proj.weight_scale": "model-00002-of-00047.safetensors", + "model.layers.1.mlp.experts.122.gate_proj.weight": "model-00002-of-00047.safetensors", + "model.layers.1.mlp.experts.122.gate_proj.weight_scale": "model-00002-of-00047.safetensors", + "model.layers.1.mlp.experts.122.up_proj.weight": "model-00002-of-00047.safetensors", + "model.layers.1.mlp.experts.122.up_proj.weight_scale": "model-00002-of-00047.safetensors", + "model.layers.1.mlp.experts.123.down_proj.weight": "model-00002-of-00047.safetensors", + "model.layers.1.mlp.experts.123.down_proj.weight_scale": "model-00002-of-00047.safetensors", + "model.layers.1.mlp.experts.123.gate_proj.weight": "model-00002-of-00047.safetensors", + "model.layers.1.mlp.experts.123.gate_proj.weight_scale": "model-00002-of-00047.safetensors", + "model.layers.1.mlp.experts.123.up_proj.weight": "model-00002-of-00047.safetensors", + "model.layers.1.mlp.experts.123.up_proj.weight_scale": "model-00002-of-00047.safetensors", + "model.layers.1.mlp.experts.124.down_proj.weight": "model-00002-of-00047.safetensors", + "model.layers.1.mlp.experts.124.down_proj.weight_scale": "model-00002-of-00047.safetensors", + "model.layers.1.mlp.experts.124.gate_proj.weight": "model-00002-of-00047.safetensors", + "model.layers.1.mlp.experts.124.gate_proj.weight_scale": "model-00002-of-00047.safetensors", + "model.layers.1.mlp.experts.124.up_proj.weight": "model-00002-of-00047.safetensors", + "model.layers.1.mlp.experts.124.up_proj.weight_scale": "model-00002-of-00047.safetensors", + "model.layers.1.mlp.experts.125.down_proj.weight": "model-00002-of-00047.safetensors", + "model.layers.1.mlp.experts.125.down_proj.weight_scale": "model-00002-of-00047.safetensors", + "model.layers.1.mlp.experts.125.gate_proj.weight": "model-00002-of-00047.safetensors", + "model.layers.1.mlp.experts.125.gate_proj.weight_scale": "model-00002-of-00047.safetensors", + "model.layers.1.mlp.experts.125.up_proj.weight": "model-00002-of-00047.safetensors", + "model.layers.1.mlp.experts.125.up_proj.weight_scale": "model-00002-of-00047.safetensors", + "model.layers.1.mlp.experts.126.down_proj.weight": "model-00002-of-00047.safetensors", + "model.layers.1.mlp.experts.126.down_proj.weight_scale": "model-00002-of-00047.safetensors", + "model.layers.1.mlp.experts.126.gate_proj.weight": "model-00002-of-00047.safetensors", + "model.layers.1.mlp.experts.126.gate_proj.weight_scale": "model-00002-of-00047.safetensors", + "model.layers.1.mlp.experts.126.up_proj.weight": "model-00002-of-00047.safetensors", + "model.layers.1.mlp.experts.126.up_proj.weight_scale": "model-00002-of-00047.safetensors", + "model.layers.1.mlp.experts.127.down_proj.weight": "model-00002-of-00047.safetensors", + "model.layers.1.mlp.experts.127.down_proj.weight_scale": "model-00002-of-00047.safetensors", + "model.layers.1.mlp.experts.127.gate_proj.weight": "model-00002-of-00047.safetensors", + "model.layers.1.mlp.experts.127.gate_proj.weight_scale": "model-00002-of-00047.safetensors", + "model.layers.1.mlp.experts.127.up_proj.weight": "model-00002-of-00047.safetensors", + "model.layers.1.mlp.experts.127.up_proj.weight_scale": "model-00002-of-00047.safetensors", + "model.layers.1.mlp.experts.13.down_proj.weight": "model-00002-of-00047.safetensors", + "model.layers.1.mlp.experts.13.down_proj.weight_scale": "model-00002-of-00047.safetensors", + "model.layers.1.mlp.experts.13.gate_proj.weight": "model-00002-of-00047.safetensors", + "model.layers.1.mlp.experts.13.gate_proj.weight_scale": "model-00002-of-00047.safetensors", + "model.layers.1.mlp.experts.13.up_proj.weight": "model-00002-of-00047.safetensors", + "model.layers.1.mlp.experts.13.up_proj.weight_scale": "model-00002-of-00047.safetensors", + "model.layers.1.mlp.experts.14.down_proj.weight": "model-00002-of-00047.safetensors", + "model.layers.1.mlp.experts.14.down_proj.weight_scale": "model-00002-of-00047.safetensors", + "model.layers.1.mlp.experts.14.gate_proj.weight": "model-00002-of-00047.safetensors", + "model.layers.1.mlp.experts.14.gate_proj.weight_scale": "model-00002-of-00047.safetensors", + "model.layers.1.mlp.experts.14.up_proj.weight": "model-00002-of-00047.safetensors", + "model.layers.1.mlp.experts.14.up_proj.weight_scale": "model-00002-of-00047.safetensors", + "model.layers.1.mlp.experts.15.down_proj.weight": "model-00002-of-00047.safetensors", + "model.layers.1.mlp.experts.15.down_proj.weight_scale": "model-00002-of-00047.safetensors", + "model.layers.1.mlp.experts.15.gate_proj.weight": "model-00002-of-00047.safetensors", + "model.layers.1.mlp.experts.15.gate_proj.weight_scale": "model-00002-of-00047.safetensors", + "model.layers.1.mlp.experts.15.up_proj.weight": "model-00002-of-00047.safetensors", + "model.layers.1.mlp.experts.15.up_proj.weight_scale": "model-00002-of-00047.safetensors", + "model.layers.1.mlp.experts.16.down_proj.weight": "model-00002-of-00047.safetensors", + "model.layers.1.mlp.experts.16.down_proj.weight_scale": "model-00002-of-00047.safetensors", + "model.layers.1.mlp.experts.16.gate_proj.weight": "model-00002-of-00047.safetensors", + "model.layers.1.mlp.experts.16.gate_proj.weight_scale": "model-00002-of-00047.safetensors", + "model.layers.1.mlp.experts.16.up_proj.weight": "model-00002-of-00047.safetensors", + "model.layers.1.mlp.experts.16.up_proj.weight_scale": "model-00002-of-00047.safetensors", + "model.layers.1.mlp.experts.17.down_proj.weight": "model-00002-of-00047.safetensors", + "model.layers.1.mlp.experts.17.down_proj.weight_scale": "model-00002-of-00047.safetensors", + "model.layers.1.mlp.experts.17.gate_proj.weight": "model-00002-of-00047.safetensors", + "model.layers.1.mlp.experts.17.gate_proj.weight_scale": "model-00002-of-00047.safetensors", + "model.layers.1.mlp.experts.17.up_proj.weight": "model-00002-of-00047.safetensors", + "model.layers.1.mlp.experts.17.up_proj.weight_scale": "model-00002-of-00047.safetensors", + "model.layers.1.mlp.experts.18.down_proj.weight": "model-00002-of-00047.safetensors", + "model.layers.1.mlp.experts.18.down_proj.weight_scale": "model-00002-of-00047.safetensors", + "model.layers.1.mlp.experts.18.gate_proj.weight": "model-00002-of-00047.safetensors", + "model.layers.1.mlp.experts.18.gate_proj.weight_scale": "model-00002-of-00047.safetensors", + "model.layers.1.mlp.experts.18.up_proj.weight": "model-00002-of-00047.safetensors", + "model.layers.1.mlp.experts.18.up_proj.weight_scale": "model-00002-of-00047.safetensors", + "model.layers.1.mlp.experts.19.down_proj.weight": "model-00002-of-00047.safetensors", + "model.layers.1.mlp.experts.19.down_proj.weight_scale": "model-00002-of-00047.safetensors", + "model.layers.1.mlp.experts.19.gate_proj.weight": "model-00002-of-00047.safetensors", + "model.layers.1.mlp.experts.19.gate_proj.weight_scale": "model-00002-of-00047.safetensors", + "model.layers.1.mlp.experts.19.up_proj.weight": "model-00002-of-00047.safetensors", + "model.layers.1.mlp.experts.19.up_proj.weight_scale": "model-00002-of-00047.safetensors", + "model.layers.1.mlp.experts.2.down_proj.weight": "model-00002-of-00047.safetensors", + "model.layers.1.mlp.experts.2.down_proj.weight_scale": "model-00002-of-00047.safetensors", + "model.layers.1.mlp.experts.2.gate_proj.weight": "model-00002-of-00047.safetensors", + "model.layers.1.mlp.experts.2.gate_proj.weight_scale": "model-00002-of-00047.safetensors", + "model.layers.1.mlp.experts.2.up_proj.weight": "model-00002-of-00047.safetensors", + "model.layers.1.mlp.experts.2.up_proj.weight_scale": "model-00002-of-00047.safetensors", + "model.layers.1.mlp.experts.20.down_proj.weight": "model-00002-of-00047.safetensors", + "model.layers.1.mlp.experts.20.down_proj.weight_scale": "model-00002-of-00047.safetensors", + "model.layers.1.mlp.experts.20.gate_proj.weight": "model-00002-of-00047.safetensors", + "model.layers.1.mlp.experts.20.gate_proj.weight_scale": "model-00002-of-00047.safetensors", + "model.layers.1.mlp.experts.20.up_proj.weight": "model-00002-of-00047.safetensors", + "model.layers.1.mlp.experts.20.up_proj.weight_scale": "model-00002-of-00047.safetensors", + "model.layers.1.mlp.experts.21.down_proj.weight": "model-00002-of-00047.safetensors", + "model.layers.1.mlp.experts.21.down_proj.weight_scale": "model-00002-of-00047.safetensors", + "model.layers.1.mlp.experts.21.gate_proj.weight": "model-00002-of-00047.safetensors", + "model.layers.1.mlp.experts.21.gate_proj.weight_scale": "model-00002-of-00047.safetensors", + "model.layers.1.mlp.experts.21.up_proj.weight": "model-00002-of-00047.safetensors", + "model.layers.1.mlp.experts.21.up_proj.weight_scale": "model-00002-of-00047.safetensors", + "model.layers.1.mlp.experts.22.down_proj.weight": "model-00002-of-00047.safetensors", + "model.layers.1.mlp.experts.22.down_proj.weight_scale": "model-00002-of-00047.safetensors", + "model.layers.1.mlp.experts.22.gate_proj.weight": "model-00002-of-00047.safetensors", + "model.layers.1.mlp.experts.22.gate_proj.weight_scale": "model-00002-of-00047.safetensors", + "model.layers.1.mlp.experts.22.up_proj.weight": "model-00002-of-00047.safetensors", + "model.layers.1.mlp.experts.22.up_proj.weight_scale": "model-00002-of-00047.safetensors", + "model.layers.1.mlp.experts.23.down_proj.weight": "model-00002-of-00047.safetensors", + "model.layers.1.mlp.experts.23.down_proj.weight_scale": "model-00002-of-00047.safetensors", + "model.layers.1.mlp.experts.23.gate_proj.weight": "model-00002-of-00047.safetensors", + "model.layers.1.mlp.experts.23.gate_proj.weight_scale": "model-00002-of-00047.safetensors", + "model.layers.1.mlp.experts.23.up_proj.weight": "model-00002-of-00047.safetensors", + "model.layers.1.mlp.experts.23.up_proj.weight_scale": "model-00002-of-00047.safetensors", + "model.layers.1.mlp.experts.24.down_proj.weight": "model-00002-of-00047.safetensors", + "model.layers.1.mlp.experts.24.down_proj.weight_scale": "model-00002-of-00047.safetensors", + "model.layers.1.mlp.experts.24.gate_proj.weight": "model-00002-of-00047.safetensors", + "model.layers.1.mlp.experts.24.gate_proj.weight_scale": "model-00002-of-00047.safetensors", + "model.layers.1.mlp.experts.24.up_proj.weight": "model-00002-of-00047.safetensors", + "model.layers.1.mlp.experts.24.up_proj.weight_scale": "model-00002-of-00047.safetensors", + "model.layers.1.mlp.experts.25.down_proj.weight": "model-00002-of-00047.safetensors", + "model.layers.1.mlp.experts.25.down_proj.weight_scale": "model-00002-of-00047.safetensors", + "model.layers.1.mlp.experts.25.gate_proj.weight": "model-00002-of-00047.safetensors", + "model.layers.1.mlp.experts.25.gate_proj.weight_scale": "model-00002-of-00047.safetensors", + "model.layers.1.mlp.experts.25.up_proj.weight": "model-00002-of-00047.safetensors", + "model.layers.1.mlp.experts.25.up_proj.weight_scale": "model-00002-of-00047.safetensors", + "model.layers.1.mlp.experts.26.down_proj.weight": "model-00002-of-00047.safetensors", + "model.layers.1.mlp.experts.26.down_proj.weight_scale": "model-00002-of-00047.safetensors", + "model.layers.1.mlp.experts.26.gate_proj.weight": "model-00002-of-00047.safetensors", + "model.layers.1.mlp.experts.26.gate_proj.weight_scale": "model-00002-of-00047.safetensors", + "model.layers.1.mlp.experts.26.up_proj.weight": "model-00002-of-00047.safetensors", + "model.layers.1.mlp.experts.26.up_proj.weight_scale": "model-00002-of-00047.safetensors", + "model.layers.1.mlp.experts.27.down_proj.weight": "model-00002-of-00047.safetensors", + "model.layers.1.mlp.experts.27.down_proj.weight_scale": "model-00002-of-00047.safetensors", + "model.layers.1.mlp.experts.27.gate_proj.weight": "model-00002-of-00047.safetensors", + "model.layers.1.mlp.experts.27.gate_proj.weight_scale": "model-00002-of-00047.safetensors", + "model.layers.1.mlp.experts.27.up_proj.weight": "model-00002-of-00047.safetensors", + "model.layers.1.mlp.experts.27.up_proj.weight_scale": "model-00002-of-00047.safetensors", + "model.layers.1.mlp.experts.28.down_proj.weight": "model-00002-of-00047.safetensors", + "model.layers.1.mlp.experts.28.down_proj.weight_scale": "model-00002-of-00047.safetensors", + "model.layers.1.mlp.experts.28.gate_proj.weight": "model-00002-of-00047.safetensors", + "model.layers.1.mlp.experts.28.gate_proj.weight_scale": "model-00002-of-00047.safetensors", + "model.layers.1.mlp.experts.28.up_proj.weight": "model-00002-of-00047.safetensors", + "model.layers.1.mlp.experts.28.up_proj.weight_scale": "model-00002-of-00047.safetensors", + "model.layers.1.mlp.experts.29.down_proj.weight": "model-00002-of-00047.safetensors", + "model.layers.1.mlp.experts.29.down_proj.weight_scale": "model-00002-of-00047.safetensors", + "model.layers.1.mlp.experts.29.gate_proj.weight": "model-00002-of-00047.safetensors", + "model.layers.1.mlp.experts.29.gate_proj.weight_scale": "model-00002-of-00047.safetensors", + "model.layers.1.mlp.experts.29.up_proj.weight": "model-00002-of-00047.safetensors", + "model.layers.1.mlp.experts.29.up_proj.weight_scale": "model-00002-of-00047.safetensors", + "model.layers.1.mlp.experts.3.down_proj.weight": "model-00002-of-00047.safetensors", + "model.layers.1.mlp.experts.3.down_proj.weight_scale": "model-00002-of-00047.safetensors", + "model.layers.1.mlp.experts.3.gate_proj.weight": "model-00002-of-00047.safetensors", + "model.layers.1.mlp.experts.3.gate_proj.weight_scale": "model-00002-of-00047.safetensors", + "model.layers.1.mlp.experts.3.up_proj.weight": "model-00002-of-00047.safetensors", + "model.layers.1.mlp.experts.3.up_proj.weight_scale": "model-00002-of-00047.safetensors", + "model.layers.1.mlp.experts.30.down_proj.weight": "model-00002-of-00047.safetensors", + "model.layers.1.mlp.experts.30.down_proj.weight_scale": "model-00002-of-00047.safetensors", + "model.layers.1.mlp.experts.30.gate_proj.weight": "model-00002-of-00047.safetensors", + "model.layers.1.mlp.experts.30.gate_proj.weight_scale": "model-00002-of-00047.safetensors", + "model.layers.1.mlp.experts.30.up_proj.weight": "model-00002-of-00047.safetensors", + "model.layers.1.mlp.experts.30.up_proj.weight_scale": "model-00002-of-00047.safetensors", + "model.layers.1.mlp.experts.31.down_proj.weight": "model-00002-of-00047.safetensors", + "model.layers.1.mlp.experts.31.down_proj.weight_scale": "model-00002-of-00047.safetensors", + "model.layers.1.mlp.experts.31.gate_proj.weight": "model-00002-of-00047.safetensors", + "model.layers.1.mlp.experts.31.gate_proj.weight_scale": "model-00002-of-00047.safetensors", + "model.layers.1.mlp.experts.31.up_proj.weight": "model-00002-of-00047.safetensors", + "model.layers.1.mlp.experts.31.up_proj.weight_scale": "model-00002-of-00047.safetensors", + "model.layers.1.mlp.experts.32.down_proj.weight": "model-00002-of-00047.safetensors", + "model.layers.1.mlp.experts.32.down_proj.weight_scale": "model-00002-of-00047.safetensors", + "model.layers.1.mlp.experts.32.gate_proj.weight": "model-00002-of-00047.safetensors", + "model.layers.1.mlp.experts.32.gate_proj.weight_scale": "model-00002-of-00047.safetensors", + "model.layers.1.mlp.experts.32.up_proj.weight": "model-00002-of-00047.safetensors", + "model.layers.1.mlp.experts.32.up_proj.weight_scale": "model-00002-of-00047.safetensors", + "model.layers.1.mlp.experts.33.down_proj.weight": "model-00002-of-00047.safetensors", + "model.layers.1.mlp.experts.33.down_proj.weight_scale": "model-00002-of-00047.safetensors", + "model.layers.1.mlp.experts.33.gate_proj.weight": "model-00002-of-00047.safetensors", + "model.layers.1.mlp.experts.33.gate_proj.weight_scale": "model-00002-of-00047.safetensors", + "model.layers.1.mlp.experts.33.up_proj.weight": "model-00002-of-00047.safetensors", + "model.layers.1.mlp.experts.33.up_proj.weight_scale": "model-00002-of-00047.safetensors", + "model.layers.1.mlp.experts.34.down_proj.weight": "model-00002-of-00047.safetensors", + "model.layers.1.mlp.experts.34.down_proj.weight_scale": "model-00002-of-00047.safetensors", + "model.layers.1.mlp.experts.34.gate_proj.weight": "model-00002-of-00047.safetensors", + "model.layers.1.mlp.experts.34.gate_proj.weight_scale": "model-00002-of-00047.safetensors", + "model.layers.1.mlp.experts.34.up_proj.weight": "model-00002-of-00047.safetensors", + "model.layers.1.mlp.experts.34.up_proj.weight_scale": "model-00002-of-00047.safetensors", + "model.layers.1.mlp.experts.35.down_proj.weight": "model-00002-of-00047.safetensors", + "model.layers.1.mlp.experts.35.down_proj.weight_scale": "model-00002-of-00047.safetensors", + "model.layers.1.mlp.experts.35.gate_proj.weight": "model-00002-of-00047.safetensors", + "model.layers.1.mlp.experts.35.gate_proj.weight_scale": "model-00002-of-00047.safetensors", + "model.layers.1.mlp.experts.35.up_proj.weight": "model-00002-of-00047.safetensors", + "model.layers.1.mlp.experts.35.up_proj.weight_scale": "model-00002-of-00047.safetensors", + "model.layers.1.mlp.experts.36.down_proj.weight": "model-00002-of-00047.safetensors", + "model.layers.1.mlp.experts.36.down_proj.weight_scale": "model-00002-of-00047.safetensors", + "model.layers.1.mlp.experts.36.gate_proj.weight": "model-00002-of-00047.safetensors", + "model.layers.1.mlp.experts.36.gate_proj.weight_scale": "model-00002-of-00047.safetensors", + "model.layers.1.mlp.experts.36.up_proj.weight": "model-00002-of-00047.safetensors", + "model.layers.1.mlp.experts.36.up_proj.weight_scale": "model-00002-of-00047.safetensors", + "model.layers.1.mlp.experts.37.down_proj.weight": "model-00002-of-00047.safetensors", + "model.layers.1.mlp.experts.37.down_proj.weight_scale": "model-00002-of-00047.safetensors", + "model.layers.1.mlp.experts.37.gate_proj.weight": "model-00002-of-00047.safetensors", + "model.layers.1.mlp.experts.37.gate_proj.weight_scale": "model-00002-of-00047.safetensors", + "model.layers.1.mlp.experts.37.up_proj.weight": "model-00002-of-00047.safetensors", + "model.layers.1.mlp.experts.37.up_proj.weight_scale": "model-00002-of-00047.safetensors", + "model.layers.1.mlp.experts.38.down_proj.weight": "model-00002-of-00047.safetensors", + "model.layers.1.mlp.experts.38.down_proj.weight_scale": "model-00002-of-00047.safetensors", + "model.layers.1.mlp.experts.38.gate_proj.weight": "model-00002-of-00047.safetensors", + "model.layers.1.mlp.experts.38.gate_proj.weight_scale": "model-00002-of-00047.safetensors", + "model.layers.1.mlp.experts.38.up_proj.weight": "model-00002-of-00047.safetensors", + "model.layers.1.mlp.experts.38.up_proj.weight_scale": "model-00002-of-00047.safetensors", + "model.layers.1.mlp.experts.39.down_proj.weight": "model-00002-of-00047.safetensors", + "model.layers.1.mlp.experts.39.down_proj.weight_scale": "model-00002-of-00047.safetensors", + "model.layers.1.mlp.experts.39.gate_proj.weight": "model-00002-of-00047.safetensors", + "model.layers.1.mlp.experts.39.gate_proj.weight_scale": "model-00002-of-00047.safetensors", + "model.layers.1.mlp.experts.39.up_proj.weight": "model-00002-of-00047.safetensors", + "model.layers.1.mlp.experts.39.up_proj.weight_scale": "model-00002-of-00047.safetensors", + "model.layers.1.mlp.experts.4.down_proj.weight": "model-00002-of-00047.safetensors", + "model.layers.1.mlp.experts.4.down_proj.weight_scale": "model-00002-of-00047.safetensors", + "model.layers.1.mlp.experts.4.gate_proj.weight": "model-00002-of-00047.safetensors", + "model.layers.1.mlp.experts.4.gate_proj.weight_scale": "model-00002-of-00047.safetensors", + "model.layers.1.mlp.experts.4.up_proj.weight": "model-00002-of-00047.safetensors", + "model.layers.1.mlp.experts.4.up_proj.weight_scale": "model-00002-of-00047.safetensors", + "model.layers.1.mlp.experts.40.down_proj.weight": "model-00002-of-00047.safetensors", + "model.layers.1.mlp.experts.40.down_proj.weight_scale": "model-00002-of-00047.safetensors", + "model.layers.1.mlp.experts.40.gate_proj.weight": "model-00002-of-00047.safetensors", + "model.layers.1.mlp.experts.40.gate_proj.weight_scale": "model-00002-of-00047.safetensors", + "model.layers.1.mlp.experts.40.up_proj.weight": "model-00002-of-00047.safetensors", + "model.layers.1.mlp.experts.40.up_proj.weight_scale": "model-00002-of-00047.safetensors", + "model.layers.1.mlp.experts.41.down_proj.weight": "model-00002-of-00047.safetensors", + "model.layers.1.mlp.experts.41.down_proj.weight_scale": "model-00002-of-00047.safetensors", + "model.layers.1.mlp.experts.41.gate_proj.weight": "model-00002-of-00047.safetensors", + "model.layers.1.mlp.experts.41.gate_proj.weight_scale": "model-00002-of-00047.safetensors", + "model.layers.1.mlp.experts.41.up_proj.weight": "model-00002-of-00047.safetensors", + "model.layers.1.mlp.experts.41.up_proj.weight_scale": "model-00002-of-00047.safetensors", + "model.layers.1.mlp.experts.42.down_proj.weight": "model-00002-of-00047.safetensors", + "model.layers.1.mlp.experts.42.down_proj.weight_scale": "model-00002-of-00047.safetensors", + "model.layers.1.mlp.experts.42.gate_proj.weight": "model-00002-of-00047.safetensors", + "model.layers.1.mlp.experts.42.gate_proj.weight_scale": "model-00002-of-00047.safetensors", + "model.layers.1.mlp.experts.42.up_proj.weight": "model-00002-of-00047.safetensors", + "model.layers.1.mlp.experts.42.up_proj.weight_scale": "model-00002-of-00047.safetensors", + "model.layers.1.mlp.experts.43.down_proj.weight": "model-00002-of-00047.safetensors", + "model.layers.1.mlp.experts.43.down_proj.weight_scale": "model-00002-of-00047.safetensors", + "model.layers.1.mlp.experts.43.gate_proj.weight": "model-00002-of-00047.safetensors", + "model.layers.1.mlp.experts.43.gate_proj.weight_scale": "model-00002-of-00047.safetensors", + "model.layers.1.mlp.experts.43.up_proj.weight": "model-00002-of-00047.safetensors", + "model.layers.1.mlp.experts.43.up_proj.weight_scale": "model-00002-of-00047.safetensors", + "model.layers.1.mlp.experts.44.down_proj.weight": "model-00002-of-00047.safetensors", + "model.layers.1.mlp.experts.44.down_proj.weight_scale": "model-00002-of-00047.safetensors", + "model.layers.1.mlp.experts.44.gate_proj.weight": "model-00002-of-00047.safetensors", + "model.layers.1.mlp.experts.44.gate_proj.weight_scale": "model-00002-of-00047.safetensors", + "model.layers.1.mlp.experts.44.up_proj.weight": "model-00002-of-00047.safetensors", + "model.layers.1.mlp.experts.44.up_proj.weight_scale": "model-00002-of-00047.safetensors", + "model.layers.1.mlp.experts.45.down_proj.weight": "model-00002-of-00047.safetensors", + "model.layers.1.mlp.experts.45.down_proj.weight_scale": "model-00002-of-00047.safetensors", + "model.layers.1.mlp.experts.45.gate_proj.weight": "model-00002-of-00047.safetensors", + "model.layers.1.mlp.experts.45.gate_proj.weight_scale": "model-00002-of-00047.safetensors", + "model.layers.1.mlp.experts.45.up_proj.weight": "model-00002-of-00047.safetensors", + "model.layers.1.mlp.experts.45.up_proj.weight_scale": "model-00002-of-00047.safetensors", + "model.layers.1.mlp.experts.46.down_proj.weight": "model-00002-of-00047.safetensors", + "model.layers.1.mlp.experts.46.down_proj.weight_scale": "model-00002-of-00047.safetensors", + "model.layers.1.mlp.experts.46.gate_proj.weight": "model-00002-of-00047.safetensors", + "model.layers.1.mlp.experts.46.gate_proj.weight_scale": "model-00002-of-00047.safetensors", + "model.layers.1.mlp.experts.46.up_proj.weight": "model-00002-of-00047.safetensors", + "model.layers.1.mlp.experts.46.up_proj.weight_scale": "model-00002-of-00047.safetensors", + "model.layers.1.mlp.experts.47.down_proj.weight": "model-00002-of-00047.safetensors", + "model.layers.1.mlp.experts.47.down_proj.weight_scale": "model-00002-of-00047.safetensors", + "model.layers.1.mlp.experts.47.gate_proj.weight": "model-00002-of-00047.safetensors", + "model.layers.1.mlp.experts.47.gate_proj.weight_scale": "model-00002-of-00047.safetensors", + "model.layers.1.mlp.experts.47.up_proj.weight": "model-00002-of-00047.safetensors", + "model.layers.1.mlp.experts.47.up_proj.weight_scale": "model-00002-of-00047.safetensors", + "model.layers.1.mlp.experts.48.down_proj.weight": "model-00002-of-00047.safetensors", + "model.layers.1.mlp.experts.48.down_proj.weight_scale": "model-00002-of-00047.safetensors", + "model.layers.1.mlp.experts.48.gate_proj.weight": "model-00002-of-00047.safetensors", + "model.layers.1.mlp.experts.48.gate_proj.weight_scale": "model-00002-of-00047.safetensors", + "model.layers.1.mlp.experts.48.up_proj.weight": "model-00002-of-00047.safetensors", + "model.layers.1.mlp.experts.48.up_proj.weight_scale": "model-00002-of-00047.safetensors", + "model.layers.1.mlp.experts.49.down_proj.weight": "model-00002-of-00047.safetensors", + "model.layers.1.mlp.experts.49.down_proj.weight_scale": "model-00002-of-00047.safetensors", + "model.layers.1.mlp.experts.49.gate_proj.weight": "model-00002-of-00047.safetensors", + "model.layers.1.mlp.experts.49.gate_proj.weight_scale": "model-00002-of-00047.safetensors", + "model.layers.1.mlp.experts.49.up_proj.weight": "model-00002-of-00047.safetensors", + "model.layers.1.mlp.experts.49.up_proj.weight_scale": "model-00002-of-00047.safetensors", + "model.layers.1.mlp.experts.5.down_proj.weight": "model-00002-of-00047.safetensors", + "model.layers.1.mlp.experts.5.down_proj.weight_scale": "model-00002-of-00047.safetensors", + "model.layers.1.mlp.experts.5.gate_proj.weight": "model-00002-of-00047.safetensors", + "model.layers.1.mlp.experts.5.gate_proj.weight_scale": "model-00002-of-00047.safetensors", + "model.layers.1.mlp.experts.5.up_proj.weight": "model-00002-of-00047.safetensors", + "model.layers.1.mlp.experts.5.up_proj.weight_scale": "model-00002-of-00047.safetensors", + "model.layers.1.mlp.experts.50.down_proj.weight": "model-00002-of-00047.safetensors", + "model.layers.1.mlp.experts.50.down_proj.weight_scale": "model-00002-of-00047.safetensors", + "model.layers.1.mlp.experts.50.gate_proj.weight": "model-00002-of-00047.safetensors", + "model.layers.1.mlp.experts.50.gate_proj.weight_scale": "model-00002-of-00047.safetensors", + "model.layers.1.mlp.experts.50.up_proj.weight": "model-00002-of-00047.safetensors", + "model.layers.1.mlp.experts.50.up_proj.weight_scale": "model-00002-of-00047.safetensors", + "model.layers.1.mlp.experts.51.down_proj.weight": "model-00002-of-00047.safetensors", + "model.layers.1.mlp.experts.51.down_proj.weight_scale": "model-00002-of-00047.safetensors", + "model.layers.1.mlp.experts.51.gate_proj.weight": "model-00002-of-00047.safetensors", + "model.layers.1.mlp.experts.51.gate_proj.weight_scale": "model-00002-of-00047.safetensors", + "model.layers.1.mlp.experts.51.up_proj.weight": "model-00002-of-00047.safetensors", + "model.layers.1.mlp.experts.51.up_proj.weight_scale": "model-00002-of-00047.safetensors", + "model.layers.1.mlp.experts.52.down_proj.weight": "model-00002-of-00047.safetensors", + "model.layers.1.mlp.experts.52.down_proj.weight_scale": "model-00002-of-00047.safetensors", + "model.layers.1.mlp.experts.52.gate_proj.weight": "model-00002-of-00047.safetensors", + "model.layers.1.mlp.experts.52.gate_proj.weight_scale": "model-00002-of-00047.safetensors", + "model.layers.1.mlp.experts.52.up_proj.weight": "model-00002-of-00047.safetensors", + "model.layers.1.mlp.experts.52.up_proj.weight_scale": "model-00002-of-00047.safetensors", + "model.layers.1.mlp.experts.53.down_proj.weight": "model-00002-of-00047.safetensors", + "model.layers.1.mlp.experts.53.down_proj.weight_scale": "model-00002-of-00047.safetensors", + "model.layers.1.mlp.experts.53.gate_proj.weight": "model-00002-of-00047.safetensors", + "model.layers.1.mlp.experts.53.gate_proj.weight_scale": "model-00002-of-00047.safetensors", + "model.layers.1.mlp.experts.53.up_proj.weight": "model-00002-of-00047.safetensors", + "model.layers.1.mlp.experts.53.up_proj.weight_scale": "model-00002-of-00047.safetensors", + "model.layers.1.mlp.experts.54.down_proj.weight": "model-00002-of-00047.safetensors", + "model.layers.1.mlp.experts.54.down_proj.weight_scale": "model-00002-of-00047.safetensors", + "model.layers.1.mlp.experts.54.gate_proj.weight": "model-00002-of-00047.safetensors", + "model.layers.1.mlp.experts.54.gate_proj.weight_scale": "model-00002-of-00047.safetensors", + "model.layers.1.mlp.experts.54.up_proj.weight": "model-00002-of-00047.safetensors", + "model.layers.1.mlp.experts.54.up_proj.weight_scale": "model-00002-of-00047.safetensors", + "model.layers.1.mlp.experts.55.down_proj.weight": "model-00002-of-00047.safetensors", + "model.layers.1.mlp.experts.55.down_proj.weight_scale": "model-00002-of-00047.safetensors", + "model.layers.1.mlp.experts.55.gate_proj.weight": "model-00002-of-00047.safetensors", + "model.layers.1.mlp.experts.55.gate_proj.weight_scale": "model-00002-of-00047.safetensors", + "model.layers.1.mlp.experts.55.up_proj.weight": "model-00002-of-00047.safetensors", + "model.layers.1.mlp.experts.55.up_proj.weight_scale": "model-00002-of-00047.safetensors", + "model.layers.1.mlp.experts.56.down_proj.weight": "model-00002-of-00047.safetensors", + "model.layers.1.mlp.experts.56.down_proj.weight_scale": "model-00002-of-00047.safetensors", + "model.layers.1.mlp.experts.56.gate_proj.weight": "model-00002-of-00047.safetensors", + "model.layers.1.mlp.experts.56.gate_proj.weight_scale": "model-00002-of-00047.safetensors", + "model.layers.1.mlp.experts.56.up_proj.weight": "model-00002-of-00047.safetensors", + "model.layers.1.mlp.experts.56.up_proj.weight_scale": "model-00002-of-00047.safetensors", + "model.layers.1.mlp.experts.57.down_proj.weight": "model-00002-of-00047.safetensors", + "model.layers.1.mlp.experts.57.down_proj.weight_scale": "model-00002-of-00047.safetensors", + "model.layers.1.mlp.experts.57.gate_proj.weight": "model-00002-of-00047.safetensors", + "model.layers.1.mlp.experts.57.gate_proj.weight_scale": "model-00002-of-00047.safetensors", + "model.layers.1.mlp.experts.57.up_proj.weight": "model-00002-of-00047.safetensors", + "model.layers.1.mlp.experts.57.up_proj.weight_scale": "model-00002-of-00047.safetensors", + "model.layers.1.mlp.experts.58.down_proj.weight": "model-00002-of-00047.safetensors", + "model.layers.1.mlp.experts.58.down_proj.weight_scale": "model-00002-of-00047.safetensors", + "model.layers.1.mlp.experts.58.gate_proj.weight": "model-00002-of-00047.safetensors", + "model.layers.1.mlp.experts.58.gate_proj.weight_scale": "model-00002-of-00047.safetensors", + "model.layers.1.mlp.experts.58.up_proj.weight": "model-00002-of-00047.safetensors", + "model.layers.1.mlp.experts.58.up_proj.weight_scale": "model-00002-of-00047.safetensors", + "model.layers.1.mlp.experts.59.down_proj.weight": "model-00002-of-00047.safetensors", + "model.layers.1.mlp.experts.59.down_proj.weight_scale": "model-00002-of-00047.safetensors", + "model.layers.1.mlp.experts.59.gate_proj.weight": "model-00002-of-00047.safetensors", + "model.layers.1.mlp.experts.59.gate_proj.weight_scale": "model-00002-of-00047.safetensors", + "model.layers.1.mlp.experts.59.up_proj.weight": "model-00002-of-00047.safetensors", + "model.layers.1.mlp.experts.59.up_proj.weight_scale": "model-00002-of-00047.safetensors", + "model.layers.1.mlp.experts.6.down_proj.weight": "model-00002-of-00047.safetensors", + "model.layers.1.mlp.experts.6.down_proj.weight_scale": "model-00002-of-00047.safetensors", + "model.layers.1.mlp.experts.6.gate_proj.weight": "model-00002-of-00047.safetensors", + "model.layers.1.mlp.experts.6.gate_proj.weight_scale": "model-00002-of-00047.safetensors", + "model.layers.1.mlp.experts.6.up_proj.weight": "model-00002-of-00047.safetensors", + "model.layers.1.mlp.experts.6.up_proj.weight_scale": "model-00002-of-00047.safetensors", + "model.layers.1.mlp.experts.60.down_proj.weight": "model-00002-of-00047.safetensors", + "model.layers.1.mlp.experts.60.down_proj.weight_scale": "model-00002-of-00047.safetensors", + "model.layers.1.mlp.experts.60.gate_proj.weight": "model-00002-of-00047.safetensors", + "model.layers.1.mlp.experts.60.gate_proj.weight_scale": "model-00002-of-00047.safetensors", + "model.layers.1.mlp.experts.60.up_proj.weight": "model-00002-of-00047.safetensors", + "model.layers.1.mlp.experts.60.up_proj.weight_scale": "model-00002-of-00047.safetensors", + "model.layers.1.mlp.experts.61.down_proj.weight": "model-00002-of-00047.safetensors", + "model.layers.1.mlp.experts.61.down_proj.weight_scale": "model-00002-of-00047.safetensors", + "model.layers.1.mlp.experts.61.gate_proj.weight": "model-00002-of-00047.safetensors", + "model.layers.1.mlp.experts.61.gate_proj.weight_scale": "model-00002-of-00047.safetensors", + "model.layers.1.mlp.experts.61.up_proj.weight": "model-00002-of-00047.safetensors", + "model.layers.1.mlp.experts.61.up_proj.weight_scale": "model-00002-of-00047.safetensors", + "model.layers.1.mlp.experts.62.down_proj.weight": "model-00002-of-00047.safetensors", + "model.layers.1.mlp.experts.62.down_proj.weight_scale": "model-00002-of-00047.safetensors", + "model.layers.1.mlp.experts.62.gate_proj.weight": "model-00002-of-00047.safetensors", + "model.layers.1.mlp.experts.62.gate_proj.weight_scale": "model-00002-of-00047.safetensors", + "model.layers.1.mlp.experts.62.up_proj.weight": "model-00002-of-00047.safetensors", + "model.layers.1.mlp.experts.62.up_proj.weight_scale": "model-00002-of-00047.safetensors", + "model.layers.1.mlp.experts.63.down_proj.weight": "model-00002-of-00047.safetensors", + "model.layers.1.mlp.experts.63.down_proj.weight_scale": "model-00002-of-00047.safetensors", + "model.layers.1.mlp.experts.63.gate_proj.weight": "model-00002-of-00047.safetensors", + "model.layers.1.mlp.experts.63.gate_proj.weight_scale": "model-00002-of-00047.safetensors", + "model.layers.1.mlp.experts.63.up_proj.weight": "model-00002-of-00047.safetensors", + "model.layers.1.mlp.experts.63.up_proj.weight_scale": "model-00002-of-00047.safetensors", + "model.layers.1.mlp.experts.64.down_proj.weight": "model-00002-of-00047.safetensors", + "model.layers.1.mlp.experts.64.down_proj.weight_scale": "model-00002-of-00047.safetensors", + "model.layers.1.mlp.experts.64.gate_proj.weight": "model-00002-of-00047.safetensors", + "model.layers.1.mlp.experts.64.gate_proj.weight_scale": "model-00002-of-00047.safetensors", + "model.layers.1.mlp.experts.64.up_proj.weight": "model-00002-of-00047.safetensors", + "model.layers.1.mlp.experts.64.up_proj.weight_scale": "model-00002-of-00047.safetensors", + "model.layers.1.mlp.experts.65.down_proj.weight": "model-00002-of-00047.safetensors", + "model.layers.1.mlp.experts.65.down_proj.weight_scale": "model-00002-of-00047.safetensors", + "model.layers.1.mlp.experts.65.gate_proj.weight": "model-00002-of-00047.safetensors", + "model.layers.1.mlp.experts.65.gate_proj.weight_scale": "model-00002-of-00047.safetensors", + "model.layers.1.mlp.experts.65.up_proj.weight": "model-00002-of-00047.safetensors", + "model.layers.1.mlp.experts.65.up_proj.weight_scale": "model-00002-of-00047.safetensors", + "model.layers.1.mlp.experts.66.down_proj.weight": "model-00002-of-00047.safetensors", + "model.layers.1.mlp.experts.66.down_proj.weight_scale": "model-00002-of-00047.safetensors", + "model.layers.1.mlp.experts.66.gate_proj.weight": "model-00002-of-00047.safetensors", + "model.layers.1.mlp.experts.66.gate_proj.weight_scale": "model-00002-of-00047.safetensors", + "model.layers.1.mlp.experts.66.up_proj.weight": "model-00002-of-00047.safetensors", + "model.layers.1.mlp.experts.66.up_proj.weight_scale": "model-00002-of-00047.safetensors", + "model.layers.1.mlp.experts.67.down_proj.weight": "model-00002-of-00047.safetensors", + "model.layers.1.mlp.experts.67.down_proj.weight_scale": "model-00002-of-00047.safetensors", + "model.layers.1.mlp.experts.67.gate_proj.weight": "model-00002-of-00047.safetensors", + "model.layers.1.mlp.experts.67.gate_proj.weight_scale": "model-00002-of-00047.safetensors", + "model.layers.1.mlp.experts.67.up_proj.weight": "model-00002-of-00047.safetensors", + "model.layers.1.mlp.experts.67.up_proj.weight_scale": "model-00002-of-00047.safetensors", + "model.layers.1.mlp.experts.68.down_proj.weight": "model-00002-of-00047.safetensors", + "model.layers.1.mlp.experts.68.down_proj.weight_scale": "model-00002-of-00047.safetensors", + "model.layers.1.mlp.experts.68.gate_proj.weight": "model-00002-of-00047.safetensors", + "model.layers.1.mlp.experts.68.gate_proj.weight_scale": "model-00002-of-00047.safetensors", + "model.layers.1.mlp.experts.68.up_proj.weight": "model-00002-of-00047.safetensors", + "model.layers.1.mlp.experts.68.up_proj.weight_scale": "model-00002-of-00047.safetensors", + "model.layers.1.mlp.experts.69.down_proj.weight": "model-00002-of-00047.safetensors", + "model.layers.1.mlp.experts.69.down_proj.weight_scale": "model-00002-of-00047.safetensors", + "model.layers.1.mlp.experts.69.gate_proj.weight": "model-00002-of-00047.safetensors", + "model.layers.1.mlp.experts.69.gate_proj.weight_scale": "model-00002-of-00047.safetensors", + "model.layers.1.mlp.experts.69.up_proj.weight": "model-00002-of-00047.safetensors", + "model.layers.1.mlp.experts.69.up_proj.weight_scale": "model-00002-of-00047.safetensors", + "model.layers.1.mlp.experts.7.down_proj.weight": "model-00002-of-00047.safetensors", + "model.layers.1.mlp.experts.7.down_proj.weight_scale": "model-00002-of-00047.safetensors", + "model.layers.1.mlp.experts.7.gate_proj.weight": "model-00002-of-00047.safetensors", + "model.layers.1.mlp.experts.7.gate_proj.weight_scale": "model-00002-of-00047.safetensors", + "model.layers.1.mlp.experts.7.up_proj.weight": "model-00002-of-00047.safetensors", + "model.layers.1.mlp.experts.7.up_proj.weight_scale": "model-00002-of-00047.safetensors", + "model.layers.1.mlp.experts.70.down_proj.weight": "model-00002-of-00047.safetensors", + "model.layers.1.mlp.experts.70.down_proj.weight_scale": "model-00002-of-00047.safetensors", + "model.layers.1.mlp.experts.70.gate_proj.weight": "model-00002-of-00047.safetensors", + "model.layers.1.mlp.experts.70.gate_proj.weight_scale": "model-00002-of-00047.safetensors", + "model.layers.1.mlp.experts.70.up_proj.weight": "model-00002-of-00047.safetensors", + "model.layers.1.mlp.experts.70.up_proj.weight_scale": "model-00002-of-00047.safetensors", + "model.layers.1.mlp.experts.71.down_proj.weight": "model-00002-of-00047.safetensors", + "model.layers.1.mlp.experts.71.down_proj.weight_scale": "model-00002-of-00047.safetensors", + "model.layers.1.mlp.experts.71.gate_proj.weight": "model-00002-of-00047.safetensors", + "model.layers.1.mlp.experts.71.gate_proj.weight_scale": "model-00002-of-00047.safetensors", + "model.layers.1.mlp.experts.71.up_proj.weight": "model-00002-of-00047.safetensors", + "model.layers.1.mlp.experts.71.up_proj.weight_scale": "model-00002-of-00047.safetensors", + "model.layers.1.mlp.experts.72.down_proj.weight": "model-00002-of-00047.safetensors", + "model.layers.1.mlp.experts.72.down_proj.weight_scale": "model-00002-of-00047.safetensors", + "model.layers.1.mlp.experts.72.gate_proj.weight": "model-00002-of-00047.safetensors", + "model.layers.1.mlp.experts.72.gate_proj.weight_scale": "model-00002-of-00047.safetensors", + "model.layers.1.mlp.experts.72.up_proj.weight": "model-00002-of-00047.safetensors", + "model.layers.1.mlp.experts.72.up_proj.weight_scale": "model-00002-of-00047.safetensors", + "model.layers.1.mlp.experts.73.down_proj.weight": "model-00002-of-00047.safetensors", + "model.layers.1.mlp.experts.73.down_proj.weight_scale": "model-00002-of-00047.safetensors", + "model.layers.1.mlp.experts.73.gate_proj.weight": "model-00002-of-00047.safetensors", + "model.layers.1.mlp.experts.73.gate_proj.weight_scale": "model-00002-of-00047.safetensors", + "model.layers.1.mlp.experts.73.up_proj.weight": "model-00002-of-00047.safetensors", + "model.layers.1.mlp.experts.73.up_proj.weight_scale": "model-00002-of-00047.safetensors", + "model.layers.1.mlp.experts.74.down_proj.weight": "model-00002-of-00047.safetensors", + "model.layers.1.mlp.experts.74.down_proj.weight_scale": "model-00002-of-00047.safetensors", + "model.layers.1.mlp.experts.74.gate_proj.weight": "model-00002-of-00047.safetensors", + "model.layers.1.mlp.experts.74.gate_proj.weight_scale": "model-00002-of-00047.safetensors", + "model.layers.1.mlp.experts.74.up_proj.weight": "model-00002-of-00047.safetensors", + "model.layers.1.mlp.experts.74.up_proj.weight_scale": "model-00002-of-00047.safetensors", + "model.layers.1.mlp.experts.75.down_proj.weight": "model-00002-of-00047.safetensors", + "model.layers.1.mlp.experts.75.down_proj.weight_scale": "model-00002-of-00047.safetensors", + "model.layers.1.mlp.experts.75.gate_proj.weight": "model-00002-of-00047.safetensors", + "model.layers.1.mlp.experts.75.gate_proj.weight_scale": "model-00002-of-00047.safetensors", + "model.layers.1.mlp.experts.75.up_proj.weight": "model-00002-of-00047.safetensors", + "model.layers.1.mlp.experts.75.up_proj.weight_scale": "model-00002-of-00047.safetensors", + "model.layers.1.mlp.experts.76.down_proj.weight": "model-00002-of-00047.safetensors", + "model.layers.1.mlp.experts.76.down_proj.weight_scale": "model-00002-of-00047.safetensors", + "model.layers.1.mlp.experts.76.gate_proj.weight": "model-00002-of-00047.safetensors", + "model.layers.1.mlp.experts.76.gate_proj.weight_scale": "model-00002-of-00047.safetensors", + "model.layers.1.mlp.experts.76.up_proj.weight": "model-00002-of-00047.safetensors", + "model.layers.1.mlp.experts.76.up_proj.weight_scale": "model-00002-of-00047.safetensors", + "model.layers.1.mlp.experts.77.down_proj.weight": "model-00002-of-00047.safetensors", + "model.layers.1.mlp.experts.77.down_proj.weight_scale": "model-00002-of-00047.safetensors", + "model.layers.1.mlp.experts.77.gate_proj.weight": "model-00002-of-00047.safetensors", + "model.layers.1.mlp.experts.77.gate_proj.weight_scale": "model-00002-of-00047.safetensors", + "model.layers.1.mlp.experts.77.up_proj.weight": "model-00002-of-00047.safetensors", + "model.layers.1.mlp.experts.77.up_proj.weight_scale": "model-00002-of-00047.safetensors", + "model.layers.1.mlp.experts.78.down_proj.weight": "model-00002-of-00047.safetensors", + "model.layers.1.mlp.experts.78.down_proj.weight_scale": "model-00002-of-00047.safetensors", + "model.layers.1.mlp.experts.78.gate_proj.weight": "model-00002-of-00047.safetensors", + "model.layers.1.mlp.experts.78.gate_proj.weight_scale": "model-00002-of-00047.safetensors", + "model.layers.1.mlp.experts.78.up_proj.weight": "model-00002-of-00047.safetensors", + "model.layers.1.mlp.experts.78.up_proj.weight_scale": "model-00002-of-00047.safetensors", + "model.layers.1.mlp.experts.79.down_proj.weight": "model-00002-of-00047.safetensors", + "model.layers.1.mlp.experts.79.down_proj.weight_scale": "model-00002-of-00047.safetensors", + "model.layers.1.mlp.experts.79.gate_proj.weight": "model-00002-of-00047.safetensors", + "model.layers.1.mlp.experts.79.gate_proj.weight_scale": "model-00002-of-00047.safetensors", + "model.layers.1.mlp.experts.79.up_proj.weight": "model-00002-of-00047.safetensors", + "model.layers.1.mlp.experts.79.up_proj.weight_scale": "model-00002-of-00047.safetensors", + "model.layers.1.mlp.experts.8.down_proj.weight": "model-00002-of-00047.safetensors", + "model.layers.1.mlp.experts.8.down_proj.weight_scale": "model-00002-of-00047.safetensors", + "model.layers.1.mlp.experts.8.gate_proj.weight": "model-00002-of-00047.safetensors", + "model.layers.1.mlp.experts.8.gate_proj.weight_scale": "model-00002-of-00047.safetensors", + "model.layers.1.mlp.experts.8.up_proj.weight": "model-00002-of-00047.safetensors", + "model.layers.1.mlp.experts.8.up_proj.weight_scale": "model-00002-of-00047.safetensors", + "model.layers.1.mlp.experts.80.down_proj.weight": "model-00002-of-00047.safetensors", + "model.layers.1.mlp.experts.80.down_proj.weight_scale": "model-00002-of-00047.safetensors", + "model.layers.1.mlp.experts.80.gate_proj.weight": "model-00002-of-00047.safetensors", + "model.layers.1.mlp.experts.80.gate_proj.weight_scale": "model-00002-of-00047.safetensors", + "model.layers.1.mlp.experts.80.up_proj.weight": "model-00002-of-00047.safetensors", + "model.layers.1.mlp.experts.80.up_proj.weight_scale": "model-00002-of-00047.safetensors", + "model.layers.1.mlp.experts.81.down_proj.weight": "model-00002-of-00047.safetensors", + "model.layers.1.mlp.experts.81.down_proj.weight_scale": "model-00002-of-00047.safetensors", + "model.layers.1.mlp.experts.81.gate_proj.weight": "model-00002-of-00047.safetensors", + "model.layers.1.mlp.experts.81.gate_proj.weight_scale": "model-00002-of-00047.safetensors", + "model.layers.1.mlp.experts.81.up_proj.weight": "model-00002-of-00047.safetensors", + "model.layers.1.mlp.experts.81.up_proj.weight_scale": "model-00002-of-00047.safetensors", + "model.layers.1.mlp.experts.82.down_proj.weight": "model-00002-of-00047.safetensors", + "model.layers.1.mlp.experts.82.down_proj.weight_scale": "model-00002-of-00047.safetensors", + "model.layers.1.mlp.experts.82.gate_proj.weight": "model-00002-of-00047.safetensors", + "model.layers.1.mlp.experts.82.gate_proj.weight_scale": "model-00002-of-00047.safetensors", + "model.layers.1.mlp.experts.82.up_proj.weight": "model-00002-of-00047.safetensors", + "model.layers.1.mlp.experts.82.up_proj.weight_scale": "model-00002-of-00047.safetensors", + "model.layers.1.mlp.experts.83.down_proj.weight": "model-00002-of-00047.safetensors", + "model.layers.1.mlp.experts.83.down_proj.weight_scale": "model-00002-of-00047.safetensors", + "model.layers.1.mlp.experts.83.gate_proj.weight": "model-00002-of-00047.safetensors", + "model.layers.1.mlp.experts.83.gate_proj.weight_scale": "model-00002-of-00047.safetensors", + "model.layers.1.mlp.experts.83.up_proj.weight": "model-00002-of-00047.safetensors", + "model.layers.1.mlp.experts.83.up_proj.weight_scale": "model-00002-of-00047.safetensors", + "model.layers.1.mlp.experts.84.down_proj.weight": "model-00002-of-00047.safetensors", + "model.layers.1.mlp.experts.84.down_proj.weight_scale": "model-00002-of-00047.safetensors", + "model.layers.1.mlp.experts.84.gate_proj.weight": "model-00002-of-00047.safetensors", + "model.layers.1.mlp.experts.84.gate_proj.weight_scale": "model-00002-of-00047.safetensors", + "model.layers.1.mlp.experts.84.up_proj.weight": "model-00002-of-00047.safetensors", + "model.layers.1.mlp.experts.84.up_proj.weight_scale": "model-00002-of-00047.safetensors", + "model.layers.1.mlp.experts.85.down_proj.weight": "model-00002-of-00047.safetensors", + "model.layers.1.mlp.experts.85.down_proj.weight_scale": "model-00002-of-00047.safetensors", + "model.layers.1.mlp.experts.85.gate_proj.weight": "model-00002-of-00047.safetensors", + "model.layers.1.mlp.experts.85.gate_proj.weight_scale": "model-00002-of-00047.safetensors", + "model.layers.1.mlp.experts.85.up_proj.weight": "model-00002-of-00047.safetensors", + "model.layers.1.mlp.experts.85.up_proj.weight_scale": "model-00002-of-00047.safetensors", + "model.layers.1.mlp.experts.86.down_proj.weight": "model-00002-of-00047.safetensors", + "model.layers.1.mlp.experts.86.down_proj.weight_scale": "model-00002-of-00047.safetensors", + "model.layers.1.mlp.experts.86.gate_proj.weight": "model-00002-of-00047.safetensors", + "model.layers.1.mlp.experts.86.gate_proj.weight_scale": "model-00002-of-00047.safetensors", + "model.layers.1.mlp.experts.86.up_proj.weight": "model-00002-of-00047.safetensors", + "model.layers.1.mlp.experts.86.up_proj.weight_scale": "model-00002-of-00047.safetensors", + "model.layers.1.mlp.experts.87.down_proj.weight": "model-00002-of-00047.safetensors", + "model.layers.1.mlp.experts.87.down_proj.weight_scale": "model-00002-of-00047.safetensors", + "model.layers.1.mlp.experts.87.gate_proj.weight": "model-00002-of-00047.safetensors", + "model.layers.1.mlp.experts.87.gate_proj.weight_scale": "model-00002-of-00047.safetensors", + "model.layers.1.mlp.experts.87.up_proj.weight": "model-00002-of-00047.safetensors", + "model.layers.1.mlp.experts.87.up_proj.weight_scale": "model-00002-of-00047.safetensors", + "model.layers.1.mlp.experts.88.down_proj.weight": "model-00002-of-00047.safetensors", + "model.layers.1.mlp.experts.88.down_proj.weight_scale": "model-00002-of-00047.safetensors", + "model.layers.1.mlp.experts.88.gate_proj.weight": "model-00002-of-00047.safetensors", + "model.layers.1.mlp.experts.88.gate_proj.weight_scale": "model-00002-of-00047.safetensors", + "model.layers.1.mlp.experts.88.up_proj.weight": "model-00002-of-00047.safetensors", + "model.layers.1.mlp.experts.88.up_proj.weight_scale": "model-00002-of-00047.safetensors", + "model.layers.1.mlp.experts.89.down_proj.weight": "model-00002-of-00047.safetensors", + "model.layers.1.mlp.experts.89.down_proj.weight_scale": "model-00002-of-00047.safetensors", + "model.layers.1.mlp.experts.89.gate_proj.weight": "model-00002-of-00047.safetensors", + "model.layers.1.mlp.experts.89.gate_proj.weight_scale": "model-00002-of-00047.safetensors", + "model.layers.1.mlp.experts.89.up_proj.weight": "model-00002-of-00047.safetensors", + "model.layers.1.mlp.experts.89.up_proj.weight_scale": "model-00002-of-00047.safetensors", + "model.layers.1.mlp.experts.9.down_proj.weight": "model-00002-of-00047.safetensors", + "model.layers.1.mlp.experts.9.down_proj.weight_scale": "model-00002-of-00047.safetensors", + "model.layers.1.mlp.experts.9.gate_proj.weight": "model-00002-of-00047.safetensors", + "model.layers.1.mlp.experts.9.gate_proj.weight_scale": "model-00002-of-00047.safetensors", + "model.layers.1.mlp.experts.9.up_proj.weight": "model-00002-of-00047.safetensors", + "model.layers.1.mlp.experts.9.up_proj.weight_scale": "model-00002-of-00047.safetensors", + "model.layers.1.mlp.experts.90.down_proj.weight": "model-00002-of-00047.safetensors", + "model.layers.1.mlp.experts.90.down_proj.weight_scale": "model-00002-of-00047.safetensors", + "model.layers.1.mlp.experts.90.gate_proj.weight": "model-00002-of-00047.safetensors", + "model.layers.1.mlp.experts.90.gate_proj.weight_scale": "model-00002-of-00047.safetensors", + "model.layers.1.mlp.experts.90.up_proj.weight": "model-00002-of-00047.safetensors", + "model.layers.1.mlp.experts.90.up_proj.weight_scale": "model-00002-of-00047.safetensors", + "model.layers.1.mlp.experts.91.down_proj.weight": "model-00002-of-00047.safetensors", + "model.layers.1.mlp.experts.91.down_proj.weight_scale": "model-00002-of-00047.safetensors", + "model.layers.1.mlp.experts.91.gate_proj.weight": "model-00002-of-00047.safetensors", + "model.layers.1.mlp.experts.91.gate_proj.weight_scale": "model-00002-of-00047.safetensors", + "model.layers.1.mlp.experts.91.up_proj.weight": "model-00002-of-00047.safetensors", + "model.layers.1.mlp.experts.91.up_proj.weight_scale": "model-00002-of-00047.safetensors", + "model.layers.1.mlp.experts.92.down_proj.weight": "model-00002-of-00047.safetensors", + "model.layers.1.mlp.experts.92.down_proj.weight_scale": "model-00002-of-00047.safetensors", + "model.layers.1.mlp.experts.92.gate_proj.weight": "model-00002-of-00047.safetensors", + "model.layers.1.mlp.experts.92.gate_proj.weight_scale": "model-00002-of-00047.safetensors", + "model.layers.1.mlp.experts.92.up_proj.weight": "model-00002-of-00047.safetensors", + "model.layers.1.mlp.experts.92.up_proj.weight_scale": "model-00002-of-00047.safetensors", + "model.layers.1.mlp.experts.93.down_proj.weight": "model-00002-of-00047.safetensors", + "model.layers.1.mlp.experts.93.down_proj.weight_scale": "model-00002-of-00047.safetensors", + "model.layers.1.mlp.experts.93.gate_proj.weight": "model-00002-of-00047.safetensors", + "model.layers.1.mlp.experts.93.gate_proj.weight_scale": "model-00002-of-00047.safetensors", + "model.layers.1.mlp.experts.93.up_proj.weight": "model-00002-of-00047.safetensors", + "model.layers.1.mlp.experts.93.up_proj.weight_scale": "model-00002-of-00047.safetensors", + "model.layers.1.mlp.experts.94.down_proj.weight": "model-00002-of-00047.safetensors", + "model.layers.1.mlp.experts.94.down_proj.weight_scale": "model-00002-of-00047.safetensors", + "model.layers.1.mlp.experts.94.gate_proj.weight": "model-00002-of-00047.safetensors", + "model.layers.1.mlp.experts.94.gate_proj.weight_scale": "model-00002-of-00047.safetensors", + "model.layers.1.mlp.experts.94.up_proj.weight": "model-00002-of-00047.safetensors", + "model.layers.1.mlp.experts.94.up_proj.weight_scale": "model-00002-of-00047.safetensors", + "model.layers.1.mlp.experts.95.down_proj.weight": "model-00002-of-00047.safetensors", + "model.layers.1.mlp.experts.95.down_proj.weight_scale": "model-00002-of-00047.safetensors", + "model.layers.1.mlp.experts.95.gate_proj.weight": "model-00002-of-00047.safetensors", + "model.layers.1.mlp.experts.95.gate_proj.weight_scale": "model-00002-of-00047.safetensors", + "model.layers.1.mlp.experts.95.up_proj.weight": "model-00002-of-00047.safetensors", + "model.layers.1.mlp.experts.95.up_proj.weight_scale": "model-00002-of-00047.safetensors", + "model.layers.1.mlp.experts.96.down_proj.weight": "model-00002-of-00047.safetensors", + "model.layers.1.mlp.experts.96.down_proj.weight_scale": "model-00002-of-00047.safetensors", + "model.layers.1.mlp.experts.96.gate_proj.weight": "model-00002-of-00047.safetensors", + "model.layers.1.mlp.experts.96.gate_proj.weight_scale": "model-00002-of-00047.safetensors", + "model.layers.1.mlp.experts.96.up_proj.weight": "model-00002-of-00047.safetensors", + "model.layers.1.mlp.experts.96.up_proj.weight_scale": "model-00002-of-00047.safetensors", + "model.layers.1.mlp.experts.97.down_proj.weight": "model-00002-of-00047.safetensors", + "model.layers.1.mlp.experts.97.down_proj.weight_scale": "model-00002-of-00047.safetensors", + "model.layers.1.mlp.experts.97.gate_proj.weight": "model-00002-of-00047.safetensors", + "model.layers.1.mlp.experts.97.gate_proj.weight_scale": "model-00002-of-00047.safetensors", + "model.layers.1.mlp.experts.97.up_proj.weight": "model-00002-of-00047.safetensors", + "model.layers.1.mlp.experts.97.up_proj.weight_scale": "model-00002-of-00047.safetensors", + "model.layers.1.mlp.experts.98.down_proj.weight": "model-00002-of-00047.safetensors", + "model.layers.1.mlp.experts.98.down_proj.weight_scale": "model-00002-of-00047.safetensors", + "model.layers.1.mlp.experts.98.gate_proj.weight": "model-00002-of-00047.safetensors", + "model.layers.1.mlp.experts.98.gate_proj.weight_scale": "model-00002-of-00047.safetensors", + "model.layers.1.mlp.experts.98.up_proj.weight": "model-00002-of-00047.safetensors", + "model.layers.1.mlp.experts.98.up_proj.weight_scale": "model-00002-of-00047.safetensors", + "model.layers.1.mlp.experts.99.down_proj.weight": "model-00002-of-00047.safetensors", + "model.layers.1.mlp.experts.99.down_proj.weight_scale": "model-00002-of-00047.safetensors", + "model.layers.1.mlp.experts.99.gate_proj.weight": "model-00002-of-00047.safetensors", + "model.layers.1.mlp.experts.99.gate_proj.weight_scale": "model-00002-of-00047.safetensors", + "model.layers.1.mlp.experts.99.up_proj.weight": "model-00002-of-00047.safetensors", + "model.layers.1.mlp.experts.99.up_proj.weight_scale": "model-00002-of-00047.safetensors", + "model.layers.1.mlp.gate.e_score_correction_bias": "model-00002-of-00047.safetensors", + "model.layers.1.mlp.gate.weight": "model-00002-of-00047.safetensors", + "model.layers.1.mlp.shared_experts.down_proj.weight": "model-00002-of-00047.safetensors", + "model.layers.1.mlp.shared_experts.down_proj.weight_scale": "model-00002-of-00047.safetensors", + "model.layers.1.mlp.shared_experts.gate_proj.weight": "model-00002-of-00047.safetensors", + "model.layers.1.mlp.shared_experts.gate_proj.weight_scale": "model-00002-of-00047.safetensors", + "model.layers.1.mlp.shared_experts.up_proj.weight": "model-00002-of-00047.safetensors", + "model.layers.1.mlp.shared_experts.up_proj.weight_scale": "model-00002-of-00047.safetensors", + "model.layers.1.post_attention_layernorm.weight": "model-00002-of-00047.safetensors", + "model.layers.1.self_attn.k_proj.bias": "model-00002-of-00047.safetensors", + "model.layers.1.self_attn.k_proj.weight": "model-00002-of-00047.safetensors", + "model.layers.1.self_attn.k_proj.weight_scale": "model-00002-of-00047.safetensors", + "model.layers.1.self_attn.o_proj.weight": "model-00002-of-00047.safetensors", + "model.layers.1.self_attn.o_proj.weight_scale": "model-00002-of-00047.safetensors", + "model.layers.1.self_attn.q_proj.bias": "model-00002-of-00047.safetensors", + "model.layers.1.self_attn.q_proj.weight": "model-00002-of-00047.safetensors", + "model.layers.1.self_attn.q_proj.weight_scale": "model-00002-of-00047.safetensors", + "model.layers.1.self_attn.v_proj.bias": "model-00002-of-00047.safetensors", + "model.layers.1.self_attn.v_proj.weight": "model-00002-of-00047.safetensors", + "model.layers.1.self_attn.v_proj.weight_scale": "model-00002-of-00047.safetensors", + "model.layers.2.input_layernorm.weight": "model-00003-of-00047.safetensors", + "model.layers.2.mlp.experts.0.down_proj.weight": "model-00003-of-00047.safetensors", + "model.layers.2.mlp.experts.0.down_proj.weight_scale": "model-00003-of-00047.safetensors", + "model.layers.2.mlp.experts.0.gate_proj.weight": "model-00003-of-00047.safetensors", + "model.layers.2.mlp.experts.0.gate_proj.weight_scale": "model-00003-of-00047.safetensors", + "model.layers.2.mlp.experts.0.up_proj.weight": "model-00003-of-00047.safetensors", + "model.layers.2.mlp.experts.0.up_proj.weight_scale": "model-00003-of-00047.safetensors", + "model.layers.2.mlp.experts.1.down_proj.weight": "model-00003-of-00047.safetensors", + "model.layers.2.mlp.experts.1.down_proj.weight_scale": "model-00003-of-00047.safetensors", + "model.layers.2.mlp.experts.1.gate_proj.weight": "model-00003-of-00047.safetensors", + "model.layers.2.mlp.experts.1.gate_proj.weight_scale": "model-00003-of-00047.safetensors", + "model.layers.2.mlp.experts.1.up_proj.weight": "model-00003-of-00047.safetensors", + "model.layers.2.mlp.experts.1.up_proj.weight_scale": "model-00003-of-00047.safetensors", + "model.layers.2.mlp.experts.10.down_proj.weight": "model-00003-of-00047.safetensors", + "model.layers.2.mlp.experts.10.down_proj.weight_scale": "model-00003-of-00047.safetensors", + "model.layers.2.mlp.experts.10.gate_proj.weight": "model-00003-of-00047.safetensors", + "model.layers.2.mlp.experts.10.gate_proj.weight_scale": "model-00003-of-00047.safetensors", + "model.layers.2.mlp.experts.10.up_proj.weight": "model-00003-of-00047.safetensors", + "model.layers.2.mlp.experts.10.up_proj.weight_scale": "model-00003-of-00047.safetensors", + "model.layers.2.mlp.experts.100.down_proj.weight": "model-00003-of-00047.safetensors", + "model.layers.2.mlp.experts.100.down_proj.weight_scale": "model-00003-of-00047.safetensors", + "model.layers.2.mlp.experts.100.gate_proj.weight": "model-00003-of-00047.safetensors", + "model.layers.2.mlp.experts.100.gate_proj.weight_scale": "model-00003-of-00047.safetensors", + "model.layers.2.mlp.experts.100.up_proj.weight": "model-00003-of-00047.safetensors", + "model.layers.2.mlp.experts.100.up_proj.weight_scale": "model-00003-of-00047.safetensors", + "model.layers.2.mlp.experts.101.down_proj.weight": "model-00003-of-00047.safetensors", + "model.layers.2.mlp.experts.101.down_proj.weight_scale": "model-00003-of-00047.safetensors", + "model.layers.2.mlp.experts.101.gate_proj.weight": "model-00003-of-00047.safetensors", + "model.layers.2.mlp.experts.101.gate_proj.weight_scale": "model-00003-of-00047.safetensors", + "model.layers.2.mlp.experts.101.up_proj.weight": "model-00003-of-00047.safetensors", + "model.layers.2.mlp.experts.101.up_proj.weight_scale": "model-00003-of-00047.safetensors", + "model.layers.2.mlp.experts.102.down_proj.weight": "model-00003-of-00047.safetensors", + "model.layers.2.mlp.experts.102.down_proj.weight_scale": "model-00003-of-00047.safetensors", + "model.layers.2.mlp.experts.102.gate_proj.weight": "model-00003-of-00047.safetensors", + "model.layers.2.mlp.experts.102.gate_proj.weight_scale": "model-00003-of-00047.safetensors", + "model.layers.2.mlp.experts.102.up_proj.weight": "model-00003-of-00047.safetensors", + "model.layers.2.mlp.experts.102.up_proj.weight_scale": "model-00003-of-00047.safetensors", + "model.layers.2.mlp.experts.103.down_proj.weight": "model-00003-of-00047.safetensors", + "model.layers.2.mlp.experts.103.down_proj.weight_scale": "model-00003-of-00047.safetensors", + "model.layers.2.mlp.experts.103.gate_proj.weight": "model-00003-of-00047.safetensors", + "model.layers.2.mlp.experts.103.gate_proj.weight_scale": "model-00003-of-00047.safetensors", + "model.layers.2.mlp.experts.103.up_proj.weight": "model-00003-of-00047.safetensors", + "model.layers.2.mlp.experts.103.up_proj.weight_scale": "model-00003-of-00047.safetensors", + "model.layers.2.mlp.experts.104.down_proj.weight": "model-00003-of-00047.safetensors", + "model.layers.2.mlp.experts.104.down_proj.weight_scale": "model-00003-of-00047.safetensors", + "model.layers.2.mlp.experts.104.gate_proj.weight": "model-00003-of-00047.safetensors", + "model.layers.2.mlp.experts.104.gate_proj.weight_scale": "model-00003-of-00047.safetensors", + "model.layers.2.mlp.experts.104.up_proj.weight": "model-00003-of-00047.safetensors", + "model.layers.2.mlp.experts.104.up_proj.weight_scale": "model-00003-of-00047.safetensors", + "model.layers.2.mlp.experts.105.down_proj.weight": "model-00003-of-00047.safetensors", + "model.layers.2.mlp.experts.105.down_proj.weight_scale": "model-00003-of-00047.safetensors", + "model.layers.2.mlp.experts.105.gate_proj.weight": "model-00003-of-00047.safetensors", + "model.layers.2.mlp.experts.105.gate_proj.weight_scale": "model-00003-of-00047.safetensors", + "model.layers.2.mlp.experts.105.up_proj.weight": "model-00003-of-00047.safetensors", + "model.layers.2.mlp.experts.105.up_proj.weight_scale": "model-00003-of-00047.safetensors", + "model.layers.2.mlp.experts.106.down_proj.weight": "model-00003-of-00047.safetensors", + "model.layers.2.mlp.experts.106.down_proj.weight_scale": "model-00003-of-00047.safetensors", + "model.layers.2.mlp.experts.106.gate_proj.weight": "model-00003-of-00047.safetensors", + "model.layers.2.mlp.experts.106.gate_proj.weight_scale": "model-00003-of-00047.safetensors", + "model.layers.2.mlp.experts.106.up_proj.weight": "model-00003-of-00047.safetensors", + "model.layers.2.mlp.experts.106.up_proj.weight_scale": "model-00003-of-00047.safetensors", + "model.layers.2.mlp.experts.107.down_proj.weight": "model-00003-of-00047.safetensors", + "model.layers.2.mlp.experts.107.down_proj.weight_scale": "model-00003-of-00047.safetensors", + "model.layers.2.mlp.experts.107.gate_proj.weight": "model-00003-of-00047.safetensors", + "model.layers.2.mlp.experts.107.gate_proj.weight_scale": "model-00003-of-00047.safetensors", + "model.layers.2.mlp.experts.107.up_proj.weight": "model-00003-of-00047.safetensors", + "model.layers.2.mlp.experts.107.up_proj.weight_scale": "model-00003-of-00047.safetensors", + "model.layers.2.mlp.experts.108.down_proj.weight": "model-00003-of-00047.safetensors", + "model.layers.2.mlp.experts.108.down_proj.weight_scale": "model-00003-of-00047.safetensors", + "model.layers.2.mlp.experts.108.gate_proj.weight": "model-00003-of-00047.safetensors", + "model.layers.2.mlp.experts.108.gate_proj.weight_scale": "model-00003-of-00047.safetensors", + "model.layers.2.mlp.experts.108.up_proj.weight": "model-00003-of-00047.safetensors", + "model.layers.2.mlp.experts.108.up_proj.weight_scale": "model-00003-of-00047.safetensors", + "model.layers.2.mlp.experts.109.down_proj.weight": "model-00003-of-00047.safetensors", + "model.layers.2.mlp.experts.109.down_proj.weight_scale": "model-00003-of-00047.safetensors", + "model.layers.2.mlp.experts.109.gate_proj.weight": "model-00003-of-00047.safetensors", + "model.layers.2.mlp.experts.109.gate_proj.weight_scale": "model-00003-of-00047.safetensors", + "model.layers.2.mlp.experts.109.up_proj.weight": "model-00003-of-00047.safetensors", + "model.layers.2.mlp.experts.109.up_proj.weight_scale": "model-00003-of-00047.safetensors", + "model.layers.2.mlp.experts.11.down_proj.weight": "model-00003-of-00047.safetensors", + "model.layers.2.mlp.experts.11.down_proj.weight_scale": "model-00003-of-00047.safetensors", + "model.layers.2.mlp.experts.11.gate_proj.weight": "model-00003-of-00047.safetensors", + "model.layers.2.mlp.experts.11.gate_proj.weight_scale": "model-00003-of-00047.safetensors", + "model.layers.2.mlp.experts.11.up_proj.weight": "model-00003-of-00047.safetensors", + "model.layers.2.mlp.experts.11.up_proj.weight_scale": "model-00003-of-00047.safetensors", + "model.layers.2.mlp.experts.110.down_proj.weight": "model-00003-of-00047.safetensors", + "model.layers.2.mlp.experts.110.down_proj.weight_scale": "model-00003-of-00047.safetensors", + "model.layers.2.mlp.experts.110.gate_proj.weight": "model-00003-of-00047.safetensors", + "model.layers.2.mlp.experts.110.gate_proj.weight_scale": "model-00003-of-00047.safetensors", + "model.layers.2.mlp.experts.110.up_proj.weight": "model-00003-of-00047.safetensors", + "model.layers.2.mlp.experts.110.up_proj.weight_scale": "model-00003-of-00047.safetensors", + "model.layers.2.mlp.experts.111.down_proj.weight": "model-00003-of-00047.safetensors", + "model.layers.2.mlp.experts.111.down_proj.weight_scale": "model-00003-of-00047.safetensors", + "model.layers.2.mlp.experts.111.gate_proj.weight": "model-00003-of-00047.safetensors", + "model.layers.2.mlp.experts.111.gate_proj.weight_scale": "model-00003-of-00047.safetensors", + "model.layers.2.mlp.experts.111.up_proj.weight": "model-00003-of-00047.safetensors", + "model.layers.2.mlp.experts.111.up_proj.weight_scale": "model-00003-of-00047.safetensors", + "model.layers.2.mlp.experts.112.down_proj.weight": "model-00003-of-00047.safetensors", + "model.layers.2.mlp.experts.112.down_proj.weight_scale": "model-00003-of-00047.safetensors", + "model.layers.2.mlp.experts.112.gate_proj.weight": "model-00003-of-00047.safetensors", + "model.layers.2.mlp.experts.112.gate_proj.weight_scale": "model-00003-of-00047.safetensors", + "model.layers.2.mlp.experts.112.up_proj.weight": "model-00003-of-00047.safetensors", + "model.layers.2.mlp.experts.112.up_proj.weight_scale": "model-00003-of-00047.safetensors", + "model.layers.2.mlp.experts.113.down_proj.weight": "model-00003-of-00047.safetensors", + "model.layers.2.mlp.experts.113.down_proj.weight_scale": "model-00003-of-00047.safetensors", + "model.layers.2.mlp.experts.113.gate_proj.weight": "model-00003-of-00047.safetensors", + "model.layers.2.mlp.experts.113.gate_proj.weight_scale": "model-00003-of-00047.safetensors", + "model.layers.2.mlp.experts.113.up_proj.weight": "model-00003-of-00047.safetensors", + "model.layers.2.mlp.experts.113.up_proj.weight_scale": "model-00003-of-00047.safetensors", + "model.layers.2.mlp.experts.114.down_proj.weight": "model-00003-of-00047.safetensors", + "model.layers.2.mlp.experts.114.down_proj.weight_scale": "model-00003-of-00047.safetensors", + "model.layers.2.mlp.experts.114.gate_proj.weight": "model-00003-of-00047.safetensors", + "model.layers.2.mlp.experts.114.gate_proj.weight_scale": "model-00003-of-00047.safetensors", + "model.layers.2.mlp.experts.114.up_proj.weight": "model-00003-of-00047.safetensors", + "model.layers.2.mlp.experts.114.up_proj.weight_scale": "model-00003-of-00047.safetensors", + "model.layers.2.mlp.experts.115.down_proj.weight": "model-00003-of-00047.safetensors", + "model.layers.2.mlp.experts.115.down_proj.weight_scale": "model-00003-of-00047.safetensors", + "model.layers.2.mlp.experts.115.gate_proj.weight": "model-00003-of-00047.safetensors", + "model.layers.2.mlp.experts.115.gate_proj.weight_scale": "model-00003-of-00047.safetensors", + "model.layers.2.mlp.experts.115.up_proj.weight": "model-00003-of-00047.safetensors", + "model.layers.2.mlp.experts.115.up_proj.weight_scale": "model-00003-of-00047.safetensors", + "model.layers.2.mlp.experts.116.down_proj.weight": "model-00003-of-00047.safetensors", + "model.layers.2.mlp.experts.116.down_proj.weight_scale": "model-00003-of-00047.safetensors", + "model.layers.2.mlp.experts.116.gate_proj.weight": "model-00003-of-00047.safetensors", + "model.layers.2.mlp.experts.116.gate_proj.weight_scale": "model-00003-of-00047.safetensors", + "model.layers.2.mlp.experts.116.up_proj.weight": "model-00003-of-00047.safetensors", + "model.layers.2.mlp.experts.116.up_proj.weight_scale": "model-00003-of-00047.safetensors", + "model.layers.2.mlp.experts.117.down_proj.weight": "model-00003-of-00047.safetensors", + "model.layers.2.mlp.experts.117.down_proj.weight_scale": "model-00003-of-00047.safetensors", + "model.layers.2.mlp.experts.117.gate_proj.weight": "model-00003-of-00047.safetensors", + "model.layers.2.mlp.experts.117.gate_proj.weight_scale": "model-00003-of-00047.safetensors", + "model.layers.2.mlp.experts.117.up_proj.weight": "model-00003-of-00047.safetensors", + "model.layers.2.mlp.experts.117.up_proj.weight_scale": "model-00003-of-00047.safetensors", + "model.layers.2.mlp.experts.118.down_proj.weight": "model-00003-of-00047.safetensors", + "model.layers.2.mlp.experts.118.down_proj.weight_scale": "model-00003-of-00047.safetensors", + "model.layers.2.mlp.experts.118.gate_proj.weight": "model-00003-of-00047.safetensors", + "model.layers.2.mlp.experts.118.gate_proj.weight_scale": "model-00003-of-00047.safetensors", + "model.layers.2.mlp.experts.118.up_proj.weight": "model-00003-of-00047.safetensors", + "model.layers.2.mlp.experts.118.up_proj.weight_scale": "model-00003-of-00047.safetensors", + "model.layers.2.mlp.experts.119.down_proj.weight": "model-00003-of-00047.safetensors", + "model.layers.2.mlp.experts.119.down_proj.weight_scale": "model-00003-of-00047.safetensors", + "model.layers.2.mlp.experts.119.gate_proj.weight": "model-00003-of-00047.safetensors", + "model.layers.2.mlp.experts.119.gate_proj.weight_scale": "model-00003-of-00047.safetensors", + "model.layers.2.mlp.experts.119.up_proj.weight": "model-00003-of-00047.safetensors", + "model.layers.2.mlp.experts.119.up_proj.weight_scale": "model-00003-of-00047.safetensors", + "model.layers.2.mlp.experts.12.down_proj.weight": "model-00003-of-00047.safetensors", + "model.layers.2.mlp.experts.12.down_proj.weight_scale": "model-00003-of-00047.safetensors", + "model.layers.2.mlp.experts.12.gate_proj.weight": "model-00003-of-00047.safetensors", + "model.layers.2.mlp.experts.12.gate_proj.weight_scale": "model-00003-of-00047.safetensors", + "model.layers.2.mlp.experts.12.up_proj.weight": "model-00003-of-00047.safetensors", + "model.layers.2.mlp.experts.12.up_proj.weight_scale": "model-00003-of-00047.safetensors", + "model.layers.2.mlp.experts.120.down_proj.weight": "model-00003-of-00047.safetensors", + "model.layers.2.mlp.experts.120.down_proj.weight_scale": "model-00003-of-00047.safetensors", + "model.layers.2.mlp.experts.120.gate_proj.weight": "model-00003-of-00047.safetensors", + "model.layers.2.mlp.experts.120.gate_proj.weight_scale": "model-00003-of-00047.safetensors", + "model.layers.2.mlp.experts.120.up_proj.weight": "model-00003-of-00047.safetensors", + "model.layers.2.mlp.experts.120.up_proj.weight_scale": "model-00003-of-00047.safetensors", + "model.layers.2.mlp.experts.121.down_proj.weight": "model-00003-of-00047.safetensors", + "model.layers.2.mlp.experts.121.down_proj.weight_scale": "model-00003-of-00047.safetensors", + "model.layers.2.mlp.experts.121.gate_proj.weight": "model-00003-of-00047.safetensors", + "model.layers.2.mlp.experts.121.gate_proj.weight_scale": "model-00003-of-00047.safetensors", + "model.layers.2.mlp.experts.121.up_proj.weight": "model-00003-of-00047.safetensors", + "model.layers.2.mlp.experts.121.up_proj.weight_scale": "model-00003-of-00047.safetensors", + "model.layers.2.mlp.experts.122.down_proj.weight": "model-00003-of-00047.safetensors", + "model.layers.2.mlp.experts.122.down_proj.weight_scale": "model-00003-of-00047.safetensors", + "model.layers.2.mlp.experts.122.gate_proj.weight": "model-00003-of-00047.safetensors", + "model.layers.2.mlp.experts.122.gate_proj.weight_scale": "model-00003-of-00047.safetensors", + "model.layers.2.mlp.experts.122.up_proj.weight": "model-00003-of-00047.safetensors", + "model.layers.2.mlp.experts.122.up_proj.weight_scale": "model-00003-of-00047.safetensors", + "model.layers.2.mlp.experts.123.down_proj.weight": "model-00003-of-00047.safetensors", + "model.layers.2.mlp.experts.123.down_proj.weight_scale": "model-00003-of-00047.safetensors", + "model.layers.2.mlp.experts.123.gate_proj.weight": "model-00003-of-00047.safetensors", + "model.layers.2.mlp.experts.123.gate_proj.weight_scale": "model-00003-of-00047.safetensors", + "model.layers.2.mlp.experts.123.up_proj.weight": "model-00003-of-00047.safetensors", + "model.layers.2.mlp.experts.123.up_proj.weight_scale": "model-00003-of-00047.safetensors", + "model.layers.2.mlp.experts.124.down_proj.weight": "model-00003-of-00047.safetensors", + "model.layers.2.mlp.experts.124.down_proj.weight_scale": "model-00003-of-00047.safetensors", + "model.layers.2.mlp.experts.124.gate_proj.weight": "model-00003-of-00047.safetensors", + "model.layers.2.mlp.experts.124.gate_proj.weight_scale": "model-00003-of-00047.safetensors", + "model.layers.2.mlp.experts.124.up_proj.weight": "model-00003-of-00047.safetensors", + "model.layers.2.mlp.experts.124.up_proj.weight_scale": "model-00003-of-00047.safetensors", + "model.layers.2.mlp.experts.125.down_proj.weight": "model-00003-of-00047.safetensors", + "model.layers.2.mlp.experts.125.down_proj.weight_scale": "model-00003-of-00047.safetensors", + "model.layers.2.mlp.experts.125.gate_proj.weight": "model-00003-of-00047.safetensors", + "model.layers.2.mlp.experts.125.gate_proj.weight_scale": "model-00003-of-00047.safetensors", + "model.layers.2.mlp.experts.125.up_proj.weight": "model-00003-of-00047.safetensors", + "model.layers.2.mlp.experts.125.up_proj.weight_scale": "model-00003-of-00047.safetensors", + "model.layers.2.mlp.experts.126.down_proj.weight": "model-00003-of-00047.safetensors", + "model.layers.2.mlp.experts.126.down_proj.weight_scale": "model-00003-of-00047.safetensors", + "model.layers.2.mlp.experts.126.gate_proj.weight": "model-00003-of-00047.safetensors", + "model.layers.2.mlp.experts.126.gate_proj.weight_scale": "model-00003-of-00047.safetensors", + "model.layers.2.mlp.experts.126.up_proj.weight": "model-00003-of-00047.safetensors", + "model.layers.2.mlp.experts.126.up_proj.weight_scale": "model-00003-of-00047.safetensors", + "model.layers.2.mlp.experts.127.down_proj.weight": "model-00003-of-00047.safetensors", + "model.layers.2.mlp.experts.127.down_proj.weight_scale": "model-00003-of-00047.safetensors", + "model.layers.2.mlp.experts.127.gate_proj.weight": "model-00003-of-00047.safetensors", + "model.layers.2.mlp.experts.127.gate_proj.weight_scale": "model-00003-of-00047.safetensors", + "model.layers.2.mlp.experts.127.up_proj.weight": "model-00003-of-00047.safetensors", + "model.layers.2.mlp.experts.127.up_proj.weight_scale": "model-00003-of-00047.safetensors", + "model.layers.2.mlp.experts.13.down_proj.weight": "model-00003-of-00047.safetensors", + "model.layers.2.mlp.experts.13.down_proj.weight_scale": "model-00003-of-00047.safetensors", + "model.layers.2.mlp.experts.13.gate_proj.weight": "model-00003-of-00047.safetensors", + "model.layers.2.mlp.experts.13.gate_proj.weight_scale": "model-00003-of-00047.safetensors", + "model.layers.2.mlp.experts.13.up_proj.weight": "model-00003-of-00047.safetensors", + "model.layers.2.mlp.experts.13.up_proj.weight_scale": "model-00003-of-00047.safetensors", + "model.layers.2.mlp.experts.14.down_proj.weight": "model-00003-of-00047.safetensors", + "model.layers.2.mlp.experts.14.down_proj.weight_scale": "model-00003-of-00047.safetensors", + "model.layers.2.mlp.experts.14.gate_proj.weight": "model-00003-of-00047.safetensors", + "model.layers.2.mlp.experts.14.gate_proj.weight_scale": "model-00003-of-00047.safetensors", + "model.layers.2.mlp.experts.14.up_proj.weight": "model-00003-of-00047.safetensors", + "model.layers.2.mlp.experts.14.up_proj.weight_scale": "model-00003-of-00047.safetensors", + "model.layers.2.mlp.experts.15.down_proj.weight": "model-00003-of-00047.safetensors", + "model.layers.2.mlp.experts.15.down_proj.weight_scale": "model-00003-of-00047.safetensors", + "model.layers.2.mlp.experts.15.gate_proj.weight": "model-00003-of-00047.safetensors", + "model.layers.2.mlp.experts.15.gate_proj.weight_scale": "model-00003-of-00047.safetensors", + "model.layers.2.mlp.experts.15.up_proj.weight": "model-00003-of-00047.safetensors", + "model.layers.2.mlp.experts.15.up_proj.weight_scale": "model-00003-of-00047.safetensors", + "model.layers.2.mlp.experts.16.down_proj.weight": "model-00003-of-00047.safetensors", + "model.layers.2.mlp.experts.16.down_proj.weight_scale": "model-00003-of-00047.safetensors", + "model.layers.2.mlp.experts.16.gate_proj.weight": "model-00003-of-00047.safetensors", + "model.layers.2.mlp.experts.16.gate_proj.weight_scale": "model-00003-of-00047.safetensors", + "model.layers.2.mlp.experts.16.up_proj.weight": "model-00003-of-00047.safetensors", + "model.layers.2.mlp.experts.16.up_proj.weight_scale": "model-00003-of-00047.safetensors", + "model.layers.2.mlp.experts.17.down_proj.weight": "model-00003-of-00047.safetensors", + "model.layers.2.mlp.experts.17.down_proj.weight_scale": "model-00003-of-00047.safetensors", + "model.layers.2.mlp.experts.17.gate_proj.weight": "model-00003-of-00047.safetensors", + "model.layers.2.mlp.experts.17.gate_proj.weight_scale": "model-00003-of-00047.safetensors", + "model.layers.2.mlp.experts.17.up_proj.weight": "model-00003-of-00047.safetensors", + "model.layers.2.mlp.experts.17.up_proj.weight_scale": "model-00003-of-00047.safetensors", + "model.layers.2.mlp.experts.18.down_proj.weight": "model-00003-of-00047.safetensors", + "model.layers.2.mlp.experts.18.down_proj.weight_scale": "model-00003-of-00047.safetensors", + "model.layers.2.mlp.experts.18.gate_proj.weight": "model-00003-of-00047.safetensors", + "model.layers.2.mlp.experts.18.gate_proj.weight_scale": "model-00003-of-00047.safetensors", + "model.layers.2.mlp.experts.18.up_proj.weight": "model-00003-of-00047.safetensors", + "model.layers.2.mlp.experts.18.up_proj.weight_scale": "model-00003-of-00047.safetensors", + "model.layers.2.mlp.experts.19.down_proj.weight": "model-00003-of-00047.safetensors", + "model.layers.2.mlp.experts.19.down_proj.weight_scale": "model-00003-of-00047.safetensors", + "model.layers.2.mlp.experts.19.gate_proj.weight": "model-00003-of-00047.safetensors", + "model.layers.2.mlp.experts.19.gate_proj.weight_scale": "model-00003-of-00047.safetensors", + "model.layers.2.mlp.experts.19.up_proj.weight": "model-00003-of-00047.safetensors", + "model.layers.2.mlp.experts.19.up_proj.weight_scale": "model-00003-of-00047.safetensors", + "model.layers.2.mlp.experts.2.down_proj.weight": "model-00003-of-00047.safetensors", + "model.layers.2.mlp.experts.2.down_proj.weight_scale": "model-00003-of-00047.safetensors", + "model.layers.2.mlp.experts.2.gate_proj.weight": "model-00003-of-00047.safetensors", + "model.layers.2.mlp.experts.2.gate_proj.weight_scale": "model-00003-of-00047.safetensors", + "model.layers.2.mlp.experts.2.up_proj.weight": "model-00003-of-00047.safetensors", + "model.layers.2.mlp.experts.2.up_proj.weight_scale": "model-00003-of-00047.safetensors", + "model.layers.2.mlp.experts.20.down_proj.weight": "model-00003-of-00047.safetensors", + "model.layers.2.mlp.experts.20.down_proj.weight_scale": "model-00003-of-00047.safetensors", + "model.layers.2.mlp.experts.20.gate_proj.weight": "model-00003-of-00047.safetensors", + "model.layers.2.mlp.experts.20.gate_proj.weight_scale": "model-00003-of-00047.safetensors", + "model.layers.2.mlp.experts.20.up_proj.weight": "model-00003-of-00047.safetensors", + "model.layers.2.mlp.experts.20.up_proj.weight_scale": "model-00003-of-00047.safetensors", + "model.layers.2.mlp.experts.21.down_proj.weight": "model-00003-of-00047.safetensors", + "model.layers.2.mlp.experts.21.down_proj.weight_scale": "model-00003-of-00047.safetensors", + "model.layers.2.mlp.experts.21.gate_proj.weight": "model-00003-of-00047.safetensors", + "model.layers.2.mlp.experts.21.gate_proj.weight_scale": "model-00003-of-00047.safetensors", + "model.layers.2.mlp.experts.21.up_proj.weight": "model-00003-of-00047.safetensors", + "model.layers.2.mlp.experts.21.up_proj.weight_scale": "model-00003-of-00047.safetensors", + "model.layers.2.mlp.experts.22.down_proj.weight": "model-00003-of-00047.safetensors", + "model.layers.2.mlp.experts.22.down_proj.weight_scale": "model-00003-of-00047.safetensors", + "model.layers.2.mlp.experts.22.gate_proj.weight": "model-00003-of-00047.safetensors", + "model.layers.2.mlp.experts.22.gate_proj.weight_scale": "model-00003-of-00047.safetensors", + "model.layers.2.mlp.experts.22.up_proj.weight": "model-00003-of-00047.safetensors", + "model.layers.2.mlp.experts.22.up_proj.weight_scale": "model-00003-of-00047.safetensors", + "model.layers.2.mlp.experts.23.down_proj.weight": "model-00003-of-00047.safetensors", + "model.layers.2.mlp.experts.23.down_proj.weight_scale": "model-00003-of-00047.safetensors", + "model.layers.2.mlp.experts.23.gate_proj.weight": "model-00003-of-00047.safetensors", + "model.layers.2.mlp.experts.23.gate_proj.weight_scale": "model-00003-of-00047.safetensors", + "model.layers.2.mlp.experts.23.up_proj.weight": "model-00003-of-00047.safetensors", + "model.layers.2.mlp.experts.23.up_proj.weight_scale": "model-00003-of-00047.safetensors", + "model.layers.2.mlp.experts.24.down_proj.weight": "model-00003-of-00047.safetensors", + "model.layers.2.mlp.experts.24.down_proj.weight_scale": "model-00003-of-00047.safetensors", + "model.layers.2.mlp.experts.24.gate_proj.weight": "model-00003-of-00047.safetensors", + "model.layers.2.mlp.experts.24.gate_proj.weight_scale": "model-00003-of-00047.safetensors", + "model.layers.2.mlp.experts.24.up_proj.weight": "model-00003-of-00047.safetensors", + "model.layers.2.mlp.experts.24.up_proj.weight_scale": "model-00003-of-00047.safetensors", + "model.layers.2.mlp.experts.25.down_proj.weight": "model-00003-of-00047.safetensors", + "model.layers.2.mlp.experts.25.down_proj.weight_scale": "model-00003-of-00047.safetensors", + "model.layers.2.mlp.experts.25.gate_proj.weight": "model-00003-of-00047.safetensors", + "model.layers.2.mlp.experts.25.gate_proj.weight_scale": "model-00003-of-00047.safetensors", + "model.layers.2.mlp.experts.25.up_proj.weight": "model-00003-of-00047.safetensors", + "model.layers.2.mlp.experts.25.up_proj.weight_scale": "model-00003-of-00047.safetensors", + "model.layers.2.mlp.experts.26.down_proj.weight": "model-00003-of-00047.safetensors", + "model.layers.2.mlp.experts.26.down_proj.weight_scale": "model-00003-of-00047.safetensors", + "model.layers.2.mlp.experts.26.gate_proj.weight": "model-00003-of-00047.safetensors", + "model.layers.2.mlp.experts.26.gate_proj.weight_scale": "model-00003-of-00047.safetensors", + "model.layers.2.mlp.experts.26.up_proj.weight": "model-00003-of-00047.safetensors", + "model.layers.2.mlp.experts.26.up_proj.weight_scale": "model-00003-of-00047.safetensors", + "model.layers.2.mlp.experts.27.down_proj.weight": "model-00003-of-00047.safetensors", + "model.layers.2.mlp.experts.27.down_proj.weight_scale": "model-00003-of-00047.safetensors", + "model.layers.2.mlp.experts.27.gate_proj.weight": "model-00003-of-00047.safetensors", + "model.layers.2.mlp.experts.27.gate_proj.weight_scale": "model-00003-of-00047.safetensors", + "model.layers.2.mlp.experts.27.up_proj.weight": "model-00003-of-00047.safetensors", + "model.layers.2.mlp.experts.27.up_proj.weight_scale": "model-00003-of-00047.safetensors", + "model.layers.2.mlp.experts.28.down_proj.weight": "model-00003-of-00047.safetensors", + "model.layers.2.mlp.experts.28.down_proj.weight_scale": "model-00003-of-00047.safetensors", + "model.layers.2.mlp.experts.28.gate_proj.weight": "model-00003-of-00047.safetensors", + "model.layers.2.mlp.experts.28.gate_proj.weight_scale": "model-00003-of-00047.safetensors", + "model.layers.2.mlp.experts.28.up_proj.weight": "model-00003-of-00047.safetensors", + "model.layers.2.mlp.experts.28.up_proj.weight_scale": "model-00003-of-00047.safetensors", + "model.layers.2.mlp.experts.29.down_proj.weight": "model-00003-of-00047.safetensors", + "model.layers.2.mlp.experts.29.down_proj.weight_scale": "model-00003-of-00047.safetensors", + "model.layers.2.mlp.experts.29.gate_proj.weight": "model-00003-of-00047.safetensors", + "model.layers.2.mlp.experts.29.gate_proj.weight_scale": "model-00003-of-00047.safetensors", + "model.layers.2.mlp.experts.29.up_proj.weight": "model-00003-of-00047.safetensors", + "model.layers.2.mlp.experts.29.up_proj.weight_scale": "model-00003-of-00047.safetensors", + "model.layers.2.mlp.experts.3.down_proj.weight": "model-00003-of-00047.safetensors", + "model.layers.2.mlp.experts.3.down_proj.weight_scale": "model-00003-of-00047.safetensors", + "model.layers.2.mlp.experts.3.gate_proj.weight": "model-00003-of-00047.safetensors", + "model.layers.2.mlp.experts.3.gate_proj.weight_scale": "model-00003-of-00047.safetensors", + "model.layers.2.mlp.experts.3.up_proj.weight": "model-00003-of-00047.safetensors", + "model.layers.2.mlp.experts.3.up_proj.weight_scale": "model-00003-of-00047.safetensors", + "model.layers.2.mlp.experts.30.down_proj.weight": "model-00003-of-00047.safetensors", + "model.layers.2.mlp.experts.30.down_proj.weight_scale": "model-00003-of-00047.safetensors", + "model.layers.2.mlp.experts.30.gate_proj.weight": "model-00003-of-00047.safetensors", + "model.layers.2.mlp.experts.30.gate_proj.weight_scale": "model-00003-of-00047.safetensors", + "model.layers.2.mlp.experts.30.up_proj.weight": "model-00003-of-00047.safetensors", + "model.layers.2.mlp.experts.30.up_proj.weight_scale": "model-00003-of-00047.safetensors", + "model.layers.2.mlp.experts.31.down_proj.weight": "model-00003-of-00047.safetensors", + "model.layers.2.mlp.experts.31.down_proj.weight_scale": "model-00003-of-00047.safetensors", + "model.layers.2.mlp.experts.31.gate_proj.weight": "model-00003-of-00047.safetensors", + "model.layers.2.mlp.experts.31.gate_proj.weight_scale": "model-00003-of-00047.safetensors", + "model.layers.2.mlp.experts.31.up_proj.weight": "model-00003-of-00047.safetensors", + "model.layers.2.mlp.experts.31.up_proj.weight_scale": "model-00003-of-00047.safetensors", + "model.layers.2.mlp.experts.32.down_proj.weight": "model-00003-of-00047.safetensors", + "model.layers.2.mlp.experts.32.down_proj.weight_scale": "model-00003-of-00047.safetensors", + "model.layers.2.mlp.experts.32.gate_proj.weight": "model-00003-of-00047.safetensors", + "model.layers.2.mlp.experts.32.gate_proj.weight_scale": "model-00003-of-00047.safetensors", + "model.layers.2.mlp.experts.32.up_proj.weight": "model-00003-of-00047.safetensors", + "model.layers.2.mlp.experts.32.up_proj.weight_scale": "model-00003-of-00047.safetensors", + "model.layers.2.mlp.experts.33.down_proj.weight": "model-00003-of-00047.safetensors", + "model.layers.2.mlp.experts.33.down_proj.weight_scale": "model-00003-of-00047.safetensors", + "model.layers.2.mlp.experts.33.gate_proj.weight": "model-00003-of-00047.safetensors", + "model.layers.2.mlp.experts.33.gate_proj.weight_scale": "model-00003-of-00047.safetensors", + "model.layers.2.mlp.experts.33.up_proj.weight": "model-00003-of-00047.safetensors", + "model.layers.2.mlp.experts.33.up_proj.weight_scale": "model-00003-of-00047.safetensors", + "model.layers.2.mlp.experts.34.down_proj.weight": "model-00003-of-00047.safetensors", + "model.layers.2.mlp.experts.34.down_proj.weight_scale": "model-00003-of-00047.safetensors", + "model.layers.2.mlp.experts.34.gate_proj.weight": "model-00003-of-00047.safetensors", + "model.layers.2.mlp.experts.34.gate_proj.weight_scale": "model-00003-of-00047.safetensors", + "model.layers.2.mlp.experts.34.up_proj.weight": "model-00003-of-00047.safetensors", + "model.layers.2.mlp.experts.34.up_proj.weight_scale": "model-00003-of-00047.safetensors", + "model.layers.2.mlp.experts.35.down_proj.weight": "model-00003-of-00047.safetensors", + "model.layers.2.mlp.experts.35.down_proj.weight_scale": "model-00003-of-00047.safetensors", + "model.layers.2.mlp.experts.35.gate_proj.weight": "model-00003-of-00047.safetensors", + "model.layers.2.mlp.experts.35.gate_proj.weight_scale": "model-00003-of-00047.safetensors", + "model.layers.2.mlp.experts.35.up_proj.weight": "model-00003-of-00047.safetensors", + "model.layers.2.mlp.experts.35.up_proj.weight_scale": "model-00003-of-00047.safetensors", + "model.layers.2.mlp.experts.36.down_proj.weight": "model-00003-of-00047.safetensors", + "model.layers.2.mlp.experts.36.down_proj.weight_scale": "model-00003-of-00047.safetensors", + "model.layers.2.mlp.experts.36.gate_proj.weight": "model-00003-of-00047.safetensors", + "model.layers.2.mlp.experts.36.gate_proj.weight_scale": "model-00003-of-00047.safetensors", + "model.layers.2.mlp.experts.36.up_proj.weight": "model-00003-of-00047.safetensors", + "model.layers.2.mlp.experts.36.up_proj.weight_scale": "model-00003-of-00047.safetensors", + "model.layers.2.mlp.experts.37.down_proj.weight": "model-00003-of-00047.safetensors", + "model.layers.2.mlp.experts.37.down_proj.weight_scale": "model-00003-of-00047.safetensors", + "model.layers.2.mlp.experts.37.gate_proj.weight": "model-00003-of-00047.safetensors", + "model.layers.2.mlp.experts.37.gate_proj.weight_scale": "model-00003-of-00047.safetensors", + "model.layers.2.mlp.experts.37.up_proj.weight": "model-00003-of-00047.safetensors", + "model.layers.2.mlp.experts.37.up_proj.weight_scale": "model-00003-of-00047.safetensors", + "model.layers.2.mlp.experts.38.down_proj.weight": "model-00003-of-00047.safetensors", + "model.layers.2.mlp.experts.38.down_proj.weight_scale": "model-00003-of-00047.safetensors", + "model.layers.2.mlp.experts.38.gate_proj.weight": "model-00003-of-00047.safetensors", + "model.layers.2.mlp.experts.38.gate_proj.weight_scale": "model-00003-of-00047.safetensors", + "model.layers.2.mlp.experts.38.up_proj.weight": "model-00003-of-00047.safetensors", + "model.layers.2.mlp.experts.38.up_proj.weight_scale": "model-00003-of-00047.safetensors", + "model.layers.2.mlp.experts.39.down_proj.weight": "model-00003-of-00047.safetensors", + "model.layers.2.mlp.experts.39.down_proj.weight_scale": "model-00003-of-00047.safetensors", + "model.layers.2.mlp.experts.39.gate_proj.weight": "model-00003-of-00047.safetensors", + "model.layers.2.mlp.experts.39.gate_proj.weight_scale": "model-00003-of-00047.safetensors", + "model.layers.2.mlp.experts.39.up_proj.weight": "model-00003-of-00047.safetensors", + "model.layers.2.mlp.experts.39.up_proj.weight_scale": "model-00003-of-00047.safetensors", + "model.layers.2.mlp.experts.4.down_proj.weight": "model-00003-of-00047.safetensors", + "model.layers.2.mlp.experts.4.down_proj.weight_scale": "model-00003-of-00047.safetensors", + "model.layers.2.mlp.experts.4.gate_proj.weight": "model-00003-of-00047.safetensors", + "model.layers.2.mlp.experts.4.gate_proj.weight_scale": "model-00003-of-00047.safetensors", + "model.layers.2.mlp.experts.4.up_proj.weight": "model-00003-of-00047.safetensors", + "model.layers.2.mlp.experts.4.up_proj.weight_scale": "model-00003-of-00047.safetensors", + "model.layers.2.mlp.experts.40.down_proj.weight": "model-00003-of-00047.safetensors", + "model.layers.2.mlp.experts.40.down_proj.weight_scale": "model-00003-of-00047.safetensors", + "model.layers.2.mlp.experts.40.gate_proj.weight": "model-00003-of-00047.safetensors", + "model.layers.2.mlp.experts.40.gate_proj.weight_scale": "model-00003-of-00047.safetensors", + "model.layers.2.mlp.experts.40.up_proj.weight": "model-00003-of-00047.safetensors", + "model.layers.2.mlp.experts.40.up_proj.weight_scale": "model-00003-of-00047.safetensors", + "model.layers.2.mlp.experts.41.down_proj.weight": "model-00003-of-00047.safetensors", + "model.layers.2.mlp.experts.41.down_proj.weight_scale": "model-00003-of-00047.safetensors", + "model.layers.2.mlp.experts.41.gate_proj.weight": "model-00003-of-00047.safetensors", + "model.layers.2.mlp.experts.41.gate_proj.weight_scale": "model-00003-of-00047.safetensors", + "model.layers.2.mlp.experts.41.up_proj.weight": "model-00003-of-00047.safetensors", + "model.layers.2.mlp.experts.41.up_proj.weight_scale": "model-00003-of-00047.safetensors", + "model.layers.2.mlp.experts.42.down_proj.weight": "model-00003-of-00047.safetensors", + "model.layers.2.mlp.experts.42.down_proj.weight_scale": "model-00003-of-00047.safetensors", + "model.layers.2.mlp.experts.42.gate_proj.weight": "model-00003-of-00047.safetensors", + "model.layers.2.mlp.experts.42.gate_proj.weight_scale": "model-00003-of-00047.safetensors", + "model.layers.2.mlp.experts.42.up_proj.weight": "model-00003-of-00047.safetensors", + "model.layers.2.mlp.experts.42.up_proj.weight_scale": "model-00003-of-00047.safetensors", + "model.layers.2.mlp.experts.43.down_proj.weight": "model-00003-of-00047.safetensors", + "model.layers.2.mlp.experts.43.down_proj.weight_scale": "model-00003-of-00047.safetensors", + "model.layers.2.mlp.experts.43.gate_proj.weight": "model-00003-of-00047.safetensors", + "model.layers.2.mlp.experts.43.gate_proj.weight_scale": "model-00003-of-00047.safetensors", + "model.layers.2.mlp.experts.43.up_proj.weight": "model-00003-of-00047.safetensors", + "model.layers.2.mlp.experts.43.up_proj.weight_scale": "model-00003-of-00047.safetensors", + "model.layers.2.mlp.experts.44.down_proj.weight": "model-00003-of-00047.safetensors", + "model.layers.2.mlp.experts.44.down_proj.weight_scale": "model-00003-of-00047.safetensors", + "model.layers.2.mlp.experts.44.gate_proj.weight": "model-00003-of-00047.safetensors", + "model.layers.2.mlp.experts.44.gate_proj.weight_scale": "model-00003-of-00047.safetensors", + "model.layers.2.mlp.experts.44.up_proj.weight": "model-00003-of-00047.safetensors", + "model.layers.2.mlp.experts.44.up_proj.weight_scale": "model-00003-of-00047.safetensors", + "model.layers.2.mlp.experts.45.down_proj.weight": "model-00003-of-00047.safetensors", + "model.layers.2.mlp.experts.45.down_proj.weight_scale": "model-00003-of-00047.safetensors", + "model.layers.2.mlp.experts.45.gate_proj.weight": "model-00003-of-00047.safetensors", + "model.layers.2.mlp.experts.45.gate_proj.weight_scale": "model-00003-of-00047.safetensors", + "model.layers.2.mlp.experts.45.up_proj.weight": "model-00003-of-00047.safetensors", + "model.layers.2.mlp.experts.45.up_proj.weight_scale": "model-00003-of-00047.safetensors", + "model.layers.2.mlp.experts.46.down_proj.weight": "model-00003-of-00047.safetensors", + "model.layers.2.mlp.experts.46.down_proj.weight_scale": "model-00003-of-00047.safetensors", + "model.layers.2.mlp.experts.46.gate_proj.weight": "model-00003-of-00047.safetensors", + "model.layers.2.mlp.experts.46.gate_proj.weight_scale": "model-00003-of-00047.safetensors", + "model.layers.2.mlp.experts.46.up_proj.weight": "model-00003-of-00047.safetensors", + "model.layers.2.mlp.experts.46.up_proj.weight_scale": "model-00003-of-00047.safetensors", + "model.layers.2.mlp.experts.47.down_proj.weight": "model-00003-of-00047.safetensors", + "model.layers.2.mlp.experts.47.down_proj.weight_scale": "model-00003-of-00047.safetensors", + "model.layers.2.mlp.experts.47.gate_proj.weight": "model-00003-of-00047.safetensors", + "model.layers.2.mlp.experts.47.gate_proj.weight_scale": "model-00003-of-00047.safetensors", + "model.layers.2.mlp.experts.47.up_proj.weight": "model-00003-of-00047.safetensors", + "model.layers.2.mlp.experts.47.up_proj.weight_scale": "model-00003-of-00047.safetensors", + "model.layers.2.mlp.experts.48.down_proj.weight": "model-00003-of-00047.safetensors", + "model.layers.2.mlp.experts.48.down_proj.weight_scale": "model-00003-of-00047.safetensors", + "model.layers.2.mlp.experts.48.gate_proj.weight": "model-00003-of-00047.safetensors", + "model.layers.2.mlp.experts.48.gate_proj.weight_scale": "model-00003-of-00047.safetensors", + "model.layers.2.mlp.experts.48.up_proj.weight": "model-00003-of-00047.safetensors", + "model.layers.2.mlp.experts.48.up_proj.weight_scale": "model-00003-of-00047.safetensors", + "model.layers.2.mlp.experts.49.down_proj.weight": "model-00003-of-00047.safetensors", + "model.layers.2.mlp.experts.49.down_proj.weight_scale": "model-00003-of-00047.safetensors", + "model.layers.2.mlp.experts.49.gate_proj.weight": "model-00003-of-00047.safetensors", + "model.layers.2.mlp.experts.49.gate_proj.weight_scale": "model-00003-of-00047.safetensors", + "model.layers.2.mlp.experts.49.up_proj.weight": "model-00003-of-00047.safetensors", + "model.layers.2.mlp.experts.49.up_proj.weight_scale": "model-00003-of-00047.safetensors", + "model.layers.2.mlp.experts.5.down_proj.weight": "model-00003-of-00047.safetensors", + "model.layers.2.mlp.experts.5.down_proj.weight_scale": "model-00003-of-00047.safetensors", + "model.layers.2.mlp.experts.5.gate_proj.weight": "model-00003-of-00047.safetensors", + "model.layers.2.mlp.experts.5.gate_proj.weight_scale": "model-00003-of-00047.safetensors", + "model.layers.2.mlp.experts.5.up_proj.weight": "model-00003-of-00047.safetensors", + "model.layers.2.mlp.experts.5.up_proj.weight_scale": "model-00003-of-00047.safetensors", + "model.layers.2.mlp.experts.50.down_proj.weight": "model-00003-of-00047.safetensors", + "model.layers.2.mlp.experts.50.down_proj.weight_scale": "model-00003-of-00047.safetensors", + "model.layers.2.mlp.experts.50.gate_proj.weight": "model-00003-of-00047.safetensors", + "model.layers.2.mlp.experts.50.gate_proj.weight_scale": "model-00003-of-00047.safetensors", + "model.layers.2.mlp.experts.50.up_proj.weight": "model-00003-of-00047.safetensors", + "model.layers.2.mlp.experts.50.up_proj.weight_scale": "model-00003-of-00047.safetensors", + "model.layers.2.mlp.experts.51.down_proj.weight": "model-00003-of-00047.safetensors", + "model.layers.2.mlp.experts.51.down_proj.weight_scale": "model-00003-of-00047.safetensors", + "model.layers.2.mlp.experts.51.gate_proj.weight": "model-00003-of-00047.safetensors", + "model.layers.2.mlp.experts.51.gate_proj.weight_scale": "model-00003-of-00047.safetensors", + "model.layers.2.mlp.experts.51.up_proj.weight": "model-00003-of-00047.safetensors", + "model.layers.2.mlp.experts.51.up_proj.weight_scale": "model-00003-of-00047.safetensors", + "model.layers.2.mlp.experts.52.down_proj.weight": "model-00003-of-00047.safetensors", + "model.layers.2.mlp.experts.52.down_proj.weight_scale": "model-00003-of-00047.safetensors", + "model.layers.2.mlp.experts.52.gate_proj.weight": "model-00003-of-00047.safetensors", + "model.layers.2.mlp.experts.52.gate_proj.weight_scale": "model-00003-of-00047.safetensors", + "model.layers.2.mlp.experts.52.up_proj.weight": "model-00003-of-00047.safetensors", + "model.layers.2.mlp.experts.52.up_proj.weight_scale": "model-00003-of-00047.safetensors", + "model.layers.2.mlp.experts.53.down_proj.weight": "model-00003-of-00047.safetensors", + "model.layers.2.mlp.experts.53.down_proj.weight_scale": "model-00003-of-00047.safetensors", + "model.layers.2.mlp.experts.53.gate_proj.weight": "model-00003-of-00047.safetensors", + "model.layers.2.mlp.experts.53.gate_proj.weight_scale": "model-00003-of-00047.safetensors", + "model.layers.2.mlp.experts.53.up_proj.weight": "model-00003-of-00047.safetensors", + "model.layers.2.mlp.experts.53.up_proj.weight_scale": "model-00003-of-00047.safetensors", + "model.layers.2.mlp.experts.54.down_proj.weight": "model-00003-of-00047.safetensors", + "model.layers.2.mlp.experts.54.down_proj.weight_scale": "model-00003-of-00047.safetensors", + "model.layers.2.mlp.experts.54.gate_proj.weight": "model-00003-of-00047.safetensors", + "model.layers.2.mlp.experts.54.gate_proj.weight_scale": "model-00003-of-00047.safetensors", + "model.layers.2.mlp.experts.54.up_proj.weight": "model-00003-of-00047.safetensors", + "model.layers.2.mlp.experts.54.up_proj.weight_scale": "model-00003-of-00047.safetensors", + "model.layers.2.mlp.experts.55.down_proj.weight": "model-00003-of-00047.safetensors", + "model.layers.2.mlp.experts.55.down_proj.weight_scale": "model-00003-of-00047.safetensors", + "model.layers.2.mlp.experts.55.gate_proj.weight": "model-00003-of-00047.safetensors", + "model.layers.2.mlp.experts.55.gate_proj.weight_scale": "model-00003-of-00047.safetensors", + "model.layers.2.mlp.experts.55.up_proj.weight": "model-00003-of-00047.safetensors", + "model.layers.2.mlp.experts.55.up_proj.weight_scale": "model-00003-of-00047.safetensors", + "model.layers.2.mlp.experts.56.down_proj.weight": "model-00003-of-00047.safetensors", + "model.layers.2.mlp.experts.56.down_proj.weight_scale": "model-00003-of-00047.safetensors", + "model.layers.2.mlp.experts.56.gate_proj.weight": "model-00003-of-00047.safetensors", + "model.layers.2.mlp.experts.56.gate_proj.weight_scale": "model-00003-of-00047.safetensors", + "model.layers.2.mlp.experts.56.up_proj.weight": "model-00003-of-00047.safetensors", + "model.layers.2.mlp.experts.56.up_proj.weight_scale": "model-00003-of-00047.safetensors", + "model.layers.2.mlp.experts.57.down_proj.weight": "model-00003-of-00047.safetensors", + "model.layers.2.mlp.experts.57.down_proj.weight_scale": "model-00003-of-00047.safetensors", + "model.layers.2.mlp.experts.57.gate_proj.weight": "model-00003-of-00047.safetensors", + "model.layers.2.mlp.experts.57.gate_proj.weight_scale": "model-00003-of-00047.safetensors", + "model.layers.2.mlp.experts.57.up_proj.weight": "model-00003-of-00047.safetensors", + "model.layers.2.mlp.experts.57.up_proj.weight_scale": "model-00003-of-00047.safetensors", + "model.layers.2.mlp.experts.58.down_proj.weight": "model-00003-of-00047.safetensors", + "model.layers.2.mlp.experts.58.down_proj.weight_scale": "model-00003-of-00047.safetensors", + "model.layers.2.mlp.experts.58.gate_proj.weight": "model-00003-of-00047.safetensors", + "model.layers.2.mlp.experts.58.gate_proj.weight_scale": "model-00003-of-00047.safetensors", + "model.layers.2.mlp.experts.58.up_proj.weight": "model-00003-of-00047.safetensors", + "model.layers.2.mlp.experts.58.up_proj.weight_scale": "model-00003-of-00047.safetensors", + "model.layers.2.mlp.experts.59.down_proj.weight": "model-00003-of-00047.safetensors", + "model.layers.2.mlp.experts.59.down_proj.weight_scale": "model-00003-of-00047.safetensors", + "model.layers.2.mlp.experts.59.gate_proj.weight": "model-00003-of-00047.safetensors", + "model.layers.2.mlp.experts.59.gate_proj.weight_scale": "model-00003-of-00047.safetensors", + "model.layers.2.mlp.experts.59.up_proj.weight": "model-00003-of-00047.safetensors", + "model.layers.2.mlp.experts.59.up_proj.weight_scale": "model-00003-of-00047.safetensors", + "model.layers.2.mlp.experts.6.down_proj.weight": "model-00003-of-00047.safetensors", + "model.layers.2.mlp.experts.6.down_proj.weight_scale": "model-00003-of-00047.safetensors", + "model.layers.2.mlp.experts.6.gate_proj.weight": "model-00003-of-00047.safetensors", + "model.layers.2.mlp.experts.6.gate_proj.weight_scale": "model-00003-of-00047.safetensors", + "model.layers.2.mlp.experts.6.up_proj.weight": "model-00003-of-00047.safetensors", + "model.layers.2.mlp.experts.6.up_proj.weight_scale": "model-00003-of-00047.safetensors", + "model.layers.2.mlp.experts.60.down_proj.weight": "model-00003-of-00047.safetensors", + "model.layers.2.mlp.experts.60.down_proj.weight_scale": "model-00003-of-00047.safetensors", + "model.layers.2.mlp.experts.60.gate_proj.weight": "model-00003-of-00047.safetensors", + "model.layers.2.mlp.experts.60.gate_proj.weight_scale": "model-00003-of-00047.safetensors", + "model.layers.2.mlp.experts.60.up_proj.weight": "model-00003-of-00047.safetensors", + "model.layers.2.mlp.experts.60.up_proj.weight_scale": "model-00003-of-00047.safetensors", + "model.layers.2.mlp.experts.61.down_proj.weight": "model-00003-of-00047.safetensors", + "model.layers.2.mlp.experts.61.down_proj.weight_scale": "model-00003-of-00047.safetensors", + "model.layers.2.mlp.experts.61.gate_proj.weight": "model-00003-of-00047.safetensors", + "model.layers.2.mlp.experts.61.gate_proj.weight_scale": "model-00003-of-00047.safetensors", + "model.layers.2.mlp.experts.61.up_proj.weight": "model-00003-of-00047.safetensors", + "model.layers.2.mlp.experts.61.up_proj.weight_scale": "model-00003-of-00047.safetensors", + "model.layers.2.mlp.experts.62.down_proj.weight": "model-00003-of-00047.safetensors", + "model.layers.2.mlp.experts.62.down_proj.weight_scale": "model-00003-of-00047.safetensors", + "model.layers.2.mlp.experts.62.gate_proj.weight": "model-00003-of-00047.safetensors", + "model.layers.2.mlp.experts.62.gate_proj.weight_scale": "model-00003-of-00047.safetensors", + "model.layers.2.mlp.experts.62.up_proj.weight": "model-00003-of-00047.safetensors", + "model.layers.2.mlp.experts.62.up_proj.weight_scale": "model-00003-of-00047.safetensors", + "model.layers.2.mlp.experts.63.down_proj.weight": "model-00003-of-00047.safetensors", + "model.layers.2.mlp.experts.63.down_proj.weight_scale": "model-00003-of-00047.safetensors", + "model.layers.2.mlp.experts.63.gate_proj.weight": "model-00003-of-00047.safetensors", + "model.layers.2.mlp.experts.63.gate_proj.weight_scale": "model-00003-of-00047.safetensors", + "model.layers.2.mlp.experts.63.up_proj.weight": "model-00003-of-00047.safetensors", + "model.layers.2.mlp.experts.63.up_proj.weight_scale": "model-00003-of-00047.safetensors", + "model.layers.2.mlp.experts.64.down_proj.weight": "model-00003-of-00047.safetensors", + "model.layers.2.mlp.experts.64.down_proj.weight_scale": "model-00003-of-00047.safetensors", + "model.layers.2.mlp.experts.64.gate_proj.weight": "model-00003-of-00047.safetensors", + "model.layers.2.mlp.experts.64.gate_proj.weight_scale": "model-00003-of-00047.safetensors", + "model.layers.2.mlp.experts.64.up_proj.weight": "model-00003-of-00047.safetensors", + "model.layers.2.mlp.experts.64.up_proj.weight_scale": "model-00003-of-00047.safetensors", + "model.layers.2.mlp.experts.65.down_proj.weight": "model-00003-of-00047.safetensors", + "model.layers.2.mlp.experts.65.down_proj.weight_scale": "model-00003-of-00047.safetensors", + "model.layers.2.mlp.experts.65.gate_proj.weight": "model-00003-of-00047.safetensors", + "model.layers.2.mlp.experts.65.gate_proj.weight_scale": "model-00003-of-00047.safetensors", + "model.layers.2.mlp.experts.65.up_proj.weight": "model-00003-of-00047.safetensors", + "model.layers.2.mlp.experts.65.up_proj.weight_scale": "model-00003-of-00047.safetensors", + "model.layers.2.mlp.experts.66.down_proj.weight": "model-00003-of-00047.safetensors", + "model.layers.2.mlp.experts.66.down_proj.weight_scale": "model-00003-of-00047.safetensors", + "model.layers.2.mlp.experts.66.gate_proj.weight": "model-00003-of-00047.safetensors", + "model.layers.2.mlp.experts.66.gate_proj.weight_scale": "model-00003-of-00047.safetensors", + "model.layers.2.mlp.experts.66.up_proj.weight": "model-00003-of-00047.safetensors", + "model.layers.2.mlp.experts.66.up_proj.weight_scale": "model-00003-of-00047.safetensors", + "model.layers.2.mlp.experts.67.down_proj.weight": "model-00003-of-00047.safetensors", + "model.layers.2.mlp.experts.67.down_proj.weight_scale": "model-00003-of-00047.safetensors", + "model.layers.2.mlp.experts.67.gate_proj.weight": "model-00003-of-00047.safetensors", + "model.layers.2.mlp.experts.67.gate_proj.weight_scale": "model-00003-of-00047.safetensors", + "model.layers.2.mlp.experts.67.up_proj.weight": "model-00003-of-00047.safetensors", + "model.layers.2.mlp.experts.67.up_proj.weight_scale": "model-00003-of-00047.safetensors", + "model.layers.2.mlp.experts.68.down_proj.weight": "model-00003-of-00047.safetensors", + "model.layers.2.mlp.experts.68.down_proj.weight_scale": "model-00003-of-00047.safetensors", + "model.layers.2.mlp.experts.68.gate_proj.weight": "model-00003-of-00047.safetensors", + "model.layers.2.mlp.experts.68.gate_proj.weight_scale": "model-00003-of-00047.safetensors", + "model.layers.2.mlp.experts.68.up_proj.weight": "model-00003-of-00047.safetensors", + "model.layers.2.mlp.experts.68.up_proj.weight_scale": "model-00003-of-00047.safetensors", + "model.layers.2.mlp.experts.69.down_proj.weight": "model-00003-of-00047.safetensors", + "model.layers.2.mlp.experts.69.down_proj.weight_scale": "model-00003-of-00047.safetensors", + "model.layers.2.mlp.experts.69.gate_proj.weight": "model-00003-of-00047.safetensors", + "model.layers.2.mlp.experts.69.gate_proj.weight_scale": "model-00003-of-00047.safetensors", + "model.layers.2.mlp.experts.69.up_proj.weight": "model-00003-of-00047.safetensors", + "model.layers.2.mlp.experts.69.up_proj.weight_scale": "model-00003-of-00047.safetensors", + "model.layers.2.mlp.experts.7.down_proj.weight": "model-00003-of-00047.safetensors", + "model.layers.2.mlp.experts.7.down_proj.weight_scale": "model-00003-of-00047.safetensors", + "model.layers.2.mlp.experts.7.gate_proj.weight": "model-00003-of-00047.safetensors", + "model.layers.2.mlp.experts.7.gate_proj.weight_scale": "model-00003-of-00047.safetensors", + "model.layers.2.mlp.experts.7.up_proj.weight": "model-00003-of-00047.safetensors", + "model.layers.2.mlp.experts.7.up_proj.weight_scale": "model-00003-of-00047.safetensors", + "model.layers.2.mlp.experts.70.down_proj.weight": "model-00003-of-00047.safetensors", + "model.layers.2.mlp.experts.70.down_proj.weight_scale": "model-00003-of-00047.safetensors", + "model.layers.2.mlp.experts.70.gate_proj.weight": "model-00003-of-00047.safetensors", + "model.layers.2.mlp.experts.70.gate_proj.weight_scale": "model-00003-of-00047.safetensors", + "model.layers.2.mlp.experts.70.up_proj.weight": "model-00003-of-00047.safetensors", + "model.layers.2.mlp.experts.70.up_proj.weight_scale": "model-00003-of-00047.safetensors", + "model.layers.2.mlp.experts.71.down_proj.weight": "model-00003-of-00047.safetensors", + "model.layers.2.mlp.experts.71.down_proj.weight_scale": "model-00003-of-00047.safetensors", + "model.layers.2.mlp.experts.71.gate_proj.weight": "model-00003-of-00047.safetensors", + "model.layers.2.mlp.experts.71.gate_proj.weight_scale": "model-00003-of-00047.safetensors", + "model.layers.2.mlp.experts.71.up_proj.weight": "model-00003-of-00047.safetensors", + "model.layers.2.mlp.experts.71.up_proj.weight_scale": "model-00003-of-00047.safetensors", + "model.layers.2.mlp.experts.72.down_proj.weight": "model-00003-of-00047.safetensors", + "model.layers.2.mlp.experts.72.down_proj.weight_scale": "model-00003-of-00047.safetensors", + "model.layers.2.mlp.experts.72.gate_proj.weight": "model-00003-of-00047.safetensors", + "model.layers.2.mlp.experts.72.gate_proj.weight_scale": "model-00003-of-00047.safetensors", + "model.layers.2.mlp.experts.72.up_proj.weight": "model-00003-of-00047.safetensors", + "model.layers.2.mlp.experts.72.up_proj.weight_scale": "model-00003-of-00047.safetensors", + "model.layers.2.mlp.experts.73.down_proj.weight": "model-00003-of-00047.safetensors", + "model.layers.2.mlp.experts.73.down_proj.weight_scale": "model-00003-of-00047.safetensors", + "model.layers.2.mlp.experts.73.gate_proj.weight": "model-00003-of-00047.safetensors", + "model.layers.2.mlp.experts.73.gate_proj.weight_scale": "model-00003-of-00047.safetensors", + "model.layers.2.mlp.experts.73.up_proj.weight": "model-00003-of-00047.safetensors", + "model.layers.2.mlp.experts.73.up_proj.weight_scale": "model-00003-of-00047.safetensors", + "model.layers.2.mlp.experts.74.down_proj.weight": "model-00003-of-00047.safetensors", + "model.layers.2.mlp.experts.74.down_proj.weight_scale": "model-00003-of-00047.safetensors", + "model.layers.2.mlp.experts.74.gate_proj.weight": "model-00003-of-00047.safetensors", + "model.layers.2.mlp.experts.74.gate_proj.weight_scale": "model-00003-of-00047.safetensors", + "model.layers.2.mlp.experts.74.up_proj.weight": "model-00003-of-00047.safetensors", + "model.layers.2.mlp.experts.74.up_proj.weight_scale": "model-00003-of-00047.safetensors", + "model.layers.2.mlp.experts.75.down_proj.weight": "model-00003-of-00047.safetensors", + "model.layers.2.mlp.experts.75.down_proj.weight_scale": "model-00003-of-00047.safetensors", + "model.layers.2.mlp.experts.75.gate_proj.weight": "model-00003-of-00047.safetensors", + "model.layers.2.mlp.experts.75.gate_proj.weight_scale": "model-00003-of-00047.safetensors", + "model.layers.2.mlp.experts.75.up_proj.weight": "model-00003-of-00047.safetensors", + "model.layers.2.mlp.experts.75.up_proj.weight_scale": "model-00003-of-00047.safetensors", + "model.layers.2.mlp.experts.76.down_proj.weight": "model-00003-of-00047.safetensors", + "model.layers.2.mlp.experts.76.down_proj.weight_scale": "model-00003-of-00047.safetensors", + "model.layers.2.mlp.experts.76.gate_proj.weight": "model-00003-of-00047.safetensors", + "model.layers.2.mlp.experts.76.gate_proj.weight_scale": "model-00003-of-00047.safetensors", + "model.layers.2.mlp.experts.76.up_proj.weight": "model-00003-of-00047.safetensors", + "model.layers.2.mlp.experts.76.up_proj.weight_scale": "model-00003-of-00047.safetensors", + "model.layers.2.mlp.experts.77.down_proj.weight": "model-00003-of-00047.safetensors", + "model.layers.2.mlp.experts.77.down_proj.weight_scale": "model-00003-of-00047.safetensors", + "model.layers.2.mlp.experts.77.gate_proj.weight": "model-00003-of-00047.safetensors", + "model.layers.2.mlp.experts.77.gate_proj.weight_scale": "model-00003-of-00047.safetensors", + "model.layers.2.mlp.experts.77.up_proj.weight": "model-00003-of-00047.safetensors", + "model.layers.2.mlp.experts.77.up_proj.weight_scale": "model-00003-of-00047.safetensors", + "model.layers.2.mlp.experts.78.down_proj.weight": "model-00003-of-00047.safetensors", + "model.layers.2.mlp.experts.78.down_proj.weight_scale": "model-00003-of-00047.safetensors", + "model.layers.2.mlp.experts.78.gate_proj.weight": "model-00003-of-00047.safetensors", + "model.layers.2.mlp.experts.78.gate_proj.weight_scale": "model-00003-of-00047.safetensors", + "model.layers.2.mlp.experts.78.up_proj.weight": "model-00003-of-00047.safetensors", + "model.layers.2.mlp.experts.78.up_proj.weight_scale": "model-00003-of-00047.safetensors", + "model.layers.2.mlp.experts.79.down_proj.weight": "model-00003-of-00047.safetensors", + "model.layers.2.mlp.experts.79.down_proj.weight_scale": "model-00003-of-00047.safetensors", + "model.layers.2.mlp.experts.79.gate_proj.weight": "model-00003-of-00047.safetensors", + "model.layers.2.mlp.experts.79.gate_proj.weight_scale": "model-00003-of-00047.safetensors", + "model.layers.2.mlp.experts.79.up_proj.weight": "model-00003-of-00047.safetensors", + "model.layers.2.mlp.experts.79.up_proj.weight_scale": "model-00003-of-00047.safetensors", + "model.layers.2.mlp.experts.8.down_proj.weight": "model-00003-of-00047.safetensors", + "model.layers.2.mlp.experts.8.down_proj.weight_scale": "model-00003-of-00047.safetensors", + "model.layers.2.mlp.experts.8.gate_proj.weight": "model-00003-of-00047.safetensors", + "model.layers.2.mlp.experts.8.gate_proj.weight_scale": "model-00003-of-00047.safetensors", + "model.layers.2.mlp.experts.8.up_proj.weight": "model-00003-of-00047.safetensors", + "model.layers.2.mlp.experts.8.up_proj.weight_scale": "model-00003-of-00047.safetensors", + "model.layers.2.mlp.experts.80.down_proj.weight": "model-00003-of-00047.safetensors", + "model.layers.2.mlp.experts.80.down_proj.weight_scale": "model-00003-of-00047.safetensors", + "model.layers.2.mlp.experts.80.gate_proj.weight": "model-00003-of-00047.safetensors", + "model.layers.2.mlp.experts.80.gate_proj.weight_scale": "model-00003-of-00047.safetensors", + "model.layers.2.mlp.experts.80.up_proj.weight": "model-00003-of-00047.safetensors", + "model.layers.2.mlp.experts.80.up_proj.weight_scale": "model-00003-of-00047.safetensors", + "model.layers.2.mlp.experts.81.down_proj.weight": "model-00003-of-00047.safetensors", + "model.layers.2.mlp.experts.81.down_proj.weight_scale": "model-00003-of-00047.safetensors", + "model.layers.2.mlp.experts.81.gate_proj.weight": "model-00003-of-00047.safetensors", + "model.layers.2.mlp.experts.81.gate_proj.weight_scale": "model-00003-of-00047.safetensors", + "model.layers.2.mlp.experts.81.up_proj.weight": "model-00003-of-00047.safetensors", + "model.layers.2.mlp.experts.81.up_proj.weight_scale": "model-00003-of-00047.safetensors", + "model.layers.2.mlp.experts.82.down_proj.weight": "model-00003-of-00047.safetensors", + "model.layers.2.mlp.experts.82.down_proj.weight_scale": "model-00003-of-00047.safetensors", + "model.layers.2.mlp.experts.82.gate_proj.weight": "model-00003-of-00047.safetensors", + "model.layers.2.mlp.experts.82.gate_proj.weight_scale": "model-00003-of-00047.safetensors", + "model.layers.2.mlp.experts.82.up_proj.weight": "model-00003-of-00047.safetensors", + "model.layers.2.mlp.experts.82.up_proj.weight_scale": "model-00003-of-00047.safetensors", + "model.layers.2.mlp.experts.83.down_proj.weight": "model-00003-of-00047.safetensors", + "model.layers.2.mlp.experts.83.down_proj.weight_scale": "model-00003-of-00047.safetensors", + "model.layers.2.mlp.experts.83.gate_proj.weight": "model-00003-of-00047.safetensors", + "model.layers.2.mlp.experts.83.gate_proj.weight_scale": "model-00003-of-00047.safetensors", + "model.layers.2.mlp.experts.83.up_proj.weight": "model-00003-of-00047.safetensors", + "model.layers.2.mlp.experts.83.up_proj.weight_scale": "model-00003-of-00047.safetensors", + "model.layers.2.mlp.experts.84.down_proj.weight": "model-00003-of-00047.safetensors", + "model.layers.2.mlp.experts.84.down_proj.weight_scale": "model-00003-of-00047.safetensors", + "model.layers.2.mlp.experts.84.gate_proj.weight": "model-00003-of-00047.safetensors", + "model.layers.2.mlp.experts.84.gate_proj.weight_scale": "model-00003-of-00047.safetensors", + "model.layers.2.mlp.experts.84.up_proj.weight": "model-00003-of-00047.safetensors", + "model.layers.2.mlp.experts.84.up_proj.weight_scale": "model-00003-of-00047.safetensors", + "model.layers.2.mlp.experts.85.down_proj.weight": "model-00003-of-00047.safetensors", + "model.layers.2.mlp.experts.85.down_proj.weight_scale": "model-00003-of-00047.safetensors", + "model.layers.2.mlp.experts.85.gate_proj.weight": "model-00003-of-00047.safetensors", + "model.layers.2.mlp.experts.85.gate_proj.weight_scale": "model-00003-of-00047.safetensors", + "model.layers.2.mlp.experts.85.up_proj.weight": "model-00003-of-00047.safetensors", + "model.layers.2.mlp.experts.85.up_proj.weight_scale": "model-00003-of-00047.safetensors", + "model.layers.2.mlp.experts.86.down_proj.weight": "model-00003-of-00047.safetensors", + "model.layers.2.mlp.experts.86.down_proj.weight_scale": "model-00003-of-00047.safetensors", + "model.layers.2.mlp.experts.86.gate_proj.weight": "model-00003-of-00047.safetensors", + "model.layers.2.mlp.experts.86.gate_proj.weight_scale": "model-00003-of-00047.safetensors", + "model.layers.2.mlp.experts.86.up_proj.weight": "model-00003-of-00047.safetensors", + "model.layers.2.mlp.experts.86.up_proj.weight_scale": "model-00003-of-00047.safetensors", + "model.layers.2.mlp.experts.87.down_proj.weight": "model-00003-of-00047.safetensors", + "model.layers.2.mlp.experts.87.down_proj.weight_scale": "model-00003-of-00047.safetensors", + "model.layers.2.mlp.experts.87.gate_proj.weight": "model-00003-of-00047.safetensors", + "model.layers.2.mlp.experts.87.gate_proj.weight_scale": "model-00003-of-00047.safetensors", + "model.layers.2.mlp.experts.87.up_proj.weight": "model-00003-of-00047.safetensors", + "model.layers.2.mlp.experts.87.up_proj.weight_scale": "model-00003-of-00047.safetensors", + "model.layers.2.mlp.experts.88.down_proj.weight": "model-00003-of-00047.safetensors", + "model.layers.2.mlp.experts.88.down_proj.weight_scale": "model-00003-of-00047.safetensors", + "model.layers.2.mlp.experts.88.gate_proj.weight": "model-00003-of-00047.safetensors", + "model.layers.2.mlp.experts.88.gate_proj.weight_scale": "model-00003-of-00047.safetensors", + "model.layers.2.mlp.experts.88.up_proj.weight": "model-00003-of-00047.safetensors", + "model.layers.2.mlp.experts.88.up_proj.weight_scale": "model-00003-of-00047.safetensors", + "model.layers.2.mlp.experts.89.down_proj.weight": "model-00003-of-00047.safetensors", + "model.layers.2.mlp.experts.89.down_proj.weight_scale": "model-00003-of-00047.safetensors", + "model.layers.2.mlp.experts.89.gate_proj.weight": "model-00003-of-00047.safetensors", + "model.layers.2.mlp.experts.89.gate_proj.weight_scale": "model-00003-of-00047.safetensors", + "model.layers.2.mlp.experts.89.up_proj.weight": "model-00003-of-00047.safetensors", + "model.layers.2.mlp.experts.89.up_proj.weight_scale": "model-00003-of-00047.safetensors", + "model.layers.2.mlp.experts.9.down_proj.weight": "model-00003-of-00047.safetensors", + "model.layers.2.mlp.experts.9.down_proj.weight_scale": "model-00003-of-00047.safetensors", + "model.layers.2.mlp.experts.9.gate_proj.weight": "model-00003-of-00047.safetensors", + "model.layers.2.mlp.experts.9.gate_proj.weight_scale": "model-00003-of-00047.safetensors", + "model.layers.2.mlp.experts.9.up_proj.weight": "model-00003-of-00047.safetensors", + "model.layers.2.mlp.experts.9.up_proj.weight_scale": "model-00003-of-00047.safetensors", + "model.layers.2.mlp.experts.90.down_proj.weight": "model-00003-of-00047.safetensors", + "model.layers.2.mlp.experts.90.down_proj.weight_scale": "model-00003-of-00047.safetensors", + "model.layers.2.mlp.experts.90.gate_proj.weight": "model-00003-of-00047.safetensors", + "model.layers.2.mlp.experts.90.gate_proj.weight_scale": "model-00003-of-00047.safetensors", + "model.layers.2.mlp.experts.90.up_proj.weight": "model-00003-of-00047.safetensors", + "model.layers.2.mlp.experts.90.up_proj.weight_scale": "model-00003-of-00047.safetensors", + "model.layers.2.mlp.experts.91.down_proj.weight": "model-00003-of-00047.safetensors", + "model.layers.2.mlp.experts.91.down_proj.weight_scale": "model-00003-of-00047.safetensors", + "model.layers.2.mlp.experts.91.gate_proj.weight": "model-00003-of-00047.safetensors", + "model.layers.2.mlp.experts.91.gate_proj.weight_scale": "model-00003-of-00047.safetensors", + "model.layers.2.mlp.experts.91.up_proj.weight": "model-00003-of-00047.safetensors", + "model.layers.2.mlp.experts.91.up_proj.weight_scale": "model-00003-of-00047.safetensors", + "model.layers.2.mlp.experts.92.down_proj.weight": "model-00003-of-00047.safetensors", + "model.layers.2.mlp.experts.92.down_proj.weight_scale": "model-00003-of-00047.safetensors", + "model.layers.2.mlp.experts.92.gate_proj.weight": "model-00003-of-00047.safetensors", + "model.layers.2.mlp.experts.92.gate_proj.weight_scale": "model-00003-of-00047.safetensors", + "model.layers.2.mlp.experts.92.up_proj.weight": "model-00003-of-00047.safetensors", + "model.layers.2.mlp.experts.92.up_proj.weight_scale": "model-00003-of-00047.safetensors", + "model.layers.2.mlp.experts.93.down_proj.weight": "model-00003-of-00047.safetensors", + "model.layers.2.mlp.experts.93.down_proj.weight_scale": "model-00003-of-00047.safetensors", + "model.layers.2.mlp.experts.93.gate_proj.weight": "model-00003-of-00047.safetensors", + "model.layers.2.mlp.experts.93.gate_proj.weight_scale": "model-00003-of-00047.safetensors", + "model.layers.2.mlp.experts.93.up_proj.weight": "model-00003-of-00047.safetensors", + "model.layers.2.mlp.experts.93.up_proj.weight_scale": "model-00003-of-00047.safetensors", + "model.layers.2.mlp.experts.94.down_proj.weight": "model-00003-of-00047.safetensors", + "model.layers.2.mlp.experts.94.down_proj.weight_scale": "model-00003-of-00047.safetensors", + "model.layers.2.mlp.experts.94.gate_proj.weight": "model-00003-of-00047.safetensors", + "model.layers.2.mlp.experts.94.gate_proj.weight_scale": "model-00003-of-00047.safetensors", + "model.layers.2.mlp.experts.94.up_proj.weight": "model-00003-of-00047.safetensors", + "model.layers.2.mlp.experts.94.up_proj.weight_scale": "model-00003-of-00047.safetensors", + "model.layers.2.mlp.experts.95.down_proj.weight": "model-00003-of-00047.safetensors", + "model.layers.2.mlp.experts.95.down_proj.weight_scale": "model-00003-of-00047.safetensors", + "model.layers.2.mlp.experts.95.gate_proj.weight": "model-00003-of-00047.safetensors", + "model.layers.2.mlp.experts.95.gate_proj.weight_scale": "model-00003-of-00047.safetensors", + "model.layers.2.mlp.experts.95.up_proj.weight": "model-00003-of-00047.safetensors", + "model.layers.2.mlp.experts.95.up_proj.weight_scale": "model-00003-of-00047.safetensors", + "model.layers.2.mlp.experts.96.down_proj.weight": "model-00003-of-00047.safetensors", + "model.layers.2.mlp.experts.96.down_proj.weight_scale": "model-00003-of-00047.safetensors", + "model.layers.2.mlp.experts.96.gate_proj.weight": "model-00003-of-00047.safetensors", + "model.layers.2.mlp.experts.96.gate_proj.weight_scale": "model-00003-of-00047.safetensors", + "model.layers.2.mlp.experts.96.up_proj.weight": "model-00003-of-00047.safetensors", + "model.layers.2.mlp.experts.96.up_proj.weight_scale": "model-00003-of-00047.safetensors", + "model.layers.2.mlp.experts.97.down_proj.weight": "model-00003-of-00047.safetensors", + "model.layers.2.mlp.experts.97.down_proj.weight_scale": "model-00003-of-00047.safetensors", + "model.layers.2.mlp.experts.97.gate_proj.weight": "model-00003-of-00047.safetensors", + "model.layers.2.mlp.experts.97.gate_proj.weight_scale": "model-00003-of-00047.safetensors", + "model.layers.2.mlp.experts.97.up_proj.weight": "model-00003-of-00047.safetensors", + "model.layers.2.mlp.experts.97.up_proj.weight_scale": "model-00003-of-00047.safetensors", + "model.layers.2.mlp.experts.98.down_proj.weight": "model-00003-of-00047.safetensors", + "model.layers.2.mlp.experts.98.down_proj.weight_scale": "model-00003-of-00047.safetensors", + "model.layers.2.mlp.experts.98.gate_proj.weight": "model-00003-of-00047.safetensors", + "model.layers.2.mlp.experts.98.gate_proj.weight_scale": "model-00003-of-00047.safetensors", + "model.layers.2.mlp.experts.98.up_proj.weight": "model-00003-of-00047.safetensors", + "model.layers.2.mlp.experts.98.up_proj.weight_scale": "model-00003-of-00047.safetensors", + "model.layers.2.mlp.experts.99.down_proj.weight": "model-00003-of-00047.safetensors", + "model.layers.2.mlp.experts.99.down_proj.weight_scale": "model-00003-of-00047.safetensors", + "model.layers.2.mlp.experts.99.gate_proj.weight": "model-00003-of-00047.safetensors", + "model.layers.2.mlp.experts.99.gate_proj.weight_scale": "model-00003-of-00047.safetensors", + "model.layers.2.mlp.experts.99.up_proj.weight": "model-00003-of-00047.safetensors", + "model.layers.2.mlp.experts.99.up_proj.weight_scale": "model-00003-of-00047.safetensors", + "model.layers.2.mlp.gate.e_score_correction_bias": "model-00003-of-00047.safetensors", + "model.layers.2.mlp.gate.weight": "model-00003-of-00047.safetensors", + "model.layers.2.mlp.shared_experts.down_proj.weight": "model-00003-of-00047.safetensors", + "model.layers.2.mlp.shared_experts.down_proj.weight_scale": "model-00003-of-00047.safetensors", + "model.layers.2.mlp.shared_experts.gate_proj.weight": "model-00003-of-00047.safetensors", + "model.layers.2.mlp.shared_experts.gate_proj.weight_scale": "model-00003-of-00047.safetensors", + "model.layers.2.mlp.shared_experts.up_proj.weight": "model-00003-of-00047.safetensors", + "model.layers.2.mlp.shared_experts.up_proj.weight_scale": "model-00003-of-00047.safetensors", + "model.layers.2.post_attention_layernorm.weight": "model-00003-of-00047.safetensors", + "model.layers.2.self_attn.k_proj.bias": "model-00003-of-00047.safetensors", + "model.layers.2.self_attn.k_proj.weight": "model-00003-of-00047.safetensors", + "model.layers.2.self_attn.k_proj.weight_scale": "model-00003-of-00047.safetensors", + "model.layers.2.self_attn.o_proj.weight": "model-00003-of-00047.safetensors", + "model.layers.2.self_attn.o_proj.weight_scale": "model-00003-of-00047.safetensors", + "model.layers.2.self_attn.q_proj.bias": "model-00003-of-00047.safetensors", + "model.layers.2.self_attn.q_proj.weight": "model-00003-of-00047.safetensors", + "model.layers.2.self_attn.q_proj.weight_scale": "model-00003-of-00047.safetensors", + "model.layers.2.self_attn.v_proj.bias": "model-00003-of-00047.safetensors", + "model.layers.2.self_attn.v_proj.weight": "model-00003-of-00047.safetensors", + "model.layers.2.self_attn.v_proj.weight_scale": "model-00003-of-00047.safetensors", + "model.layers.3.input_layernorm.weight": "model-00004-of-00047.safetensors", + "model.layers.3.mlp.experts.0.down_proj.weight": "model-00004-of-00047.safetensors", + "model.layers.3.mlp.experts.0.down_proj.weight_scale": "model-00004-of-00047.safetensors", + "model.layers.3.mlp.experts.0.gate_proj.weight": "model-00004-of-00047.safetensors", + "model.layers.3.mlp.experts.0.gate_proj.weight_scale": "model-00004-of-00047.safetensors", + "model.layers.3.mlp.experts.0.up_proj.weight": "model-00004-of-00047.safetensors", + "model.layers.3.mlp.experts.0.up_proj.weight_scale": "model-00004-of-00047.safetensors", + "model.layers.3.mlp.experts.1.down_proj.weight": "model-00004-of-00047.safetensors", + "model.layers.3.mlp.experts.1.down_proj.weight_scale": "model-00004-of-00047.safetensors", + "model.layers.3.mlp.experts.1.gate_proj.weight": "model-00004-of-00047.safetensors", + "model.layers.3.mlp.experts.1.gate_proj.weight_scale": "model-00004-of-00047.safetensors", + "model.layers.3.mlp.experts.1.up_proj.weight": "model-00004-of-00047.safetensors", + "model.layers.3.mlp.experts.1.up_proj.weight_scale": "model-00004-of-00047.safetensors", + "model.layers.3.mlp.experts.10.down_proj.weight": "model-00004-of-00047.safetensors", + "model.layers.3.mlp.experts.10.down_proj.weight_scale": "model-00004-of-00047.safetensors", + "model.layers.3.mlp.experts.10.gate_proj.weight": "model-00004-of-00047.safetensors", + "model.layers.3.mlp.experts.10.gate_proj.weight_scale": "model-00004-of-00047.safetensors", + "model.layers.3.mlp.experts.10.up_proj.weight": "model-00004-of-00047.safetensors", + "model.layers.3.mlp.experts.10.up_proj.weight_scale": "model-00004-of-00047.safetensors", + "model.layers.3.mlp.experts.100.down_proj.weight": "model-00004-of-00047.safetensors", + "model.layers.3.mlp.experts.100.down_proj.weight_scale": "model-00004-of-00047.safetensors", + "model.layers.3.mlp.experts.100.gate_proj.weight": "model-00004-of-00047.safetensors", + "model.layers.3.mlp.experts.100.gate_proj.weight_scale": "model-00004-of-00047.safetensors", + "model.layers.3.mlp.experts.100.up_proj.weight": "model-00004-of-00047.safetensors", + "model.layers.3.mlp.experts.100.up_proj.weight_scale": "model-00004-of-00047.safetensors", + "model.layers.3.mlp.experts.101.down_proj.weight": "model-00004-of-00047.safetensors", + "model.layers.3.mlp.experts.101.down_proj.weight_scale": "model-00004-of-00047.safetensors", + "model.layers.3.mlp.experts.101.gate_proj.weight": "model-00004-of-00047.safetensors", + "model.layers.3.mlp.experts.101.gate_proj.weight_scale": "model-00004-of-00047.safetensors", + "model.layers.3.mlp.experts.101.up_proj.weight": "model-00004-of-00047.safetensors", + "model.layers.3.mlp.experts.101.up_proj.weight_scale": "model-00004-of-00047.safetensors", + "model.layers.3.mlp.experts.102.down_proj.weight": "model-00004-of-00047.safetensors", + "model.layers.3.mlp.experts.102.down_proj.weight_scale": "model-00004-of-00047.safetensors", + "model.layers.3.mlp.experts.102.gate_proj.weight": "model-00004-of-00047.safetensors", + "model.layers.3.mlp.experts.102.gate_proj.weight_scale": "model-00004-of-00047.safetensors", + "model.layers.3.mlp.experts.102.up_proj.weight": "model-00004-of-00047.safetensors", + "model.layers.3.mlp.experts.102.up_proj.weight_scale": "model-00004-of-00047.safetensors", + "model.layers.3.mlp.experts.103.down_proj.weight": "model-00004-of-00047.safetensors", + "model.layers.3.mlp.experts.103.down_proj.weight_scale": "model-00004-of-00047.safetensors", + "model.layers.3.mlp.experts.103.gate_proj.weight": "model-00004-of-00047.safetensors", + "model.layers.3.mlp.experts.103.gate_proj.weight_scale": "model-00004-of-00047.safetensors", + "model.layers.3.mlp.experts.103.up_proj.weight": "model-00004-of-00047.safetensors", + "model.layers.3.mlp.experts.103.up_proj.weight_scale": "model-00004-of-00047.safetensors", + "model.layers.3.mlp.experts.104.down_proj.weight": "model-00004-of-00047.safetensors", + "model.layers.3.mlp.experts.104.down_proj.weight_scale": "model-00004-of-00047.safetensors", + "model.layers.3.mlp.experts.104.gate_proj.weight": "model-00004-of-00047.safetensors", + "model.layers.3.mlp.experts.104.gate_proj.weight_scale": "model-00004-of-00047.safetensors", + "model.layers.3.mlp.experts.104.up_proj.weight": "model-00004-of-00047.safetensors", + "model.layers.3.mlp.experts.104.up_proj.weight_scale": "model-00004-of-00047.safetensors", + "model.layers.3.mlp.experts.105.down_proj.weight": "model-00004-of-00047.safetensors", + "model.layers.3.mlp.experts.105.down_proj.weight_scale": "model-00004-of-00047.safetensors", + "model.layers.3.mlp.experts.105.gate_proj.weight": "model-00004-of-00047.safetensors", + "model.layers.3.mlp.experts.105.gate_proj.weight_scale": "model-00004-of-00047.safetensors", + "model.layers.3.mlp.experts.105.up_proj.weight": "model-00004-of-00047.safetensors", + "model.layers.3.mlp.experts.105.up_proj.weight_scale": "model-00004-of-00047.safetensors", + "model.layers.3.mlp.experts.106.down_proj.weight": "model-00004-of-00047.safetensors", + "model.layers.3.mlp.experts.106.down_proj.weight_scale": "model-00004-of-00047.safetensors", + "model.layers.3.mlp.experts.106.gate_proj.weight": "model-00004-of-00047.safetensors", + "model.layers.3.mlp.experts.106.gate_proj.weight_scale": "model-00004-of-00047.safetensors", + "model.layers.3.mlp.experts.106.up_proj.weight": "model-00004-of-00047.safetensors", + "model.layers.3.mlp.experts.106.up_proj.weight_scale": "model-00004-of-00047.safetensors", + "model.layers.3.mlp.experts.107.down_proj.weight": "model-00004-of-00047.safetensors", + "model.layers.3.mlp.experts.107.down_proj.weight_scale": "model-00004-of-00047.safetensors", + "model.layers.3.mlp.experts.107.gate_proj.weight": "model-00004-of-00047.safetensors", + "model.layers.3.mlp.experts.107.gate_proj.weight_scale": "model-00004-of-00047.safetensors", + "model.layers.3.mlp.experts.107.up_proj.weight": "model-00004-of-00047.safetensors", + "model.layers.3.mlp.experts.107.up_proj.weight_scale": "model-00004-of-00047.safetensors", + "model.layers.3.mlp.experts.108.down_proj.weight": "model-00004-of-00047.safetensors", + "model.layers.3.mlp.experts.108.down_proj.weight_scale": "model-00004-of-00047.safetensors", + "model.layers.3.mlp.experts.108.gate_proj.weight": "model-00004-of-00047.safetensors", + "model.layers.3.mlp.experts.108.gate_proj.weight_scale": "model-00004-of-00047.safetensors", + "model.layers.3.mlp.experts.108.up_proj.weight": "model-00004-of-00047.safetensors", + "model.layers.3.mlp.experts.108.up_proj.weight_scale": "model-00004-of-00047.safetensors", + "model.layers.3.mlp.experts.109.down_proj.weight": "model-00004-of-00047.safetensors", + "model.layers.3.mlp.experts.109.down_proj.weight_scale": "model-00004-of-00047.safetensors", + "model.layers.3.mlp.experts.109.gate_proj.weight": "model-00004-of-00047.safetensors", + "model.layers.3.mlp.experts.109.gate_proj.weight_scale": "model-00004-of-00047.safetensors", + "model.layers.3.mlp.experts.109.up_proj.weight": "model-00004-of-00047.safetensors", + "model.layers.3.mlp.experts.109.up_proj.weight_scale": "model-00004-of-00047.safetensors", + "model.layers.3.mlp.experts.11.down_proj.weight": "model-00004-of-00047.safetensors", + "model.layers.3.mlp.experts.11.down_proj.weight_scale": "model-00004-of-00047.safetensors", + "model.layers.3.mlp.experts.11.gate_proj.weight": "model-00004-of-00047.safetensors", + "model.layers.3.mlp.experts.11.gate_proj.weight_scale": "model-00004-of-00047.safetensors", + "model.layers.3.mlp.experts.11.up_proj.weight": "model-00004-of-00047.safetensors", + "model.layers.3.mlp.experts.11.up_proj.weight_scale": "model-00004-of-00047.safetensors", + "model.layers.3.mlp.experts.110.down_proj.weight": "model-00004-of-00047.safetensors", + "model.layers.3.mlp.experts.110.down_proj.weight_scale": "model-00004-of-00047.safetensors", + "model.layers.3.mlp.experts.110.gate_proj.weight": "model-00004-of-00047.safetensors", + "model.layers.3.mlp.experts.110.gate_proj.weight_scale": "model-00004-of-00047.safetensors", + "model.layers.3.mlp.experts.110.up_proj.weight": "model-00004-of-00047.safetensors", + "model.layers.3.mlp.experts.110.up_proj.weight_scale": "model-00004-of-00047.safetensors", + "model.layers.3.mlp.experts.111.down_proj.weight": "model-00004-of-00047.safetensors", + "model.layers.3.mlp.experts.111.down_proj.weight_scale": "model-00004-of-00047.safetensors", + "model.layers.3.mlp.experts.111.gate_proj.weight": "model-00004-of-00047.safetensors", + "model.layers.3.mlp.experts.111.gate_proj.weight_scale": "model-00004-of-00047.safetensors", + "model.layers.3.mlp.experts.111.up_proj.weight": "model-00004-of-00047.safetensors", + "model.layers.3.mlp.experts.111.up_proj.weight_scale": "model-00004-of-00047.safetensors", + "model.layers.3.mlp.experts.112.down_proj.weight": "model-00004-of-00047.safetensors", + "model.layers.3.mlp.experts.112.down_proj.weight_scale": "model-00004-of-00047.safetensors", + "model.layers.3.mlp.experts.112.gate_proj.weight": "model-00004-of-00047.safetensors", + "model.layers.3.mlp.experts.112.gate_proj.weight_scale": "model-00004-of-00047.safetensors", + "model.layers.3.mlp.experts.112.up_proj.weight": "model-00004-of-00047.safetensors", + "model.layers.3.mlp.experts.112.up_proj.weight_scale": "model-00004-of-00047.safetensors", + "model.layers.3.mlp.experts.113.down_proj.weight": "model-00004-of-00047.safetensors", + "model.layers.3.mlp.experts.113.down_proj.weight_scale": "model-00004-of-00047.safetensors", + "model.layers.3.mlp.experts.113.gate_proj.weight": "model-00004-of-00047.safetensors", + "model.layers.3.mlp.experts.113.gate_proj.weight_scale": "model-00004-of-00047.safetensors", + "model.layers.3.mlp.experts.113.up_proj.weight": "model-00004-of-00047.safetensors", + "model.layers.3.mlp.experts.113.up_proj.weight_scale": "model-00004-of-00047.safetensors", + "model.layers.3.mlp.experts.114.down_proj.weight": "model-00004-of-00047.safetensors", + "model.layers.3.mlp.experts.114.down_proj.weight_scale": "model-00004-of-00047.safetensors", + "model.layers.3.mlp.experts.114.gate_proj.weight": "model-00004-of-00047.safetensors", + "model.layers.3.mlp.experts.114.gate_proj.weight_scale": "model-00004-of-00047.safetensors", + "model.layers.3.mlp.experts.114.up_proj.weight": "model-00004-of-00047.safetensors", + "model.layers.3.mlp.experts.114.up_proj.weight_scale": "model-00004-of-00047.safetensors", + "model.layers.3.mlp.experts.115.down_proj.weight": "model-00004-of-00047.safetensors", + "model.layers.3.mlp.experts.115.down_proj.weight_scale": "model-00004-of-00047.safetensors", + "model.layers.3.mlp.experts.115.gate_proj.weight": "model-00004-of-00047.safetensors", + "model.layers.3.mlp.experts.115.gate_proj.weight_scale": "model-00004-of-00047.safetensors", + "model.layers.3.mlp.experts.115.up_proj.weight": "model-00004-of-00047.safetensors", + "model.layers.3.mlp.experts.115.up_proj.weight_scale": "model-00004-of-00047.safetensors", + "model.layers.3.mlp.experts.116.down_proj.weight": "model-00004-of-00047.safetensors", + "model.layers.3.mlp.experts.116.down_proj.weight_scale": "model-00004-of-00047.safetensors", + "model.layers.3.mlp.experts.116.gate_proj.weight": "model-00004-of-00047.safetensors", + "model.layers.3.mlp.experts.116.gate_proj.weight_scale": "model-00004-of-00047.safetensors", + "model.layers.3.mlp.experts.116.up_proj.weight": "model-00004-of-00047.safetensors", + "model.layers.3.mlp.experts.116.up_proj.weight_scale": "model-00004-of-00047.safetensors", + "model.layers.3.mlp.experts.117.down_proj.weight": "model-00004-of-00047.safetensors", + "model.layers.3.mlp.experts.117.down_proj.weight_scale": "model-00004-of-00047.safetensors", + "model.layers.3.mlp.experts.117.gate_proj.weight": "model-00004-of-00047.safetensors", + "model.layers.3.mlp.experts.117.gate_proj.weight_scale": "model-00004-of-00047.safetensors", + "model.layers.3.mlp.experts.117.up_proj.weight": "model-00004-of-00047.safetensors", + "model.layers.3.mlp.experts.117.up_proj.weight_scale": "model-00004-of-00047.safetensors", + "model.layers.3.mlp.experts.118.down_proj.weight": "model-00004-of-00047.safetensors", + "model.layers.3.mlp.experts.118.down_proj.weight_scale": "model-00004-of-00047.safetensors", + "model.layers.3.mlp.experts.118.gate_proj.weight": "model-00004-of-00047.safetensors", + "model.layers.3.mlp.experts.118.gate_proj.weight_scale": "model-00004-of-00047.safetensors", + "model.layers.3.mlp.experts.118.up_proj.weight": "model-00004-of-00047.safetensors", + "model.layers.3.mlp.experts.118.up_proj.weight_scale": "model-00004-of-00047.safetensors", + "model.layers.3.mlp.experts.119.down_proj.weight": "model-00004-of-00047.safetensors", + "model.layers.3.mlp.experts.119.down_proj.weight_scale": "model-00004-of-00047.safetensors", + "model.layers.3.mlp.experts.119.gate_proj.weight": "model-00004-of-00047.safetensors", + "model.layers.3.mlp.experts.119.gate_proj.weight_scale": "model-00004-of-00047.safetensors", + "model.layers.3.mlp.experts.119.up_proj.weight": "model-00004-of-00047.safetensors", + "model.layers.3.mlp.experts.119.up_proj.weight_scale": "model-00004-of-00047.safetensors", + "model.layers.3.mlp.experts.12.down_proj.weight": "model-00004-of-00047.safetensors", + "model.layers.3.mlp.experts.12.down_proj.weight_scale": "model-00004-of-00047.safetensors", + "model.layers.3.mlp.experts.12.gate_proj.weight": "model-00004-of-00047.safetensors", + "model.layers.3.mlp.experts.12.gate_proj.weight_scale": "model-00004-of-00047.safetensors", + "model.layers.3.mlp.experts.12.up_proj.weight": "model-00004-of-00047.safetensors", + "model.layers.3.mlp.experts.12.up_proj.weight_scale": "model-00004-of-00047.safetensors", + "model.layers.3.mlp.experts.120.down_proj.weight": "model-00004-of-00047.safetensors", + "model.layers.3.mlp.experts.120.down_proj.weight_scale": "model-00004-of-00047.safetensors", + "model.layers.3.mlp.experts.120.gate_proj.weight": "model-00004-of-00047.safetensors", + "model.layers.3.mlp.experts.120.gate_proj.weight_scale": "model-00004-of-00047.safetensors", + "model.layers.3.mlp.experts.120.up_proj.weight": "model-00004-of-00047.safetensors", + "model.layers.3.mlp.experts.120.up_proj.weight_scale": "model-00004-of-00047.safetensors", + "model.layers.3.mlp.experts.121.down_proj.weight": "model-00004-of-00047.safetensors", + "model.layers.3.mlp.experts.121.down_proj.weight_scale": "model-00004-of-00047.safetensors", + "model.layers.3.mlp.experts.121.gate_proj.weight": "model-00004-of-00047.safetensors", + "model.layers.3.mlp.experts.121.gate_proj.weight_scale": "model-00004-of-00047.safetensors", + "model.layers.3.mlp.experts.121.up_proj.weight": "model-00004-of-00047.safetensors", + "model.layers.3.mlp.experts.121.up_proj.weight_scale": "model-00004-of-00047.safetensors", + "model.layers.3.mlp.experts.122.down_proj.weight": "model-00004-of-00047.safetensors", + "model.layers.3.mlp.experts.122.down_proj.weight_scale": "model-00004-of-00047.safetensors", + "model.layers.3.mlp.experts.122.gate_proj.weight": "model-00004-of-00047.safetensors", + "model.layers.3.mlp.experts.122.gate_proj.weight_scale": "model-00004-of-00047.safetensors", + "model.layers.3.mlp.experts.122.up_proj.weight": "model-00004-of-00047.safetensors", + "model.layers.3.mlp.experts.122.up_proj.weight_scale": "model-00004-of-00047.safetensors", + "model.layers.3.mlp.experts.123.down_proj.weight": "model-00004-of-00047.safetensors", + "model.layers.3.mlp.experts.123.down_proj.weight_scale": "model-00004-of-00047.safetensors", + "model.layers.3.mlp.experts.123.gate_proj.weight": "model-00004-of-00047.safetensors", + "model.layers.3.mlp.experts.123.gate_proj.weight_scale": "model-00004-of-00047.safetensors", + "model.layers.3.mlp.experts.123.up_proj.weight": "model-00004-of-00047.safetensors", + "model.layers.3.mlp.experts.123.up_proj.weight_scale": "model-00004-of-00047.safetensors", + "model.layers.3.mlp.experts.124.down_proj.weight": "model-00004-of-00047.safetensors", + "model.layers.3.mlp.experts.124.down_proj.weight_scale": "model-00004-of-00047.safetensors", + "model.layers.3.mlp.experts.124.gate_proj.weight": "model-00004-of-00047.safetensors", + "model.layers.3.mlp.experts.124.gate_proj.weight_scale": "model-00004-of-00047.safetensors", + "model.layers.3.mlp.experts.124.up_proj.weight": "model-00004-of-00047.safetensors", + "model.layers.3.mlp.experts.124.up_proj.weight_scale": "model-00004-of-00047.safetensors", + "model.layers.3.mlp.experts.125.down_proj.weight": "model-00004-of-00047.safetensors", + "model.layers.3.mlp.experts.125.down_proj.weight_scale": "model-00004-of-00047.safetensors", + "model.layers.3.mlp.experts.125.gate_proj.weight": "model-00004-of-00047.safetensors", + "model.layers.3.mlp.experts.125.gate_proj.weight_scale": "model-00004-of-00047.safetensors", + "model.layers.3.mlp.experts.125.up_proj.weight": "model-00004-of-00047.safetensors", + "model.layers.3.mlp.experts.125.up_proj.weight_scale": "model-00004-of-00047.safetensors", + "model.layers.3.mlp.experts.126.down_proj.weight": "model-00004-of-00047.safetensors", + "model.layers.3.mlp.experts.126.down_proj.weight_scale": "model-00004-of-00047.safetensors", + "model.layers.3.mlp.experts.126.gate_proj.weight": "model-00004-of-00047.safetensors", + "model.layers.3.mlp.experts.126.gate_proj.weight_scale": "model-00004-of-00047.safetensors", + "model.layers.3.mlp.experts.126.up_proj.weight": "model-00004-of-00047.safetensors", + "model.layers.3.mlp.experts.126.up_proj.weight_scale": "model-00004-of-00047.safetensors", + "model.layers.3.mlp.experts.127.down_proj.weight": "model-00004-of-00047.safetensors", + "model.layers.3.mlp.experts.127.down_proj.weight_scale": "model-00004-of-00047.safetensors", + "model.layers.3.mlp.experts.127.gate_proj.weight": "model-00004-of-00047.safetensors", + "model.layers.3.mlp.experts.127.gate_proj.weight_scale": "model-00004-of-00047.safetensors", + "model.layers.3.mlp.experts.127.up_proj.weight": "model-00004-of-00047.safetensors", + "model.layers.3.mlp.experts.127.up_proj.weight_scale": "model-00004-of-00047.safetensors", + "model.layers.3.mlp.experts.13.down_proj.weight": "model-00004-of-00047.safetensors", + "model.layers.3.mlp.experts.13.down_proj.weight_scale": "model-00004-of-00047.safetensors", + "model.layers.3.mlp.experts.13.gate_proj.weight": "model-00004-of-00047.safetensors", + "model.layers.3.mlp.experts.13.gate_proj.weight_scale": "model-00004-of-00047.safetensors", + "model.layers.3.mlp.experts.13.up_proj.weight": "model-00004-of-00047.safetensors", + "model.layers.3.mlp.experts.13.up_proj.weight_scale": "model-00004-of-00047.safetensors", + "model.layers.3.mlp.experts.14.down_proj.weight": "model-00004-of-00047.safetensors", + "model.layers.3.mlp.experts.14.down_proj.weight_scale": "model-00004-of-00047.safetensors", + "model.layers.3.mlp.experts.14.gate_proj.weight": "model-00004-of-00047.safetensors", + "model.layers.3.mlp.experts.14.gate_proj.weight_scale": "model-00004-of-00047.safetensors", + "model.layers.3.mlp.experts.14.up_proj.weight": "model-00004-of-00047.safetensors", + "model.layers.3.mlp.experts.14.up_proj.weight_scale": "model-00004-of-00047.safetensors", + "model.layers.3.mlp.experts.15.down_proj.weight": "model-00004-of-00047.safetensors", + "model.layers.3.mlp.experts.15.down_proj.weight_scale": "model-00004-of-00047.safetensors", + "model.layers.3.mlp.experts.15.gate_proj.weight": "model-00004-of-00047.safetensors", + "model.layers.3.mlp.experts.15.gate_proj.weight_scale": "model-00004-of-00047.safetensors", + "model.layers.3.mlp.experts.15.up_proj.weight": "model-00004-of-00047.safetensors", + "model.layers.3.mlp.experts.15.up_proj.weight_scale": "model-00004-of-00047.safetensors", + "model.layers.3.mlp.experts.16.down_proj.weight": "model-00004-of-00047.safetensors", + "model.layers.3.mlp.experts.16.down_proj.weight_scale": "model-00004-of-00047.safetensors", + "model.layers.3.mlp.experts.16.gate_proj.weight": "model-00004-of-00047.safetensors", + "model.layers.3.mlp.experts.16.gate_proj.weight_scale": "model-00004-of-00047.safetensors", + "model.layers.3.mlp.experts.16.up_proj.weight": "model-00004-of-00047.safetensors", + "model.layers.3.mlp.experts.16.up_proj.weight_scale": "model-00004-of-00047.safetensors", + "model.layers.3.mlp.experts.17.down_proj.weight": "model-00004-of-00047.safetensors", + "model.layers.3.mlp.experts.17.down_proj.weight_scale": "model-00004-of-00047.safetensors", + "model.layers.3.mlp.experts.17.gate_proj.weight": "model-00004-of-00047.safetensors", + "model.layers.3.mlp.experts.17.gate_proj.weight_scale": "model-00004-of-00047.safetensors", + "model.layers.3.mlp.experts.17.up_proj.weight": "model-00004-of-00047.safetensors", + "model.layers.3.mlp.experts.17.up_proj.weight_scale": "model-00004-of-00047.safetensors", + "model.layers.3.mlp.experts.18.down_proj.weight": "model-00004-of-00047.safetensors", + "model.layers.3.mlp.experts.18.down_proj.weight_scale": "model-00004-of-00047.safetensors", + "model.layers.3.mlp.experts.18.gate_proj.weight": "model-00004-of-00047.safetensors", + "model.layers.3.mlp.experts.18.gate_proj.weight_scale": "model-00004-of-00047.safetensors", + "model.layers.3.mlp.experts.18.up_proj.weight": "model-00004-of-00047.safetensors", + "model.layers.3.mlp.experts.18.up_proj.weight_scale": "model-00004-of-00047.safetensors", + "model.layers.3.mlp.experts.19.down_proj.weight": "model-00004-of-00047.safetensors", + "model.layers.3.mlp.experts.19.down_proj.weight_scale": "model-00004-of-00047.safetensors", + "model.layers.3.mlp.experts.19.gate_proj.weight": "model-00004-of-00047.safetensors", + "model.layers.3.mlp.experts.19.gate_proj.weight_scale": "model-00004-of-00047.safetensors", + "model.layers.3.mlp.experts.19.up_proj.weight": "model-00004-of-00047.safetensors", + "model.layers.3.mlp.experts.19.up_proj.weight_scale": "model-00004-of-00047.safetensors", + "model.layers.3.mlp.experts.2.down_proj.weight": "model-00004-of-00047.safetensors", + "model.layers.3.mlp.experts.2.down_proj.weight_scale": "model-00004-of-00047.safetensors", + "model.layers.3.mlp.experts.2.gate_proj.weight": "model-00004-of-00047.safetensors", + "model.layers.3.mlp.experts.2.gate_proj.weight_scale": "model-00004-of-00047.safetensors", + "model.layers.3.mlp.experts.2.up_proj.weight": "model-00004-of-00047.safetensors", + "model.layers.3.mlp.experts.2.up_proj.weight_scale": "model-00004-of-00047.safetensors", + "model.layers.3.mlp.experts.20.down_proj.weight": "model-00004-of-00047.safetensors", + "model.layers.3.mlp.experts.20.down_proj.weight_scale": "model-00004-of-00047.safetensors", + "model.layers.3.mlp.experts.20.gate_proj.weight": "model-00004-of-00047.safetensors", + "model.layers.3.mlp.experts.20.gate_proj.weight_scale": "model-00004-of-00047.safetensors", + "model.layers.3.mlp.experts.20.up_proj.weight": "model-00004-of-00047.safetensors", + "model.layers.3.mlp.experts.20.up_proj.weight_scale": "model-00004-of-00047.safetensors", + "model.layers.3.mlp.experts.21.down_proj.weight": "model-00004-of-00047.safetensors", + "model.layers.3.mlp.experts.21.down_proj.weight_scale": "model-00004-of-00047.safetensors", + "model.layers.3.mlp.experts.21.gate_proj.weight": "model-00004-of-00047.safetensors", + "model.layers.3.mlp.experts.21.gate_proj.weight_scale": "model-00004-of-00047.safetensors", + "model.layers.3.mlp.experts.21.up_proj.weight": "model-00004-of-00047.safetensors", + "model.layers.3.mlp.experts.21.up_proj.weight_scale": "model-00004-of-00047.safetensors", + "model.layers.3.mlp.experts.22.down_proj.weight": "model-00004-of-00047.safetensors", + "model.layers.3.mlp.experts.22.down_proj.weight_scale": "model-00004-of-00047.safetensors", + "model.layers.3.mlp.experts.22.gate_proj.weight": "model-00004-of-00047.safetensors", + "model.layers.3.mlp.experts.22.gate_proj.weight_scale": "model-00004-of-00047.safetensors", + "model.layers.3.mlp.experts.22.up_proj.weight": "model-00004-of-00047.safetensors", + "model.layers.3.mlp.experts.22.up_proj.weight_scale": "model-00004-of-00047.safetensors", + "model.layers.3.mlp.experts.23.down_proj.weight": "model-00004-of-00047.safetensors", + "model.layers.3.mlp.experts.23.down_proj.weight_scale": "model-00004-of-00047.safetensors", + "model.layers.3.mlp.experts.23.gate_proj.weight": "model-00004-of-00047.safetensors", + "model.layers.3.mlp.experts.23.gate_proj.weight_scale": "model-00004-of-00047.safetensors", + "model.layers.3.mlp.experts.23.up_proj.weight": "model-00004-of-00047.safetensors", + "model.layers.3.mlp.experts.23.up_proj.weight_scale": "model-00004-of-00047.safetensors", + "model.layers.3.mlp.experts.24.down_proj.weight": "model-00004-of-00047.safetensors", + "model.layers.3.mlp.experts.24.down_proj.weight_scale": "model-00004-of-00047.safetensors", + "model.layers.3.mlp.experts.24.gate_proj.weight": "model-00004-of-00047.safetensors", + "model.layers.3.mlp.experts.24.gate_proj.weight_scale": "model-00004-of-00047.safetensors", + "model.layers.3.mlp.experts.24.up_proj.weight": "model-00004-of-00047.safetensors", + "model.layers.3.mlp.experts.24.up_proj.weight_scale": "model-00004-of-00047.safetensors", + "model.layers.3.mlp.experts.25.down_proj.weight": "model-00004-of-00047.safetensors", + "model.layers.3.mlp.experts.25.down_proj.weight_scale": "model-00004-of-00047.safetensors", + "model.layers.3.mlp.experts.25.gate_proj.weight": "model-00004-of-00047.safetensors", + "model.layers.3.mlp.experts.25.gate_proj.weight_scale": "model-00004-of-00047.safetensors", + "model.layers.3.mlp.experts.25.up_proj.weight": "model-00004-of-00047.safetensors", + "model.layers.3.mlp.experts.25.up_proj.weight_scale": "model-00004-of-00047.safetensors", + "model.layers.3.mlp.experts.26.down_proj.weight": "model-00004-of-00047.safetensors", + "model.layers.3.mlp.experts.26.down_proj.weight_scale": "model-00004-of-00047.safetensors", + "model.layers.3.mlp.experts.26.gate_proj.weight": "model-00004-of-00047.safetensors", + "model.layers.3.mlp.experts.26.gate_proj.weight_scale": "model-00004-of-00047.safetensors", + "model.layers.3.mlp.experts.26.up_proj.weight": "model-00004-of-00047.safetensors", + "model.layers.3.mlp.experts.26.up_proj.weight_scale": "model-00004-of-00047.safetensors", + "model.layers.3.mlp.experts.27.down_proj.weight": "model-00004-of-00047.safetensors", + "model.layers.3.mlp.experts.27.down_proj.weight_scale": "model-00004-of-00047.safetensors", + "model.layers.3.mlp.experts.27.gate_proj.weight": "model-00004-of-00047.safetensors", + "model.layers.3.mlp.experts.27.gate_proj.weight_scale": "model-00004-of-00047.safetensors", + "model.layers.3.mlp.experts.27.up_proj.weight": "model-00004-of-00047.safetensors", + "model.layers.3.mlp.experts.27.up_proj.weight_scale": "model-00004-of-00047.safetensors", + "model.layers.3.mlp.experts.28.down_proj.weight": "model-00004-of-00047.safetensors", + "model.layers.3.mlp.experts.28.down_proj.weight_scale": "model-00004-of-00047.safetensors", + "model.layers.3.mlp.experts.28.gate_proj.weight": "model-00004-of-00047.safetensors", + "model.layers.3.mlp.experts.28.gate_proj.weight_scale": "model-00004-of-00047.safetensors", + "model.layers.3.mlp.experts.28.up_proj.weight": "model-00004-of-00047.safetensors", + "model.layers.3.mlp.experts.28.up_proj.weight_scale": "model-00004-of-00047.safetensors", + "model.layers.3.mlp.experts.29.down_proj.weight": "model-00004-of-00047.safetensors", + "model.layers.3.mlp.experts.29.down_proj.weight_scale": "model-00004-of-00047.safetensors", + "model.layers.3.mlp.experts.29.gate_proj.weight": "model-00004-of-00047.safetensors", + "model.layers.3.mlp.experts.29.gate_proj.weight_scale": "model-00004-of-00047.safetensors", + "model.layers.3.mlp.experts.29.up_proj.weight": "model-00004-of-00047.safetensors", + "model.layers.3.mlp.experts.29.up_proj.weight_scale": "model-00004-of-00047.safetensors", + "model.layers.3.mlp.experts.3.down_proj.weight": "model-00004-of-00047.safetensors", + "model.layers.3.mlp.experts.3.down_proj.weight_scale": "model-00004-of-00047.safetensors", + "model.layers.3.mlp.experts.3.gate_proj.weight": "model-00004-of-00047.safetensors", + "model.layers.3.mlp.experts.3.gate_proj.weight_scale": "model-00004-of-00047.safetensors", + "model.layers.3.mlp.experts.3.up_proj.weight": "model-00004-of-00047.safetensors", + "model.layers.3.mlp.experts.3.up_proj.weight_scale": "model-00004-of-00047.safetensors", + "model.layers.3.mlp.experts.30.down_proj.weight": "model-00004-of-00047.safetensors", + "model.layers.3.mlp.experts.30.down_proj.weight_scale": "model-00004-of-00047.safetensors", + "model.layers.3.mlp.experts.30.gate_proj.weight": "model-00004-of-00047.safetensors", + "model.layers.3.mlp.experts.30.gate_proj.weight_scale": "model-00004-of-00047.safetensors", + "model.layers.3.mlp.experts.30.up_proj.weight": "model-00004-of-00047.safetensors", + "model.layers.3.mlp.experts.30.up_proj.weight_scale": "model-00004-of-00047.safetensors", + "model.layers.3.mlp.experts.31.down_proj.weight": "model-00004-of-00047.safetensors", + "model.layers.3.mlp.experts.31.down_proj.weight_scale": "model-00004-of-00047.safetensors", + "model.layers.3.mlp.experts.31.gate_proj.weight": "model-00004-of-00047.safetensors", + "model.layers.3.mlp.experts.31.gate_proj.weight_scale": "model-00004-of-00047.safetensors", + "model.layers.3.mlp.experts.31.up_proj.weight": "model-00004-of-00047.safetensors", + "model.layers.3.mlp.experts.31.up_proj.weight_scale": "model-00004-of-00047.safetensors", + "model.layers.3.mlp.experts.32.down_proj.weight": "model-00004-of-00047.safetensors", + "model.layers.3.mlp.experts.32.down_proj.weight_scale": "model-00004-of-00047.safetensors", + "model.layers.3.mlp.experts.32.gate_proj.weight": "model-00004-of-00047.safetensors", + "model.layers.3.mlp.experts.32.gate_proj.weight_scale": "model-00004-of-00047.safetensors", + "model.layers.3.mlp.experts.32.up_proj.weight": "model-00004-of-00047.safetensors", + "model.layers.3.mlp.experts.32.up_proj.weight_scale": "model-00004-of-00047.safetensors", + "model.layers.3.mlp.experts.33.down_proj.weight": "model-00004-of-00047.safetensors", + "model.layers.3.mlp.experts.33.down_proj.weight_scale": "model-00004-of-00047.safetensors", + "model.layers.3.mlp.experts.33.gate_proj.weight": "model-00004-of-00047.safetensors", + "model.layers.3.mlp.experts.33.gate_proj.weight_scale": "model-00004-of-00047.safetensors", + "model.layers.3.mlp.experts.33.up_proj.weight": "model-00004-of-00047.safetensors", + "model.layers.3.mlp.experts.33.up_proj.weight_scale": "model-00004-of-00047.safetensors", + "model.layers.3.mlp.experts.34.down_proj.weight": "model-00004-of-00047.safetensors", + "model.layers.3.mlp.experts.34.down_proj.weight_scale": "model-00004-of-00047.safetensors", + "model.layers.3.mlp.experts.34.gate_proj.weight": "model-00004-of-00047.safetensors", + "model.layers.3.mlp.experts.34.gate_proj.weight_scale": "model-00004-of-00047.safetensors", + "model.layers.3.mlp.experts.34.up_proj.weight": "model-00004-of-00047.safetensors", + "model.layers.3.mlp.experts.34.up_proj.weight_scale": "model-00004-of-00047.safetensors", + "model.layers.3.mlp.experts.35.down_proj.weight": "model-00004-of-00047.safetensors", + "model.layers.3.mlp.experts.35.down_proj.weight_scale": "model-00004-of-00047.safetensors", + "model.layers.3.mlp.experts.35.gate_proj.weight": "model-00004-of-00047.safetensors", + "model.layers.3.mlp.experts.35.gate_proj.weight_scale": "model-00004-of-00047.safetensors", + "model.layers.3.mlp.experts.35.up_proj.weight": "model-00004-of-00047.safetensors", + "model.layers.3.mlp.experts.35.up_proj.weight_scale": "model-00004-of-00047.safetensors", + "model.layers.3.mlp.experts.36.down_proj.weight": "model-00004-of-00047.safetensors", + "model.layers.3.mlp.experts.36.down_proj.weight_scale": "model-00004-of-00047.safetensors", + "model.layers.3.mlp.experts.36.gate_proj.weight": "model-00004-of-00047.safetensors", + "model.layers.3.mlp.experts.36.gate_proj.weight_scale": "model-00004-of-00047.safetensors", + "model.layers.3.mlp.experts.36.up_proj.weight": "model-00004-of-00047.safetensors", + "model.layers.3.mlp.experts.36.up_proj.weight_scale": "model-00004-of-00047.safetensors", + "model.layers.3.mlp.experts.37.down_proj.weight": "model-00004-of-00047.safetensors", + "model.layers.3.mlp.experts.37.down_proj.weight_scale": "model-00004-of-00047.safetensors", + "model.layers.3.mlp.experts.37.gate_proj.weight": "model-00004-of-00047.safetensors", + "model.layers.3.mlp.experts.37.gate_proj.weight_scale": "model-00004-of-00047.safetensors", + "model.layers.3.mlp.experts.37.up_proj.weight": "model-00004-of-00047.safetensors", + "model.layers.3.mlp.experts.37.up_proj.weight_scale": "model-00004-of-00047.safetensors", + "model.layers.3.mlp.experts.38.down_proj.weight": "model-00004-of-00047.safetensors", + "model.layers.3.mlp.experts.38.down_proj.weight_scale": "model-00004-of-00047.safetensors", + "model.layers.3.mlp.experts.38.gate_proj.weight": "model-00004-of-00047.safetensors", + "model.layers.3.mlp.experts.38.gate_proj.weight_scale": "model-00004-of-00047.safetensors", + "model.layers.3.mlp.experts.38.up_proj.weight": "model-00004-of-00047.safetensors", + "model.layers.3.mlp.experts.38.up_proj.weight_scale": "model-00004-of-00047.safetensors", + "model.layers.3.mlp.experts.39.down_proj.weight": "model-00004-of-00047.safetensors", + "model.layers.3.mlp.experts.39.down_proj.weight_scale": "model-00004-of-00047.safetensors", + "model.layers.3.mlp.experts.39.gate_proj.weight": "model-00004-of-00047.safetensors", + "model.layers.3.mlp.experts.39.gate_proj.weight_scale": "model-00004-of-00047.safetensors", + "model.layers.3.mlp.experts.39.up_proj.weight": "model-00004-of-00047.safetensors", + "model.layers.3.mlp.experts.39.up_proj.weight_scale": "model-00004-of-00047.safetensors", + "model.layers.3.mlp.experts.4.down_proj.weight": "model-00004-of-00047.safetensors", + "model.layers.3.mlp.experts.4.down_proj.weight_scale": "model-00004-of-00047.safetensors", + "model.layers.3.mlp.experts.4.gate_proj.weight": "model-00004-of-00047.safetensors", + "model.layers.3.mlp.experts.4.gate_proj.weight_scale": "model-00004-of-00047.safetensors", + "model.layers.3.mlp.experts.4.up_proj.weight": "model-00004-of-00047.safetensors", + "model.layers.3.mlp.experts.4.up_proj.weight_scale": "model-00004-of-00047.safetensors", + "model.layers.3.mlp.experts.40.down_proj.weight": "model-00004-of-00047.safetensors", + "model.layers.3.mlp.experts.40.down_proj.weight_scale": "model-00004-of-00047.safetensors", + "model.layers.3.mlp.experts.40.gate_proj.weight": "model-00004-of-00047.safetensors", + "model.layers.3.mlp.experts.40.gate_proj.weight_scale": "model-00004-of-00047.safetensors", + "model.layers.3.mlp.experts.40.up_proj.weight": "model-00004-of-00047.safetensors", + "model.layers.3.mlp.experts.40.up_proj.weight_scale": "model-00004-of-00047.safetensors", + "model.layers.3.mlp.experts.41.down_proj.weight": "model-00004-of-00047.safetensors", + "model.layers.3.mlp.experts.41.down_proj.weight_scale": "model-00004-of-00047.safetensors", + "model.layers.3.mlp.experts.41.gate_proj.weight": "model-00004-of-00047.safetensors", + "model.layers.3.mlp.experts.41.gate_proj.weight_scale": "model-00004-of-00047.safetensors", + "model.layers.3.mlp.experts.41.up_proj.weight": "model-00004-of-00047.safetensors", + "model.layers.3.mlp.experts.41.up_proj.weight_scale": "model-00004-of-00047.safetensors", + "model.layers.3.mlp.experts.42.down_proj.weight": "model-00004-of-00047.safetensors", + "model.layers.3.mlp.experts.42.down_proj.weight_scale": "model-00004-of-00047.safetensors", + "model.layers.3.mlp.experts.42.gate_proj.weight": "model-00004-of-00047.safetensors", + "model.layers.3.mlp.experts.42.gate_proj.weight_scale": "model-00004-of-00047.safetensors", + "model.layers.3.mlp.experts.42.up_proj.weight": "model-00004-of-00047.safetensors", + "model.layers.3.mlp.experts.42.up_proj.weight_scale": "model-00004-of-00047.safetensors", + "model.layers.3.mlp.experts.43.down_proj.weight": "model-00004-of-00047.safetensors", + "model.layers.3.mlp.experts.43.down_proj.weight_scale": "model-00004-of-00047.safetensors", + "model.layers.3.mlp.experts.43.gate_proj.weight": "model-00004-of-00047.safetensors", + "model.layers.3.mlp.experts.43.gate_proj.weight_scale": "model-00004-of-00047.safetensors", + "model.layers.3.mlp.experts.43.up_proj.weight": "model-00004-of-00047.safetensors", + "model.layers.3.mlp.experts.43.up_proj.weight_scale": "model-00004-of-00047.safetensors", + "model.layers.3.mlp.experts.44.down_proj.weight": "model-00004-of-00047.safetensors", + "model.layers.3.mlp.experts.44.down_proj.weight_scale": "model-00004-of-00047.safetensors", + "model.layers.3.mlp.experts.44.gate_proj.weight": "model-00004-of-00047.safetensors", + "model.layers.3.mlp.experts.44.gate_proj.weight_scale": "model-00004-of-00047.safetensors", + "model.layers.3.mlp.experts.44.up_proj.weight": "model-00004-of-00047.safetensors", + "model.layers.3.mlp.experts.44.up_proj.weight_scale": "model-00004-of-00047.safetensors", + "model.layers.3.mlp.experts.45.down_proj.weight": "model-00004-of-00047.safetensors", + "model.layers.3.mlp.experts.45.down_proj.weight_scale": "model-00004-of-00047.safetensors", + "model.layers.3.mlp.experts.45.gate_proj.weight": "model-00004-of-00047.safetensors", + "model.layers.3.mlp.experts.45.gate_proj.weight_scale": "model-00004-of-00047.safetensors", + "model.layers.3.mlp.experts.45.up_proj.weight": "model-00004-of-00047.safetensors", + "model.layers.3.mlp.experts.45.up_proj.weight_scale": "model-00004-of-00047.safetensors", + "model.layers.3.mlp.experts.46.down_proj.weight": "model-00004-of-00047.safetensors", + "model.layers.3.mlp.experts.46.down_proj.weight_scale": "model-00004-of-00047.safetensors", + "model.layers.3.mlp.experts.46.gate_proj.weight": "model-00004-of-00047.safetensors", + "model.layers.3.mlp.experts.46.gate_proj.weight_scale": "model-00004-of-00047.safetensors", + "model.layers.3.mlp.experts.46.up_proj.weight": "model-00004-of-00047.safetensors", + "model.layers.3.mlp.experts.46.up_proj.weight_scale": "model-00004-of-00047.safetensors", + "model.layers.3.mlp.experts.47.down_proj.weight": "model-00004-of-00047.safetensors", + "model.layers.3.mlp.experts.47.down_proj.weight_scale": "model-00004-of-00047.safetensors", + "model.layers.3.mlp.experts.47.gate_proj.weight": "model-00004-of-00047.safetensors", + "model.layers.3.mlp.experts.47.gate_proj.weight_scale": "model-00004-of-00047.safetensors", + "model.layers.3.mlp.experts.47.up_proj.weight": "model-00004-of-00047.safetensors", + "model.layers.3.mlp.experts.47.up_proj.weight_scale": "model-00004-of-00047.safetensors", + "model.layers.3.mlp.experts.48.down_proj.weight": "model-00004-of-00047.safetensors", + "model.layers.3.mlp.experts.48.down_proj.weight_scale": "model-00004-of-00047.safetensors", + "model.layers.3.mlp.experts.48.gate_proj.weight": "model-00004-of-00047.safetensors", + "model.layers.3.mlp.experts.48.gate_proj.weight_scale": "model-00004-of-00047.safetensors", + "model.layers.3.mlp.experts.48.up_proj.weight": "model-00004-of-00047.safetensors", + "model.layers.3.mlp.experts.48.up_proj.weight_scale": "model-00004-of-00047.safetensors", + "model.layers.3.mlp.experts.49.down_proj.weight": "model-00004-of-00047.safetensors", + "model.layers.3.mlp.experts.49.down_proj.weight_scale": "model-00004-of-00047.safetensors", + "model.layers.3.mlp.experts.49.gate_proj.weight": "model-00004-of-00047.safetensors", + "model.layers.3.mlp.experts.49.gate_proj.weight_scale": "model-00004-of-00047.safetensors", + "model.layers.3.mlp.experts.49.up_proj.weight": "model-00004-of-00047.safetensors", + "model.layers.3.mlp.experts.49.up_proj.weight_scale": "model-00004-of-00047.safetensors", + "model.layers.3.mlp.experts.5.down_proj.weight": "model-00004-of-00047.safetensors", + "model.layers.3.mlp.experts.5.down_proj.weight_scale": "model-00004-of-00047.safetensors", + "model.layers.3.mlp.experts.5.gate_proj.weight": "model-00004-of-00047.safetensors", + "model.layers.3.mlp.experts.5.gate_proj.weight_scale": "model-00004-of-00047.safetensors", + "model.layers.3.mlp.experts.5.up_proj.weight": "model-00004-of-00047.safetensors", + "model.layers.3.mlp.experts.5.up_proj.weight_scale": "model-00004-of-00047.safetensors", + "model.layers.3.mlp.experts.50.down_proj.weight": "model-00004-of-00047.safetensors", + "model.layers.3.mlp.experts.50.down_proj.weight_scale": "model-00004-of-00047.safetensors", + "model.layers.3.mlp.experts.50.gate_proj.weight": "model-00004-of-00047.safetensors", + "model.layers.3.mlp.experts.50.gate_proj.weight_scale": "model-00004-of-00047.safetensors", + "model.layers.3.mlp.experts.50.up_proj.weight": "model-00004-of-00047.safetensors", + "model.layers.3.mlp.experts.50.up_proj.weight_scale": "model-00004-of-00047.safetensors", + "model.layers.3.mlp.experts.51.down_proj.weight": "model-00004-of-00047.safetensors", + "model.layers.3.mlp.experts.51.down_proj.weight_scale": "model-00004-of-00047.safetensors", + "model.layers.3.mlp.experts.51.gate_proj.weight": "model-00004-of-00047.safetensors", + "model.layers.3.mlp.experts.51.gate_proj.weight_scale": "model-00004-of-00047.safetensors", + "model.layers.3.mlp.experts.51.up_proj.weight": "model-00004-of-00047.safetensors", + "model.layers.3.mlp.experts.51.up_proj.weight_scale": "model-00004-of-00047.safetensors", + "model.layers.3.mlp.experts.52.down_proj.weight": "model-00004-of-00047.safetensors", + "model.layers.3.mlp.experts.52.down_proj.weight_scale": "model-00004-of-00047.safetensors", + "model.layers.3.mlp.experts.52.gate_proj.weight": "model-00004-of-00047.safetensors", + "model.layers.3.mlp.experts.52.gate_proj.weight_scale": "model-00004-of-00047.safetensors", + "model.layers.3.mlp.experts.52.up_proj.weight": "model-00004-of-00047.safetensors", + "model.layers.3.mlp.experts.52.up_proj.weight_scale": "model-00004-of-00047.safetensors", + "model.layers.3.mlp.experts.53.down_proj.weight": "model-00004-of-00047.safetensors", + "model.layers.3.mlp.experts.53.down_proj.weight_scale": "model-00004-of-00047.safetensors", + "model.layers.3.mlp.experts.53.gate_proj.weight": "model-00004-of-00047.safetensors", + "model.layers.3.mlp.experts.53.gate_proj.weight_scale": "model-00004-of-00047.safetensors", + "model.layers.3.mlp.experts.53.up_proj.weight": "model-00004-of-00047.safetensors", + "model.layers.3.mlp.experts.53.up_proj.weight_scale": "model-00004-of-00047.safetensors", + "model.layers.3.mlp.experts.54.down_proj.weight": "model-00004-of-00047.safetensors", + "model.layers.3.mlp.experts.54.down_proj.weight_scale": "model-00004-of-00047.safetensors", + "model.layers.3.mlp.experts.54.gate_proj.weight": "model-00004-of-00047.safetensors", + "model.layers.3.mlp.experts.54.gate_proj.weight_scale": "model-00004-of-00047.safetensors", + "model.layers.3.mlp.experts.54.up_proj.weight": "model-00004-of-00047.safetensors", + "model.layers.3.mlp.experts.54.up_proj.weight_scale": "model-00004-of-00047.safetensors", + "model.layers.3.mlp.experts.55.down_proj.weight": "model-00004-of-00047.safetensors", + "model.layers.3.mlp.experts.55.down_proj.weight_scale": "model-00004-of-00047.safetensors", + "model.layers.3.mlp.experts.55.gate_proj.weight": "model-00004-of-00047.safetensors", + "model.layers.3.mlp.experts.55.gate_proj.weight_scale": "model-00004-of-00047.safetensors", + "model.layers.3.mlp.experts.55.up_proj.weight": "model-00004-of-00047.safetensors", + "model.layers.3.mlp.experts.55.up_proj.weight_scale": "model-00004-of-00047.safetensors", + "model.layers.3.mlp.experts.56.down_proj.weight": "model-00004-of-00047.safetensors", + "model.layers.3.mlp.experts.56.down_proj.weight_scale": "model-00004-of-00047.safetensors", + "model.layers.3.mlp.experts.56.gate_proj.weight": "model-00004-of-00047.safetensors", + "model.layers.3.mlp.experts.56.gate_proj.weight_scale": "model-00004-of-00047.safetensors", + "model.layers.3.mlp.experts.56.up_proj.weight": "model-00004-of-00047.safetensors", + "model.layers.3.mlp.experts.56.up_proj.weight_scale": "model-00004-of-00047.safetensors", + "model.layers.3.mlp.experts.57.down_proj.weight": "model-00004-of-00047.safetensors", + "model.layers.3.mlp.experts.57.down_proj.weight_scale": "model-00004-of-00047.safetensors", + "model.layers.3.mlp.experts.57.gate_proj.weight": "model-00004-of-00047.safetensors", + "model.layers.3.mlp.experts.57.gate_proj.weight_scale": "model-00004-of-00047.safetensors", + "model.layers.3.mlp.experts.57.up_proj.weight": "model-00004-of-00047.safetensors", + "model.layers.3.mlp.experts.57.up_proj.weight_scale": "model-00004-of-00047.safetensors", + "model.layers.3.mlp.experts.58.down_proj.weight": "model-00004-of-00047.safetensors", + "model.layers.3.mlp.experts.58.down_proj.weight_scale": "model-00004-of-00047.safetensors", + "model.layers.3.mlp.experts.58.gate_proj.weight": "model-00004-of-00047.safetensors", + "model.layers.3.mlp.experts.58.gate_proj.weight_scale": "model-00004-of-00047.safetensors", + "model.layers.3.mlp.experts.58.up_proj.weight": "model-00004-of-00047.safetensors", + "model.layers.3.mlp.experts.58.up_proj.weight_scale": "model-00004-of-00047.safetensors", + "model.layers.3.mlp.experts.59.down_proj.weight": "model-00004-of-00047.safetensors", + "model.layers.3.mlp.experts.59.down_proj.weight_scale": "model-00004-of-00047.safetensors", + "model.layers.3.mlp.experts.59.gate_proj.weight": "model-00004-of-00047.safetensors", + "model.layers.3.mlp.experts.59.gate_proj.weight_scale": "model-00004-of-00047.safetensors", + "model.layers.3.mlp.experts.59.up_proj.weight": "model-00004-of-00047.safetensors", + "model.layers.3.mlp.experts.59.up_proj.weight_scale": "model-00004-of-00047.safetensors", + "model.layers.3.mlp.experts.6.down_proj.weight": "model-00004-of-00047.safetensors", + "model.layers.3.mlp.experts.6.down_proj.weight_scale": "model-00004-of-00047.safetensors", + "model.layers.3.mlp.experts.6.gate_proj.weight": "model-00004-of-00047.safetensors", + "model.layers.3.mlp.experts.6.gate_proj.weight_scale": "model-00004-of-00047.safetensors", + "model.layers.3.mlp.experts.6.up_proj.weight": "model-00004-of-00047.safetensors", + "model.layers.3.mlp.experts.6.up_proj.weight_scale": "model-00004-of-00047.safetensors", + "model.layers.3.mlp.experts.60.down_proj.weight": "model-00004-of-00047.safetensors", + "model.layers.3.mlp.experts.60.down_proj.weight_scale": "model-00004-of-00047.safetensors", + "model.layers.3.mlp.experts.60.gate_proj.weight": "model-00004-of-00047.safetensors", + "model.layers.3.mlp.experts.60.gate_proj.weight_scale": "model-00004-of-00047.safetensors", + "model.layers.3.mlp.experts.60.up_proj.weight": "model-00004-of-00047.safetensors", + "model.layers.3.mlp.experts.60.up_proj.weight_scale": "model-00004-of-00047.safetensors", + "model.layers.3.mlp.experts.61.down_proj.weight": "model-00004-of-00047.safetensors", + "model.layers.3.mlp.experts.61.down_proj.weight_scale": "model-00004-of-00047.safetensors", + "model.layers.3.mlp.experts.61.gate_proj.weight": "model-00004-of-00047.safetensors", + "model.layers.3.mlp.experts.61.gate_proj.weight_scale": "model-00004-of-00047.safetensors", + "model.layers.3.mlp.experts.61.up_proj.weight": "model-00004-of-00047.safetensors", + "model.layers.3.mlp.experts.61.up_proj.weight_scale": "model-00004-of-00047.safetensors", + "model.layers.3.mlp.experts.62.down_proj.weight": "model-00004-of-00047.safetensors", + "model.layers.3.mlp.experts.62.down_proj.weight_scale": "model-00004-of-00047.safetensors", + "model.layers.3.mlp.experts.62.gate_proj.weight": "model-00004-of-00047.safetensors", + "model.layers.3.mlp.experts.62.gate_proj.weight_scale": "model-00004-of-00047.safetensors", + "model.layers.3.mlp.experts.62.up_proj.weight": "model-00004-of-00047.safetensors", + "model.layers.3.mlp.experts.62.up_proj.weight_scale": "model-00004-of-00047.safetensors", + "model.layers.3.mlp.experts.63.down_proj.weight": "model-00004-of-00047.safetensors", + "model.layers.3.mlp.experts.63.down_proj.weight_scale": "model-00004-of-00047.safetensors", + "model.layers.3.mlp.experts.63.gate_proj.weight": "model-00004-of-00047.safetensors", + "model.layers.3.mlp.experts.63.gate_proj.weight_scale": "model-00004-of-00047.safetensors", + "model.layers.3.mlp.experts.63.up_proj.weight": "model-00004-of-00047.safetensors", + "model.layers.3.mlp.experts.63.up_proj.weight_scale": "model-00004-of-00047.safetensors", + "model.layers.3.mlp.experts.64.down_proj.weight": "model-00004-of-00047.safetensors", + "model.layers.3.mlp.experts.64.down_proj.weight_scale": "model-00004-of-00047.safetensors", + "model.layers.3.mlp.experts.64.gate_proj.weight": "model-00004-of-00047.safetensors", + "model.layers.3.mlp.experts.64.gate_proj.weight_scale": "model-00004-of-00047.safetensors", + "model.layers.3.mlp.experts.64.up_proj.weight": "model-00004-of-00047.safetensors", + "model.layers.3.mlp.experts.64.up_proj.weight_scale": "model-00004-of-00047.safetensors", + "model.layers.3.mlp.experts.65.down_proj.weight": "model-00004-of-00047.safetensors", + "model.layers.3.mlp.experts.65.down_proj.weight_scale": "model-00004-of-00047.safetensors", + "model.layers.3.mlp.experts.65.gate_proj.weight": "model-00004-of-00047.safetensors", + "model.layers.3.mlp.experts.65.gate_proj.weight_scale": "model-00004-of-00047.safetensors", + "model.layers.3.mlp.experts.65.up_proj.weight": "model-00004-of-00047.safetensors", + "model.layers.3.mlp.experts.65.up_proj.weight_scale": "model-00004-of-00047.safetensors", + "model.layers.3.mlp.experts.66.down_proj.weight": "model-00004-of-00047.safetensors", + "model.layers.3.mlp.experts.66.down_proj.weight_scale": "model-00004-of-00047.safetensors", + "model.layers.3.mlp.experts.66.gate_proj.weight": "model-00004-of-00047.safetensors", + "model.layers.3.mlp.experts.66.gate_proj.weight_scale": "model-00004-of-00047.safetensors", + "model.layers.3.mlp.experts.66.up_proj.weight": "model-00004-of-00047.safetensors", + "model.layers.3.mlp.experts.66.up_proj.weight_scale": "model-00004-of-00047.safetensors", + "model.layers.3.mlp.experts.67.down_proj.weight": "model-00004-of-00047.safetensors", + "model.layers.3.mlp.experts.67.down_proj.weight_scale": "model-00004-of-00047.safetensors", + "model.layers.3.mlp.experts.67.gate_proj.weight": "model-00004-of-00047.safetensors", + "model.layers.3.mlp.experts.67.gate_proj.weight_scale": "model-00004-of-00047.safetensors", + "model.layers.3.mlp.experts.67.up_proj.weight": "model-00004-of-00047.safetensors", + "model.layers.3.mlp.experts.67.up_proj.weight_scale": "model-00004-of-00047.safetensors", + "model.layers.3.mlp.experts.68.down_proj.weight": "model-00004-of-00047.safetensors", + "model.layers.3.mlp.experts.68.down_proj.weight_scale": "model-00004-of-00047.safetensors", + "model.layers.3.mlp.experts.68.gate_proj.weight": "model-00004-of-00047.safetensors", + "model.layers.3.mlp.experts.68.gate_proj.weight_scale": "model-00004-of-00047.safetensors", + "model.layers.3.mlp.experts.68.up_proj.weight": "model-00004-of-00047.safetensors", + "model.layers.3.mlp.experts.68.up_proj.weight_scale": "model-00004-of-00047.safetensors", + "model.layers.3.mlp.experts.69.down_proj.weight": "model-00004-of-00047.safetensors", + "model.layers.3.mlp.experts.69.down_proj.weight_scale": "model-00004-of-00047.safetensors", + "model.layers.3.mlp.experts.69.gate_proj.weight": "model-00004-of-00047.safetensors", + "model.layers.3.mlp.experts.69.gate_proj.weight_scale": "model-00004-of-00047.safetensors", + "model.layers.3.mlp.experts.69.up_proj.weight": "model-00004-of-00047.safetensors", + "model.layers.3.mlp.experts.69.up_proj.weight_scale": "model-00004-of-00047.safetensors", + "model.layers.3.mlp.experts.7.down_proj.weight": "model-00004-of-00047.safetensors", + "model.layers.3.mlp.experts.7.down_proj.weight_scale": "model-00004-of-00047.safetensors", + "model.layers.3.mlp.experts.7.gate_proj.weight": "model-00004-of-00047.safetensors", + "model.layers.3.mlp.experts.7.gate_proj.weight_scale": "model-00004-of-00047.safetensors", + "model.layers.3.mlp.experts.7.up_proj.weight": "model-00004-of-00047.safetensors", + "model.layers.3.mlp.experts.7.up_proj.weight_scale": "model-00004-of-00047.safetensors", + "model.layers.3.mlp.experts.70.down_proj.weight": "model-00004-of-00047.safetensors", + "model.layers.3.mlp.experts.70.down_proj.weight_scale": "model-00004-of-00047.safetensors", + "model.layers.3.mlp.experts.70.gate_proj.weight": "model-00004-of-00047.safetensors", + "model.layers.3.mlp.experts.70.gate_proj.weight_scale": "model-00004-of-00047.safetensors", + "model.layers.3.mlp.experts.70.up_proj.weight": "model-00004-of-00047.safetensors", + "model.layers.3.mlp.experts.70.up_proj.weight_scale": "model-00004-of-00047.safetensors", + "model.layers.3.mlp.experts.71.down_proj.weight": "model-00004-of-00047.safetensors", + "model.layers.3.mlp.experts.71.down_proj.weight_scale": "model-00004-of-00047.safetensors", + "model.layers.3.mlp.experts.71.gate_proj.weight": "model-00004-of-00047.safetensors", + "model.layers.3.mlp.experts.71.gate_proj.weight_scale": "model-00004-of-00047.safetensors", + "model.layers.3.mlp.experts.71.up_proj.weight": "model-00004-of-00047.safetensors", + "model.layers.3.mlp.experts.71.up_proj.weight_scale": "model-00004-of-00047.safetensors", + "model.layers.3.mlp.experts.72.down_proj.weight": "model-00004-of-00047.safetensors", + "model.layers.3.mlp.experts.72.down_proj.weight_scale": "model-00004-of-00047.safetensors", + "model.layers.3.mlp.experts.72.gate_proj.weight": "model-00004-of-00047.safetensors", + "model.layers.3.mlp.experts.72.gate_proj.weight_scale": "model-00004-of-00047.safetensors", + "model.layers.3.mlp.experts.72.up_proj.weight": "model-00004-of-00047.safetensors", + "model.layers.3.mlp.experts.72.up_proj.weight_scale": "model-00004-of-00047.safetensors", + "model.layers.3.mlp.experts.73.down_proj.weight": "model-00004-of-00047.safetensors", + "model.layers.3.mlp.experts.73.down_proj.weight_scale": "model-00004-of-00047.safetensors", + "model.layers.3.mlp.experts.73.gate_proj.weight": "model-00004-of-00047.safetensors", + "model.layers.3.mlp.experts.73.gate_proj.weight_scale": "model-00004-of-00047.safetensors", + "model.layers.3.mlp.experts.73.up_proj.weight": "model-00004-of-00047.safetensors", + "model.layers.3.mlp.experts.73.up_proj.weight_scale": "model-00004-of-00047.safetensors", + "model.layers.3.mlp.experts.74.down_proj.weight": "model-00004-of-00047.safetensors", + "model.layers.3.mlp.experts.74.down_proj.weight_scale": "model-00004-of-00047.safetensors", + "model.layers.3.mlp.experts.74.gate_proj.weight": "model-00004-of-00047.safetensors", + "model.layers.3.mlp.experts.74.gate_proj.weight_scale": "model-00004-of-00047.safetensors", + "model.layers.3.mlp.experts.74.up_proj.weight": "model-00004-of-00047.safetensors", + "model.layers.3.mlp.experts.74.up_proj.weight_scale": "model-00004-of-00047.safetensors", + "model.layers.3.mlp.experts.75.down_proj.weight": "model-00004-of-00047.safetensors", + "model.layers.3.mlp.experts.75.down_proj.weight_scale": "model-00004-of-00047.safetensors", + "model.layers.3.mlp.experts.75.gate_proj.weight": "model-00004-of-00047.safetensors", + "model.layers.3.mlp.experts.75.gate_proj.weight_scale": "model-00004-of-00047.safetensors", + "model.layers.3.mlp.experts.75.up_proj.weight": "model-00004-of-00047.safetensors", + "model.layers.3.mlp.experts.75.up_proj.weight_scale": "model-00004-of-00047.safetensors", + "model.layers.3.mlp.experts.76.down_proj.weight": "model-00004-of-00047.safetensors", + "model.layers.3.mlp.experts.76.down_proj.weight_scale": "model-00004-of-00047.safetensors", + "model.layers.3.mlp.experts.76.gate_proj.weight": "model-00004-of-00047.safetensors", + "model.layers.3.mlp.experts.76.gate_proj.weight_scale": "model-00004-of-00047.safetensors", + "model.layers.3.mlp.experts.76.up_proj.weight": "model-00004-of-00047.safetensors", + "model.layers.3.mlp.experts.76.up_proj.weight_scale": "model-00004-of-00047.safetensors", + "model.layers.3.mlp.experts.77.down_proj.weight": "model-00004-of-00047.safetensors", + "model.layers.3.mlp.experts.77.down_proj.weight_scale": "model-00004-of-00047.safetensors", + "model.layers.3.mlp.experts.77.gate_proj.weight": "model-00004-of-00047.safetensors", + "model.layers.3.mlp.experts.77.gate_proj.weight_scale": "model-00004-of-00047.safetensors", + "model.layers.3.mlp.experts.77.up_proj.weight": "model-00004-of-00047.safetensors", + "model.layers.3.mlp.experts.77.up_proj.weight_scale": "model-00004-of-00047.safetensors", + "model.layers.3.mlp.experts.78.down_proj.weight": "model-00004-of-00047.safetensors", + "model.layers.3.mlp.experts.78.down_proj.weight_scale": "model-00004-of-00047.safetensors", + "model.layers.3.mlp.experts.78.gate_proj.weight": "model-00004-of-00047.safetensors", + "model.layers.3.mlp.experts.78.gate_proj.weight_scale": "model-00004-of-00047.safetensors", + "model.layers.3.mlp.experts.78.up_proj.weight": "model-00004-of-00047.safetensors", + "model.layers.3.mlp.experts.78.up_proj.weight_scale": "model-00004-of-00047.safetensors", + "model.layers.3.mlp.experts.79.down_proj.weight": "model-00004-of-00047.safetensors", + "model.layers.3.mlp.experts.79.down_proj.weight_scale": "model-00004-of-00047.safetensors", + "model.layers.3.mlp.experts.79.gate_proj.weight": "model-00004-of-00047.safetensors", + "model.layers.3.mlp.experts.79.gate_proj.weight_scale": "model-00004-of-00047.safetensors", + "model.layers.3.mlp.experts.79.up_proj.weight": "model-00004-of-00047.safetensors", + "model.layers.3.mlp.experts.79.up_proj.weight_scale": "model-00004-of-00047.safetensors", + "model.layers.3.mlp.experts.8.down_proj.weight": "model-00004-of-00047.safetensors", + "model.layers.3.mlp.experts.8.down_proj.weight_scale": "model-00004-of-00047.safetensors", + "model.layers.3.mlp.experts.8.gate_proj.weight": "model-00004-of-00047.safetensors", + "model.layers.3.mlp.experts.8.gate_proj.weight_scale": "model-00004-of-00047.safetensors", + "model.layers.3.mlp.experts.8.up_proj.weight": "model-00004-of-00047.safetensors", + "model.layers.3.mlp.experts.8.up_proj.weight_scale": "model-00004-of-00047.safetensors", + "model.layers.3.mlp.experts.80.down_proj.weight": "model-00004-of-00047.safetensors", + "model.layers.3.mlp.experts.80.down_proj.weight_scale": "model-00004-of-00047.safetensors", + "model.layers.3.mlp.experts.80.gate_proj.weight": "model-00004-of-00047.safetensors", + "model.layers.3.mlp.experts.80.gate_proj.weight_scale": "model-00004-of-00047.safetensors", + "model.layers.3.mlp.experts.80.up_proj.weight": "model-00004-of-00047.safetensors", + "model.layers.3.mlp.experts.80.up_proj.weight_scale": "model-00004-of-00047.safetensors", + "model.layers.3.mlp.experts.81.down_proj.weight": "model-00004-of-00047.safetensors", + "model.layers.3.mlp.experts.81.down_proj.weight_scale": "model-00004-of-00047.safetensors", + "model.layers.3.mlp.experts.81.gate_proj.weight": "model-00004-of-00047.safetensors", + "model.layers.3.mlp.experts.81.gate_proj.weight_scale": "model-00004-of-00047.safetensors", + "model.layers.3.mlp.experts.81.up_proj.weight": "model-00004-of-00047.safetensors", + "model.layers.3.mlp.experts.81.up_proj.weight_scale": "model-00004-of-00047.safetensors", + "model.layers.3.mlp.experts.82.down_proj.weight": "model-00004-of-00047.safetensors", + "model.layers.3.mlp.experts.82.down_proj.weight_scale": "model-00004-of-00047.safetensors", + "model.layers.3.mlp.experts.82.gate_proj.weight": "model-00004-of-00047.safetensors", + "model.layers.3.mlp.experts.82.gate_proj.weight_scale": "model-00004-of-00047.safetensors", + "model.layers.3.mlp.experts.82.up_proj.weight": "model-00004-of-00047.safetensors", + "model.layers.3.mlp.experts.82.up_proj.weight_scale": "model-00004-of-00047.safetensors", + "model.layers.3.mlp.experts.83.down_proj.weight": "model-00004-of-00047.safetensors", + "model.layers.3.mlp.experts.83.down_proj.weight_scale": "model-00004-of-00047.safetensors", + "model.layers.3.mlp.experts.83.gate_proj.weight": "model-00004-of-00047.safetensors", + "model.layers.3.mlp.experts.83.gate_proj.weight_scale": "model-00004-of-00047.safetensors", + "model.layers.3.mlp.experts.83.up_proj.weight": "model-00004-of-00047.safetensors", + "model.layers.3.mlp.experts.83.up_proj.weight_scale": "model-00004-of-00047.safetensors", + "model.layers.3.mlp.experts.84.down_proj.weight": "model-00004-of-00047.safetensors", + "model.layers.3.mlp.experts.84.down_proj.weight_scale": "model-00004-of-00047.safetensors", + "model.layers.3.mlp.experts.84.gate_proj.weight": "model-00004-of-00047.safetensors", + "model.layers.3.mlp.experts.84.gate_proj.weight_scale": "model-00004-of-00047.safetensors", + "model.layers.3.mlp.experts.84.up_proj.weight": "model-00004-of-00047.safetensors", + "model.layers.3.mlp.experts.84.up_proj.weight_scale": "model-00004-of-00047.safetensors", + "model.layers.3.mlp.experts.85.down_proj.weight": "model-00004-of-00047.safetensors", + "model.layers.3.mlp.experts.85.down_proj.weight_scale": "model-00004-of-00047.safetensors", + "model.layers.3.mlp.experts.85.gate_proj.weight": "model-00004-of-00047.safetensors", + "model.layers.3.mlp.experts.85.gate_proj.weight_scale": "model-00004-of-00047.safetensors", + "model.layers.3.mlp.experts.85.up_proj.weight": "model-00004-of-00047.safetensors", + "model.layers.3.mlp.experts.85.up_proj.weight_scale": "model-00004-of-00047.safetensors", + "model.layers.3.mlp.experts.86.down_proj.weight": "model-00004-of-00047.safetensors", + "model.layers.3.mlp.experts.86.down_proj.weight_scale": "model-00004-of-00047.safetensors", + "model.layers.3.mlp.experts.86.gate_proj.weight": "model-00004-of-00047.safetensors", + "model.layers.3.mlp.experts.86.gate_proj.weight_scale": "model-00004-of-00047.safetensors", + "model.layers.3.mlp.experts.86.up_proj.weight": "model-00004-of-00047.safetensors", + "model.layers.3.mlp.experts.86.up_proj.weight_scale": "model-00004-of-00047.safetensors", + "model.layers.3.mlp.experts.87.down_proj.weight": "model-00004-of-00047.safetensors", + "model.layers.3.mlp.experts.87.down_proj.weight_scale": "model-00004-of-00047.safetensors", + "model.layers.3.mlp.experts.87.gate_proj.weight": "model-00004-of-00047.safetensors", + "model.layers.3.mlp.experts.87.gate_proj.weight_scale": "model-00004-of-00047.safetensors", + "model.layers.3.mlp.experts.87.up_proj.weight": "model-00004-of-00047.safetensors", + "model.layers.3.mlp.experts.87.up_proj.weight_scale": "model-00004-of-00047.safetensors", + "model.layers.3.mlp.experts.88.down_proj.weight": "model-00004-of-00047.safetensors", + "model.layers.3.mlp.experts.88.down_proj.weight_scale": "model-00004-of-00047.safetensors", + "model.layers.3.mlp.experts.88.gate_proj.weight": "model-00004-of-00047.safetensors", + "model.layers.3.mlp.experts.88.gate_proj.weight_scale": "model-00004-of-00047.safetensors", + "model.layers.3.mlp.experts.88.up_proj.weight": "model-00004-of-00047.safetensors", + "model.layers.3.mlp.experts.88.up_proj.weight_scale": "model-00004-of-00047.safetensors", + "model.layers.3.mlp.experts.89.down_proj.weight": "model-00004-of-00047.safetensors", + "model.layers.3.mlp.experts.89.down_proj.weight_scale": "model-00004-of-00047.safetensors", + "model.layers.3.mlp.experts.89.gate_proj.weight": "model-00004-of-00047.safetensors", + "model.layers.3.mlp.experts.89.gate_proj.weight_scale": "model-00004-of-00047.safetensors", + "model.layers.3.mlp.experts.89.up_proj.weight": "model-00004-of-00047.safetensors", + "model.layers.3.mlp.experts.89.up_proj.weight_scale": "model-00004-of-00047.safetensors", + "model.layers.3.mlp.experts.9.down_proj.weight": "model-00004-of-00047.safetensors", + "model.layers.3.mlp.experts.9.down_proj.weight_scale": "model-00004-of-00047.safetensors", + "model.layers.3.mlp.experts.9.gate_proj.weight": "model-00004-of-00047.safetensors", + "model.layers.3.mlp.experts.9.gate_proj.weight_scale": "model-00004-of-00047.safetensors", + "model.layers.3.mlp.experts.9.up_proj.weight": "model-00004-of-00047.safetensors", + "model.layers.3.mlp.experts.9.up_proj.weight_scale": "model-00004-of-00047.safetensors", + "model.layers.3.mlp.experts.90.down_proj.weight": "model-00004-of-00047.safetensors", + "model.layers.3.mlp.experts.90.down_proj.weight_scale": "model-00004-of-00047.safetensors", + "model.layers.3.mlp.experts.90.gate_proj.weight": "model-00004-of-00047.safetensors", + "model.layers.3.mlp.experts.90.gate_proj.weight_scale": "model-00004-of-00047.safetensors", + "model.layers.3.mlp.experts.90.up_proj.weight": "model-00004-of-00047.safetensors", + "model.layers.3.mlp.experts.90.up_proj.weight_scale": "model-00004-of-00047.safetensors", + "model.layers.3.mlp.experts.91.down_proj.weight": "model-00004-of-00047.safetensors", + "model.layers.3.mlp.experts.91.down_proj.weight_scale": "model-00004-of-00047.safetensors", + "model.layers.3.mlp.experts.91.gate_proj.weight": "model-00004-of-00047.safetensors", + "model.layers.3.mlp.experts.91.gate_proj.weight_scale": "model-00004-of-00047.safetensors", + "model.layers.3.mlp.experts.91.up_proj.weight": "model-00004-of-00047.safetensors", + "model.layers.3.mlp.experts.91.up_proj.weight_scale": "model-00004-of-00047.safetensors", + "model.layers.3.mlp.experts.92.down_proj.weight": "model-00004-of-00047.safetensors", + "model.layers.3.mlp.experts.92.down_proj.weight_scale": "model-00004-of-00047.safetensors", + "model.layers.3.mlp.experts.92.gate_proj.weight": "model-00004-of-00047.safetensors", + "model.layers.3.mlp.experts.92.gate_proj.weight_scale": "model-00004-of-00047.safetensors", + "model.layers.3.mlp.experts.92.up_proj.weight": "model-00004-of-00047.safetensors", + "model.layers.3.mlp.experts.92.up_proj.weight_scale": "model-00004-of-00047.safetensors", + "model.layers.3.mlp.experts.93.down_proj.weight": "model-00004-of-00047.safetensors", + "model.layers.3.mlp.experts.93.down_proj.weight_scale": "model-00004-of-00047.safetensors", + "model.layers.3.mlp.experts.93.gate_proj.weight": "model-00004-of-00047.safetensors", + "model.layers.3.mlp.experts.93.gate_proj.weight_scale": "model-00004-of-00047.safetensors", + "model.layers.3.mlp.experts.93.up_proj.weight": "model-00004-of-00047.safetensors", + "model.layers.3.mlp.experts.93.up_proj.weight_scale": "model-00004-of-00047.safetensors", + "model.layers.3.mlp.experts.94.down_proj.weight": "model-00004-of-00047.safetensors", + "model.layers.3.mlp.experts.94.down_proj.weight_scale": "model-00004-of-00047.safetensors", + "model.layers.3.mlp.experts.94.gate_proj.weight": "model-00004-of-00047.safetensors", + "model.layers.3.mlp.experts.94.gate_proj.weight_scale": "model-00004-of-00047.safetensors", + "model.layers.3.mlp.experts.94.up_proj.weight": "model-00004-of-00047.safetensors", + "model.layers.3.mlp.experts.94.up_proj.weight_scale": "model-00004-of-00047.safetensors", + "model.layers.3.mlp.experts.95.down_proj.weight": "model-00004-of-00047.safetensors", + "model.layers.3.mlp.experts.95.down_proj.weight_scale": "model-00004-of-00047.safetensors", + "model.layers.3.mlp.experts.95.gate_proj.weight": "model-00004-of-00047.safetensors", + "model.layers.3.mlp.experts.95.gate_proj.weight_scale": "model-00004-of-00047.safetensors", + "model.layers.3.mlp.experts.95.up_proj.weight": "model-00004-of-00047.safetensors", + "model.layers.3.mlp.experts.95.up_proj.weight_scale": "model-00004-of-00047.safetensors", + "model.layers.3.mlp.experts.96.down_proj.weight": "model-00004-of-00047.safetensors", + "model.layers.3.mlp.experts.96.down_proj.weight_scale": "model-00004-of-00047.safetensors", + "model.layers.3.mlp.experts.96.gate_proj.weight": "model-00004-of-00047.safetensors", + "model.layers.3.mlp.experts.96.gate_proj.weight_scale": "model-00004-of-00047.safetensors", + "model.layers.3.mlp.experts.96.up_proj.weight": "model-00004-of-00047.safetensors", + "model.layers.3.mlp.experts.96.up_proj.weight_scale": "model-00004-of-00047.safetensors", + "model.layers.3.mlp.experts.97.down_proj.weight": "model-00004-of-00047.safetensors", + "model.layers.3.mlp.experts.97.down_proj.weight_scale": "model-00004-of-00047.safetensors", + "model.layers.3.mlp.experts.97.gate_proj.weight": "model-00004-of-00047.safetensors", + "model.layers.3.mlp.experts.97.gate_proj.weight_scale": "model-00004-of-00047.safetensors", + "model.layers.3.mlp.experts.97.up_proj.weight": "model-00004-of-00047.safetensors", + "model.layers.3.mlp.experts.97.up_proj.weight_scale": "model-00004-of-00047.safetensors", + "model.layers.3.mlp.experts.98.down_proj.weight": "model-00004-of-00047.safetensors", + "model.layers.3.mlp.experts.98.down_proj.weight_scale": "model-00004-of-00047.safetensors", + "model.layers.3.mlp.experts.98.gate_proj.weight": "model-00004-of-00047.safetensors", + "model.layers.3.mlp.experts.98.gate_proj.weight_scale": "model-00004-of-00047.safetensors", + "model.layers.3.mlp.experts.98.up_proj.weight": "model-00004-of-00047.safetensors", + "model.layers.3.mlp.experts.98.up_proj.weight_scale": "model-00004-of-00047.safetensors", + "model.layers.3.mlp.experts.99.down_proj.weight": "model-00004-of-00047.safetensors", + "model.layers.3.mlp.experts.99.down_proj.weight_scale": "model-00004-of-00047.safetensors", + "model.layers.3.mlp.experts.99.gate_proj.weight": "model-00004-of-00047.safetensors", + "model.layers.3.mlp.experts.99.gate_proj.weight_scale": "model-00004-of-00047.safetensors", + "model.layers.3.mlp.experts.99.up_proj.weight": "model-00004-of-00047.safetensors", + "model.layers.3.mlp.experts.99.up_proj.weight_scale": "model-00004-of-00047.safetensors", + "model.layers.3.mlp.gate.e_score_correction_bias": "model-00004-of-00047.safetensors", + "model.layers.3.mlp.gate.weight": "model-00004-of-00047.safetensors", + "model.layers.3.mlp.shared_experts.down_proj.weight": "model-00004-of-00047.safetensors", + "model.layers.3.mlp.shared_experts.down_proj.weight_scale": "model-00004-of-00047.safetensors", + "model.layers.3.mlp.shared_experts.gate_proj.weight": "model-00004-of-00047.safetensors", + "model.layers.3.mlp.shared_experts.gate_proj.weight_scale": "model-00004-of-00047.safetensors", + "model.layers.3.mlp.shared_experts.up_proj.weight": "model-00004-of-00047.safetensors", + "model.layers.3.mlp.shared_experts.up_proj.weight_scale": "model-00004-of-00047.safetensors", + "model.layers.3.post_attention_layernorm.weight": "model-00004-of-00047.safetensors", + "model.layers.3.self_attn.k_proj.bias": "model-00004-of-00047.safetensors", + "model.layers.3.self_attn.k_proj.weight": "model-00004-of-00047.safetensors", + "model.layers.3.self_attn.k_proj.weight_scale": "model-00004-of-00047.safetensors", + "model.layers.3.self_attn.o_proj.weight": "model-00004-of-00047.safetensors", + "model.layers.3.self_attn.o_proj.weight_scale": "model-00004-of-00047.safetensors", + "model.layers.3.self_attn.q_proj.bias": "model-00004-of-00047.safetensors", + "model.layers.3.self_attn.q_proj.weight": "model-00004-of-00047.safetensors", + "model.layers.3.self_attn.q_proj.weight_scale": "model-00004-of-00047.safetensors", + "model.layers.3.self_attn.v_proj.bias": "model-00004-of-00047.safetensors", + "model.layers.3.self_attn.v_proj.weight": "model-00004-of-00047.safetensors", + "model.layers.3.self_attn.v_proj.weight_scale": "model-00004-of-00047.safetensors", + "model.layers.4.input_layernorm.weight": "model-00005-of-00047.safetensors", + "model.layers.4.mlp.experts.0.down_proj.weight": "model-00005-of-00047.safetensors", + "model.layers.4.mlp.experts.0.down_proj.weight_scale": "model-00005-of-00047.safetensors", + "model.layers.4.mlp.experts.0.gate_proj.weight": "model-00005-of-00047.safetensors", + "model.layers.4.mlp.experts.0.gate_proj.weight_scale": "model-00005-of-00047.safetensors", + "model.layers.4.mlp.experts.0.up_proj.weight": "model-00005-of-00047.safetensors", + "model.layers.4.mlp.experts.0.up_proj.weight_scale": "model-00005-of-00047.safetensors", + "model.layers.4.mlp.experts.1.down_proj.weight": "model-00005-of-00047.safetensors", + "model.layers.4.mlp.experts.1.down_proj.weight_scale": "model-00005-of-00047.safetensors", + "model.layers.4.mlp.experts.1.gate_proj.weight": "model-00005-of-00047.safetensors", + "model.layers.4.mlp.experts.1.gate_proj.weight_scale": "model-00005-of-00047.safetensors", + "model.layers.4.mlp.experts.1.up_proj.weight": "model-00005-of-00047.safetensors", + "model.layers.4.mlp.experts.1.up_proj.weight_scale": "model-00005-of-00047.safetensors", + "model.layers.4.mlp.experts.10.down_proj.weight": "model-00005-of-00047.safetensors", + "model.layers.4.mlp.experts.10.down_proj.weight_scale": "model-00005-of-00047.safetensors", + "model.layers.4.mlp.experts.10.gate_proj.weight": "model-00005-of-00047.safetensors", + "model.layers.4.mlp.experts.10.gate_proj.weight_scale": "model-00005-of-00047.safetensors", + "model.layers.4.mlp.experts.10.up_proj.weight": "model-00005-of-00047.safetensors", + "model.layers.4.mlp.experts.10.up_proj.weight_scale": "model-00005-of-00047.safetensors", + "model.layers.4.mlp.experts.100.down_proj.weight": "model-00005-of-00047.safetensors", + "model.layers.4.mlp.experts.100.down_proj.weight_scale": "model-00005-of-00047.safetensors", + "model.layers.4.mlp.experts.100.gate_proj.weight": "model-00005-of-00047.safetensors", + "model.layers.4.mlp.experts.100.gate_proj.weight_scale": "model-00005-of-00047.safetensors", + "model.layers.4.mlp.experts.100.up_proj.weight": "model-00005-of-00047.safetensors", + "model.layers.4.mlp.experts.100.up_proj.weight_scale": "model-00005-of-00047.safetensors", + "model.layers.4.mlp.experts.101.down_proj.weight": "model-00005-of-00047.safetensors", + "model.layers.4.mlp.experts.101.down_proj.weight_scale": "model-00005-of-00047.safetensors", + "model.layers.4.mlp.experts.101.gate_proj.weight": "model-00005-of-00047.safetensors", + "model.layers.4.mlp.experts.101.gate_proj.weight_scale": "model-00005-of-00047.safetensors", + "model.layers.4.mlp.experts.101.up_proj.weight": "model-00005-of-00047.safetensors", + "model.layers.4.mlp.experts.101.up_proj.weight_scale": "model-00005-of-00047.safetensors", + "model.layers.4.mlp.experts.102.down_proj.weight": "model-00005-of-00047.safetensors", + "model.layers.4.mlp.experts.102.down_proj.weight_scale": "model-00005-of-00047.safetensors", + "model.layers.4.mlp.experts.102.gate_proj.weight": "model-00005-of-00047.safetensors", + "model.layers.4.mlp.experts.102.gate_proj.weight_scale": "model-00005-of-00047.safetensors", + "model.layers.4.mlp.experts.102.up_proj.weight": "model-00005-of-00047.safetensors", + "model.layers.4.mlp.experts.102.up_proj.weight_scale": "model-00005-of-00047.safetensors", + "model.layers.4.mlp.experts.103.down_proj.weight": "model-00005-of-00047.safetensors", + "model.layers.4.mlp.experts.103.down_proj.weight_scale": "model-00005-of-00047.safetensors", + "model.layers.4.mlp.experts.103.gate_proj.weight": "model-00005-of-00047.safetensors", + "model.layers.4.mlp.experts.103.gate_proj.weight_scale": "model-00005-of-00047.safetensors", + "model.layers.4.mlp.experts.103.up_proj.weight": "model-00005-of-00047.safetensors", + "model.layers.4.mlp.experts.103.up_proj.weight_scale": "model-00005-of-00047.safetensors", + "model.layers.4.mlp.experts.104.down_proj.weight": "model-00005-of-00047.safetensors", + "model.layers.4.mlp.experts.104.down_proj.weight_scale": "model-00005-of-00047.safetensors", + "model.layers.4.mlp.experts.104.gate_proj.weight": "model-00005-of-00047.safetensors", + "model.layers.4.mlp.experts.104.gate_proj.weight_scale": "model-00005-of-00047.safetensors", + "model.layers.4.mlp.experts.104.up_proj.weight": "model-00005-of-00047.safetensors", + "model.layers.4.mlp.experts.104.up_proj.weight_scale": "model-00005-of-00047.safetensors", + "model.layers.4.mlp.experts.105.down_proj.weight": "model-00005-of-00047.safetensors", + "model.layers.4.mlp.experts.105.down_proj.weight_scale": "model-00005-of-00047.safetensors", + "model.layers.4.mlp.experts.105.gate_proj.weight": "model-00005-of-00047.safetensors", + "model.layers.4.mlp.experts.105.gate_proj.weight_scale": "model-00005-of-00047.safetensors", + "model.layers.4.mlp.experts.105.up_proj.weight": "model-00005-of-00047.safetensors", + "model.layers.4.mlp.experts.105.up_proj.weight_scale": "model-00005-of-00047.safetensors", + "model.layers.4.mlp.experts.106.down_proj.weight": "model-00005-of-00047.safetensors", + "model.layers.4.mlp.experts.106.down_proj.weight_scale": "model-00005-of-00047.safetensors", + "model.layers.4.mlp.experts.106.gate_proj.weight": "model-00005-of-00047.safetensors", + "model.layers.4.mlp.experts.106.gate_proj.weight_scale": "model-00005-of-00047.safetensors", + "model.layers.4.mlp.experts.106.up_proj.weight": "model-00005-of-00047.safetensors", + "model.layers.4.mlp.experts.106.up_proj.weight_scale": "model-00005-of-00047.safetensors", + "model.layers.4.mlp.experts.107.down_proj.weight": "model-00005-of-00047.safetensors", + "model.layers.4.mlp.experts.107.down_proj.weight_scale": "model-00005-of-00047.safetensors", + "model.layers.4.mlp.experts.107.gate_proj.weight": "model-00005-of-00047.safetensors", + "model.layers.4.mlp.experts.107.gate_proj.weight_scale": "model-00005-of-00047.safetensors", + "model.layers.4.mlp.experts.107.up_proj.weight": "model-00005-of-00047.safetensors", + "model.layers.4.mlp.experts.107.up_proj.weight_scale": "model-00005-of-00047.safetensors", + "model.layers.4.mlp.experts.108.down_proj.weight": "model-00005-of-00047.safetensors", + "model.layers.4.mlp.experts.108.down_proj.weight_scale": "model-00005-of-00047.safetensors", + "model.layers.4.mlp.experts.108.gate_proj.weight": "model-00005-of-00047.safetensors", + "model.layers.4.mlp.experts.108.gate_proj.weight_scale": "model-00005-of-00047.safetensors", + "model.layers.4.mlp.experts.108.up_proj.weight": "model-00005-of-00047.safetensors", + "model.layers.4.mlp.experts.108.up_proj.weight_scale": "model-00005-of-00047.safetensors", + "model.layers.4.mlp.experts.109.down_proj.weight": "model-00005-of-00047.safetensors", + "model.layers.4.mlp.experts.109.down_proj.weight_scale": "model-00005-of-00047.safetensors", + "model.layers.4.mlp.experts.109.gate_proj.weight": "model-00005-of-00047.safetensors", + "model.layers.4.mlp.experts.109.gate_proj.weight_scale": "model-00005-of-00047.safetensors", + "model.layers.4.mlp.experts.109.up_proj.weight": "model-00005-of-00047.safetensors", + "model.layers.4.mlp.experts.109.up_proj.weight_scale": "model-00005-of-00047.safetensors", + "model.layers.4.mlp.experts.11.down_proj.weight": "model-00005-of-00047.safetensors", + "model.layers.4.mlp.experts.11.down_proj.weight_scale": "model-00005-of-00047.safetensors", + "model.layers.4.mlp.experts.11.gate_proj.weight": "model-00005-of-00047.safetensors", + "model.layers.4.mlp.experts.11.gate_proj.weight_scale": "model-00005-of-00047.safetensors", + "model.layers.4.mlp.experts.11.up_proj.weight": "model-00005-of-00047.safetensors", + "model.layers.4.mlp.experts.11.up_proj.weight_scale": "model-00005-of-00047.safetensors", + "model.layers.4.mlp.experts.110.down_proj.weight": "model-00005-of-00047.safetensors", + "model.layers.4.mlp.experts.110.down_proj.weight_scale": "model-00005-of-00047.safetensors", + "model.layers.4.mlp.experts.110.gate_proj.weight": "model-00005-of-00047.safetensors", + "model.layers.4.mlp.experts.110.gate_proj.weight_scale": "model-00005-of-00047.safetensors", + "model.layers.4.mlp.experts.110.up_proj.weight": "model-00005-of-00047.safetensors", + "model.layers.4.mlp.experts.110.up_proj.weight_scale": "model-00005-of-00047.safetensors", + "model.layers.4.mlp.experts.111.down_proj.weight": "model-00005-of-00047.safetensors", + "model.layers.4.mlp.experts.111.down_proj.weight_scale": "model-00005-of-00047.safetensors", + "model.layers.4.mlp.experts.111.gate_proj.weight": "model-00005-of-00047.safetensors", + "model.layers.4.mlp.experts.111.gate_proj.weight_scale": "model-00005-of-00047.safetensors", + "model.layers.4.mlp.experts.111.up_proj.weight": "model-00005-of-00047.safetensors", + "model.layers.4.mlp.experts.111.up_proj.weight_scale": "model-00005-of-00047.safetensors", + "model.layers.4.mlp.experts.112.down_proj.weight": "model-00005-of-00047.safetensors", + "model.layers.4.mlp.experts.112.down_proj.weight_scale": "model-00005-of-00047.safetensors", + "model.layers.4.mlp.experts.112.gate_proj.weight": "model-00005-of-00047.safetensors", + "model.layers.4.mlp.experts.112.gate_proj.weight_scale": "model-00005-of-00047.safetensors", + "model.layers.4.mlp.experts.112.up_proj.weight": "model-00005-of-00047.safetensors", + "model.layers.4.mlp.experts.112.up_proj.weight_scale": "model-00005-of-00047.safetensors", + "model.layers.4.mlp.experts.113.down_proj.weight": "model-00005-of-00047.safetensors", + "model.layers.4.mlp.experts.113.down_proj.weight_scale": "model-00005-of-00047.safetensors", + "model.layers.4.mlp.experts.113.gate_proj.weight": "model-00005-of-00047.safetensors", + "model.layers.4.mlp.experts.113.gate_proj.weight_scale": "model-00005-of-00047.safetensors", + "model.layers.4.mlp.experts.113.up_proj.weight": "model-00005-of-00047.safetensors", + "model.layers.4.mlp.experts.113.up_proj.weight_scale": "model-00005-of-00047.safetensors", + "model.layers.4.mlp.experts.114.down_proj.weight": "model-00005-of-00047.safetensors", + "model.layers.4.mlp.experts.114.down_proj.weight_scale": "model-00005-of-00047.safetensors", + "model.layers.4.mlp.experts.114.gate_proj.weight": "model-00005-of-00047.safetensors", + "model.layers.4.mlp.experts.114.gate_proj.weight_scale": "model-00005-of-00047.safetensors", + "model.layers.4.mlp.experts.114.up_proj.weight": "model-00005-of-00047.safetensors", + "model.layers.4.mlp.experts.114.up_proj.weight_scale": "model-00005-of-00047.safetensors", + "model.layers.4.mlp.experts.115.down_proj.weight": "model-00005-of-00047.safetensors", + "model.layers.4.mlp.experts.115.down_proj.weight_scale": "model-00005-of-00047.safetensors", + "model.layers.4.mlp.experts.115.gate_proj.weight": "model-00005-of-00047.safetensors", + "model.layers.4.mlp.experts.115.gate_proj.weight_scale": "model-00005-of-00047.safetensors", + "model.layers.4.mlp.experts.115.up_proj.weight": "model-00005-of-00047.safetensors", + "model.layers.4.mlp.experts.115.up_proj.weight_scale": "model-00005-of-00047.safetensors", + "model.layers.4.mlp.experts.116.down_proj.weight": "model-00005-of-00047.safetensors", + "model.layers.4.mlp.experts.116.down_proj.weight_scale": "model-00005-of-00047.safetensors", + "model.layers.4.mlp.experts.116.gate_proj.weight": "model-00005-of-00047.safetensors", + "model.layers.4.mlp.experts.116.gate_proj.weight_scale": "model-00005-of-00047.safetensors", + "model.layers.4.mlp.experts.116.up_proj.weight": "model-00005-of-00047.safetensors", + "model.layers.4.mlp.experts.116.up_proj.weight_scale": "model-00005-of-00047.safetensors", + "model.layers.4.mlp.experts.117.down_proj.weight": "model-00005-of-00047.safetensors", + "model.layers.4.mlp.experts.117.down_proj.weight_scale": "model-00005-of-00047.safetensors", + "model.layers.4.mlp.experts.117.gate_proj.weight": "model-00005-of-00047.safetensors", + "model.layers.4.mlp.experts.117.gate_proj.weight_scale": "model-00005-of-00047.safetensors", + "model.layers.4.mlp.experts.117.up_proj.weight": "model-00005-of-00047.safetensors", + "model.layers.4.mlp.experts.117.up_proj.weight_scale": "model-00005-of-00047.safetensors", + "model.layers.4.mlp.experts.118.down_proj.weight": "model-00005-of-00047.safetensors", + "model.layers.4.mlp.experts.118.down_proj.weight_scale": "model-00005-of-00047.safetensors", + "model.layers.4.mlp.experts.118.gate_proj.weight": "model-00005-of-00047.safetensors", + "model.layers.4.mlp.experts.118.gate_proj.weight_scale": "model-00005-of-00047.safetensors", + "model.layers.4.mlp.experts.118.up_proj.weight": "model-00005-of-00047.safetensors", + "model.layers.4.mlp.experts.118.up_proj.weight_scale": "model-00005-of-00047.safetensors", + "model.layers.4.mlp.experts.119.down_proj.weight": "model-00005-of-00047.safetensors", + "model.layers.4.mlp.experts.119.down_proj.weight_scale": "model-00005-of-00047.safetensors", + "model.layers.4.mlp.experts.119.gate_proj.weight": "model-00005-of-00047.safetensors", + "model.layers.4.mlp.experts.119.gate_proj.weight_scale": "model-00005-of-00047.safetensors", + "model.layers.4.mlp.experts.119.up_proj.weight": "model-00005-of-00047.safetensors", + "model.layers.4.mlp.experts.119.up_proj.weight_scale": "model-00005-of-00047.safetensors", + "model.layers.4.mlp.experts.12.down_proj.weight": "model-00005-of-00047.safetensors", + "model.layers.4.mlp.experts.12.down_proj.weight_scale": "model-00005-of-00047.safetensors", + "model.layers.4.mlp.experts.12.gate_proj.weight": "model-00005-of-00047.safetensors", + "model.layers.4.mlp.experts.12.gate_proj.weight_scale": "model-00005-of-00047.safetensors", + "model.layers.4.mlp.experts.12.up_proj.weight": "model-00005-of-00047.safetensors", + "model.layers.4.mlp.experts.12.up_proj.weight_scale": "model-00005-of-00047.safetensors", + "model.layers.4.mlp.experts.120.down_proj.weight": "model-00005-of-00047.safetensors", + "model.layers.4.mlp.experts.120.down_proj.weight_scale": "model-00005-of-00047.safetensors", + "model.layers.4.mlp.experts.120.gate_proj.weight": "model-00005-of-00047.safetensors", + "model.layers.4.mlp.experts.120.gate_proj.weight_scale": "model-00005-of-00047.safetensors", + "model.layers.4.mlp.experts.120.up_proj.weight": "model-00005-of-00047.safetensors", + "model.layers.4.mlp.experts.120.up_proj.weight_scale": "model-00005-of-00047.safetensors", + "model.layers.4.mlp.experts.121.down_proj.weight": "model-00005-of-00047.safetensors", + "model.layers.4.mlp.experts.121.down_proj.weight_scale": "model-00005-of-00047.safetensors", + "model.layers.4.mlp.experts.121.gate_proj.weight": "model-00005-of-00047.safetensors", + "model.layers.4.mlp.experts.121.gate_proj.weight_scale": "model-00005-of-00047.safetensors", + "model.layers.4.mlp.experts.121.up_proj.weight": "model-00005-of-00047.safetensors", + "model.layers.4.mlp.experts.121.up_proj.weight_scale": "model-00005-of-00047.safetensors", + "model.layers.4.mlp.experts.122.down_proj.weight": "model-00005-of-00047.safetensors", + "model.layers.4.mlp.experts.122.down_proj.weight_scale": "model-00005-of-00047.safetensors", + "model.layers.4.mlp.experts.122.gate_proj.weight": "model-00005-of-00047.safetensors", + "model.layers.4.mlp.experts.122.gate_proj.weight_scale": "model-00005-of-00047.safetensors", + "model.layers.4.mlp.experts.122.up_proj.weight": "model-00005-of-00047.safetensors", + "model.layers.4.mlp.experts.122.up_proj.weight_scale": "model-00005-of-00047.safetensors", + "model.layers.4.mlp.experts.123.down_proj.weight": "model-00005-of-00047.safetensors", + "model.layers.4.mlp.experts.123.down_proj.weight_scale": "model-00005-of-00047.safetensors", + "model.layers.4.mlp.experts.123.gate_proj.weight": "model-00005-of-00047.safetensors", + "model.layers.4.mlp.experts.123.gate_proj.weight_scale": "model-00005-of-00047.safetensors", + "model.layers.4.mlp.experts.123.up_proj.weight": "model-00005-of-00047.safetensors", + "model.layers.4.mlp.experts.123.up_proj.weight_scale": "model-00005-of-00047.safetensors", + "model.layers.4.mlp.experts.124.down_proj.weight": "model-00005-of-00047.safetensors", + "model.layers.4.mlp.experts.124.down_proj.weight_scale": "model-00005-of-00047.safetensors", + "model.layers.4.mlp.experts.124.gate_proj.weight": "model-00005-of-00047.safetensors", + "model.layers.4.mlp.experts.124.gate_proj.weight_scale": "model-00005-of-00047.safetensors", + "model.layers.4.mlp.experts.124.up_proj.weight": "model-00005-of-00047.safetensors", + "model.layers.4.mlp.experts.124.up_proj.weight_scale": "model-00005-of-00047.safetensors", + "model.layers.4.mlp.experts.125.down_proj.weight": "model-00005-of-00047.safetensors", + "model.layers.4.mlp.experts.125.down_proj.weight_scale": "model-00005-of-00047.safetensors", + "model.layers.4.mlp.experts.125.gate_proj.weight": "model-00005-of-00047.safetensors", + "model.layers.4.mlp.experts.125.gate_proj.weight_scale": "model-00005-of-00047.safetensors", + "model.layers.4.mlp.experts.125.up_proj.weight": "model-00005-of-00047.safetensors", + "model.layers.4.mlp.experts.125.up_proj.weight_scale": "model-00005-of-00047.safetensors", + "model.layers.4.mlp.experts.126.down_proj.weight": "model-00005-of-00047.safetensors", + "model.layers.4.mlp.experts.126.down_proj.weight_scale": "model-00005-of-00047.safetensors", + "model.layers.4.mlp.experts.126.gate_proj.weight": "model-00005-of-00047.safetensors", + "model.layers.4.mlp.experts.126.gate_proj.weight_scale": "model-00005-of-00047.safetensors", + "model.layers.4.mlp.experts.126.up_proj.weight": "model-00005-of-00047.safetensors", + "model.layers.4.mlp.experts.126.up_proj.weight_scale": "model-00005-of-00047.safetensors", + "model.layers.4.mlp.experts.127.down_proj.weight": "model-00005-of-00047.safetensors", + "model.layers.4.mlp.experts.127.down_proj.weight_scale": "model-00005-of-00047.safetensors", + "model.layers.4.mlp.experts.127.gate_proj.weight": "model-00005-of-00047.safetensors", + "model.layers.4.mlp.experts.127.gate_proj.weight_scale": "model-00005-of-00047.safetensors", + "model.layers.4.mlp.experts.127.up_proj.weight": "model-00005-of-00047.safetensors", + "model.layers.4.mlp.experts.127.up_proj.weight_scale": "model-00005-of-00047.safetensors", + "model.layers.4.mlp.experts.13.down_proj.weight": "model-00005-of-00047.safetensors", + "model.layers.4.mlp.experts.13.down_proj.weight_scale": "model-00005-of-00047.safetensors", + "model.layers.4.mlp.experts.13.gate_proj.weight": "model-00005-of-00047.safetensors", + "model.layers.4.mlp.experts.13.gate_proj.weight_scale": "model-00005-of-00047.safetensors", + "model.layers.4.mlp.experts.13.up_proj.weight": "model-00005-of-00047.safetensors", + "model.layers.4.mlp.experts.13.up_proj.weight_scale": "model-00005-of-00047.safetensors", + "model.layers.4.mlp.experts.14.down_proj.weight": "model-00005-of-00047.safetensors", + "model.layers.4.mlp.experts.14.down_proj.weight_scale": "model-00005-of-00047.safetensors", + "model.layers.4.mlp.experts.14.gate_proj.weight": "model-00005-of-00047.safetensors", + "model.layers.4.mlp.experts.14.gate_proj.weight_scale": "model-00005-of-00047.safetensors", + "model.layers.4.mlp.experts.14.up_proj.weight": "model-00005-of-00047.safetensors", + "model.layers.4.mlp.experts.14.up_proj.weight_scale": "model-00005-of-00047.safetensors", + "model.layers.4.mlp.experts.15.down_proj.weight": "model-00005-of-00047.safetensors", + "model.layers.4.mlp.experts.15.down_proj.weight_scale": "model-00005-of-00047.safetensors", + "model.layers.4.mlp.experts.15.gate_proj.weight": "model-00005-of-00047.safetensors", + "model.layers.4.mlp.experts.15.gate_proj.weight_scale": "model-00005-of-00047.safetensors", + "model.layers.4.mlp.experts.15.up_proj.weight": "model-00005-of-00047.safetensors", + "model.layers.4.mlp.experts.15.up_proj.weight_scale": "model-00005-of-00047.safetensors", + "model.layers.4.mlp.experts.16.down_proj.weight": "model-00005-of-00047.safetensors", + "model.layers.4.mlp.experts.16.down_proj.weight_scale": "model-00005-of-00047.safetensors", + "model.layers.4.mlp.experts.16.gate_proj.weight": "model-00005-of-00047.safetensors", + "model.layers.4.mlp.experts.16.gate_proj.weight_scale": "model-00005-of-00047.safetensors", + "model.layers.4.mlp.experts.16.up_proj.weight": "model-00005-of-00047.safetensors", + "model.layers.4.mlp.experts.16.up_proj.weight_scale": "model-00005-of-00047.safetensors", + "model.layers.4.mlp.experts.17.down_proj.weight": "model-00005-of-00047.safetensors", + "model.layers.4.mlp.experts.17.down_proj.weight_scale": "model-00005-of-00047.safetensors", + "model.layers.4.mlp.experts.17.gate_proj.weight": "model-00005-of-00047.safetensors", + "model.layers.4.mlp.experts.17.gate_proj.weight_scale": "model-00005-of-00047.safetensors", + "model.layers.4.mlp.experts.17.up_proj.weight": "model-00005-of-00047.safetensors", + "model.layers.4.mlp.experts.17.up_proj.weight_scale": "model-00005-of-00047.safetensors", + "model.layers.4.mlp.experts.18.down_proj.weight": "model-00005-of-00047.safetensors", + "model.layers.4.mlp.experts.18.down_proj.weight_scale": "model-00005-of-00047.safetensors", + "model.layers.4.mlp.experts.18.gate_proj.weight": "model-00005-of-00047.safetensors", + "model.layers.4.mlp.experts.18.gate_proj.weight_scale": "model-00005-of-00047.safetensors", + "model.layers.4.mlp.experts.18.up_proj.weight": "model-00005-of-00047.safetensors", + "model.layers.4.mlp.experts.18.up_proj.weight_scale": "model-00005-of-00047.safetensors", + "model.layers.4.mlp.experts.19.down_proj.weight": "model-00005-of-00047.safetensors", + "model.layers.4.mlp.experts.19.down_proj.weight_scale": "model-00005-of-00047.safetensors", + "model.layers.4.mlp.experts.19.gate_proj.weight": "model-00005-of-00047.safetensors", + "model.layers.4.mlp.experts.19.gate_proj.weight_scale": "model-00005-of-00047.safetensors", + "model.layers.4.mlp.experts.19.up_proj.weight": "model-00005-of-00047.safetensors", + "model.layers.4.mlp.experts.19.up_proj.weight_scale": "model-00005-of-00047.safetensors", + "model.layers.4.mlp.experts.2.down_proj.weight": "model-00005-of-00047.safetensors", + "model.layers.4.mlp.experts.2.down_proj.weight_scale": "model-00005-of-00047.safetensors", + "model.layers.4.mlp.experts.2.gate_proj.weight": "model-00005-of-00047.safetensors", + "model.layers.4.mlp.experts.2.gate_proj.weight_scale": "model-00005-of-00047.safetensors", + "model.layers.4.mlp.experts.2.up_proj.weight": "model-00005-of-00047.safetensors", + "model.layers.4.mlp.experts.2.up_proj.weight_scale": "model-00005-of-00047.safetensors", + "model.layers.4.mlp.experts.20.down_proj.weight": "model-00005-of-00047.safetensors", + "model.layers.4.mlp.experts.20.down_proj.weight_scale": "model-00005-of-00047.safetensors", + "model.layers.4.mlp.experts.20.gate_proj.weight": "model-00005-of-00047.safetensors", + "model.layers.4.mlp.experts.20.gate_proj.weight_scale": "model-00005-of-00047.safetensors", + "model.layers.4.mlp.experts.20.up_proj.weight": "model-00005-of-00047.safetensors", + "model.layers.4.mlp.experts.20.up_proj.weight_scale": "model-00005-of-00047.safetensors", + "model.layers.4.mlp.experts.21.down_proj.weight": "model-00005-of-00047.safetensors", + "model.layers.4.mlp.experts.21.down_proj.weight_scale": "model-00005-of-00047.safetensors", + "model.layers.4.mlp.experts.21.gate_proj.weight": "model-00005-of-00047.safetensors", + "model.layers.4.mlp.experts.21.gate_proj.weight_scale": "model-00005-of-00047.safetensors", + "model.layers.4.mlp.experts.21.up_proj.weight": "model-00005-of-00047.safetensors", + "model.layers.4.mlp.experts.21.up_proj.weight_scale": "model-00005-of-00047.safetensors", + "model.layers.4.mlp.experts.22.down_proj.weight": "model-00005-of-00047.safetensors", + "model.layers.4.mlp.experts.22.down_proj.weight_scale": "model-00005-of-00047.safetensors", + "model.layers.4.mlp.experts.22.gate_proj.weight": "model-00005-of-00047.safetensors", + "model.layers.4.mlp.experts.22.gate_proj.weight_scale": "model-00005-of-00047.safetensors", + "model.layers.4.mlp.experts.22.up_proj.weight": "model-00005-of-00047.safetensors", + "model.layers.4.mlp.experts.22.up_proj.weight_scale": "model-00005-of-00047.safetensors", + "model.layers.4.mlp.experts.23.down_proj.weight": "model-00005-of-00047.safetensors", + "model.layers.4.mlp.experts.23.down_proj.weight_scale": "model-00005-of-00047.safetensors", + "model.layers.4.mlp.experts.23.gate_proj.weight": "model-00005-of-00047.safetensors", + "model.layers.4.mlp.experts.23.gate_proj.weight_scale": "model-00005-of-00047.safetensors", + "model.layers.4.mlp.experts.23.up_proj.weight": "model-00005-of-00047.safetensors", + "model.layers.4.mlp.experts.23.up_proj.weight_scale": "model-00005-of-00047.safetensors", + "model.layers.4.mlp.experts.24.down_proj.weight": "model-00005-of-00047.safetensors", + "model.layers.4.mlp.experts.24.down_proj.weight_scale": "model-00005-of-00047.safetensors", + "model.layers.4.mlp.experts.24.gate_proj.weight": "model-00005-of-00047.safetensors", + "model.layers.4.mlp.experts.24.gate_proj.weight_scale": "model-00005-of-00047.safetensors", + "model.layers.4.mlp.experts.24.up_proj.weight": "model-00005-of-00047.safetensors", + "model.layers.4.mlp.experts.24.up_proj.weight_scale": "model-00005-of-00047.safetensors", + "model.layers.4.mlp.experts.25.down_proj.weight": "model-00005-of-00047.safetensors", + "model.layers.4.mlp.experts.25.down_proj.weight_scale": "model-00005-of-00047.safetensors", + "model.layers.4.mlp.experts.25.gate_proj.weight": "model-00005-of-00047.safetensors", + "model.layers.4.mlp.experts.25.gate_proj.weight_scale": "model-00005-of-00047.safetensors", + "model.layers.4.mlp.experts.25.up_proj.weight": "model-00005-of-00047.safetensors", + "model.layers.4.mlp.experts.25.up_proj.weight_scale": "model-00005-of-00047.safetensors", + "model.layers.4.mlp.experts.26.down_proj.weight": "model-00005-of-00047.safetensors", + "model.layers.4.mlp.experts.26.down_proj.weight_scale": "model-00005-of-00047.safetensors", + "model.layers.4.mlp.experts.26.gate_proj.weight": "model-00005-of-00047.safetensors", + "model.layers.4.mlp.experts.26.gate_proj.weight_scale": "model-00005-of-00047.safetensors", + "model.layers.4.mlp.experts.26.up_proj.weight": "model-00005-of-00047.safetensors", + "model.layers.4.mlp.experts.26.up_proj.weight_scale": "model-00005-of-00047.safetensors", + "model.layers.4.mlp.experts.27.down_proj.weight": "model-00005-of-00047.safetensors", + "model.layers.4.mlp.experts.27.down_proj.weight_scale": "model-00005-of-00047.safetensors", + "model.layers.4.mlp.experts.27.gate_proj.weight": "model-00005-of-00047.safetensors", + "model.layers.4.mlp.experts.27.gate_proj.weight_scale": "model-00005-of-00047.safetensors", + "model.layers.4.mlp.experts.27.up_proj.weight": "model-00005-of-00047.safetensors", + "model.layers.4.mlp.experts.27.up_proj.weight_scale": "model-00005-of-00047.safetensors", + "model.layers.4.mlp.experts.28.down_proj.weight": "model-00005-of-00047.safetensors", + "model.layers.4.mlp.experts.28.down_proj.weight_scale": "model-00005-of-00047.safetensors", + "model.layers.4.mlp.experts.28.gate_proj.weight": "model-00005-of-00047.safetensors", + "model.layers.4.mlp.experts.28.gate_proj.weight_scale": "model-00005-of-00047.safetensors", + "model.layers.4.mlp.experts.28.up_proj.weight": "model-00005-of-00047.safetensors", + "model.layers.4.mlp.experts.28.up_proj.weight_scale": "model-00005-of-00047.safetensors", + "model.layers.4.mlp.experts.29.down_proj.weight": "model-00005-of-00047.safetensors", + "model.layers.4.mlp.experts.29.down_proj.weight_scale": "model-00005-of-00047.safetensors", + "model.layers.4.mlp.experts.29.gate_proj.weight": "model-00005-of-00047.safetensors", + "model.layers.4.mlp.experts.29.gate_proj.weight_scale": "model-00005-of-00047.safetensors", + "model.layers.4.mlp.experts.29.up_proj.weight": "model-00005-of-00047.safetensors", + "model.layers.4.mlp.experts.29.up_proj.weight_scale": "model-00005-of-00047.safetensors", + "model.layers.4.mlp.experts.3.down_proj.weight": "model-00005-of-00047.safetensors", + "model.layers.4.mlp.experts.3.down_proj.weight_scale": "model-00005-of-00047.safetensors", + "model.layers.4.mlp.experts.3.gate_proj.weight": "model-00005-of-00047.safetensors", + "model.layers.4.mlp.experts.3.gate_proj.weight_scale": "model-00005-of-00047.safetensors", + "model.layers.4.mlp.experts.3.up_proj.weight": "model-00005-of-00047.safetensors", + "model.layers.4.mlp.experts.3.up_proj.weight_scale": "model-00005-of-00047.safetensors", + "model.layers.4.mlp.experts.30.down_proj.weight": "model-00005-of-00047.safetensors", + "model.layers.4.mlp.experts.30.down_proj.weight_scale": "model-00005-of-00047.safetensors", + "model.layers.4.mlp.experts.30.gate_proj.weight": "model-00005-of-00047.safetensors", + "model.layers.4.mlp.experts.30.gate_proj.weight_scale": "model-00005-of-00047.safetensors", + "model.layers.4.mlp.experts.30.up_proj.weight": "model-00005-of-00047.safetensors", + "model.layers.4.mlp.experts.30.up_proj.weight_scale": "model-00005-of-00047.safetensors", + "model.layers.4.mlp.experts.31.down_proj.weight": "model-00005-of-00047.safetensors", + "model.layers.4.mlp.experts.31.down_proj.weight_scale": "model-00005-of-00047.safetensors", + "model.layers.4.mlp.experts.31.gate_proj.weight": "model-00005-of-00047.safetensors", + "model.layers.4.mlp.experts.31.gate_proj.weight_scale": "model-00005-of-00047.safetensors", + "model.layers.4.mlp.experts.31.up_proj.weight": "model-00005-of-00047.safetensors", + "model.layers.4.mlp.experts.31.up_proj.weight_scale": "model-00005-of-00047.safetensors", + "model.layers.4.mlp.experts.32.down_proj.weight": "model-00005-of-00047.safetensors", + "model.layers.4.mlp.experts.32.down_proj.weight_scale": "model-00005-of-00047.safetensors", + "model.layers.4.mlp.experts.32.gate_proj.weight": "model-00005-of-00047.safetensors", + "model.layers.4.mlp.experts.32.gate_proj.weight_scale": "model-00005-of-00047.safetensors", + "model.layers.4.mlp.experts.32.up_proj.weight": "model-00005-of-00047.safetensors", + "model.layers.4.mlp.experts.32.up_proj.weight_scale": "model-00005-of-00047.safetensors", + "model.layers.4.mlp.experts.33.down_proj.weight": "model-00005-of-00047.safetensors", + "model.layers.4.mlp.experts.33.down_proj.weight_scale": "model-00005-of-00047.safetensors", + "model.layers.4.mlp.experts.33.gate_proj.weight": "model-00005-of-00047.safetensors", + "model.layers.4.mlp.experts.33.gate_proj.weight_scale": "model-00005-of-00047.safetensors", + "model.layers.4.mlp.experts.33.up_proj.weight": "model-00005-of-00047.safetensors", + "model.layers.4.mlp.experts.33.up_proj.weight_scale": "model-00005-of-00047.safetensors", + "model.layers.4.mlp.experts.34.down_proj.weight": "model-00005-of-00047.safetensors", + "model.layers.4.mlp.experts.34.down_proj.weight_scale": "model-00005-of-00047.safetensors", + "model.layers.4.mlp.experts.34.gate_proj.weight": "model-00005-of-00047.safetensors", + "model.layers.4.mlp.experts.34.gate_proj.weight_scale": "model-00005-of-00047.safetensors", + "model.layers.4.mlp.experts.34.up_proj.weight": "model-00005-of-00047.safetensors", + "model.layers.4.mlp.experts.34.up_proj.weight_scale": "model-00005-of-00047.safetensors", + "model.layers.4.mlp.experts.35.down_proj.weight": "model-00005-of-00047.safetensors", + "model.layers.4.mlp.experts.35.down_proj.weight_scale": "model-00005-of-00047.safetensors", + "model.layers.4.mlp.experts.35.gate_proj.weight": "model-00005-of-00047.safetensors", + "model.layers.4.mlp.experts.35.gate_proj.weight_scale": "model-00005-of-00047.safetensors", + "model.layers.4.mlp.experts.35.up_proj.weight": "model-00005-of-00047.safetensors", + "model.layers.4.mlp.experts.35.up_proj.weight_scale": "model-00005-of-00047.safetensors", + "model.layers.4.mlp.experts.36.down_proj.weight": "model-00005-of-00047.safetensors", + "model.layers.4.mlp.experts.36.down_proj.weight_scale": "model-00005-of-00047.safetensors", + "model.layers.4.mlp.experts.36.gate_proj.weight": "model-00005-of-00047.safetensors", + "model.layers.4.mlp.experts.36.gate_proj.weight_scale": "model-00005-of-00047.safetensors", + "model.layers.4.mlp.experts.36.up_proj.weight": "model-00005-of-00047.safetensors", + "model.layers.4.mlp.experts.36.up_proj.weight_scale": "model-00005-of-00047.safetensors", + "model.layers.4.mlp.experts.37.down_proj.weight": "model-00005-of-00047.safetensors", + "model.layers.4.mlp.experts.37.down_proj.weight_scale": "model-00005-of-00047.safetensors", + "model.layers.4.mlp.experts.37.gate_proj.weight": "model-00005-of-00047.safetensors", + "model.layers.4.mlp.experts.37.gate_proj.weight_scale": "model-00005-of-00047.safetensors", + "model.layers.4.mlp.experts.37.up_proj.weight": "model-00005-of-00047.safetensors", + "model.layers.4.mlp.experts.37.up_proj.weight_scale": "model-00005-of-00047.safetensors", + "model.layers.4.mlp.experts.38.down_proj.weight": "model-00005-of-00047.safetensors", + "model.layers.4.mlp.experts.38.down_proj.weight_scale": "model-00005-of-00047.safetensors", + "model.layers.4.mlp.experts.38.gate_proj.weight": "model-00005-of-00047.safetensors", + "model.layers.4.mlp.experts.38.gate_proj.weight_scale": "model-00005-of-00047.safetensors", + "model.layers.4.mlp.experts.38.up_proj.weight": "model-00005-of-00047.safetensors", + "model.layers.4.mlp.experts.38.up_proj.weight_scale": "model-00005-of-00047.safetensors", + "model.layers.4.mlp.experts.39.down_proj.weight": "model-00005-of-00047.safetensors", + "model.layers.4.mlp.experts.39.down_proj.weight_scale": "model-00005-of-00047.safetensors", + "model.layers.4.mlp.experts.39.gate_proj.weight": "model-00005-of-00047.safetensors", + "model.layers.4.mlp.experts.39.gate_proj.weight_scale": "model-00005-of-00047.safetensors", + "model.layers.4.mlp.experts.39.up_proj.weight": "model-00005-of-00047.safetensors", + "model.layers.4.mlp.experts.39.up_proj.weight_scale": "model-00005-of-00047.safetensors", + "model.layers.4.mlp.experts.4.down_proj.weight": "model-00005-of-00047.safetensors", + "model.layers.4.mlp.experts.4.down_proj.weight_scale": "model-00005-of-00047.safetensors", + "model.layers.4.mlp.experts.4.gate_proj.weight": "model-00005-of-00047.safetensors", + "model.layers.4.mlp.experts.4.gate_proj.weight_scale": "model-00005-of-00047.safetensors", + "model.layers.4.mlp.experts.4.up_proj.weight": "model-00005-of-00047.safetensors", + "model.layers.4.mlp.experts.4.up_proj.weight_scale": "model-00005-of-00047.safetensors", + "model.layers.4.mlp.experts.40.down_proj.weight": "model-00005-of-00047.safetensors", + "model.layers.4.mlp.experts.40.down_proj.weight_scale": "model-00005-of-00047.safetensors", + "model.layers.4.mlp.experts.40.gate_proj.weight": "model-00005-of-00047.safetensors", + "model.layers.4.mlp.experts.40.gate_proj.weight_scale": "model-00005-of-00047.safetensors", + "model.layers.4.mlp.experts.40.up_proj.weight": "model-00005-of-00047.safetensors", + "model.layers.4.mlp.experts.40.up_proj.weight_scale": "model-00005-of-00047.safetensors", + "model.layers.4.mlp.experts.41.down_proj.weight": "model-00005-of-00047.safetensors", + "model.layers.4.mlp.experts.41.down_proj.weight_scale": "model-00005-of-00047.safetensors", + "model.layers.4.mlp.experts.41.gate_proj.weight": "model-00005-of-00047.safetensors", + "model.layers.4.mlp.experts.41.gate_proj.weight_scale": "model-00005-of-00047.safetensors", + "model.layers.4.mlp.experts.41.up_proj.weight": "model-00005-of-00047.safetensors", + "model.layers.4.mlp.experts.41.up_proj.weight_scale": "model-00005-of-00047.safetensors", + "model.layers.4.mlp.experts.42.down_proj.weight": "model-00005-of-00047.safetensors", + "model.layers.4.mlp.experts.42.down_proj.weight_scale": "model-00005-of-00047.safetensors", + "model.layers.4.mlp.experts.42.gate_proj.weight": "model-00005-of-00047.safetensors", + "model.layers.4.mlp.experts.42.gate_proj.weight_scale": "model-00005-of-00047.safetensors", + "model.layers.4.mlp.experts.42.up_proj.weight": "model-00005-of-00047.safetensors", + "model.layers.4.mlp.experts.42.up_proj.weight_scale": "model-00005-of-00047.safetensors", + "model.layers.4.mlp.experts.43.down_proj.weight": "model-00005-of-00047.safetensors", + "model.layers.4.mlp.experts.43.down_proj.weight_scale": "model-00005-of-00047.safetensors", + "model.layers.4.mlp.experts.43.gate_proj.weight": "model-00005-of-00047.safetensors", + "model.layers.4.mlp.experts.43.gate_proj.weight_scale": "model-00005-of-00047.safetensors", + "model.layers.4.mlp.experts.43.up_proj.weight": "model-00005-of-00047.safetensors", + "model.layers.4.mlp.experts.43.up_proj.weight_scale": "model-00005-of-00047.safetensors", + "model.layers.4.mlp.experts.44.down_proj.weight": "model-00005-of-00047.safetensors", + "model.layers.4.mlp.experts.44.down_proj.weight_scale": "model-00005-of-00047.safetensors", + "model.layers.4.mlp.experts.44.gate_proj.weight": "model-00005-of-00047.safetensors", + "model.layers.4.mlp.experts.44.gate_proj.weight_scale": "model-00005-of-00047.safetensors", + "model.layers.4.mlp.experts.44.up_proj.weight": "model-00005-of-00047.safetensors", + "model.layers.4.mlp.experts.44.up_proj.weight_scale": "model-00005-of-00047.safetensors", + "model.layers.4.mlp.experts.45.down_proj.weight": "model-00005-of-00047.safetensors", + "model.layers.4.mlp.experts.45.down_proj.weight_scale": "model-00005-of-00047.safetensors", + "model.layers.4.mlp.experts.45.gate_proj.weight": "model-00005-of-00047.safetensors", + "model.layers.4.mlp.experts.45.gate_proj.weight_scale": "model-00005-of-00047.safetensors", + "model.layers.4.mlp.experts.45.up_proj.weight": "model-00005-of-00047.safetensors", + "model.layers.4.mlp.experts.45.up_proj.weight_scale": "model-00005-of-00047.safetensors", + "model.layers.4.mlp.experts.46.down_proj.weight": "model-00005-of-00047.safetensors", + "model.layers.4.mlp.experts.46.down_proj.weight_scale": "model-00005-of-00047.safetensors", + "model.layers.4.mlp.experts.46.gate_proj.weight": "model-00005-of-00047.safetensors", + "model.layers.4.mlp.experts.46.gate_proj.weight_scale": "model-00005-of-00047.safetensors", + "model.layers.4.mlp.experts.46.up_proj.weight": "model-00005-of-00047.safetensors", + "model.layers.4.mlp.experts.46.up_proj.weight_scale": "model-00005-of-00047.safetensors", + "model.layers.4.mlp.experts.47.down_proj.weight": "model-00005-of-00047.safetensors", + "model.layers.4.mlp.experts.47.down_proj.weight_scale": "model-00005-of-00047.safetensors", + "model.layers.4.mlp.experts.47.gate_proj.weight": "model-00005-of-00047.safetensors", + "model.layers.4.mlp.experts.47.gate_proj.weight_scale": "model-00005-of-00047.safetensors", + "model.layers.4.mlp.experts.47.up_proj.weight": "model-00005-of-00047.safetensors", + "model.layers.4.mlp.experts.47.up_proj.weight_scale": "model-00005-of-00047.safetensors", + "model.layers.4.mlp.experts.48.down_proj.weight": "model-00005-of-00047.safetensors", + "model.layers.4.mlp.experts.48.down_proj.weight_scale": "model-00005-of-00047.safetensors", + "model.layers.4.mlp.experts.48.gate_proj.weight": "model-00005-of-00047.safetensors", + "model.layers.4.mlp.experts.48.gate_proj.weight_scale": "model-00005-of-00047.safetensors", + "model.layers.4.mlp.experts.48.up_proj.weight": "model-00005-of-00047.safetensors", + "model.layers.4.mlp.experts.48.up_proj.weight_scale": "model-00005-of-00047.safetensors", + "model.layers.4.mlp.experts.49.down_proj.weight": "model-00005-of-00047.safetensors", + "model.layers.4.mlp.experts.49.down_proj.weight_scale": "model-00005-of-00047.safetensors", + "model.layers.4.mlp.experts.49.gate_proj.weight": "model-00005-of-00047.safetensors", + "model.layers.4.mlp.experts.49.gate_proj.weight_scale": "model-00005-of-00047.safetensors", + "model.layers.4.mlp.experts.49.up_proj.weight": "model-00005-of-00047.safetensors", + "model.layers.4.mlp.experts.49.up_proj.weight_scale": "model-00005-of-00047.safetensors", + "model.layers.4.mlp.experts.5.down_proj.weight": "model-00005-of-00047.safetensors", + "model.layers.4.mlp.experts.5.down_proj.weight_scale": "model-00005-of-00047.safetensors", + "model.layers.4.mlp.experts.5.gate_proj.weight": "model-00005-of-00047.safetensors", + "model.layers.4.mlp.experts.5.gate_proj.weight_scale": "model-00005-of-00047.safetensors", + "model.layers.4.mlp.experts.5.up_proj.weight": "model-00005-of-00047.safetensors", + "model.layers.4.mlp.experts.5.up_proj.weight_scale": "model-00005-of-00047.safetensors", + "model.layers.4.mlp.experts.50.down_proj.weight": "model-00005-of-00047.safetensors", + "model.layers.4.mlp.experts.50.down_proj.weight_scale": "model-00005-of-00047.safetensors", + "model.layers.4.mlp.experts.50.gate_proj.weight": "model-00005-of-00047.safetensors", + "model.layers.4.mlp.experts.50.gate_proj.weight_scale": "model-00005-of-00047.safetensors", + "model.layers.4.mlp.experts.50.up_proj.weight": "model-00005-of-00047.safetensors", + "model.layers.4.mlp.experts.50.up_proj.weight_scale": "model-00005-of-00047.safetensors", + "model.layers.4.mlp.experts.51.down_proj.weight": "model-00005-of-00047.safetensors", + "model.layers.4.mlp.experts.51.down_proj.weight_scale": "model-00005-of-00047.safetensors", + "model.layers.4.mlp.experts.51.gate_proj.weight": "model-00005-of-00047.safetensors", + "model.layers.4.mlp.experts.51.gate_proj.weight_scale": "model-00005-of-00047.safetensors", + "model.layers.4.mlp.experts.51.up_proj.weight": "model-00005-of-00047.safetensors", + "model.layers.4.mlp.experts.51.up_proj.weight_scale": "model-00005-of-00047.safetensors", + "model.layers.4.mlp.experts.52.down_proj.weight": "model-00005-of-00047.safetensors", + "model.layers.4.mlp.experts.52.down_proj.weight_scale": "model-00005-of-00047.safetensors", + "model.layers.4.mlp.experts.52.gate_proj.weight": "model-00005-of-00047.safetensors", + "model.layers.4.mlp.experts.52.gate_proj.weight_scale": "model-00005-of-00047.safetensors", + "model.layers.4.mlp.experts.52.up_proj.weight": "model-00005-of-00047.safetensors", + "model.layers.4.mlp.experts.52.up_proj.weight_scale": "model-00005-of-00047.safetensors", + "model.layers.4.mlp.experts.53.down_proj.weight": "model-00005-of-00047.safetensors", + "model.layers.4.mlp.experts.53.down_proj.weight_scale": "model-00005-of-00047.safetensors", + "model.layers.4.mlp.experts.53.gate_proj.weight": "model-00005-of-00047.safetensors", + "model.layers.4.mlp.experts.53.gate_proj.weight_scale": "model-00005-of-00047.safetensors", + "model.layers.4.mlp.experts.53.up_proj.weight": "model-00005-of-00047.safetensors", + "model.layers.4.mlp.experts.53.up_proj.weight_scale": "model-00005-of-00047.safetensors", + "model.layers.4.mlp.experts.54.down_proj.weight": "model-00005-of-00047.safetensors", + "model.layers.4.mlp.experts.54.down_proj.weight_scale": "model-00005-of-00047.safetensors", + "model.layers.4.mlp.experts.54.gate_proj.weight": "model-00005-of-00047.safetensors", + "model.layers.4.mlp.experts.54.gate_proj.weight_scale": "model-00005-of-00047.safetensors", + "model.layers.4.mlp.experts.54.up_proj.weight": "model-00005-of-00047.safetensors", + "model.layers.4.mlp.experts.54.up_proj.weight_scale": "model-00005-of-00047.safetensors", + "model.layers.4.mlp.experts.55.down_proj.weight": "model-00005-of-00047.safetensors", + "model.layers.4.mlp.experts.55.down_proj.weight_scale": "model-00005-of-00047.safetensors", + "model.layers.4.mlp.experts.55.gate_proj.weight": "model-00005-of-00047.safetensors", + "model.layers.4.mlp.experts.55.gate_proj.weight_scale": "model-00005-of-00047.safetensors", + "model.layers.4.mlp.experts.55.up_proj.weight": "model-00005-of-00047.safetensors", + "model.layers.4.mlp.experts.55.up_proj.weight_scale": "model-00005-of-00047.safetensors", + "model.layers.4.mlp.experts.56.down_proj.weight": "model-00005-of-00047.safetensors", + "model.layers.4.mlp.experts.56.down_proj.weight_scale": "model-00005-of-00047.safetensors", + "model.layers.4.mlp.experts.56.gate_proj.weight": "model-00005-of-00047.safetensors", + "model.layers.4.mlp.experts.56.gate_proj.weight_scale": "model-00005-of-00047.safetensors", + "model.layers.4.mlp.experts.56.up_proj.weight": "model-00005-of-00047.safetensors", + "model.layers.4.mlp.experts.56.up_proj.weight_scale": "model-00005-of-00047.safetensors", + "model.layers.4.mlp.experts.57.down_proj.weight": "model-00005-of-00047.safetensors", + "model.layers.4.mlp.experts.57.down_proj.weight_scale": "model-00005-of-00047.safetensors", + "model.layers.4.mlp.experts.57.gate_proj.weight": "model-00005-of-00047.safetensors", + "model.layers.4.mlp.experts.57.gate_proj.weight_scale": "model-00005-of-00047.safetensors", + "model.layers.4.mlp.experts.57.up_proj.weight": "model-00005-of-00047.safetensors", + "model.layers.4.mlp.experts.57.up_proj.weight_scale": "model-00005-of-00047.safetensors", + "model.layers.4.mlp.experts.58.down_proj.weight": "model-00005-of-00047.safetensors", + "model.layers.4.mlp.experts.58.down_proj.weight_scale": "model-00005-of-00047.safetensors", + "model.layers.4.mlp.experts.58.gate_proj.weight": "model-00005-of-00047.safetensors", + "model.layers.4.mlp.experts.58.gate_proj.weight_scale": "model-00005-of-00047.safetensors", + "model.layers.4.mlp.experts.58.up_proj.weight": "model-00005-of-00047.safetensors", + "model.layers.4.mlp.experts.58.up_proj.weight_scale": "model-00005-of-00047.safetensors", + "model.layers.4.mlp.experts.59.down_proj.weight": "model-00005-of-00047.safetensors", + "model.layers.4.mlp.experts.59.down_proj.weight_scale": "model-00005-of-00047.safetensors", + "model.layers.4.mlp.experts.59.gate_proj.weight": "model-00005-of-00047.safetensors", + "model.layers.4.mlp.experts.59.gate_proj.weight_scale": "model-00005-of-00047.safetensors", + "model.layers.4.mlp.experts.59.up_proj.weight": "model-00005-of-00047.safetensors", + "model.layers.4.mlp.experts.59.up_proj.weight_scale": "model-00005-of-00047.safetensors", + "model.layers.4.mlp.experts.6.down_proj.weight": "model-00005-of-00047.safetensors", + "model.layers.4.mlp.experts.6.down_proj.weight_scale": "model-00005-of-00047.safetensors", + "model.layers.4.mlp.experts.6.gate_proj.weight": "model-00005-of-00047.safetensors", + "model.layers.4.mlp.experts.6.gate_proj.weight_scale": "model-00005-of-00047.safetensors", + "model.layers.4.mlp.experts.6.up_proj.weight": "model-00005-of-00047.safetensors", + "model.layers.4.mlp.experts.6.up_proj.weight_scale": "model-00005-of-00047.safetensors", + "model.layers.4.mlp.experts.60.down_proj.weight": "model-00005-of-00047.safetensors", + "model.layers.4.mlp.experts.60.down_proj.weight_scale": "model-00005-of-00047.safetensors", + "model.layers.4.mlp.experts.60.gate_proj.weight": "model-00005-of-00047.safetensors", + "model.layers.4.mlp.experts.60.gate_proj.weight_scale": "model-00005-of-00047.safetensors", + "model.layers.4.mlp.experts.60.up_proj.weight": "model-00005-of-00047.safetensors", + "model.layers.4.mlp.experts.60.up_proj.weight_scale": "model-00005-of-00047.safetensors", + "model.layers.4.mlp.experts.61.down_proj.weight": "model-00005-of-00047.safetensors", + "model.layers.4.mlp.experts.61.down_proj.weight_scale": "model-00005-of-00047.safetensors", + "model.layers.4.mlp.experts.61.gate_proj.weight": "model-00005-of-00047.safetensors", + "model.layers.4.mlp.experts.61.gate_proj.weight_scale": "model-00005-of-00047.safetensors", + "model.layers.4.mlp.experts.61.up_proj.weight": "model-00005-of-00047.safetensors", + "model.layers.4.mlp.experts.61.up_proj.weight_scale": "model-00005-of-00047.safetensors", + "model.layers.4.mlp.experts.62.down_proj.weight": "model-00005-of-00047.safetensors", + "model.layers.4.mlp.experts.62.down_proj.weight_scale": "model-00005-of-00047.safetensors", + "model.layers.4.mlp.experts.62.gate_proj.weight": "model-00005-of-00047.safetensors", + "model.layers.4.mlp.experts.62.gate_proj.weight_scale": "model-00005-of-00047.safetensors", + "model.layers.4.mlp.experts.62.up_proj.weight": "model-00005-of-00047.safetensors", + "model.layers.4.mlp.experts.62.up_proj.weight_scale": "model-00005-of-00047.safetensors", + "model.layers.4.mlp.experts.63.down_proj.weight": "model-00005-of-00047.safetensors", + "model.layers.4.mlp.experts.63.down_proj.weight_scale": "model-00005-of-00047.safetensors", + "model.layers.4.mlp.experts.63.gate_proj.weight": "model-00005-of-00047.safetensors", + "model.layers.4.mlp.experts.63.gate_proj.weight_scale": "model-00005-of-00047.safetensors", + "model.layers.4.mlp.experts.63.up_proj.weight": "model-00005-of-00047.safetensors", + "model.layers.4.mlp.experts.63.up_proj.weight_scale": "model-00005-of-00047.safetensors", + "model.layers.4.mlp.experts.64.down_proj.weight": "model-00005-of-00047.safetensors", + "model.layers.4.mlp.experts.64.down_proj.weight_scale": "model-00005-of-00047.safetensors", + "model.layers.4.mlp.experts.64.gate_proj.weight": "model-00005-of-00047.safetensors", + "model.layers.4.mlp.experts.64.gate_proj.weight_scale": "model-00005-of-00047.safetensors", + "model.layers.4.mlp.experts.64.up_proj.weight": "model-00005-of-00047.safetensors", + "model.layers.4.mlp.experts.64.up_proj.weight_scale": "model-00005-of-00047.safetensors", + "model.layers.4.mlp.experts.65.down_proj.weight": "model-00005-of-00047.safetensors", + "model.layers.4.mlp.experts.65.down_proj.weight_scale": "model-00005-of-00047.safetensors", + "model.layers.4.mlp.experts.65.gate_proj.weight": "model-00005-of-00047.safetensors", + "model.layers.4.mlp.experts.65.gate_proj.weight_scale": "model-00005-of-00047.safetensors", + "model.layers.4.mlp.experts.65.up_proj.weight": "model-00005-of-00047.safetensors", + "model.layers.4.mlp.experts.65.up_proj.weight_scale": "model-00005-of-00047.safetensors", + "model.layers.4.mlp.experts.66.down_proj.weight": "model-00005-of-00047.safetensors", + "model.layers.4.mlp.experts.66.down_proj.weight_scale": "model-00005-of-00047.safetensors", + "model.layers.4.mlp.experts.66.gate_proj.weight": "model-00005-of-00047.safetensors", + "model.layers.4.mlp.experts.66.gate_proj.weight_scale": "model-00005-of-00047.safetensors", + "model.layers.4.mlp.experts.66.up_proj.weight": "model-00005-of-00047.safetensors", + "model.layers.4.mlp.experts.66.up_proj.weight_scale": "model-00005-of-00047.safetensors", + "model.layers.4.mlp.experts.67.down_proj.weight": "model-00005-of-00047.safetensors", + "model.layers.4.mlp.experts.67.down_proj.weight_scale": "model-00005-of-00047.safetensors", + "model.layers.4.mlp.experts.67.gate_proj.weight": "model-00005-of-00047.safetensors", + "model.layers.4.mlp.experts.67.gate_proj.weight_scale": "model-00005-of-00047.safetensors", + "model.layers.4.mlp.experts.67.up_proj.weight": "model-00005-of-00047.safetensors", + "model.layers.4.mlp.experts.67.up_proj.weight_scale": "model-00005-of-00047.safetensors", + "model.layers.4.mlp.experts.68.down_proj.weight": "model-00005-of-00047.safetensors", + "model.layers.4.mlp.experts.68.down_proj.weight_scale": "model-00005-of-00047.safetensors", + "model.layers.4.mlp.experts.68.gate_proj.weight": "model-00005-of-00047.safetensors", + "model.layers.4.mlp.experts.68.gate_proj.weight_scale": "model-00005-of-00047.safetensors", + "model.layers.4.mlp.experts.68.up_proj.weight": "model-00005-of-00047.safetensors", + "model.layers.4.mlp.experts.68.up_proj.weight_scale": "model-00005-of-00047.safetensors", + "model.layers.4.mlp.experts.69.down_proj.weight": "model-00005-of-00047.safetensors", + "model.layers.4.mlp.experts.69.down_proj.weight_scale": "model-00005-of-00047.safetensors", + "model.layers.4.mlp.experts.69.gate_proj.weight": "model-00005-of-00047.safetensors", + "model.layers.4.mlp.experts.69.gate_proj.weight_scale": "model-00005-of-00047.safetensors", + "model.layers.4.mlp.experts.69.up_proj.weight": "model-00005-of-00047.safetensors", + "model.layers.4.mlp.experts.69.up_proj.weight_scale": "model-00005-of-00047.safetensors", + "model.layers.4.mlp.experts.7.down_proj.weight": "model-00005-of-00047.safetensors", + "model.layers.4.mlp.experts.7.down_proj.weight_scale": "model-00005-of-00047.safetensors", + "model.layers.4.mlp.experts.7.gate_proj.weight": "model-00005-of-00047.safetensors", + "model.layers.4.mlp.experts.7.gate_proj.weight_scale": "model-00005-of-00047.safetensors", + "model.layers.4.mlp.experts.7.up_proj.weight": "model-00005-of-00047.safetensors", + "model.layers.4.mlp.experts.7.up_proj.weight_scale": "model-00005-of-00047.safetensors", + "model.layers.4.mlp.experts.70.down_proj.weight": "model-00005-of-00047.safetensors", + "model.layers.4.mlp.experts.70.down_proj.weight_scale": "model-00005-of-00047.safetensors", + "model.layers.4.mlp.experts.70.gate_proj.weight": "model-00005-of-00047.safetensors", + "model.layers.4.mlp.experts.70.gate_proj.weight_scale": "model-00005-of-00047.safetensors", + "model.layers.4.mlp.experts.70.up_proj.weight": "model-00005-of-00047.safetensors", + "model.layers.4.mlp.experts.70.up_proj.weight_scale": "model-00005-of-00047.safetensors", + "model.layers.4.mlp.experts.71.down_proj.weight": "model-00005-of-00047.safetensors", + "model.layers.4.mlp.experts.71.down_proj.weight_scale": "model-00005-of-00047.safetensors", + "model.layers.4.mlp.experts.71.gate_proj.weight": "model-00005-of-00047.safetensors", + "model.layers.4.mlp.experts.71.gate_proj.weight_scale": "model-00005-of-00047.safetensors", + "model.layers.4.mlp.experts.71.up_proj.weight": "model-00005-of-00047.safetensors", + "model.layers.4.mlp.experts.71.up_proj.weight_scale": "model-00005-of-00047.safetensors", + "model.layers.4.mlp.experts.72.down_proj.weight": "model-00005-of-00047.safetensors", + "model.layers.4.mlp.experts.72.down_proj.weight_scale": "model-00005-of-00047.safetensors", + "model.layers.4.mlp.experts.72.gate_proj.weight": "model-00005-of-00047.safetensors", + "model.layers.4.mlp.experts.72.gate_proj.weight_scale": "model-00005-of-00047.safetensors", + "model.layers.4.mlp.experts.72.up_proj.weight": "model-00005-of-00047.safetensors", + "model.layers.4.mlp.experts.72.up_proj.weight_scale": "model-00005-of-00047.safetensors", + "model.layers.4.mlp.experts.73.down_proj.weight": "model-00005-of-00047.safetensors", + "model.layers.4.mlp.experts.73.down_proj.weight_scale": "model-00005-of-00047.safetensors", + "model.layers.4.mlp.experts.73.gate_proj.weight": "model-00005-of-00047.safetensors", + "model.layers.4.mlp.experts.73.gate_proj.weight_scale": "model-00005-of-00047.safetensors", + "model.layers.4.mlp.experts.73.up_proj.weight": "model-00005-of-00047.safetensors", + "model.layers.4.mlp.experts.73.up_proj.weight_scale": "model-00005-of-00047.safetensors", + "model.layers.4.mlp.experts.74.down_proj.weight": "model-00005-of-00047.safetensors", + "model.layers.4.mlp.experts.74.down_proj.weight_scale": "model-00005-of-00047.safetensors", + "model.layers.4.mlp.experts.74.gate_proj.weight": "model-00005-of-00047.safetensors", + "model.layers.4.mlp.experts.74.gate_proj.weight_scale": "model-00005-of-00047.safetensors", + "model.layers.4.mlp.experts.74.up_proj.weight": "model-00005-of-00047.safetensors", + "model.layers.4.mlp.experts.74.up_proj.weight_scale": "model-00005-of-00047.safetensors", + "model.layers.4.mlp.experts.75.down_proj.weight": "model-00005-of-00047.safetensors", + "model.layers.4.mlp.experts.75.down_proj.weight_scale": "model-00005-of-00047.safetensors", + "model.layers.4.mlp.experts.75.gate_proj.weight": "model-00005-of-00047.safetensors", + "model.layers.4.mlp.experts.75.gate_proj.weight_scale": "model-00005-of-00047.safetensors", + "model.layers.4.mlp.experts.75.up_proj.weight": "model-00005-of-00047.safetensors", + "model.layers.4.mlp.experts.75.up_proj.weight_scale": "model-00005-of-00047.safetensors", + "model.layers.4.mlp.experts.76.down_proj.weight": "model-00005-of-00047.safetensors", + "model.layers.4.mlp.experts.76.down_proj.weight_scale": "model-00005-of-00047.safetensors", + "model.layers.4.mlp.experts.76.gate_proj.weight": "model-00005-of-00047.safetensors", + "model.layers.4.mlp.experts.76.gate_proj.weight_scale": "model-00005-of-00047.safetensors", + "model.layers.4.mlp.experts.76.up_proj.weight": "model-00005-of-00047.safetensors", + "model.layers.4.mlp.experts.76.up_proj.weight_scale": "model-00005-of-00047.safetensors", + "model.layers.4.mlp.experts.77.down_proj.weight": "model-00005-of-00047.safetensors", + "model.layers.4.mlp.experts.77.down_proj.weight_scale": "model-00005-of-00047.safetensors", + "model.layers.4.mlp.experts.77.gate_proj.weight": "model-00005-of-00047.safetensors", + "model.layers.4.mlp.experts.77.gate_proj.weight_scale": "model-00005-of-00047.safetensors", + "model.layers.4.mlp.experts.77.up_proj.weight": "model-00005-of-00047.safetensors", + "model.layers.4.mlp.experts.77.up_proj.weight_scale": "model-00005-of-00047.safetensors", + "model.layers.4.mlp.experts.78.down_proj.weight": "model-00005-of-00047.safetensors", + "model.layers.4.mlp.experts.78.down_proj.weight_scale": "model-00005-of-00047.safetensors", + "model.layers.4.mlp.experts.78.gate_proj.weight": "model-00005-of-00047.safetensors", + "model.layers.4.mlp.experts.78.gate_proj.weight_scale": "model-00005-of-00047.safetensors", + "model.layers.4.mlp.experts.78.up_proj.weight": "model-00005-of-00047.safetensors", + "model.layers.4.mlp.experts.78.up_proj.weight_scale": "model-00005-of-00047.safetensors", + "model.layers.4.mlp.experts.79.down_proj.weight": "model-00005-of-00047.safetensors", + "model.layers.4.mlp.experts.79.down_proj.weight_scale": "model-00005-of-00047.safetensors", + "model.layers.4.mlp.experts.79.gate_proj.weight": "model-00005-of-00047.safetensors", + "model.layers.4.mlp.experts.79.gate_proj.weight_scale": "model-00005-of-00047.safetensors", + "model.layers.4.mlp.experts.79.up_proj.weight": "model-00005-of-00047.safetensors", + "model.layers.4.mlp.experts.79.up_proj.weight_scale": "model-00005-of-00047.safetensors", + "model.layers.4.mlp.experts.8.down_proj.weight": "model-00005-of-00047.safetensors", + "model.layers.4.mlp.experts.8.down_proj.weight_scale": "model-00005-of-00047.safetensors", + "model.layers.4.mlp.experts.8.gate_proj.weight": "model-00005-of-00047.safetensors", + "model.layers.4.mlp.experts.8.gate_proj.weight_scale": "model-00005-of-00047.safetensors", + "model.layers.4.mlp.experts.8.up_proj.weight": "model-00005-of-00047.safetensors", + "model.layers.4.mlp.experts.8.up_proj.weight_scale": "model-00005-of-00047.safetensors", + "model.layers.4.mlp.experts.80.down_proj.weight": "model-00005-of-00047.safetensors", + "model.layers.4.mlp.experts.80.down_proj.weight_scale": "model-00005-of-00047.safetensors", + "model.layers.4.mlp.experts.80.gate_proj.weight": "model-00005-of-00047.safetensors", + "model.layers.4.mlp.experts.80.gate_proj.weight_scale": "model-00005-of-00047.safetensors", + "model.layers.4.mlp.experts.80.up_proj.weight": "model-00005-of-00047.safetensors", + "model.layers.4.mlp.experts.80.up_proj.weight_scale": "model-00005-of-00047.safetensors", + "model.layers.4.mlp.experts.81.down_proj.weight": "model-00005-of-00047.safetensors", + "model.layers.4.mlp.experts.81.down_proj.weight_scale": "model-00005-of-00047.safetensors", + "model.layers.4.mlp.experts.81.gate_proj.weight": "model-00005-of-00047.safetensors", + "model.layers.4.mlp.experts.81.gate_proj.weight_scale": "model-00005-of-00047.safetensors", + "model.layers.4.mlp.experts.81.up_proj.weight": "model-00005-of-00047.safetensors", + "model.layers.4.mlp.experts.81.up_proj.weight_scale": "model-00005-of-00047.safetensors", + "model.layers.4.mlp.experts.82.down_proj.weight": "model-00005-of-00047.safetensors", + "model.layers.4.mlp.experts.82.down_proj.weight_scale": "model-00005-of-00047.safetensors", + "model.layers.4.mlp.experts.82.gate_proj.weight": "model-00005-of-00047.safetensors", + "model.layers.4.mlp.experts.82.gate_proj.weight_scale": "model-00005-of-00047.safetensors", + "model.layers.4.mlp.experts.82.up_proj.weight": "model-00005-of-00047.safetensors", + "model.layers.4.mlp.experts.82.up_proj.weight_scale": "model-00005-of-00047.safetensors", + "model.layers.4.mlp.experts.83.down_proj.weight": "model-00005-of-00047.safetensors", + "model.layers.4.mlp.experts.83.down_proj.weight_scale": "model-00005-of-00047.safetensors", + "model.layers.4.mlp.experts.83.gate_proj.weight": "model-00005-of-00047.safetensors", + "model.layers.4.mlp.experts.83.gate_proj.weight_scale": "model-00005-of-00047.safetensors", + "model.layers.4.mlp.experts.83.up_proj.weight": "model-00005-of-00047.safetensors", + "model.layers.4.mlp.experts.83.up_proj.weight_scale": "model-00005-of-00047.safetensors", + "model.layers.4.mlp.experts.84.down_proj.weight": "model-00005-of-00047.safetensors", + "model.layers.4.mlp.experts.84.down_proj.weight_scale": "model-00005-of-00047.safetensors", + "model.layers.4.mlp.experts.84.gate_proj.weight": "model-00005-of-00047.safetensors", + "model.layers.4.mlp.experts.84.gate_proj.weight_scale": "model-00005-of-00047.safetensors", + "model.layers.4.mlp.experts.84.up_proj.weight": "model-00005-of-00047.safetensors", + "model.layers.4.mlp.experts.84.up_proj.weight_scale": "model-00005-of-00047.safetensors", + "model.layers.4.mlp.experts.85.down_proj.weight": "model-00005-of-00047.safetensors", + "model.layers.4.mlp.experts.85.down_proj.weight_scale": "model-00005-of-00047.safetensors", + "model.layers.4.mlp.experts.85.gate_proj.weight": "model-00005-of-00047.safetensors", + "model.layers.4.mlp.experts.85.gate_proj.weight_scale": "model-00005-of-00047.safetensors", + "model.layers.4.mlp.experts.85.up_proj.weight": "model-00005-of-00047.safetensors", + "model.layers.4.mlp.experts.85.up_proj.weight_scale": "model-00005-of-00047.safetensors", + "model.layers.4.mlp.experts.86.down_proj.weight": "model-00005-of-00047.safetensors", + "model.layers.4.mlp.experts.86.down_proj.weight_scale": "model-00005-of-00047.safetensors", + "model.layers.4.mlp.experts.86.gate_proj.weight": "model-00005-of-00047.safetensors", + "model.layers.4.mlp.experts.86.gate_proj.weight_scale": "model-00005-of-00047.safetensors", + "model.layers.4.mlp.experts.86.up_proj.weight": "model-00005-of-00047.safetensors", + "model.layers.4.mlp.experts.86.up_proj.weight_scale": "model-00005-of-00047.safetensors", + "model.layers.4.mlp.experts.87.down_proj.weight": "model-00005-of-00047.safetensors", + "model.layers.4.mlp.experts.87.down_proj.weight_scale": "model-00005-of-00047.safetensors", + "model.layers.4.mlp.experts.87.gate_proj.weight": "model-00005-of-00047.safetensors", + "model.layers.4.mlp.experts.87.gate_proj.weight_scale": "model-00005-of-00047.safetensors", + "model.layers.4.mlp.experts.87.up_proj.weight": "model-00005-of-00047.safetensors", + "model.layers.4.mlp.experts.87.up_proj.weight_scale": "model-00005-of-00047.safetensors", + "model.layers.4.mlp.experts.88.down_proj.weight": "model-00005-of-00047.safetensors", + "model.layers.4.mlp.experts.88.down_proj.weight_scale": "model-00005-of-00047.safetensors", + "model.layers.4.mlp.experts.88.gate_proj.weight": "model-00005-of-00047.safetensors", + "model.layers.4.mlp.experts.88.gate_proj.weight_scale": "model-00005-of-00047.safetensors", + "model.layers.4.mlp.experts.88.up_proj.weight": "model-00005-of-00047.safetensors", + "model.layers.4.mlp.experts.88.up_proj.weight_scale": "model-00005-of-00047.safetensors", + "model.layers.4.mlp.experts.89.down_proj.weight": "model-00005-of-00047.safetensors", + "model.layers.4.mlp.experts.89.down_proj.weight_scale": "model-00005-of-00047.safetensors", + "model.layers.4.mlp.experts.89.gate_proj.weight": "model-00005-of-00047.safetensors", + "model.layers.4.mlp.experts.89.gate_proj.weight_scale": "model-00005-of-00047.safetensors", + "model.layers.4.mlp.experts.89.up_proj.weight": "model-00005-of-00047.safetensors", + "model.layers.4.mlp.experts.89.up_proj.weight_scale": "model-00005-of-00047.safetensors", + "model.layers.4.mlp.experts.9.down_proj.weight": "model-00005-of-00047.safetensors", + "model.layers.4.mlp.experts.9.down_proj.weight_scale": "model-00005-of-00047.safetensors", + "model.layers.4.mlp.experts.9.gate_proj.weight": "model-00005-of-00047.safetensors", + "model.layers.4.mlp.experts.9.gate_proj.weight_scale": "model-00005-of-00047.safetensors", + "model.layers.4.mlp.experts.9.up_proj.weight": "model-00005-of-00047.safetensors", + "model.layers.4.mlp.experts.9.up_proj.weight_scale": "model-00005-of-00047.safetensors", + "model.layers.4.mlp.experts.90.down_proj.weight": "model-00005-of-00047.safetensors", + "model.layers.4.mlp.experts.90.down_proj.weight_scale": "model-00005-of-00047.safetensors", + "model.layers.4.mlp.experts.90.gate_proj.weight": "model-00005-of-00047.safetensors", + "model.layers.4.mlp.experts.90.gate_proj.weight_scale": "model-00005-of-00047.safetensors", + "model.layers.4.mlp.experts.90.up_proj.weight": "model-00005-of-00047.safetensors", + "model.layers.4.mlp.experts.90.up_proj.weight_scale": "model-00005-of-00047.safetensors", + "model.layers.4.mlp.experts.91.down_proj.weight": "model-00005-of-00047.safetensors", + "model.layers.4.mlp.experts.91.down_proj.weight_scale": "model-00005-of-00047.safetensors", + "model.layers.4.mlp.experts.91.gate_proj.weight": "model-00005-of-00047.safetensors", + "model.layers.4.mlp.experts.91.gate_proj.weight_scale": "model-00005-of-00047.safetensors", + "model.layers.4.mlp.experts.91.up_proj.weight": "model-00005-of-00047.safetensors", + "model.layers.4.mlp.experts.91.up_proj.weight_scale": "model-00005-of-00047.safetensors", + "model.layers.4.mlp.experts.92.down_proj.weight": "model-00005-of-00047.safetensors", + "model.layers.4.mlp.experts.92.down_proj.weight_scale": "model-00005-of-00047.safetensors", + "model.layers.4.mlp.experts.92.gate_proj.weight": "model-00005-of-00047.safetensors", + "model.layers.4.mlp.experts.92.gate_proj.weight_scale": "model-00005-of-00047.safetensors", + "model.layers.4.mlp.experts.92.up_proj.weight": "model-00005-of-00047.safetensors", + "model.layers.4.mlp.experts.92.up_proj.weight_scale": "model-00005-of-00047.safetensors", + "model.layers.4.mlp.experts.93.down_proj.weight": "model-00005-of-00047.safetensors", + "model.layers.4.mlp.experts.93.down_proj.weight_scale": "model-00005-of-00047.safetensors", + "model.layers.4.mlp.experts.93.gate_proj.weight": "model-00005-of-00047.safetensors", + "model.layers.4.mlp.experts.93.gate_proj.weight_scale": "model-00005-of-00047.safetensors", + "model.layers.4.mlp.experts.93.up_proj.weight": "model-00005-of-00047.safetensors", + "model.layers.4.mlp.experts.93.up_proj.weight_scale": "model-00005-of-00047.safetensors", + "model.layers.4.mlp.experts.94.down_proj.weight": "model-00005-of-00047.safetensors", + "model.layers.4.mlp.experts.94.down_proj.weight_scale": "model-00005-of-00047.safetensors", + "model.layers.4.mlp.experts.94.gate_proj.weight": "model-00005-of-00047.safetensors", + "model.layers.4.mlp.experts.94.gate_proj.weight_scale": "model-00005-of-00047.safetensors", + "model.layers.4.mlp.experts.94.up_proj.weight": "model-00005-of-00047.safetensors", + "model.layers.4.mlp.experts.94.up_proj.weight_scale": "model-00005-of-00047.safetensors", + "model.layers.4.mlp.experts.95.down_proj.weight": "model-00005-of-00047.safetensors", + "model.layers.4.mlp.experts.95.down_proj.weight_scale": "model-00005-of-00047.safetensors", + "model.layers.4.mlp.experts.95.gate_proj.weight": "model-00005-of-00047.safetensors", + "model.layers.4.mlp.experts.95.gate_proj.weight_scale": "model-00005-of-00047.safetensors", + "model.layers.4.mlp.experts.95.up_proj.weight": "model-00005-of-00047.safetensors", + "model.layers.4.mlp.experts.95.up_proj.weight_scale": "model-00005-of-00047.safetensors", + "model.layers.4.mlp.experts.96.down_proj.weight": "model-00005-of-00047.safetensors", + "model.layers.4.mlp.experts.96.down_proj.weight_scale": "model-00005-of-00047.safetensors", + "model.layers.4.mlp.experts.96.gate_proj.weight": "model-00005-of-00047.safetensors", + "model.layers.4.mlp.experts.96.gate_proj.weight_scale": "model-00005-of-00047.safetensors", + "model.layers.4.mlp.experts.96.up_proj.weight": "model-00005-of-00047.safetensors", + "model.layers.4.mlp.experts.96.up_proj.weight_scale": "model-00005-of-00047.safetensors", + "model.layers.4.mlp.experts.97.down_proj.weight": "model-00005-of-00047.safetensors", + "model.layers.4.mlp.experts.97.down_proj.weight_scale": "model-00005-of-00047.safetensors", + "model.layers.4.mlp.experts.97.gate_proj.weight": "model-00005-of-00047.safetensors", + "model.layers.4.mlp.experts.97.gate_proj.weight_scale": "model-00005-of-00047.safetensors", + "model.layers.4.mlp.experts.97.up_proj.weight": "model-00005-of-00047.safetensors", + "model.layers.4.mlp.experts.97.up_proj.weight_scale": "model-00005-of-00047.safetensors", + "model.layers.4.mlp.experts.98.down_proj.weight": "model-00005-of-00047.safetensors", + "model.layers.4.mlp.experts.98.down_proj.weight_scale": "model-00005-of-00047.safetensors", + "model.layers.4.mlp.experts.98.gate_proj.weight": "model-00005-of-00047.safetensors", + "model.layers.4.mlp.experts.98.gate_proj.weight_scale": "model-00005-of-00047.safetensors", + "model.layers.4.mlp.experts.98.up_proj.weight": "model-00005-of-00047.safetensors", + "model.layers.4.mlp.experts.98.up_proj.weight_scale": "model-00005-of-00047.safetensors", + "model.layers.4.mlp.experts.99.down_proj.weight": "model-00005-of-00047.safetensors", + "model.layers.4.mlp.experts.99.down_proj.weight_scale": "model-00005-of-00047.safetensors", + "model.layers.4.mlp.experts.99.gate_proj.weight": "model-00005-of-00047.safetensors", + "model.layers.4.mlp.experts.99.gate_proj.weight_scale": "model-00005-of-00047.safetensors", + "model.layers.4.mlp.experts.99.up_proj.weight": "model-00005-of-00047.safetensors", + "model.layers.4.mlp.experts.99.up_proj.weight_scale": "model-00005-of-00047.safetensors", + "model.layers.4.mlp.gate.e_score_correction_bias": "model-00005-of-00047.safetensors", + "model.layers.4.mlp.gate.weight": "model-00005-of-00047.safetensors", + "model.layers.4.mlp.shared_experts.down_proj.weight": "model-00005-of-00047.safetensors", + "model.layers.4.mlp.shared_experts.down_proj.weight_scale": "model-00005-of-00047.safetensors", + "model.layers.4.mlp.shared_experts.gate_proj.weight": "model-00005-of-00047.safetensors", + "model.layers.4.mlp.shared_experts.gate_proj.weight_scale": "model-00005-of-00047.safetensors", + "model.layers.4.mlp.shared_experts.up_proj.weight": "model-00005-of-00047.safetensors", + "model.layers.4.mlp.shared_experts.up_proj.weight_scale": "model-00005-of-00047.safetensors", + "model.layers.4.post_attention_layernorm.weight": "model-00005-of-00047.safetensors", + "model.layers.4.self_attn.k_proj.bias": "model-00005-of-00047.safetensors", + "model.layers.4.self_attn.k_proj.weight": "model-00005-of-00047.safetensors", + "model.layers.4.self_attn.k_proj.weight_scale": "model-00005-of-00047.safetensors", + "model.layers.4.self_attn.o_proj.weight": "model-00005-of-00047.safetensors", + "model.layers.4.self_attn.o_proj.weight_scale": "model-00005-of-00047.safetensors", + "model.layers.4.self_attn.q_proj.bias": "model-00005-of-00047.safetensors", + "model.layers.4.self_attn.q_proj.weight": "model-00005-of-00047.safetensors", + "model.layers.4.self_attn.q_proj.weight_scale": "model-00005-of-00047.safetensors", + "model.layers.4.self_attn.v_proj.bias": "model-00005-of-00047.safetensors", + "model.layers.4.self_attn.v_proj.weight": "model-00005-of-00047.safetensors", + "model.layers.4.self_attn.v_proj.weight_scale": "model-00005-of-00047.safetensors", + "model.layers.5.input_layernorm.weight": "model-00006-of-00047.safetensors", + "model.layers.5.mlp.experts.0.down_proj.weight": "model-00006-of-00047.safetensors", + "model.layers.5.mlp.experts.0.down_proj.weight_scale": "model-00006-of-00047.safetensors", + "model.layers.5.mlp.experts.0.gate_proj.weight": "model-00006-of-00047.safetensors", + "model.layers.5.mlp.experts.0.gate_proj.weight_scale": "model-00006-of-00047.safetensors", + "model.layers.5.mlp.experts.0.up_proj.weight": "model-00006-of-00047.safetensors", + "model.layers.5.mlp.experts.0.up_proj.weight_scale": "model-00006-of-00047.safetensors", + "model.layers.5.mlp.experts.1.down_proj.weight": "model-00006-of-00047.safetensors", + "model.layers.5.mlp.experts.1.down_proj.weight_scale": "model-00006-of-00047.safetensors", + "model.layers.5.mlp.experts.1.gate_proj.weight": "model-00006-of-00047.safetensors", + "model.layers.5.mlp.experts.1.gate_proj.weight_scale": "model-00006-of-00047.safetensors", + "model.layers.5.mlp.experts.1.up_proj.weight": "model-00006-of-00047.safetensors", + "model.layers.5.mlp.experts.1.up_proj.weight_scale": "model-00006-of-00047.safetensors", + "model.layers.5.mlp.experts.10.down_proj.weight": "model-00006-of-00047.safetensors", + "model.layers.5.mlp.experts.10.down_proj.weight_scale": "model-00006-of-00047.safetensors", + "model.layers.5.mlp.experts.10.gate_proj.weight": "model-00006-of-00047.safetensors", + "model.layers.5.mlp.experts.10.gate_proj.weight_scale": "model-00006-of-00047.safetensors", + "model.layers.5.mlp.experts.10.up_proj.weight": "model-00006-of-00047.safetensors", + "model.layers.5.mlp.experts.10.up_proj.weight_scale": "model-00006-of-00047.safetensors", + "model.layers.5.mlp.experts.100.down_proj.weight": "model-00006-of-00047.safetensors", + "model.layers.5.mlp.experts.100.down_proj.weight_scale": "model-00006-of-00047.safetensors", + "model.layers.5.mlp.experts.100.gate_proj.weight": "model-00006-of-00047.safetensors", + "model.layers.5.mlp.experts.100.gate_proj.weight_scale": "model-00006-of-00047.safetensors", + "model.layers.5.mlp.experts.100.up_proj.weight": "model-00006-of-00047.safetensors", + "model.layers.5.mlp.experts.100.up_proj.weight_scale": "model-00006-of-00047.safetensors", + "model.layers.5.mlp.experts.101.down_proj.weight": "model-00006-of-00047.safetensors", + "model.layers.5.mlp.experts.101.down_proj.weight_scale": "model-00006-of-00047.safetensors", + "model.layers.5.mlp.experts.101.gate_proj.weight": "model-00006-of-00047.safetensors", + "model.layers.5.mlp.experts.101.gate_proj.weight_scale": "model-00006-of-00047.safetensors", + "model.layers.5.mlp.experts.101.up_proj.weight": "model-00006-of-00047.safetensors", + "model.layers.5.mlp.experts.101.up_proj.weight_scale": "model-00006-of-00047.safetensors", + "model.layers.5.mlp.experts.102.down_proj.weight": "model-00006-of-00047.safetensors", + "model.layers.5.mlp.experts.102.down_proj.weight_scale": "model-00006-of-00047.safetensors", + "model.layers.5.mlp.experts.102.gate_proj.weight": "model-00006-of-00047.safetensors", + "model.layers.5.mlp.experts.102.gate_proj.weight_scale": "model-00006-of-00047.safetensors", + "model.layers.5.mlp.experts.102.up_proj.weight": "model-00006-of-00047.safetensors", + "model.layers.5.mlp.experts.102.up_proj.weight_scale": "model-00006-of-00047.safetensors", + "model.layers.5.mlp.experts.103.down_proj.weight": "model-00006-of-00047.safetensors", + "model.layers.5.mlp.experts.103.down_proj.weight_scale": "model-00006-of-00047.safetensors", + "model.layers.5.mlp.experts.103.gate_proj.weight": "model-00006-of-00047.safetensors", + "model.layers.5.mlp.experts.103.gate_proj.weight_scale": "model-00006-of-00047.safetensors", + "model.layers.5.mlp.experts.103.up_proj.weight": "model-00006-of-00047.safetensors", + "model.layers.5.mlp.experts.103.up_proj.weight_scale": "model-00006-of-00047.safetensors", + "model.layers.5.mlp.experts.104.down_proj.weight": "model-00006-of-00047.safetensors", + "model.layers.5.mlp.experts.104.down_proj.weight_scale": "model-00006-of-00047.safetensors", + "model.layers.5.mlp.experts.104.gate_proj.weight": "model-00006-of-00047.safetensors", + "model.layers.5.mlp.experts.104.gate_proj.weight_scale": "model-00006-of-00047.safetensors", + "model.layers.5.mlp.experts.104.up_proj.weight": "model-00006-of-00047.safetensors", + "model.layers.5.mlp.experts.104.up_proj.weight_scale": "model-00006-of-00047.safetensors", + "model.layers.5.mlp.experts.105.down_proj.weight": "model-00006-of-00047.safetensors", + "model.layers.5.mlp.experts.105.down_proj.weight_scale": "model-00006-of-00047.safetensors", + "model.layers.5.mlp.experts.105.gate_proj.weight": "model-00006-of-00047.safetensors", + "model.layers.5.mlp.experts.105.gate_proj.weight_scale": "model-00006-of-00047.safetensors", + "model.layers.5.mlp.experts.105.up_proj.weight": "model-00006-of-00047.safetensors", + "model.layers.5.mlp.experts.105.up_proj.weight_scale": "model-00006-of-00047.safetensors", + "model.layers.5.mlp.experts.106.down_proj.weight": "model-00006-of-00047.safetensors", + "model.layers.5.mlp.experts.106.down_proj.weight_scale": "model-00006-of-00047.safetensors", + "model.layers.5.mlp.experts.106.gate_proj.weight": "model-00006-of-00047.safetensors", + "model.layers.5.mlp.experts.106.gate_proj.weight_scale": "model-00006-of-00047.safetensors", + "model.layers.5.mlp.experts.106.up_proj.weight": "model-00006-of-00047.safetensors", + "model.layers.5.mlp.experts.106.up_proj.weight_scale": "model-00006-of-00047.safetensors", + "model.layers.5.mlp.experts.107.down_proj.weight": "model-00006-of-00047.safetensors", + "model.layers.5.mlp.experts.107.down_proj.weight_scale": "model-00006-of-00047.safetensors", + "model.layers.5.mlp.experts.107.gate_proj.weight": "model-00006-of-00047.safetensors", + "model.layers.5.mlp.experts.107.gate_proj.weight_scale": "model-00006-of-00047.safetensors", + "model.layers.5.mlp.experts.107.up_proj.weight": "model-00006-of-00047.safetensors", + "model.layers.5.mlp.experts.107.up_proj.weight_scale": "model-00006-of-00047.safetensors", + "model.layers.5.mlp.experts.108.down_proj.weight": "model-00006-of-00047.safetensors", + "model.layers.5.mlp.experts.108.down_proj.weight_scale": "model-00006-of-00047.safetensors", + "model.layers.5.mlp.experts.108.gate_proj.weight": "model-00006-of-00047.safetensors", + "model.layers.5.mlp.experts.108.gate_proj.weight_scale": "model-00006-of-00047.safetensors", + "model.layers.5.mlp.experts.108.up_proj.weight": "model-00006-of-00047.safetensors", + "model.layers.5.mlp.experts.108.up_proj.weight_scale": "model-00006-of-00047.safetensors", + "model.layers.5.mlp.experts.109.down_proj.weight": "model-00006-of-00047.safetensors", + "model.layers.5.mlp.experts.109.down_proj.weight_scale": "model-00006-of-00047.safetensors", + "model.layers.5.mlp.experts.109.gate_proj.weight": "model-00006-of-00047.safetensors", + "model.layers.5.mlp.experts.109.gate_proj.weight_scale": "model-00006-of-00047.safetensors", + "model.layers.5.mlp.experts.109.up_proj.weight": "model-00006-of-00047.safetensors", + "model.layers.5.mlp.experts.109.up_proj.weight_scale": "model-00006-of-00047.safetensors", + "model.layers.5.mlp.experts.11.down_proj.weight": "model-00006-of-00047.safetensors", + "model.layers.5.mlp.experts.11.down_proj.weight_scale": "model-00006-of-00047.safetensors", + "model.layers.5.mlp.experts.11.gate_proj.weight": "model-00006-of-00047.safetensors", + "model.layers.5.mlp.experts.11.gate_proj.weight_scale": "model-00006-of-00047.safetensors", + "model.layers.5.mlp.experts.11.up_proj.weight": "model-00006-of-00047.safetensors", + "model.layers.5.mlp.experts.11.up_proj.weight_scale": "model-00006-of-00047.safetensors", + "model.layers.5.mlp.experts.110.down_proj.weight": "model-00006-of-00047.safetensors", + "model.layers.5.mlp.experts.110.down_proj.weight_scale": "model-00006-of-00047.safetensors", + "model.layers.5.mlp.experts.110.gate_proj.weight": "model-00006-of-00047.safetensors", + "model.layers.5.mlp.experts.110.gate_proj.weight_scale": "model-00006-of-00047.safetensors", + "model.layers.5.mlp.experts.110.up_proj.weight": "model-00006-of-00047.safetensors", + "model.layers.5.mlp.experts.110.up_proj.weight_scale": "model-00006-of-00047.safetensors", + "model.layers.5.mlp.experts.111.down_proj.weight": "model-00006-of-00047.safetensors", + "model.layers.5.mlp.experts.111.down_proj.weight_scale": "model-00006-of-00047.safetensors", + "model.layers.5.mlp.experts.111.gate_proj.weight": "model-00006-of-00047.safetensors", + "model.layers.5.mlp.experts.111.gate_proj.weight_scale": "model-00006-of-00047.safetensors", + "model.layers.5.mlp.experts.111.up_proj.weight": "model-00006-of-00047.safetensors", + "model.layers.5.mlp.experts.111.up_proj.weight_scale": "model-00006-of-00047.safetensors", + "model.layers.5.mlp.experts.112.down_proj.weight": "model-00006-of-00047.safetensors", + "model.layers.5.mlp.experts.112.down_proj.weight_scale": "model-00006-of-00047.safetensors", + "model.layers.5.mlp.experts.112.gate_proj.weight": "model-00006-of-00047.safetensors", + "model.layers.5.mlp.experts.112.gate_proj.weight_scale": "model-00006-of-00047.safetensors", + "model.layers.5.mlp.experts.112.up_proj.weight": "model-00006-of-00047.safetensors", + "model.layers.5.mlp.experts.112.up_proj.weight_scale": "model-00006-of-00047.safetensors", + "model.layers.5.mlp.experts.113.down_proj.weight": "model-00006-of-00047.safetensors", + "model.layers.5.mlp.experts.113.down_proj.weight_scale": "model-00006-of-00047.safetensors", + "model.layers.5.mlp.experts.113.gate_proj.weight": "model-00006-of-00047.safetensors", + "model.layers.5.mlp.experts.113.gate_proj.weight_scale": "model-00006-of-00047.safetensors", + "model.layers.5.mlp.experts.113.up_proj.weight": "model-00006-of-00047.safetensors", + "model.layers.5.mlp.experts.113.up_proj.weight_scale": "model-00006-of-00047.safetensors", + "model.layers.5.mlp.experts.114.down_proj.weight": "model-00006-of-00047.safetensors", + "model.layers.5.mlp.experts.114.down_proj.weight_scale": "model-00006-of-00047.safetensors", + "model.layers.5.mlp.experts.114.gate_proj.weight": "model-00006-of-00047.safetensors", + "model.layers.5.mlp.experts.114.gate_proj.weight_scale": "model-00006-of-00047.safetensors", + "model.layers.5.mlp.experts.114.up_proj.weight": "model-00006-of-00047.safetensors", + "model.layers.5.mlp.experts.114.up_proj.weight_scale": "model-00006-of-00047.safetensors", + "model.layers.5.mlp.experts.115.down_proj.weight": "model-00006-of-00047.safetensors", + "model.layers.5.mlp.experts.115.down_proj.weight_scale": "model-00006-of-00047.safetensors", + "model.layers.5.mlp.experts.115.gate_proj.weight": "model-00006-of-00047.safetensors", + "model.layers.5.mlp.experts.115.gate_proj.weight_scale": "model-00006-of-00047.safetensors", + "model.layers.5.mlp.experts.115.up_proj.weight": "model-00006-of-00047.safetensors", + "model.layers.5.mlp.experts.115.up_proj.weight_scale": "model-00006-of-00047.safetensors", + "model.layers.5.mlp.experts.116.down_proj.weight": "model-00006-of-00047.safetensors", + "model.layers.5.mlp.experts.116.down_proj.weight_scale": "model-00006-of-00047.safetensors", + "model.layers.5.mlp.experts.116.gate_proj.weight": "model-00006-of-00047.safetensors", + "model.layers.5.mlp.experts.116.gate_proj.weight_scale": "model-00006-of-00047.safetensors", + "model.layers.5.mlp.experts.116.up_proj.weight": "model-00006-of-00047.safetensors", + "model.layers.5.mlp.experts.116.up_proj.weight_scale": "model-00006-of-00047.safetensors", + "model.layers.5.mlp.experts.117.down_proj.weight": "model-00006-of-00047.safetensors", + "model.layers.5.mlp.experts.117.down_proj.weight_scale": "model-00006-of-00047.safetensors", + "model.layers.5.mlp.experts.117.gate_proj.weight": "model-00006-of-00047.safetensors", + "model.layers.5.mlp.experts.117.gate_proj.weight_scale": "model-00006-of-00047.safetensors", + "model.layers.5.mlp.experts.117.up_proj.weight": "model-00006-of-00047.safetensors", + "model.layers.5.mlp.experts.117.up_proj.weight_scale": "model-00006-of-00047.safetensors", + "model.layers.5.mlp.experts.118.down_proj.weight": "model-00006-of-00047.safetensors", + "model.layers.5.mlp.experts.118.down_proj.weight_scale": "model-00006-of-00047.safetensors", + "model.layers.5.mlp.experts.118.gate_proj.weight": "model-00006-of-00047.safetensors", + "model.layers.5.mlp.experts.118.gate_proj.weight_scale": "model-00006-of-00047.safetensors", + "model.layers.5.mlp.experts.118.up_proj.weight": "model-00006-of-00047.safetensors", + "model.layers.5.mlp.experts.118.up_proj.weight_scale": "model-00006-of-00047.safetensors", + "model.layers.5.mlp.experts.119.down_proj.weight": "model-00006-of-00047.safetensors", + "model.layers.5.mlp.experts.119.down_proj.weight_scale": "model-00006-of-00047.safetensors", + "model.layers.5.mlp.experts.119.gate_proj.weight": "model-00006-of-00047.safetensors", + "model.layers.5.mlp.experts.119.gate_proj.weight_scale": "model-00006-of-00047.safetensors", + "model.layers.5.mlp.experts.119.up_proj.weight": "model-00006-of-00047.safetensors", + "model.layers.5.mlp.experts.119.up_proj.weight_scale": "model-00006-of-00047.safetensors", + "model.layers.5.mlp.experts.12.down_proj.weight": "model-00006-of-00047.safetensors", + "model.layers.5.mlp.experts.12.down_proj.weight_scale": "model-00006-of-00047.safetensors", + "model.layers.5.mlp.experts.12.gate_proj.weight": "model-00006-of-00047.safetensors", + "model.layers.5.mlp.experts.12.gate_proj.weight_scale": "model-00006-of-00047.safetensors", + "model.layers.5.mlp.experts.12.up_proj.weight": "model-00006-of-00047.safetensors", + "model.layers.5.mlp.experts.12.up_proj.weight_scale": "model-00006-of-00047.safetensors", + "model.layers.5.mlp.experts.120.down_proj.weight": "model-00006-of-00047.safetensors", + "model.layers.5.mlp.experts.120.down_proj.weight_scale": "model-00006-of-00047.safetensors", + "model.layers.5.mlp.experts.120.gate_proj.weight": "model-00006-of-00047.safetensors", + "model.layers.5.mlp.experts.120.gate_proj.weight_scale": "model-00006-of-00047.safetensors", + "model.layers.5.mlp.experts.120.up_proj.weight": "model-00006-of-00047.safetensors", + "model.layers.5.mlp.experts.120.up_proj.weight_scale": "model-00006-of-00047.safetensors", + "model.layers.5.mlp.experts.121.down_proj.weight": "model-00006-of-00047.safetensors", + "model.layers.5.mlp.experts.121.down_proj.weight_scale": "model-00006-of-00047.safetensors", + "model.layers.5.mlp.experts.121.gate_proj.weight": "model-00006-of-00047.safetensors", + "model.layers.5.mlp.experts.121.gate_proj.weight_scale": "model-00006-of-00047.safetensors", + "model.layers.5.mlp.experts.121.up_proj.weight": "model-00006-of-00047.safetensors", + "model.layers.5.mlp.experts.121.up_proj.weight_scale": "model-00006-of-00047.safetensors", + "model.layers.5.mlp.experts.122.down_proj.weight": "model-00006-of-00047.safetensors", + "model.layers.5.mlp.experts.122.down_proj.weight_scale": "model-00006-of-00047.safetensors", + "model.layers.5.mlp.experts.122.gate_proj.weight": "model-00006-of-00047.safetensors", + "model.layers.5.mlp.experts.122.gate_proj.weight_scale": "model-00006-of-00047.safetensors", + "model.layers.5.mlp.experts.122.up_proj.weight": "model-00006-of-00047.safetensors", + "model.layers.5.mlp.experts.122.up_proj.weight_scale": "model-00006-of-00047.safetensors", + "model.layers.5.mlp.experts.123.down_proj.weight": "model-00006-of-00047.safetensors", + "model.layers.5.mlp.experts.123.down_proj.weight_scale": "model-00006-of-00047.safetensors", + "model.layers.5.mlp.experts.123.gate_proj.weight": "model-00006-of-00047.safetensors", + "model.layers.5.mlp.experts.123.gate_proj.weight_scale": "model-00006-of-00047.safetensors", + "model.layers.5.mlp.experts.123.up_proj.weight": "model-00006-of-00047.safetensors", + "model.layers.5.mlp.experts.123.up_proj.weight_scale": "model-00006-of-00047.safetensors", + "model.layers.5.mlp.experts.124.down_proj.weight": "model-00006-of-00047.safetensors", + "model.layers.5.mlp.experts.124.down_proj.weight_scale": "model-00006-of-00047.safetensors", + "model.layers.5.mlp.experts.124.gate_proj.weight": "model-00006-of-00047.safetensors", + "model.layers.5.mlp.experts.124.gate_proj.weight_scale": "model-00006-of-00047.safetensors", + "model.layers.5.mlp.experts.124.up_proj.weight": "model-00006-of-00047.safetensors", + "model.layers.5.mlp.experts.124.up_proj.weight_scale": "model-00006-of-00047.safetensors", + "model.layers.5.mlp.experts.125.down_proj.weight": "model-00006-of-00047.safetensors", + "model.layers.5.mlp.experts.125.down_proj.weight_scale": "model-00006-of-00047.safetensors", + "model.layers.5.mlp.experts.125.gate_proj.weight": "model-00006-of-00047.safetensors", + "model.layers.5.mlp.experts.125.gate_proj.weight_scale": "model-00006-of-00047.safetensors", + "model.layers.5.mlp.experts.125.up_proj.weight": "model-00006-of-00047.safetensors", + "model.layers.5.mlp.experts.125.up_proj.weight_scale": "model-00006-of-00047.safetensors", + "model.layers.5.mlp.experts.126.down_proj.weight": "model-00006-of-00047.safetensors", + "model.layers.5.mlp.experts.126.down_proj.weight_scale": "model-00006-of-00047.safetensors", + "model.layers.5.mlp.experts.126.gate_proj.weight": "model-00006-of-00047.safetensors", + "model.layers.5.mlp.experts.126.gate_proj.weight_scale": "model-00006-of-00047.safetensors", + "model.layers.5.mlp.experts.126.up_proj.weight": "model-00006-of-00047.safetensors", + "model.layers.5.mlp.experts.126.up_proj.weight_scale": "model-00006-of-00047.safetensors", + "model.layers.5.mlp.experts.127.down_proj.weight": "model-00006-of-00047.safetensors", + "model.layers.5.mlp.experts.127.down_proj.weight_scale": "model-00006-of-00047.safetensors", + "model.layers.5.mlp.experts.127.gate_proj.weight": "model-00006-of-00047.safetensors", + "model.layers.5.mlp.experts.127.gate_proj.weight_scale": "model-00006-of-00047.safetensors", + "model.layers.5.mlp.experts.127.up_proj.weight": "model-00006-of-00047.safetensors", + "model.layers.5.mlp.experts.127.up_proj.weight_scale": "model-00006-of-00047.safetensors", + "model.layers.5.mlp.experts.13.down_proj.weight": "model-00006-of-00047.safetensors", + "model.layers.5.mlp.experts.13.down_proj.weight_scale": "model-00006-of-00047.safetensors", + "model.layers.5.mlp.experts.13.gate_proj.weight": "model-00006-of-00047.safetensors", + "model.layers.5.mlp.experts.13.gate_proj.weight_scale": "model-00006-of-00047.safetensors", + "model.layers.5.mlp.experts.13.up_proj.weight": "model-00006-of-00047.safetensors", + "model.layers.5.mlp.experts.13.up_proj.weight_scale": "model-00006-of-00047.safetensors", + "model.layers.5.mlp.experts.14.down_proj.weight": "model-00006-of-00047.safetensors", + "model.layers.5.mlp.experts.14.down_proj.weight_scale": "model-00006-of-00047.safetensors", + "model.layers.5.mlp.experts.14.gate_proj.weight": "model-00006-of-00047.safetensors", + "model.layers.5.mlp.experts.14.gate_proj.weight_scale": "model-00006-of-00047.safetensors", + "model.layers.5.mlp.experts.14.up_proj.weight": "model-00006-of-00047.safetensors", + "model.layers.5.mlp.experts.14.up_proj.weight_scale": "model-00006-of-00047.safetensors", + "model.layers.5.mlp.experts.15.down_proj.weight": "model-00006-of-00047.safetensors", + "model.layers.5.mlp.experts.15.down_proj.weight_scale": "model-00006-of-00047.safetensors", + "model.layers.5.mlp.experts.15.gate_proj.weight": "model-00006-of-00047.safetensors", + "model.layers.5.mlp.experts.15.gate_proj.weight_scale": "model-00006-of-00047.safetensors", + "model.layers.5.mlp.experts.15.up_proj.weight": "model-00006-of-00047.safetensors", + "model.layers.5.mlp.experts.15.up_proj.weight_scale": "model-00006-of-00047.safetensors", + "model.layers.5.mlp.experts.16.down_proj.weight": "model-00006-of-00047.safetensors", + "model.layers.5.mlp.experts.16.down_proj.weight_scale": "model-00006-of-00047.safetensors", + "model.layers.5.mlp.experts.16.gate_proj.weight": "model-00006-of-00047.safetensors", + "model.layers.5.mlp.experts.16.gate_proj.weight_scale": "model-00006-of-00047.safetensors", + "model.layers.5.mlp.experts.16.up_proj.weight": "model-00006-of-00047.safetensors", + "model.layers.5.mlp.experts.16.up_proj.weight_scale": "model-00006-of-00047.safetensors", + "model.layers.5.mlp.experts.17.down_proj.weight": "model-00006-of-00047.safetensors", + "model.layers.5.mlp.experts.17.down_proj.weight_scale": "model-00006-of-00047.safetensors", + "model.layers.5.mlp.experts.17.gate_proj.weight": "model-00006-of-00047.safetensors", + "model.layers.5.mlp.experts.17.gate_proj.weight_scale": "model-00006-of-00047.safetensors", + "model.layers.5.mlp.experts.17.up_proj.weight": "model-00006-of-00047.safetensors", + "model.layers.5.mlp.experts.17.up_proj.weight_scale": "model-00006-of-00047.safetensors", + "model.layers.5.mlp.experts.18.down_proj.weight": "model-00006-of-00047.safetensors", + "model.layers.5.mlp.experts.18.down_proj.weight_scale": "model-00006-of-00047.safetensors", + "model.layers.5.mlp.experts.18.gate_proj.weight": "model-00006-of-00047.safetensors", + "model.layers.5.mlp.experts.18.gate_proj.weight_scale": "model-00006-of-00047.safetensors", + "model.layers.5.mlp.experts.18.up_proj.weight": "model-00006-of-00047.safetensors", + "model.layers.5.mlp.experts.18.up_proj.weight_scale": "model-00006-of-00047.safetensors", + "model.layers.5.mlp.experts.19.down_proj.weight": "model-00006-of-00047.safetensors", + "model.layers.5.mlp.experts.19.down_proj.weight_scale": "model-00006-of-00047.safetensors", + "model.layers.5.mlp.experts.19.gate_proj.weight": "model-00006-of-00047.safetensors", + "model.layers.5.mlp.experts.19.gate_proj.weight_scale": "model-00006-of-00047.safetensors", + "model.layers.5.mlp.experts.19.up_proj.weight": "model-00006-of-00047.safetensors", + "model.layers.5.mlp.experts.19.up_proj.weight_scale": "model-00006-of-00047.safetensors", + "model.layers.5.mlp.experts.2.down_proj.weight": "model-00006-of-00047.safetensors", + "model.layers.5.mlp.experts.2.down_proj.weight_scale": "model-00006-of-00047.safetensors", + "model.layers.5.mlp.experts.2.gate_proj.weight": "model-00006-of-00047.safetensors", + "model.layers.5.mlp.experts.2.gate_proj.weight_scale": "model-00006-of-00047.safetensors", + "model.layers.5.mlp.experts.2.up_proj.weight": "model-00006-of-00047.safetensors", + "model.layers.5.mlp.experts.2.up_proj.weight_scale": "model-00006-of-00047.safetensors", + "model.layers.5.mlp.experts.20.down_proj.weight": "model-00006-of-00047.safetensors", + "model.layers.5.mlp.experts.20.down_proj.weight_scale": "model-00006-of-00047.safetensors", + "model.layers.5.mlp.experts.20.gate_proj.weight": "model-00006-of-00047.safetensors", + "model.layers.5.mlp.experts.20.gate_proj.weight_scale": "model-00006-of-00047.safetensors", + "model.layers.5.mlp.experts.20.up_proj.weight": "model-00006-of-00047.safetensors", + "model.layers.5.mlp.experts.20.up_proj.weight_scale": "model-00006-of-00047.safetensors", + "model.layers.5.mlp.experts.21.down_proj.weight": "model-00006-of-00047.safetensors", + "model.layers.5.mlp.experts.21.down_proj.weight_scale": "model-00006-of-00047.safetensors", + "model.layers.5.mlp.experts.21.gate_proj.weight": "model-00006-of-00047.safetensors", + "model.layers.5.mlp.experts.21.gate_proj.weight_scale": "model-00006-of-00047.safetensors", + "model.layers.5.mlp.experts.21.up_proj.weight": "model-00006-of-00047.safetensors", + "model.layers.5.mlp.experts.21.up_proj.weight_scale": "model-00006-of-00047.safetensors", + "model.layers.5.mlp.experts.22.down_proj.weight": "model-00006-of-00047.safetensors", + "model.layers.5.mlp.experts.22.down_proj.weight_scale": "model-00006-of-00047.safetensors", + "model.layers.5.mlp.experts.22.gate_proj.weight": "model-00006-of-00047.safetensors", + "model.layers.5.mlp.experts.22.gate_proj.weight_scale": "model-00006-of-00047.safetensors", + "model.layers.5.mlp.experts.22.up_proj.weight": "model-00006-of-00047.safetensors", + "model.layers.5.mlp.experts.22.up_proj.weight_scale": "model-00006-of-00047.safetensors", + "model.layers.5.mlp.experts.23.down_proj.weight": "model-00006-of-00047.safetensors", + "model.layers.5.mlp.experts.23.down_proj.weight_scale": "model-00006-of-00047.safetensors", + "model.layers.5.mlp.experts.23.gate_proj.weight": "model-00006-of-00047.safetensors", + "model.layers.5.mlp.experts.23.gate_proj.weight_scale": "model-00006-of-00047.safetensors", + "model.layers.5.mlp.experts.23.up_proj.weight": "model-00006-of-00047.safetensors", + "model.layers.5.mlp.experts.23.up_proj.weight_scale": "model-00006-of-00047.safetensors", + "model.layers.5.mlp.experts.24.down_proj.weight": "model-00006-of-00047.safetensors", + "model.layers.5.mlp.experts.24.down_proj.weight_scale": "model-00006-of-00047.safetensors", + "model.layers.5.mlp.experts.24.gate_proj.weight": "model-00006-of-00047.safetensors", + "model.layers.5.mlp.experts.24.gate_proj.weight_scale": "model-00006-of-00047.safetensors", + "model.layers.5.mlp.experts.24.up_proj.weight": "model-00006-of-00047.safetensors", + "model.layers.5.mlp.experts.24.up_proj.weight_scale": "model-00006-of-00047.safetensors", + "model.layers.5.mlp.experts.25.down_proj.weight": "model-00006-of-00047.safetensors", + "model.layers.5.mlp.experts.25.down_proj.weight_scale": "model-00006-of-00047.safetensors", + "model.layers.5.mlp.experts.25.gate_proj.weight": "model-00006-of-00047.safetensors", + "model.layers.5.mlp.experts.25.gate_proj.weight_scale": "model-00006-of-00047.safetensors", + "model.layers.5.mlp.experts.25.up_proj.weight": "model-00006-of-00047.safetensors", + "model.layers.5.mlp.experts.25.up_proj.weight_scale": "model-00006-of-00047.safetensors", + "model.layers.5.mlp.experts.26.down_proj.weight": "model-00006-of-00047.safetensors", + "model.layers.5.mlp.experts.26.down_proj.weight_scale": "model-00006-of-00047.safetensors", + "model.layers.5.mlp.experts.26.gate_proj.weight": "model-00006-of-00047.safetensors", + "model.layers.5.mlp.experts.26.gate_proj.weight_scale": "model-00006-of-00047.safetensors", + "model.layers.5.mlp.experts.26.up_proj.weight": "model-00006-of-00047.safetensors", + "model.layers.5.mlp.experts.26.up_proj.weight_scale": "model-00006-of-00047.safetensors", + "model.layers.5.mlp.experts.27.down_proj.weight": "model-00006-of-00047.safetensors", + "model.layers.5.mlp.experts.27.down_proj.weight_scale": "model-00006-of-00047.safetensors", + "model.layers.5.mlp.experts.27.gate_proj.weight": "model-00006-of-00047.safetensors", + "model.layers.5.mlp.experts.27.gate_proj.weight_scale": "model-00006-of-00047.safetensors", + "model.layers.5.mlp.experts.27.up_proj.weight": "model-00006-of-00047.safetensors", + "model.layers.5.mlp.experts.27.up_proj.weight_scale": "model-00006-of-00047.safetensors", + "model.layers.5.mlp.experts.28.down_proj.weight": "model-00006-of-00047.safetensors", + "model.layers.5.mlp.experts.28.down_proj.weight_scale": "model-00006-of-00047.safetensors", + "model.layers.5.mlp.experts.28.gate_proj.weight": "model-00006-of-00047.safetensors", + "model.layers.5.mlp.experts.28.gate_proj.weight_scale": "model-00006-of-00047.safetensors", + "model.layers.5.mlp.experts.28.up_proj.weight": "model-00006-of-00047.safetensors", + "model.layers.5.mlp.experts.28.up_proj.weight_scale": "model-00006-of-00047.safetensors", + "model.layers.5.mlp.experts.29.down_proj.weight": "model-00006-of-00047.safetensors", + "model.layers.5.mlp.experts.29.down_proj.weight_scale": "model-00006-of-00047.safetensors", + "model.layers.5.mlp.experts.29.gate_proj.weight": "model-00006-of-00047.safetensors", + "model.layers.5.mlp.experts.29.gate_proj.weight_scale": "model-00006-of-00047.safetensors", + "model.layers.5.mlp.experts.29.up_proj.weight": "model-00006-of-00047.safetensors", + "model.layers.5.mlp.experts.29.up_proj.weight_scale": "model-00006-of-00047.safetensors", + "model.layers.5.mlp.experts.3.down_proj.weight": "model-00006-of-00047.safetensors", + "model.layers.5.mlp.experts.3.down_proj.weight_scale": "model-00006-of-00047.safetensors", + "model.layers.5.mlp.experts.3.gate_proj.weight": "model-00006-of-00047.safetensors", + "model.layers.5.mlp.experts.3.gate_proj.weight_scale": "model-00006-of-00047.safetensors", + "model.layers.5.mlp.experts.3.up_proj.weight": "model-00006-of-00047.safetensors", + "model.layers.5.mlp.experts.3.up_proj.weight_scale": "model-00006-of-00047.safetensors", + "model.layers.5.mlp.experts.30.down_proj.weight": "model-00006-of-00047.safetensors", + "model.layers.5.mlp.experts.30.down_proj.weight_scale": "model-00006-of-00047.safetensors", + "model.layers.5.mlp.experts.30.gate_proj.weight": "model-00006-of-00047.safetensors", + "model.layers.5.mlp.experts.30.gate_proj.weight_scale": "model-00006-of-00047.safetensors", + "model.layers.5.mlp.experts.30.up_proj.weight": "model-00006-of-00047.safetensors", + "model.layers.5.mlp.experts.30.up_proj.weight_scale": "model-00006-of-00047.safetensors", + "model.layers.5.mlp.experts.31.down_proj.weight": "model-00006-of-00047.safetensors", + "model.layers.5.mlp.experts.31.down_proj.weight_scale": "model-00006-of-00047.safetensors", + "model.layers.5.mlp.experts.31.gate_proj.weight": "model-00006-of-00047.safetensors", + "model.layers.5.mlp.experts.31.gate_proj.weight_scale": "model-00006-of-00047.safetensors", + "model.layers.5.mlp.experts.31.up_proj.weight": "model-00006-of-00047.safetensors", + "model.layers.5.mlp.experts.31.up_proj.weight_scale": "model-00006-of-00047.safetensors", + "model.layers.5.mlp.experts.32.down_proj.weight": "model-00006-of-00047.safetensors", + "model.layers.5.mlp.experts.32.down_proj.weight_scale": "model-00006-of-00047.safetensors", + "model.layers.5.mlp.experts.32.gate_proj.weight": "model-00006-of-00047.safetensors", + "model.layers.5.mlp.experts.32.gate_proj.weight_scale": "model-00006-of-00047.safetensors", + "model.layers.5.mlp.experts.32.up_proj.weight": "model-00006-of-00047.safetensors", + "model.layers.5.mlp.experts.32.up_proj.weight_scale": "model-00006-of-00047.safetensors", + "model.layers.5.mlp.experts.33.down_proj.weight": "model-00006-of-00047.safetensors", + "model.layers.5.mlp.experts.33.down_proj.weight_scale": "model-00006-of-00047.safetensors", + "model.layers.5.mlp.experts.33.gate_proj.weight": "model-00006-of-00047.safetensors", + "model.layers.5.mlp.experts.33.gate_proj.weight_scale": "model-00006-of-00047.safetensors", + "model.layers.5.mlp.experts.33.up_proj.weight": "model-00006-of-00047.safetensors", + "model.layers.5.mlp.experts.33.up_proj.weight_scale": "model-00006-of-00047.safetensors", + "model.layers.5.mlp.experts.34.down_proj.weight": "model-00006-of-00047.safetensors", + "model.layers.5.mlp.experts.34.down_proj.weight_scale": "model-00006-of-00047.safetensors", + "model.layers.5.mlp.experts.34.gate_proj.weight": "model-00006-of-00047.safetensors", + "model.layers.5.mlp.experts.34.gate_proj.weight_scale": "model-00006-of-00047.safetensors", + "model.layers.5.mlp.experts.34.up_proj.weight": "model-00006-of-00047.safetensors", + "model.layers.5.mlp.experts.34.up_proj.weight_scale": "model-00006-of-00047.safetensors", + "model.layers.5.mlp.experts.35.down_proj.weight": "model-00006-of-00047.safetensors", + "model.layers.5.mlp.experts.35.down_proj.weight_scale": "model-00006-of-00047.safetensors", + "model.layers.5.mlp.experts.35.gate_proj.weight": "model-00006-of-00047.safetensors", + "model.layers.5.mlp.experts.35.gate_proj.weight_scale": "model-00006-of-00047.safetensors", + "model.layers.5.mlp.experts.35.up_proj.weight": "model-00006-of-00047.safetensors", + "model.layers.5.mlp.experts.35.up_proj.weight_scale": "model-00006-of-00047.safetensors", + "model.layers.5.mlp.experts.36.down_proj.weight": "model-00006-of-00047.safetensors", + "model.layers.5.mlp.experts.36.down_proj.weight_scale": "model-00006-of-00047.safetensors", + "model.layers.5.mlp.experts.36.gate_proj.weight": "model-00006-of-00047.safetensors", + "model.layers.5.mlp.experts.36.gate_proj.weight_scale": "model-00006-of-00047.safetensors", + "model.layers.5.mlp.experts.36.up_proj.weight": "model-00006-of-00047.safetensors", + "model.layers.5.mlp.experts.36.up_proj.weight_scale": "model-00006-of-00047.safetensors", + "model.layers.5.mlp.experts.37.down_proj.weight": "model-00006-of-00047.safetensors", + "model.layers.5.mlp.experts.37.down_proj.weight_scale": "model-00006-of-00047.safetensors", + "model.layers.5.mlp.experts.37.gate_proj.weight": "model-00006-of-00047.safetensors", + "model.layers.5.mlp.experts.37.gate_proj.weight_scale": "model-00006-of-00047.safetensors", + "model.layers.5.mlp.experts.37.up_proj.weight": "model-00006-of-00047.safetensors", + "model.layers.5.mlp.experts.37.up_proj.weight_scale": "model-00006-of-00047.safetensors", + "model.layers.5.mlp.experts.38.down_proj.weight": "model-00006-of-00047.safetensors", + "model.layers.5.mlp.experts.38.down_proj.weight_scale": "model-00006-of-00047.safetensors", + "model.layers.5.mlp.experts.38.gate_proj.weight": "model-00006-of-00047.safetensors", + "model.layers.5.mlp.experts.38.gate_proj.weight_scale": "model-00006-of-00047.safetensors", + "model.layers.5.mlp.experts.38.up_proj.weight": "model-00006-of-00047.safetensors", + "model.layers.5.mlp.experts.38.up_proj.weight_scale": "model-00006-of-00047.safetensors", + "model.layers.5.mlp.experts.39.down_proj.weight": "model-00006-of-00047.safetensors", + "model.layers.5.mlp.experts.39.down_proj.weight_scale": "model-00006-of-00047.safetensors", + "model.layers.5.mlp.experts.39.gate_proj.weight": "model-00006-of-00047.safetensors", + "model.layers.5.mlp.experts.39.gate_proj.weight_scale": "model-00006-of-00047.safetensors", + "model.layers.5.mlp.experts.39.up_proj.weight": "model-00006-of-00047.safetensors", + "model.layers.5.mlp.experts.39.up_proj.weight_scale": "model-00006-of-00047.safetensors", + "model.layers.5.mlp.experts.4.down_proj.weight": "model-00006-of-00047.safetensors", + "model.layers.5.mlp.experts.4.down_proj.weight_scale": "model-00006-of-00047.safetensors", + "model.layers.5.mlp.experts.4.gate_proj.weight": "model-00006-of-00047.safetensors", + "model.layers.5.mlp.experts.4.gate_proj.weight_scale": "model-00006-of-00047.safetensors", + "model.layers.5.mlp.experts.4.up_proj.weight": "model-00006-of-00047.safetensors", + "model.layers.5.mlp.experts.4.up_proj.weight_scale": "model-00006-of-00047.safetensors", + "model.layers.5.mlp.experts.40.down_proj.weight": "model-00006-of-00047.safetensors", + "model.layers.5.mlp.experts.40.down_proj.weight_scale": "model-00006-of-00047.safetensors", + "model.layers.5.mlp.experts.40.gate_proj.weight": "model-00006-of-00047.safetensors", + "model.layers.5.mlp.experts.40.gate_proj.weight_scale": "model-00006-of-00047.safetensors", + "model.layers.5.mlp.experts.40.up_proj.weight": "model-00006-of-00047.safetensors", + "model.layers.5.mlp.experts.40.up_proj.weight_scale": "model-00006-of-00047.safetensors", + "model.layers.5.mlp.experts.41.down_proj.weight": "model-00006-of-00047.safetensors", + "model.layers.5.mlp.experts.41.down_proj.weight_scale": "model-00006-of-00047.safetensors", + "model.layers.5.mlp.experts.41.gate_proj.weight": "model-00006-of-00047.safetensors", + "model.layers.5.mlp.experts.41.gate_proj.weight_scale": "model-00006-of-00047.safetensors", + "model.layers.5.mlp.experts.41.up_proj.weight": "model-00006-of-00047.safetensors", + "model.layers.5.mlp.experts.41.up_proj.weight_scale": "model-00006-of-00047.safetensors", + "model.layers.5.mlp.experts.42.down_proj.weight": "model-00006-of-00047.safetensors", + "model.layers.5.mlp.experts.42.down_proj.weight_scale": "model-00006-of-00047.safetensors", + "model.layers.5.mlp.experts.42.gate_proj.weight": "model-00006-of-00047.safetensors", + "model.layers.5.mlp.experts.42.gate_proj.weight_scale": "model-00006-of-00047.safetensors", + "model.layers.5.mlp.experts.42.up_proj.weight": "model-00006-of-00047.safetensors", + "model.layers.5.mlp.experts.42.up_proj.weight_scale": "model-00006-of-00047.safetensors", + "model.layers.5.mlp.experts.43.down_proj.weight": "model-00006-of-00047.safetensors", + "model.layers.5.mlp.experts.43.down_proj.weight_scale": "model-00006-of-00047.safetensors", + "model.layers.5.mlp.experts.43.gate_proj.weight": "model-00006-of-00047.safetensors", + "model.layers.5.mlp.experts.43.gate_proj.weight_scale": "model-00006-of-00047.safetensors", + "model.layers.5.mlp.experts.43.up_proj.weight": "model-00006-of-00047.safetensors", + "model.layers.5.mlp.experts.43.up_proj.weight_scale": "model-00006-of-00047.safetensors", + "model.layers.5.mlp.experts.44.down_proj.weight": "model-00006-of-00047.safetensors", + "model.layers.5.mlp.experts.44.down_proj.weight_scale": "model-00006-of-00047.safetensors", + "model.layers.5.mlp.experts.44.gate_proj.weight": "model-00006-of-00047.safetensors", + "model.layers.5.mlp.experts.44.gate_proj.weight_scale": "model-00006-of-00047.safetensors", + "model.layers.5.mlp.experts.44.up_proj.weight": "model-00006-of-00047.safetensors", + "model.layers.5.mlp.experts.44.up_proj.weight_scale": "model-00006-of-00047.safetensors", + "model.layers.5.mlp.experts.45.down_proj.weight": "model-00006-of-00047.safetensors", + "model.layers.5.mlp.experts.45.down_proj.weight_scale": "model-00006-of-00047.safetensors", + "model.layers.5.mlp.experts.45.gate_proj.weight": "model-00006-of-00047.safetensors", + "model.layers.5.mlp.experts.45.gate_proj.weight_scale": "model-00006-of-00047.safetensors", + "model.layers.5.mlp.experts.45.up_proj.weight": "model-00006-of-00047.safetensors", + "model.layers.5.mlp.experts.45.up_proj.weight_scale": "model-00006-of-00047.safetensors", + "model.layers.5.mlp.experts.46.down_proj.weight": "model-00006-of-00047.safetensors", + "model.layers.5.mlp.experts.46.down_proj.weight_scale": "model-00006-of-00047.safetensors", + "model.layers.5.mlp.experts.46.gate_proj.weight": "model-00006-of-00047.safetensors", + "model.layers.5.mlp.experts.46.gate_proj.weight_scale": "model-00006-of-00047.safetensors", + "model.layers.5.mlp.experts.46.up_proj.weight": "model-00006-of-00047.safetensors", + "model.layers.5.mlp.experts.46.up_proj.weight_scale": "model-00006-of-00047.safetensors", + "model.layers.5.mlp.experts.47.down_proj.weight": "model-00006-of-00047.safetensors", + "model.layers.5.mlp.experts.47.down_proj.weight_scale": "model-00006-of-00047.safetensors", + "model.layers.5.mlp.experts.47.gate_proj.weight": "model-00006-of-00047.safetensors", + "model.layers.5.mlp.experts.47.gate_proj.weight_scale": "model-00006-of-00047.safetensors", + "model.layers.5.mlp.experts.47.up_proj.weight": "model-00006-of-00047.safetensors", + "model.layers.5.mlp.experts.47.up_proj.weight_scale": "model-00006-of-00047.safetensors", + "model.layers.5.mlp.experts.48.down_proj.weight": "model-00006-of-00047.safetensors", + "model.layers.5.mlp.experts.48.down_proj.weight_scale": "model-00006-of-00047.safetensors", + "model.layers.5.mlp.experts.48.gate_proj.weight": "model-00006-of-00047.safetensors", + "model.layers.5.mlp.experts.48.gate_proj.weight_scale": "model-00006-of-00047.safetensors", + "model.layers.5.mlp.experts.48.up_proj.weight": "model-00006-of-00047.safetensors", + "model.layers.5.mlp.experts.48.up_proj.weight_scale": "model-00006-of-00047.safetensors", + "model.layers.5.mlp.experts.49.down_proj.weight": "model-00006-of-00047.safetensors", + "model.layers.5.mlp.experts.49.down_proj.weight_scale": "model-00006-of-00047.safetensors", + "model.layers.5.mlp.experts.49.gate_proj.weight": "model-00006-of-00047.safetensors", + "model.layers.5.mlp.experts.49.gate_proj.weight_scale": "model-00006-of-00047.safetensors", + "model.layers.5.mlp.experts.49.up_proj.weight": "model-00006-of-00047.safetensors", + "model.layers.5.mlp.experts.49.up_proj.weight_scale": "model-00006-of-00047.safetensors", + "model.layers.5.mlp.experts.5.down_proj.weight": "model-00006-of-00047.safetensors", + "model.layers.5.mlp.experts.5.down_proj.weight_scale": "model-00006-of-00047.safetensors", + "model.layers.5.mlp.experts.5.gate_proj.weight": "model-00006-of-00047.safetensors", + "model.layers.5.mlp.experts.5.gate_proj.weight_scale": "model-00006-of-00047.safetensors", + "model.layers.5.mlp.experts.5.up_proj.weight": "model-00006-of-00047.safetensors", + "model.layers.5.mlp.experts.5.up_proj.weight_scale": "model-00006-of-00047.safetensors", + "model.layers.5.mlp.experts.50.down_proj.weight": "model-00006-of-00047.safetensors", + "model.layers.5.mlp.experts.50.down_proj.weight_scale": "model-00006-of-00047.safetensors", + "model.layers.5.mlp.experts.50.gate_proj.weight": "model-00006-of-00047.safetensors", + "model.layers.5.mlp.experts.50.gate_proj.weight_scale": "model-00006-of-00047.safetensors", + "model.layers.5.mlp.experts.50.up_proj.weight": "model-00006-of-00047.safetensors", + "model.layers.5.mlp.experts.50.up_proj.weight_scale": "model-00006-of-00047.safetensors", + "model.layers.5.mlp.experts.51.down_proj.weight": "model-00006-of-00047.safetensors", + "model.layers.5.mlp.experts.51.down_proj.weight_scale": "model-00006-of-00047.safetensors", + "model.layers.5.mlp.experts.51.gate_proj.weight": "model-00006-of-00047.safetensors", + "model.layers.5.mlp.experts.51.gate_proj.weight_scale": "model-00006-of-00047.safetensors", + "model.layers.5.mlp.experts.51.up_proj.weight": "model-00006-of-00047.safetensors", + "model.layers.5.mlp.experts.51.up_proj.weight_scale": "model-00006-of-00047.safetensors", + "model.layers.5.mlp.experts.52.down_proj.weight": "model-00006-of-00047.safetensors", + "model.layers.5.mlp.experts.52.down_proj.weight_scale": "model-00006-of-00047.safetensors", + "model.layers.5.mlp.experts.52.gate_proj.weight": "model-00006-of-00047.safetensors", + "model.layers.5.mlp.experts.52.gate_proj.weight_scale": "model-00006-of-00047.safetensors", + "model.layers.5.mlp.experts.52.up_proj.weight": "model-00006-of-00047.safetensors", + "model.layers.5.mlp.experts.52.up_proj.weight_scale": "model-00006-of-00047.safetensors", + "model.layers.5.mlp.experts.53.down_proj.weight": "model-00006-of-00047.safetensors", + "model.layers.5.mlp.experts.53.down_proj.weight_scale": "model-00006-of-00047.safetensors", + "model.layers.5.mlp.experts.53.gate_proj.weight": "model-00006-of-00047.safetensors", + "model.layers.5.mlp.experts.53.gate_proj.weight_scale": "model-00006-of-00047.safetensors", + "model.layers.5.mlp.experts.53.up_proj.weight": "model-00006-of-00047.safetensors", + "model.layers.5.mlp.experts.53.up_proj.weight_scale": "model-00006-of-00047.safetensors", + "model.layers.5.mlp.experts.54.down_proj.weight": "model-00006-of-00047.safetensors", + "model.layers.5.mlp.experts.54.down_proj.weight_scale": "model-00006-of-00047.safetensors", + "model.layers.5.mlp.experts.54.gate_proj.weight": "model-00006-of-00047.safetensors", + "model.layers.5.mlp.experts.54.gate_proj.weight_scale": "model-00006-of-00047.safetensors", + "model.layers.5.mlp.experts.54.up_proj.weight": "model-00006-of-00047.safetensors", + "model.layers.5.mlp.experts.54.up_proj.weight_scale": "model-00006-of-00047.safetensors", + "model.layers.5.mlp.experts.55.down_proj.weight": "model-00006-of-00047.safetensors", + "model.layers.5.mlp.experts.55.down_proj.weight_scale": "model-00006-of-00047.safetensors", + "model.layers.5.mlp.experts.55.gate_proj.weight": "model-00006-of-00047.safetensors", + "model.layers.5.mlp.experts.55.gate_proj.weight_scale": "model-00006-of-00047.safetensors", + "model.layers.5.mlp.experts.55.up_proj.weight": "model-00006-of-00047.safetensors", + "model.layers.5.mlp.experts.55.up_proj.weight_scale": "model-00006-of-00047.safetensors", + "model.layers.5.mlp.experts.56.down_proj.weight": "model-00006-of-00047.safetensors", + "model.layers.5.mlp.experts.56.down_proj.weight_scale": "model-00006-of-00047.safetensors", + "model.layers.5.mlp.experts.56.gate_proj.weight": "model-00006-of-00047.safetensors", + "model.layers.5.mlp.experts.56.gate_proj.weight_scale": "model-00006-of-00047.safetensors", + "model.layers.5.mlp.experts.56.up_proj.weight": "model-00006-of-00047.safetensors", + "model.layers.5.mlp.experts.56.up_proj.weight_scale": "model-00006-of-00047.safetensors", + "model.layers.5.mlp.experts.57.down_proj.weight": "model-00006-of-00047.safetensors", + "model.layers.5.mlp.experts.57.down_proj.weight_scale": "model-00006-of-00047.safetensors", + "model.layers.5.mlp.experts.57.gate_proj.weight": "model-00006-of-00047.safetensors", + "model.layers.5.mlp.experts.57.gate_proj.weight_scale": "model-00006-of-00047.safetensors", + "model.layers.5.mlp.experts.57.up_proj.weight": "model-00006-of-00047.safetensors", + "model.layers.5.mlp.experts.57.up_proj.weight_scale": "model-00006-of-00047.safetensors", + "model.layers.5.mlp.experts.58.down_proj.weight": "model-00006-of-00047.safetensors", + "model.layers.5.mlp.experts.58.down_proj.weight_scale": "model-00006-of-00047.safetensors", + "model.layers.5.mlp.experts.58.gate_proj.weight": "model-00006-of-00047.safetensors", + "model.layers.5.mlp.experts.58.gate_proj.weight_scale": "model-00006-of-00047.safetensors", + "model.layers.5.mlp.experts.58.up_proj.weight": "model-00006-of-00047.safetensors", + "model.layers.5.mlp.experts.58.up_proj.weight_scale": "model-00006-of-00047.safetensors", + "model.layers.5.mlp.experts.59.down_proj.weight": "model-00006-of-00047.safetensors", + "model.layers.5.mlp.experts.59.down_proj.weight_scale": "model-00006-of-00047.safetensors", + "model.layers.5.mlp.experts.59.gate_proj.weight": "model-00006-of-00047.safetensors", + "model.layers.5.mlp.experts.59.gate_proj.weight_scale": "model-00006-of-00047.safetensors", + "model.layers.5.mlp.experts.59.up_proj.weight": "model-00006-of-00047.safetensors", + "model.layers.5.mlp.experts.59.up_proj.weight_scale": "model-00006-of-00047.safetensors", + "model.layers.5.mlp.experts.6.down_proj.weight": "model-00006-of-00047.safetensors", + "model.layers.5.mlp.experts.6.down_proj.weight_scale": "model-00006-of-00047.safetensors", + "model.layers.5.mlp.experts.6.gate_proj.weight": "model-00006-of-00047.safetensors", + "model.layers.5.mlp.experts.6.gate_proj.weight_scale": "model-00006-of-00047.safetensors", + "model.layers.5.mlp.experts.6.up_proj.weight": "model-00006-of-00047.safetensors", + "model.layers.5.mlp.experts.6.up_proj.weight_scale": "model-00006-of-00047.safetensors", + "model.layers.5.mlp.experts.60.down_proj.weight": "model-00006-of-00047.safetensors", + "model.layers.5.mlp.experts.60.down_proj.weight_scale": "model-00006-of-00047.safetensors", + "model.layers.5.mlp.experts.60.gate_proj.weight": "model-00006-of-00047.safetensors", + "model.layers.5.mlp.experts.60.gate_proj.weight_scale": "model-00006-of-00047.safetensors", + "model.layers.5.mlp.experts.60.up_proj.weight": "model-00006-of-00047.safetensors", + "model.layers.5.mlp.experts.60.up_proj.weight_scale": "model-00006-of-00047.safetensors", + "model.layers.5.mlp.experts.61.down_proj.weight": "model-00006-of-00047.safetensors", + "model.layers.5.mlp.experts.61.down_proj.weight_scale": "model-00006-of-00047.safetensors", + "model.layers.5.mlp.experts.61.gate_proj.weight": "model-00006-of-00047.safetensors", + "model.layers.5.mlp.experts.61.gate_proj.weight_scale": "model-00006-of-00047.safetensors", + "model.layers.5.mlp.experts.61.up_proj.weight": "model-00006-of-00047.safetensors", + "model.layers.5.mlp.experts.61.up_proj.weight_scale": "model-00006-of-00047.safetensors", + "model.layers.5.mlp.experts.62.down_proj.weight": "model-00006-of-00047.safetensors", + "model.layers.5.mlp.experts.62.down_proj.weight_scale": "model-00006-of-00047.safetensors", + "model.layers.5.mlp.experts.62.gate_proj.weight": "model-00006-of-00047.safetensors", + "model.layers.5.mlp.experts.62.gate_proj.weight_scale": "model-00006-of-00047.safetensors", + "model.layers.5.mlp.experts.62.up_proj.weight": "model-00006-of-00047.safetensors", + "model.layers.5.mlp.experts.62.up_proj.weight_scale": "model-00006-of-00047.safetensors", + "model.layers.5.mlp.experts.63.down_proj.weight": "model-00006-of-00047.safetensors", + "model.layers.5.mlp.experts.63.down_proj.weight_scale": "model-00006-of-00047.safetensors", + "model.layers.5.mlp.experts.63.gate_proj.weight": "model-00006-of-00047.safetensors", + "model.layers.5.mlp.experts.63.gate_proj.weight_scale": "model-00006-of-00047.safetensors", + "model.layers.5.mlp.experts.63.up_proj.weight": "model-00006-of-00047.safetensors", + "model.layers.5.mlp.experts.63.up_proj.weight_scale": "model-00006-of-00047.safetensors", + "model.layers.5.mlp.experts.64.down_proj.weight": "model-00006-of-00047.safetensors", + "model.layers.5.mlp.experts.64.down_proj.weight_scale": "model-00006-of-00047.safetensors", + "model.layers.5.mlp.experts.64.gate_proj.weight": "model-00006-of-00047.safetensors", + "model.layers.5.mlp.experts.64.gate_proj.weight_scale": "model-00006-of-00047.safetensors", + "model.layers.5.mlp.experts.64.up_proj.weight": "model-00006-of-00047.safetensors", + "model.layers.5.mlp.experts.64.up_proj.weight_scale": "model-00006-of-00047.safetensors", + "model.layers.5.mlp.experts.65.down_proj.weight": "model-00006-of-00047.safetensors", + "model.layers.5.mlp.experts.65.down_proj.weight_scale": "model-00006-of-00047.safetensors", + "model.layers.5.mlp.experts.65.gate_proj.weight": "model-00006-of-00047.safetensors", + "model.layers.5.mlp.experts.65.gate_proj.weight_scale": "model-00006-of-00047.safetensors", + "model.layers.5.mlp.experts.65.up_proj.weight": "model-00006-of-00047.safetensors", + "model.layers.5.mlp.experts.65.up_proj.weight_scale": "model-00006-of-00047.safetensors", + "model.layers.5.mlp.experts.66.down_proj.weight": "model-00006-of-00047.safetensors", + "model.layers.5.mlp.experts.66.down_proj.weight_scale": "model-00006-of-00047.safetensors", + "model.layers.5.mlp.experts.66.gate_proj.weight": "model-00006-of-00047.safetensors", + "model.layers.5.mlp.experts.66.gate_proj.weight_scale": "model-00006-of-00047.safetensors", + "model.layers.5.mlp.experts.66.up_proj.weight": "model-00006-of-00047.safetensors", + "model.layers.5.mlp.experts.66.up_proj.weight_scale": "model-00006-of-00047.safetensors", + "model.layers.5.mlp.experts.67.down_proj.weight": "model-00006-of-00047.safetensors", + "model.layers.5.mlp.experts.67.down_proj.weight_scale": "model-00006-of-00047.safetensors", + "model.layers.5.mlp.experts.67.gate_proj.weight": "model-00006-of-00047.safetensors", + "model.layers.5.mlp.experts.67.gate_proj.weight_scale": "model-00006-of-00047.safetensors", + "model.layers.5.mlp.experts.67.up_proj.weight": "model-00006-of-00047.safetensors", + "model.layers.5.mlp.experts.67.up_proj.weight_scale": "model-00006-of-00047.safetensors", + "model.layers.5.mlp.experts.68.down_proj.weight": "model-00006-of-00047.safetensors", + "model.layers.5.mlp.experts.68.down_proj.weight_scale": "model-00006-of-00047.safetensors", + "model.layers.5.mlp.experts.68.gate_proj.weight": "model-00006-of-00047.safetensors", + "model.layers.5.mlp.experts.68.gate_proj.weight_scale": "model-00006-of-00047.safetensors", + "model.layers.5.mlp.experts.68.up_proj.weight": "model-00006-of-00047.safetensors", + "model.layers.5.mlp.experts.68.up_proj.weight_scale": "model-00006-of-00047.safetensors", + "model.layers.5.mlp.experts.69.down_proj.weight": "model-00006-of-00047.safetensors", + "model.layers.5.mlp.experts.69.down_proj.weight_scale": "model-00006-of-00047.safetensors", + "model.layers.5.mlp.experts.69.gate_proj.weight": "model-00006-of-00047.safetensors", + "model.layers.5.mlp.experts.69.gate_proj.weight_scale": "model-00006-of-00047.safetensors", + "model.layers.5.mlp.experts.69.up_proj.weight": "model-00006-of-00047.safetensors", + "model.layers.5.mlp.experts.69.up_proj.weight_scale": "model-00006-of-00047.safetensors", + "model.layers.5.mlp.experts.7.down_proj.weight": "model-00006-of-00047.safetensors", + "model.layers.5.mlp.experts.7.down_proj.weight_scale": "model-00006-of-00047.safetensors", + "model.layers.5.mlp.experts.7.gate_proj.weight": "model-00006-of-00047.safetensors", + "model.layers.5.mlp.experts.7.gate_proj.weight_scale": "model-00006-of-00047.safetensors", + "model.layers.5.mlp.experts.7.up_proj.weight": "model-00006-of-00047.safetensors", + "model.layers.5.mlp.experts.7.up_proj.weight_scale": "model-00006-of-00047.safetensors", + "model.layers.5.mlp.experts.70.down_proj.weight": "model-00006-of-00047.safetensors", + "model.layers.5.mlp.experts.70.down_proj.weight_scale": "model-00006-of-00047.safetensors", + "model.layers.5.mlp.experts.70.gate_proj.weight": "model-00006-of-00047.safetensors", + "model.layers.5.mlp.experts.70.gate_proj.weight_scale": "model-00006-of-00047.safetensors", + "model.layers.5.mlp.experts.70.up_proj.weight": "model-00006-of-00047.safetensors", + "model.layers.5.mlp.experts.70.up_proj.weight_scale": "model-00006-of-00047.safetensors", + "model.layers.5.mlp.experts.71.down_proj.weight": "model-00006-of-00047.safetensors", + "model.layers.5.mlp.experts.71.down_proj.weight_scale": "model-00006-of-00047.safetensors", + "model.layers.5.mlp.experts.71.gate_proj.weight": "model-00006-of-00047.safetensors", + "model.layers.5.mlp.experts.71.gate_proj.weight_scale": "model-00006-of-00047.safetensors", + "model.layers.5.mlp.experts.71.up_proj.weight": "model-00006-of-00047.safetensors", + "model.layers.5.mlp.experts.71.up_proj.weight_scale": "model-00006-of-00047.safetensors", + "model.layers.5.mlp.experts.72.down_proj.weight": "model-00006-of-00047.safetensors", + "model.layers.5.mlp.experts.72.down_proj.weight_scale": "model-00006-of-00047.safetensors", + "model.layers.5.mlp.experts.72.gate_proj.weight": "model-00006-of-00047.safetensors", + "model.layers.5.mlp.experts.72.gate_proj.weight_scale": "model-00006-of-00047.safetensors", + "model.layers.5.mlp.experts.72.up_proj.weight": "model-00006-of-00047.safetensors", + "model.layers.5.mlp.experts.72.up_proj.weight_scale": "model-00006-of-00047.safetensors", + "model.layers.5.mlp.experts.73.down_proj.weight": "model-00006-of-00047.safetensors", + "model.layers.5.mlp.experts.73.down_proj.weight_scale": "model-00006-of-00047.safetensors", + "model.layers.5.mlp.experts.73.gate_proj.weight": "model-00006-of-00047.safetensors", + "model.layers.5.mlp.experts.73.gate_proj.weight_scale": "model-00006-of-00047.safetensors", + "model.layers.5.mlp.experts.73.up_proj.weight": "model-00006-of-00047.safetensors", + "model.layers.5.mlp.experts.73.up_proj.weight_scale": "model-00006-of-00047.safetensors", + "model.layers.5.mlp.experts.74.down_proj.weight": "model-00006-of-00047.safetensors", + "model.layers.5.mlp.experts.74.down_proj.weight_scale": "model-00006-of-00047.safetensors", + "model.layers.5.mlp.experts.74.gate_proj.weight": "model-00006-of-00047.safetensors", + "model.layers.5.mlp.experts.74.gate_proj.weight_scale": "model-00006-of-00047.safetensors", + "model.layers.5.mlp.experts.74.up_proj.weight": "model-00006-of-00047.safetensors", + "model.layers.5.mlp.experts.74.up_proj.weight_scale": "model-00006-of-00047.safetensors", + "model.layers.5.mlp.experts.75.down_proj.weight": "model-00006-of-00047.safetensors", + "model.layers.5.mlp.experts.75.down_proj.weight_scale": "model-00006-of-00047.safetensors", + "model.layers.5.mlp.experts.75.gate_proj.weight": "model-00006-of-00047.safetensors", + "model.layers.5.mlp.experts.75.gate_proj.weight_scale": "model-00006-of-00047.safetensors", + "model.layers.5.mlp.experts.75.up_proj.weight": "model-00006-of-00047.safetensors", + "model.layers.5.mlp.experts.75.up_proj.weight_scale": "model-00006-of-00047.safetensors", + "model.layers.5.mlp.experts.76.down_proj.weight": "model-00006-of-00047.safetensors", + "model.layers.5.mlp.experts.76.down_proj.weight_scale": "model-00006-of-00047.safetensors", + "model.layers.5.mlp.experts.76.gate_proj.weight": "model-00006-of-00047.safetensors", + "model.layers.5.mlp.experts.76.gate_proj.weight_scale": "model-00006-of-00047.safetensors", + "model.layers.5.mlp.experts.76.up_proj.weight": "model-00006-of-00047.safetensors", + "model.layers.5.mlp.experts.76.up_proj.weight_scale": "model-00006-of-00047.safetensors", + "model.layers.5.mlp.experts.77.down_proj.weight": "model-00006-of-00047.safetensors", + "model.layers.5.mlp.experts.77.down_proj.weight_scale": "model-00006-of-00047.safetensors", + "model.layers.5.mlp.experts.77.gate_proj.weight": "model-00006-of-00047.safetensors", + "model.layers.5.mlp.experts.77.gate_proj.weight_scale": "model-00006-of-00047.safetensors", + "model.layers.5.mlp.experts.77.up_proj.weight": "model-00006-of-00047.safetensors", + "model.layers.5.mlp.experts.77.up_proj.weight_scale": "model-00006-of-00047.safetensors", + "model.layers.5.mlp.experts.78.down_proj.weight": "model-00006-of-00047.safetensors", + "model.layers.5.mlp.experts.78.down_proj.weight_scale": "model-00006-of-00047.safetensors", + "model.layers.5.mlp.experts.78.gate_proj.weight": "model-00006-of-00047.safetensors", + "model.layers.5.mlp.experts.78.gate_proj.weight_scale": "model-00006-of-00047.safetensors", + "model.layers.5.mlp.experts.78.up_proj.weight": "model-00006-of-00047.safetensors", + "model.layers.5.mlp.experts.78.up_proj.weight_scale": "model-00006-of-00047.safetensors", + "model.layers.5.mlp.experts.79.down_proj.weight": "model-00006-of-00047.safetensors", + "model.layers.5.mlp.experts.79.down_proj.weight_scale": "model-00006-of-00047.safetensors", + "model.layers.5.mlp.experts.79.gate_proj.weight": "model-00006-of-00047.safetensors", + "model.layers.5.mlp.experts.79.gate_proj.weight_scale": "model-00006-of-00047.safetensors", + "model.layers.5.mlp.experts.79.up_proj.weight": "model-00006-of-00047.safetensors", + "model.layers.5.mlp.experts.79.up_proj.weight_scale": "model-00006-of-00047.safetensors", + "model.layers.5.mlp.experts.8.down_proj.weight": "model-00006-of-00047.safetensors", + "model.layers.5.mlp.experts.8.down_proj.weight_scale": "model-00006-of-00047.safetensors", + "model.layers.5.mlp.experts.8.gate_proj.weight": "model-00006-of-00047.safetensors", + "model.layers.5.mlp.experts.8.gate_proj.weight_scale": "model-00006-of-00047.safetensors", + "model.layers.5.mlp.experts.8.up_proj.weight": "model-00006-of-00047.safetensors", + "model.layers.5.mlp.experts.8.up_proj.weight_scale": "model-00006-of-00047.safetensors", + "model.layers.5.mlp.experts.80.down_proj.weight": "model-00006-of-00047.safetensors", + "model.layers.5.mlp.experts.80.down_proj.weight_scale": "model-00006-of-00047.safetensors", + "model.layers.5.mlp.experts.80.gate_proj.weight": "model-00006-of-00047.safetensors", + "model.layers.5.mlp.experts.80.gate_proj.weight_scale": "model-00006-of-00047.safetensors", + "model.layers.5.mlp.experts.80.up_proj.weight": "model-00006-of-00047.safetensors", + "model.layers.5.mlp.experts.80.up_proj.weight_scale": "model-00006-of-00047.safetensors", + "model.layers.5.mlp.experts.81.down_proj.weight": "model-00006-of-00047.safetensors", + "model.layers.5.mlp.experts.81.down_proj.weight_scale": "model-00006-of-00047.safetensors", + "model.layers.5.mlp.experts.81.gate_proj.weight": "model-00006-of-00047.safetensors", + "model.layers.5.mlp.experts.81.gate_proj.weight_scale": "model-00006-of-00047.safetensors", + "model.layers.5.mlp.experts.81.up_proj.weight": "model-00006-of-00047.safetensors", + "model.layers.5.mlp.experts.81.up_proj.weight_scale": "model-00006-of-00047.safetensors", + "model.layers.5.mlp.experts.82.down_proj.weight": "model-00006-of-00047.safetensors", + "model.layers.5.mlp.experts.82.down_proj.weight_scale": "model-00006-of-00047.safetensors", + "model.layers.5.mlp.experts.82.gate_proj.weight": "model-00006-of-00047.safetensors", + "model.layers.5.mlp.experts.82.gate_proj.weight_scale": "model-00006-of-00047.safetensors", + "model.layers.5.mlp.experts.82.up_proj.weight": "model-00006-of-00047.safetensors", + "model.layers.5.mlp.experts.82.up_proj.weight_scale": "model-00006-of-00047.safetensors", + "model.layers.5.mlp.experts.83.down_proj.weight": "model-00006-of-00047.safetensors", + "model.layers.5.mlp.experts.83.down_proj.weight_scale": "model-00006-of-00047.safetensors", + "model.layers.5.mlp.experts.83.gate_proj.weight": "model-00006-of-00047.safetensors", + "model.layers.5.mlp.experts.83.gate_proj.weight_scale": "model-00006-of-00047.safetensors", + "model.layers.5.mlp.experts.83.up_proj.weight": "model-00006-of-00047.safetensors", + "model.layers.5.mlp.experts.83.up_proj.weight_scale": "model-00006-of-00047.safetensors", + "model.layers.5.mlp.experts.84.down_proj.weight": "model-00006-of-00047.safetensors", + "model.layers.5.mlp.experts.84.down_proj.weight_scale": "model-00006-of-00047.safetensors", + "model.layers.5.mlp.experts.84.gate_proj.weight": "model-00006-of-00047.safetensors", + "model.layers.5.mlp.experts.84.gate_proj.weight_scale": "model-00006-of-00047.safetensors", + "model.layers.5.mlp.experts.84.up_proj.weight": "model-00006-of-00047.safetensors", + "model.layers.5.mlp.experts.84.up_proj.weight_scale": "model-00006-of-00047.safetensors", + "model.layers.5.mlp.experts.85.down_proj.weight": "model-00006-of-00047.safetensors", + "model.layers.5.mlp.experts.85.down_proj.weight_scale": "model-00006-of-00047.safetensors", + "model.layers.5.mlp.experts.85.gate_proj.weight": "model-00006-of-00047.safetensors", + "model.layers.5.mlp.experts.85.gate_proj.weight_scale": "model-00006-of-00047.safetensors", + "model.layers.5.mlp.experts.85.up_proj.weight": "model-00006-of-00047.safetensors", + "model.layers.5.mlp.experts.85.up_proj.weight_scale": "model-00006-of-00047.safetensors", + "model.layers.5.mlp.experts.86.down_proj.weight": "model-00006-of-00047.safetensors", + "model.layers.5.mlp.experts.86.down_proj.weight_scale": "model-00006-of-00047.safetensors", + "model.layers.5.mlp.experts.86.gate_proj.weight": "model-00006-of-00047.safetensors", + "model.layers.5.mlp.experts.86.gate_proj.weight_scale": "model-00006-of-00047.safetensors", + "model.layers.5.mlp.experts.86.up_proj.weight": "model-00006-of-00047.safetensors", + "model.layers.5.mlp.experts.86.up_proj.weight_scale": "model-00006-of-00047.safetensors", + "model.layers.5.mlp.experts.87.down_proj.weight": "model-00006-of-00047.safetensors", + "model.layers.5.mlp.experts.87.down_proj.weight_scale": "model-00006-of-00047.safetensors", + "model.layers.5.mlp.experts.87.gate_proj.weight": "model-00006-of-00047.safetensors", + "model.layers.5.mlp.experts.87.gate_proj.weight_scale": "model-00006-of-00047.safetensors", + "model.layers.5.mlp.experts.87.up_proj.weight": "model-00006-of-00047.safetensors", + "model.layers.5.mlp.experts.87.up_proj.weight_scale": "model-00006-of-00047.safetensors", + "model.layers.5.mlp.experts.88.down_proj.weight": "model-00006-of-00047.safetensors", + "model.layers.5.mlp.experts.88.down_proj.weight_scale": "model-00006-of-00047.safetensors", + "model.layers.5.mlp.experts.88.gate_proj.weight": "model-00006-of-00047.safetensors", + "model.layers.5.mlp.experts.88.gate_proj.weight_scale": "model-00006-of-00047.safetensors", + "model.layers.5.mlp.experts.88.up_proj.weight": "model-00006-of-00047.safetensors", + "model.layers.5.mlp.experts.88.up_proj.weight_scale": "model-00006-of-00047.safetensors", + "model.layers.5.mlp.experts.89.down_proj.weight": "model-00006-of-00047.safetensors", + "model.layers.5.mlp.experts.89.down_proj.weight_scale": "model-00006-of-00047.safetensors", + "model.layers.5.mlp.experts.89.gate_proj.weight": "model-00006-of-00047.safetensors", + "model.layers.5.mlp.experts.89.gate_proj.weight_scale": "model-00006-of-00047.safetensors", + "model.layers.5.mlp.experts.89.up_proj.weight": "model-00006-of-00047.safetensors", + "model.layers.5.mlp.experts.89.up_proj.weight_scale": "model-00006-of-00047.safetensors", + "model.layers.5.mlp.experts.9.down_proj.weight": "model-00006-of-00047.safetensors", + "model.layers.5.mlp.experts.9.down_proj.weight_scale": "model-00006-of-00047.safetensors", + "model.layers.5.mlp.experts.9.gate_proj.weight": "model-00006-of-00047.safetensors", + "model.layers.5.mlp.experts.9.gate_proj.weight_scale": "model-00006-of-00047.safetensors", + "model.layers.5.mlp.experts.9.up_proj.weight": "model-00006-of-00047.safetensors", + "model.layers.5.mlp.experts.9.up_proj.weight_scale": "model-00006-of-00047.safetensors", + "model.layers.5.mlp.experts.90.down_proj.weight": "model-00006-of-00047.safetensors", + "model.layers.5.mlp.experts.90.down_proj.weight_scale": "model-00006-of-00047.safetensors", + "model.layers.5.mlp.experts.90.gate_proj.weight": "model-00006-of-00047.safetensors", + "model.layers.5.mlp.experts.90.gate_proj.weight_scale": "model-00006-of-00047.safetensors", + "model.layers.5.mlp.experts.90.up_proj.weight": "model-00006-of-00047.safetensors", + "model.layers.5.mlp.experts.90.up_proj.weight_scale": "model-00006-of-00047.safetensors", + "model.layers.5.mlp.experts.91.down_proj.weight": "model-00006-of-00047.safetensors", + "model.layers.5.mlp.experts.91.down_proj.weight_scale": "model-00006-of-00047.safetensors", + "model.layers.5.mlp.experts.91.gate_proj.weight": "model-00006-of-00047.safetensors", + "model.layers.5.mlp.experts.91.gate_proj.weight_scale": "model-00006-of-00047.safetensors", + "model.layers.5.mlp.experts.91.up_proj.weight": "model-00006-of-00047.safetensors", + "model.layers.5.mlp.experts.91.up_proj.weight_scale": "model-00006-of-00047.safetensors", + "model.layers.5.mlp.experts.92.down_proj.weight": "model-00006-of-00047.safetensors", + "model.layers.5.mlp.experts.92.down_proj.weight_scale": "model-00006-of-00047.safetensors", + "model.layers.5.mlp.experts.92.gate_proj.weight": "model-00006-of-00047.safetensors", + "model.layers.5.mlp.experts.92.gate_proj.weight_scale": "model-00006-of-00047.safetensors", + "model.layers.5.mlp.experts.92.up_proj.weight": "model-00006-of-00047.safetensors", + "model.layers.5.mlp.experts.92.up_proj.weight_scale": "model-00006-of-00047.safetensors", + "model.layers.5.mlp.experts.93.down_proj.weight": "model-00006-of-00047.safetensors", + "model.layers.5.mlp.experts.93.down_proj.weight_scale": "model-00006-of-00047.safetensors", + "model.layers.5.mlp.experts.93.gate_proj.weight": "model-00006-of-00047.safetensors", + "model.layers.5.mlp.experts.93.gate_proj.weight_scale": "model-00006-of-00047.safetensors", + "model.layers.5.mlp.experts.93.up_proj.weight": "model-00006-of-00047.safetensors", + "model.layers.5.mlp.experts.93.up_proj.weight_scale": "model-00006-of-00047.safetensors", + "model.layers.5.mlp.experts.94.down_proj.weight": "model-00006-of-00047.safetensors", + "model.layers.5.mlp.experts.94.down_proj.weight_scale": "model-00006-of-00047.safetensors", + "model.layers.5.mlp.experts.94.gate_proj.weight": "model-00006-of-00047.safetensors", + "model.layers.5.mlp.experts.94.gate_proj.weight_scale": "model-00006-of-00047.safetensors", + "model.layers.5.mlp.experts.94.up_proj.weight": "model-00006-of-00047.safetensors", + "model.layers.5.mlp.experts.94.up_proj.weight_scale": "model-00006-of-00047.safetensors", + "model.layers.5.mlp.experts.95.down_proj.weight": "model-00006-of-00047.safetensors", + "model.layers.5.mlp.experts.95.down_proj.weight_scale": "model-00006-of-00047.safetensors", + "model.layers.5.mlp.experts.95.gate_proj.weight": "model-00006-of-00047.safetensors", + "model.layers.5.mlp.experts.95.gate_proj.weight_scale": "model-00006-of-00047.safetensors", + "model.layers.5.mlp.experts.95.up_proj.weight": "model-00006-of-00047.safetensors", + "model.layers.5.mlp.experts.95.up_proj.weight_scale": "model-00006-of-00047.safetensors", + "model.layers.5.mlp.experts.96.down_proj.weight": "model-00006-of-00047.safetensors", + "model.layers.5.mlp.experts.96.down_proj.weight_scale": "model-00006-of-00047.safetensors", + "model.layers.5.mlp.experts.96.gate_proj.weight": "model-00006-of-00047.safetensors", + "model.layers.5.mlp.experts.96.gate_proj.weight_scale": "model-00006-of-00047.safetensors", + "model.layers.5.mlp.experts.96.up_proj.weight": "model-00006-of-00047.safetensors", + "model.layers.5.mlp.experts.96.up_proj.weight_scale": "model-00006-of-00047.safetensors", + "model.layers.5.mlp.experts.97.down_proj.weight": "model-00006-of-00047.safetensors", + "model.layers.5.mlp.experts.97.down_proj.weight_scale": "model-00006-of-00047.safetensors", + "model.layers.5.mlp.experts.97.gate_proj.weight": "model-00006-of-00047.safetensors", + "model.layers.5.mlp.experts.97.gate_proj.weight_scale": "model-00006-of-00047.safetensors", + "model.layers.5.mlp.experts.97.up_proj.weight": "model-00006-of-00047.safetensors", + "model.layers.5.mlp.experts.97.up_proj.weight_scale": "model-00006-of-00047.safetensors", + "model.layers.5.mlp.experts.98.down_proj.weight": "model-00006-of-00047.safetensors", + "model.layers.5.mlp.experts.98.down_proj.weight_scale": "model-00006-of-00047.safetensors", + "model.layers.5.mlp.experts.98.gate_proj.weight": "model-00006-of-00047.safetensors", + "model.layers.5.mlp.experts.98.gate_proj.weight_scale": "model-00006-of-00047.safetensors", + "model.layers.5.mlp.experts.98.up_proj.weight": "model-00006-of-00047.safetensors", + "model.layers.5.mlp.experts.98.up_proj.weight_scale": "model-00006-of-00047.safetensors", + "model.layers.5.mlp.experts.99.down_proj.weight": "model-00006-of-00047.safetensors", + "model.layers.5.mlp.experts.99.down_proj.weight_scale": "model-00006-of-00047.safetensors", + "model.layers.5.mlp.experts.99.gate_proj.weight": "model-00006-of-00047.safetensors", + "model.layers.5.mlp.experts.99.gate_proj.weight_scale": "model-00006-of-00047.safetensors", + "model.layers.5.mlp.experts.99.up_proj.weight": "model-00006-of-00047.safetensors", + "model.layers.5.mlp.experts.99.up_proj.weight_scale": "model-00006-of-00047.safetensors", + "model.layers.5.mlp.gate.e_score_correction_bias": "model-00006-of-00047.safetensors", + "model.layers.5.mlp.gate.weight": "model-00006-of-00047.safetensors", + "model.layers.5.mlp.shared_experts.down_proj.weight": "model-00006-of-00047.safetensors", + "model.layers.5.mlp.shared_experts.down_proj.weight_scale": "model-00006-of-00047.safetensors", + "model.layers.5.mlp.shared_experts.gate_proj.weight": "model-00006-of-00047.safetensors", + "model.layers.5.mlp.shared_experts.gate_proj.weight_scale": "model-00006-of-00047.safetensors", + "model.layers.5.mlp.shared_experts.up_proj.weight": "model-00006-of-00047.safetensors", + "model.layers.5.mlp.shared_experts.up_proj.weight_scale": "model-00006-of-00047.safetensors", + "model.layers.5.post_attention_layernorm.weight": "model-00006-of-00047.safetensors", + "model.layers.5.self_attn.k_proj.bias": "model-00006-of-00047.safetensors", + "model.layers.5.self_attn.k_proj.weight": "model-00006-of-00047.safetensors", + "model.layers.5.self_attn.k_proj.weight_scale": "model-00006-of-00047.safetensors", + "model.layers.5.self_attn.o_proj.weight": "model-00006-of-00047.safetensors", + "model.layers.5.self_attn.o_proj.weight_scale": "model-00006-of-00047.safetensors", + "model.layers.5.self_attn.q_proj.bias": "model-00006-of-00047.safetensors", + "model.layers.5.self_attn.q_proj.weight": "model-00006-of-00047.safetensors", + "model.layers.5.self_attn.q_proj.weight_scale": "model-00006-of-00047.safetensors", + "model.layers.5.self_attn.v_proj.bias": "model-00006-of-00047.safetensors", + "model.layers.5.self_attn.v_proj.weight": "model-00006-of-00047.safetensors", + "model.layers.5.self_attn.v_proj.weight_scale": "model-00006-of-00047.safetensors", + "model.layers.6.input_layernorm.weight": "model-00007-of-00047.safetensors", + "model.layers.6.mlp.experts.0.down_proj.weight": "model-00007-of-00047.safetensors", + "model.layers.6.mlp.experts.0.down_proj.weight_scale": "model-00007-of-00047.safetensors", + "model.layers.6.mlp.experts.0.gate_proj.weight": "model-00007-of-00047.safetensors", + "model.layers.6.mlp.experts.0.gate_proj.weight_scale": "model-00007-of-00047.safetensors", + "model.layers.6.mlp.experts.0.up_proj.weight": "model-00007-of-00047.safetensors", + "model.layers.6.mlp.experts.0.up_proj.weight_scale": "model-00007-of-00047.safetensors", + "model.layers.6.mlp.experts.1.down_proj.weight": "model-00007-of-00047.safetensors", + "model.layers.6.mlp.experts.1.down_proj.weight_scale": "model-00007-of-00047.safetensors", + "model.layers.6.mlp.experts.1.gate_proj.weight": "model-00007-of-00047.safetensors", + "model.layers.6.mlp.experts.1.gate_proj.weight_scale": "model-00007-of-00047.safetensors", + "model.layers.6.mlp.experts.1.up_proj.weight": "model-00007-of-00047.safetensors", + "model.layers.6.mlp.experts.1.up_proj.weight_scale": "model-00007-of-00047.safetensors", + "model.layers.6.mlp.experts.10.down_proj.weight": "model-00007-of-00047.safetensors", + "model.layers.6.mlp.experts.10.down_proj.weight_scale": "model-00007-of-00047.safetensors", + "model.layers.6.mlp.experts.10.gate_proj.weight": "model-00007-of-00047.safetensors", + "model.layers.6.mlp.experts.10.gate_proj.weight_scale": "model-00007-of-00047.safetensors", + "model.layers.6.mlp.experts.10.up_proj.weight": "model-00007-of-00047.safetensors", + "model.layers.6.mlp.experts.10.up_proj.weight_scale": "model-00007-of-00047.safetensors", + "model.layers.6.mlp.experts.100.down_proj.weight": "model-00007-of-00047.safetensors", + "model.layers.6.mlp.experts.100.down_proj.weight_scale": "model-00007-of-00047.safetensors", + "model.layers.6.mlp.experts.100.gate_proj.weight": "model-00007-of-00047.safetensors", + "model.layers.6.mlp.experts.100.gate_proj.weight_scale": "model-00007-of-00047.safetensors", + "model.layers.6.mlp.experts.100.up_proj.weight": "model-00007-of-00047.safetensors", + "model.layers.6.mlp.experts.100.up_proj.weight_scale": "model-00007-of-00047.safetensors", + "model.layers.6.mlp.experts.101.down_proj.weight": "model-00007-of-00047.safetensors", + "model.layers.6.mlp.experts.101.down_proj.weight_scale": "model-00007-of-00047.safetensors", + "model.layers.6.mlp.experts.101.gate_proj.weight": "model-00007-of-00047.safetensors", + "model.layers.6.mlp.experts.101.gate_proj.weight_scale": "model-00007-of-00047.safetensors", + "model.layers.6.mlp.experts.101.up_proj.weight": "model-00007-of-00047.safetensors", + "model.layers.6.mlp.experts.101.up_proj.weight_scale": "model-00007-of-00047.safetensors", + "model.layers.6.mlp.experts.102.down_proj.weight": "model-00007-of-00047.safetensors", + "model.layers.6.mlp.experts.102.down_proj.weight_scale": "model-00007-of-00047.safetensors", + "model.layers.6.mlp.experts.102.gate_proj.weight": "model-00007-of-00047.safetensors", + "model.layers.6.mlp.experts.102.gate_proj.weight_scale": "model-00007-of-00047.safetensors", + "model.layers.6.mlp.experts.102.up_proj.weight": "model-00007-of-00047.safetensors", + "model.layers.6.mlp.experts.102.up_proj.weight_scale": "model-00007-of-00047.safetensors", + "model.layers.6.mlp.experts.103.down_proj.weight": "model-00007-of-00047.safetensors", + "model.layers.6.mlp.experts.103.down_proj.weight_scale": "model-00007-of-00047.safetensors", + "model.layers.6.mlp.experts.103.gate_proj.weight": "model-00007-of-00047.safetensors", + "model.layers.6.mlp.experts.103.gate_proj.weight_scale": "model-00007-of-00047.safetensors", + "model.layers.6.mlp.experts.103.up_proj.weight": "model-00007-of-00047.safetensors", + "model.layers.6.mlp.experts.103.up_proj.weight_scale": "model-00007-of-00047.safetensors", + "model.layers.6.mlp.experts.104.down_proj.weight": "model-00007-of-00047.safetensors", + "model.layers.6.mlp.experts.104.down_proj.weight_scale": "model-00007-of-00047.safetensors", + "model.layers.6.mlp.experts.104.gate_proj.weight": "model-00007-of-00047.safetensors", + "model.layers.6.mlp.experts.104.gate_proj.weight_scale": "model-00007-of-00047.safetensors", + "model.layers.6.mlp.experts.104.up_proj.weight": "model-00007-of-00047.safetensors", + "model.layers.6.mlp.experts.104.up_proj.weight_scale": "model-00007-of-00047.safetensors", + "model.layers.6.mlp.experts.105.down_proj.weight": "model-00007-of-00047.safetensors", + "model.layers.6.mlp.experts.105.down_proj.weight_scale": "model-00007-of-00047.safetensors", + "model.layers.6.mlp.experts.105.gate_proj.weight": "model-00007-of-00047.safetensors", + "model.layers.6.mlp.experts.105.gate_proj.weight_scale": "model-00007-of-00047.safetensors", + "model.layers.6.mlp.experts.105.up_proj.weight": "model-00007-of-00047.safetensors", + "model.layers.6.mlp.experts.105.up_proj.weight_scale": "model-00007-of-00047.safetensors", + "model.layers.6.mlp.experts.106.down_proj.weight": "model-00007-of-00047.safetensors", + "model.layers.6.mlp.experts.106.down_proj.weight_scale": "model-00007-of-00047.safetensors", + "model.layers.6.mlp.experts.106.gate_proj.weight": "model-00007-of-00047.safetensors", + "model.layers.6.mlp.experts.106.gate_proj.weight_scale": "model-00007-of-00047.safetensors", + "model.layers.6.mlp.experts.106.up_proj.weight": "model-00007-of-00047.safetensors", + "model.layers.6.mlp.experts.106.up_proj.weight_scale": "model-00007-of-00047.safetensors", + "model.layers.6.mlp.experts.107.down_proj.weight": "model-00007-of-00047.safetensors", + "model.layers.6.mlp.experts.107.down_proj.weight_scale": "model-00007-of-00047.safetensors", + "model.layers.6.mlp.experts.107.gate_proj.weight": "model-00007-of-00047.safetensors", + "model.layers.6.mlp.experts.107.gate_proj.weight_scale": "model-00007-of-00047.safetensors", + "model.layers.6.mlp.experts.107.up_proj.weight": "model-00007-of-00047.safetensors", + "model.layers.6.mlp.experts.107.up_proj.weight_scale": "model-00007-of-00047.safetensors", + "model.layers.6.mlp.experts.108.down_proj.weight": "model-00007-of-00047.safetensors", + "model.layers.6.mlp.experts.108.down_proj.weight_scale": "model-00007-of-00047.safetensors", + "model.layers.6.mlp.experts.108.gate_proj.weight": "model-00007-of-00047.safetensors", + "model.layers.6.mlp.experts.108.gate_proj.weight_scale": "model-00007-of-00047.safetensors", + "model.layers.6.mlp.experts.108.up_proj.weight": "model-00007-of-00047.safetensors", + "model.layers.6.mlp.experts.108.up_proj.weight_scale": "model-00007-of-00047.safetensors", + "model.layers.6.mlp.experts.109.down_proj.weight": "model-00007-of-00047.safetensors", + "model.layers.6.mlp.experts.109.down_proj.weight_scale": "model-00007-of-00047.safetensors", + "model.layers.6.mlp.experts.109.gate_proj.weight": "model-00007-of-00047.safetensors", + "model.layers.6.mlp.experts.109.gate_proj.weight_scale": "model-00007-of-00047.safetensors", + "model.layers.6.mlp.experts.109.up_proj.weight": "model-00007-of-00047.safetensors", + "model.layers.6.mlp.experts.109.up_proj.weight_scale": "model-00007-of-00047.safetensors", + "model.layers.6.mlp.experts.11.down_proj.weight": "model-00007-of-00047.safetensors", + "model.layers.6.mlp.experts.11.down_proj.weight_scale": "model-00007-of-00047.safetensors", + "model.layers.6.mlp.experts.11.gate_proj.weight": "model-00007-of-00047.safetensors", + "model.layers.6.mlp.experts.11.gate_proj.weight_scale": "model-00007-of-00047.safetensors", + "model.layers.6.mlp.experts.11.up_proj.weight": "model-00007-of-00047.safetensors", + "model.layers.6.mlp.experts.11.up_proj.weight_scale": "model-00007-of-00047.safetensors", + "model.layers.6.mlp.experts.110.down_proj.weight": "model-00007-of-00047.safetensors", + "model.layers.6.mlp.experts.110.down_proj.weight_scale": "model-00007-of-00047.safetensors", + "model.layers.6.mlp.experts.110.gate_proj.weight": "model-00007-of-00047.safetensors", + "model.layers.6.mlp.experts.110.gate_proj.weight_scale": "model-00007-of-00047.safetensors", + "model.layers.6.mlp.experts.110.up_proj.weight": "model-00007-of-00047.safetensors", + "model.layers.6.mlp.experts.110.up_proj.weight_scale": "model-00007-of-00047.safetensors", + "model.layers.6.mlp.experts.111.down_proj.weight": "model-00007-of-00047.safetensors", + "model.layers.6.mlp.experts.111.down_proj.weight_scale": "model-00007-of-00047.safetensors", + "model.layers.6.mlp.experts.111.gate_proj.weight": "model-00007-of-00047.safetensors", + "model.layers.6.mlp.experts.111.gate_proj.weight_scale": "model-00007-of-00047.safetensors", + "model.layers.6.mlp.experts.111.up_proj.weight": "model-00007-of-00047.safetensors", + "model.layers.6.mlp.experts.111.up_proj.weight_scale": "model-00007-of-00047.safetensors", + "model.layers.6.mlp.experts.112.down_proj.weight": "model-00007-of-00047.safetensors", + "model.layers.6.mlp.experts.112.down_proj.weight_scale": "model-00007-of-00047.safetensors", + "model.layers.6.mlp.experts.112.gate_proj.weight": "model-00007-of-00047.safetensors", + "model.layers.6.mlp.experts.112.gate_proj.weight_scale": "model-00007-of-00047.safetensors", + "model.layers.6.mlp.experts.112.up_proj.weight": "model-00007-of-00047.safetensors", + "model.layers.6.mlp.experts.112.up_proj.weight_scale": "model-00007-of-00047.safetensors", + "model.layers.6.mlp.experts.113.down_proj.weight": "model-00007-of-00047.safetensors", + "model.layers.6.mlp.experts.113.down_proj.weight_scale": "model-00007-of-00047.safetensors", + "model.layers.6.mlp.experts.113.gate_proj.weight": "model-00007-of-00047.safetensors", + "model.layers.6.mlp.experts.113.gate_proj.weight_scale": "model-00007-of-00047.safetensors", + "model.layers.6.mlp.experts.113.up_proj.weight": "model-00007-of-00047.safetensors", + "model.layers.6.mlp.experts.113.up_proj.weight_scale": "model-00007-of-00047.safetensors", + "model.layers.6.mlp.experts.114.down_proj.weight": "model-00007-of-00047.safetensors", + "model.layers.6.mlp.experts.114.down_proj.weight_scale": "model-00007-of-00047.safetensors", + "model.layers.6.mlp.experts.114.gate_proj.weight": "model-00007-of-00047.safetensors", + "model.layers.6.mlp.experts.114.gate_proj.weight_scale": "model-00007-of-00047.safetensors", + "model.layers.6.mlp.experts.114.up_proj.weight": "model-00007-of-00047.safetensors", + "model.layers.6.mlp.experts.114.up_proj.weight_scale": "model-00007-of-00047.safetensors", + "model.layers.6.mlp.experts.115.down_proj.weight": "model-00007-of-00047.safetensors", + "model.layers.6.mlp.experts.115.down_proj.weight_scale": "model-00007-of-00047.safetensors", + "model.layers.6.mlp.experts.115.gate_proj.weight": "model-00007-of-00047.safetensors", + "model.layers.6.mlp.experts.115.gate_proj.weight_scale": "model-00007-of-00047.safetensors", + "model.layers.6.mlp.experts.115.up_proj.weight": "model-00007-of-00047.safetensors", + "model.layers.6.mlp.experts.115.up_proj.weight_scale": "model-00007-of-00047.safetensors", + "model.layers.6.mlp.experts.116.down_proj.weight": "model-00007-of-00047.safetensors", + "model.layers.6.mlp.experts.116.down_proj.weight_scale": "model-00007-of-00047.safetensors", + "model.layers.6.mlp.experts.116.gate_proj.weight": "model-00007-of-00047.safetensors", + "model.layers.6.mlp.experts.116.gate_proj.weight_scale": "model-00007-of-00047.safetensors", + "model.layers.6.mlp.experts.116.up_proj.weight": "model-00007-of-00047.safetensors", + "model.layers.6.mlp.experts.116.up_proj.weight_scale": "model-00007-of-00047.safetensors", + "model.layers.6.mlp.experts.117.down_proj.weight": "model-00007-of-00047.safetensors", + "model.layers.6.mlp.experts.117.down_proj.weight_scale": "model-00007-of-00047.safetensors", + "model.layers.6.mlp.experts.117.gate_proj.weight": "model-00007-of-00047.safetensors", + "model.layers.6.mlp.experts.117.gate_proj.weight_scale": "model-00007-of-00047.safetensors", + "model.layers.6.mlp.experts.117.up_proj.weight": "model-00007-of-00047.safetensors", + "model.layers.6.mlp.experts.117.up_proj.weight_scale": "model-00007-of-00047.safetensors", + "model.layers.6.mlp.experts.118.down_proj.weight": "model-00007-of-00047.safetensors", + "model.layers.6.mlp.experts.118.down_proj.weight_scale": "model-00007-of-00047.safetensors", + "model.layers.6.mlp.experts.118.gate_proj.weight": "model-00007-of-00047.safetensors", + "model.layers.6.mlp.experts.118.gate_proj.weight_scale": "model-00007-of-00047.safetensors", + "model.layers.6.mlp.experts.118.up_proj.weight": "model-00007-of-00047.safetensors", + "model.layers.6.mlp.experts.118.up_proj.weight_scale": "model-00007-of-00047.safetensors", + "model.layers.6.mlp.experts.119.down_proj.weight": "model-00007-of-00047.safetensors", + "model.layers.6.mlp.experts.119.down_proj.weight_scale": "model-00007-of-00047.safetensors", + "model.layers.6.mlp.experts.119.gate_proj.weight": "model-00007-of-00047.safetensors", + "model.layers.6.mlp.experts.119.gate_proj.weight_scale": "model-00007-of-00047.safetensors", + "model.layers.6.mlp.experts.119.up_proj.weight": "model-00007-of-00047.safetensors", + "model.layers.6.mlp.experts.119.up_proj.weight_scale": "model-00007-of-00047.safetensors", + "model.layers.6.mlp.experts.12.down_proj.weight": "model-00007-of-00047.safetensors", + "model.layers.6.mlp.experts.12.down_proj.weight_scale": "model-00007-of-00047.safetensors", + "model.layers.6.mlp.experts.12.gate_proj.weight": "model-00007-of-00047.safetensors", + "model.layers.6.mlp.experts.12.gate_proj.weight_scale": "model-00007-of-00047.safetensors", + "model.layers.6.mlp.experts.12.up_proj.weight": "model-00007-of-00047.safetensors", + "model.layers.6.mlp.experts.12.up_proj.weight_scale": "model-00007-of-00047.safetensors", + "model.layers.6.mlp.experts.120.down_proj.weight": "model-00007-of-00047.safetensors", + "model.layers.6.mlp.experts.120.down_proj.weight_scale": "model-00007-of-00047.safetensors", + "model.layers.6.mlp.experts.120.gate_proj.weight": "model-00007-of-00047.safetensors", + "model.layers.6.mlp.experts.120.gate_proj.weight_scale": "model-00007-of-00047.safetensors", + "model.layers.6.mlp.experts.120.up_proj.weight": "model-00007-of-00047.safetensors", + "model.layers.6.mlp.experts.120.up_proj.weight_scale": "model-00007-of-00047.safetensors", + "model.layers.6.mlp.experts.121.down_proj.weight": "model-00007-of-00047.safetensors", + "model.layers.6.mlp.experts.121.down_proj.weight_scale": "model-00007-of-00047.safetensors", + "model.layers.6.mlp.experts.121.gate_proj.weight": "model-00007-of-00047.safetensors", + "model.layers.6.mlp.experts.121.gate_proj.weight_scale": "model-00007-of-00047.safetensors", + "model.layers.6.mlp.experts.121.up_proj.weight": "model-00007-of-00047.safetensors", + "model.layers.6.mlp.experts.121.up_proj.weight_scale": "model-00007-of-00047.safetensors", + "model.layers.6.mlp.experts.122.down_proj.weight": "model-00007-of-00047.safetensors", + "model.layers.6.mlp.experts.122.down_proj.weight_scale": "model-00007-of-00047.safetensors", + "model.layers.6.mlp.experts.122.gate_proj.weight": "model-00007-of-00047.safetensors", + "model.layers.6.mlp.experts.122.gate_proj.weight_scale": "model-00007-of-00047.safetensors", + "model.layers.6.mlp.experts.122.up_proj.weight": "model-00007-of-00047.safetensors", + "model.layers.6.mlp.experts.122.up_proj.weight_scale": "model-00007-of-00047.safetensors", + "model.layers.6.mlp.experts.123.down_proj.weight": "model-00007-of-00047.safetensors", + "model.layers.6.mlp.experts.123.down_proj.weight_scale": "model-00007-of-00047.safetensors", + "model.layers.6.mlp.experts.123.gate_proj.weight": "model-00007-of-00047.safetensors", + "model.layers.6.mlp.experts.123.gate_proj.weight_scale": "model-00007-of-00047.safetensors", + "model.layers.6.mlp.experts.123.up_proj.weight": "model-00007-of-00047.safetensors", + "model.layers.6.mlp.experts.123.up_proj.weight_scale": "model-00007-of-00047.safetensors", + "model.layers.6.mlp.experts.124.down_proj.weight": "model-00007-of-00047.safetensors", + "model.layers.6.mlp.experts.124.down_proj.weight_scale": "model-00007-of-00047.safetensors", + "model.layers.6.mlp.experts.124.gate_proj.weight": "model-00007-of-00047.safetensors", + "model.layers.6.mlp.experts.124.gate_proj.weight_scale": "model-00007-of-00047.safetensors", + "model.layers.6.mlp.experts.124.up_proj.weight": "model-00007-of-00047.safetensors", + "model.layers.6.mlp.experts.124.up_proj.weight_scale": "model-00007-of-00047.safetensors", + "model.layers.6.mlp.experts.125.down_proj.weight": "model-00007-of-00047.safetensors", + "model.layers.6.mlp.experts.125.down_proj.weight_scale": "model-00007-of-00047.safetensors", + "model.layers.6.mlp.experts.125.gate_proj.weight": "model-00007-of-00047.safetensors", + "model.layers.6.mlp.experts.125.gate_proj.weight_scale": "model-00007-of-00047.safetensors", + "model.layers.6.mlp.experts.125.up_proj.weight": "model-00007-of-00047.safetensors", + "model.layers.6.mlp.experts.125.up_proj.weight_scale": "model-00007-of-00047.safetensors", + "model.layers.6.mlp.experts.126.down_proj.weight": "model-00007-of-00047.safetensors", + "model.layers.6.mlp.experts.126.down_proj.weight_scale": "model-00007-of-00047.safetensors", + "model.layers.6.mlp.experts.126.gate_proj.weight": "model-00007-of-00047.safetensors", + "model.layers.6.mlp.experts.126.gate_proj.weight_scale": "model-00007-of-00047.safetensors", + "model.layers.6.mlp.experts.126.up_proj.weight": "model-00007-of-00047.safetensors", + "model.layers.6.mlp.experts.126.up_proj.weight_scale": "model-00007-of-00047.safetensors", + "model.layers.6.mlp.experts.127.down_proj.weight": "model-00007-of-00047.safetensors", + "model.layers.6.mlp.experts.127.down_proj.weight_scale": "model-00007-of-00047.safetensors", + "model.layers.6.mlp.experts.127.gate_proj.weight": "model-00007-of-00047.safetensors", + "model.layers.6.mlp.experts.127.gate_proj.weight_scale": "model-00007-of-00047.safetensors", + "model.layers.6.mlp.experts.127.up_proj.weight": "model-00007-of-00047.safetensors", + "model.layers.6.mlp.experts.127.up_proj.weight_scale": "model-00007-of-00047.safetensors", + "model.layers.6.mlp.experts.13.down_proj.weight": "model-00007-of-00047.safetensors", + "model.layers.6.mlp.experts.13.down_proj.weight_scale": "model-00007-of-00047.safetensors", + "model.layers.6.mlp.experts.13.gate_proj.weight": "model-00007-of-00047.safetensors", + "model.layers.6.mlp.experts.13.gate_proj.weight_scale": "model-00007-of-00047.safetensors", + "model.layers.6.mlp.experts.13.up_proj.weight": "model-00007-of-00047.safetensors", + "model.layers.6.mlp.experts.13.up_proj.weight_scale": "model-00007-of-00047.safetensors", + "model.layers.6.mlp.experts.14.down_proj.weight": "model-00007-of-00047.safetensors", + "model.layers.6.mlp.experts.14.down_proj.weight_scale": "model-00007-of-00047.safetensors", + "model.layers.6.mlp.experts.14.gate_proj.weight": "model-00007-of-00047.safetensors", + "model.layers.6.mlp.experts.14.gate_proj.weight_scale": "model-00007-of-00047.safetensors", + "model.layers.6.mlp.experts.14.up_proj.weight": "model-00007-of-00047.safetensors", + "model.layers.6.mlp.experts.14.up_proj.weight_scale": "model-00007-of-00047.safetensors", + "model.layers.6.mlp.experts.15.down_proj.weight": "model-00007-of-00047.safetensors", + "model.layers.6.mlp.experts.15.down_proj.weight_scale": "model-00007-of-00047.safetensors", + "model.layers.6.mlp.experts.15.gate_proj.weight": "model-00007-of-00047.safetensors", + "model.layers.6.mlp.experts.15.gate_proj.weight_scale": "model-00007-of-00047.safetensors", + "model.layers.6.mlp.experts.15.up_proj.weight": "model-00007-of-00047.safetensors", + "model.layers.6.mlp.experts.15.up_proj.weight_scale": "model-00007-of-00047.safetensors", + "model.layers.6.mlp.experts.16.down_proj.weight": "model-00007-of-00047.safetensors", + "model.layers.6.mlp.experts.16.down_proj.weight_scale": "model-00007-of-00047.safetensors", + "model.layers.6.mlp.experts.16.gate_proj.weight": "model-00007-of-00047.safetensors", + "model.layers.6.mlp.experts.16.gate_proj.weight_scale": "model-00007-of-00047.safetensors", + "model.layers.6.mlp.experts.16.up_proj.weight": "model-00007-of-00047.safetensors", + "model.layers.6.mlp.experts.16.up_proj.weight_scale": "model-00007-of-00047.safetensors", + "model.layers.6.mlp.experts.17.down_proj.weight": "model-00007-of-00047.safetensors", + "model.layers.6.mlp.experts.17.down_proj.weight_scale": "model-00007-of-00047.safetensors", + "model.layers.6.mlp.experts.17.gate_proj.weight": "model-00007-of-00047.safetensors", + "model.layers.6.mlp.experts.17.gate_proj.weight_scale": "model-00007-of-00047.safetensors", + "model.layers.6.mlp.experts.17.up_proj.weight": "model-00007-of-00047.safetensors", + "model.layers.6.mlp.experts.17.up_proj.weight_scale": "model-00007-of-00047.safetensors", + "model.layers.6.mlp.experts.18.down_proj.weight": "model-00007-of-00047.safetensors", + "model.layers.6.mlp.experts.18.down_proj.weight_scale": "model-00007-of-00047.safetensors", + "model.layers.6.mlp.experts.18.gate_proj.weight": "model-00007-of-00047.safetensors", + "model.layers.6.mlp.experts.18.gate_proj.weight_scale": "model-00007-of-00047.safetensors", + "model.layers.6.mlp.experts.18.up_proj.weight": "model-00007-of-00047.safetensors", + "model.layers.6.mlp.experts.18.up_proj.weight_scale": "model-00007-of-00047.safetensors", + "model.layers.6.mlp.experts.19.down_proj.weight": "model-00007-of-00047.safetensors", + "model.layers.6.mlp.experts.19.down_proj.weight_scale": "model-00007-of-00047.safetensors", + "model.layers.6.mlp.experts.19.gate_proj.weight": "model-00007-of-00047.safetensors", + "model.layers.6.mlp.experts.19.gate_proj.weight_scale": "model-00007-of-00047.safetensors", + "model.layers.6.mlp.experts.19.up_proj.weight": "model-00007-of-00047.safetensors", + "model.layers.6.mlp.experts.19.up_proj.weight_scale": "model-00007-of-00047.safetensors", + "model.layers.6.mlp.experts.2.down_proj.weight": "model-00007-of-00047.safetensors", + "model.layers.6.mlp.experts.2.down_proj.weight_scale": "model-00007-of-00047.safetensors", + "model.layers.6.mlp.experts.2.gate_proj.weight": "model-00007-of-00047.safetensors", + "model.layers.6.mlp.experts.2.gate_proj.weight_scale": "model-00007-of-00047.safetensors", + "model.layers.6.mlp.experts.2.up_proj.weight": "model-00007-of-00047.safetensors", + "model.layers.6.mlp.experts.2.up_proj.weight_scale": "model-00007-of-00047.safetensors", + "model.layers.6.mlp.experts.20.down_proj.weight": "model-00007-of-00047.safetensors", + "model.layers.6.mlp.experts.20.down_proj.weight_scale": "model-00007-of-00047.safetensors", + "model.layers.6.mlp.experts.20.gate_proj.weight": "model-00007-of-00047.safetensors", + "model.layers.6.mlp.experts.20.gate_proj.weight_scale": "model-00007-of-00047.safetensors", + "model.layers.6.mlp.experts.20.up_proj.weight": "model-00007-of-00047.safetensors", + "model.layers.6.mlp.experts.20.up_proj.weight_scale": "model-00007-of-00047.safetensors", + "model.layers.6.mlp.experts.21.down_proj.weight": "model-00007-of-00047.safetensors", + "model.layers.6.mlp.experts.21.down_proj.weight_scale": "model-00007-of-00047.safetensors", + "model.layers.6.mlp.experts.21.gate_proj.weight": "model-00007-of-00047.safetensors", + "model.layers.6.mlp.experts.21.gate_proj.weight_scale": "model-00007-of-00047.safetensors", + "model.layers.6.mlp.experts.21.up_proj.weight": "model-00007-of-00047.safetensors", + "model.layers.6.mlp.experts.21.up_proj.weight_scale": "model-00007-of-00047.safetensors", + "model.layers.6.mlp.experts.22.down_proj.weight": "model-00007-of-00047.safetensors", + "model.layers.6.mlp.experts.22.down_proj.weight_scale": "model-00007-of-00047.safetensors", + "model.layers.6.mlp.experts.22.gate_proj.weight": "model-00007-of-00047.safetensors", + "model.layers.6.mlp.experts.22.gate_proj.weight_scale": "model-00007-of-00047.safetensors", + "model.layers.6.mlp.experts.22.up_proj.weight": "model-00007-of-00047.safetensors", + "model.layers.6.mlp.experts.22.up_proj.weight_scale": "model-00007-of-00047.safetensors", + "model.layers.6.mlp.experts.23.down_proj.weight": "model-00007-of-00047.safetensors", + "model.layers.6.mlp.experts.23.down_proj.weight_scale": "model-00007-of-00047.safetensors", + "model.layers.6.mlp.experts.23.gate_proj.weight": "model-00007-of-00047.safetensors", + "model.layers.6.mlp.experts.23.gate_proj.weight_scale": "model-00007-of-00047.safetensors", + "model.layers.6.mlp.experts.23.up_proj.weight": "model-00007-of-00047.safetensors", + "model.layers.6.mlp.experts.23.up_proj.weight_scale": "model-00007-of-00047.safetensors", + "model.layers.6.mlp.experts.24.down_proj.weight": "model-00007-of-00047.safetensors", + "model.layers.6.mlp.experts.24.down_proj.weight_scale": "model-00007-of-00047.safetensors", + "model.layers.6.mlp.experts.24.gate_proj.weight": "model-00007-of-00047.safetensors", + "model.layers.6.mlp.experts.24.gate_proj.weight_scale": "model-00007-of-00047.safetensors", + "model.layers.6.mlp.experts.24.up_proj.weight": "model-00007-of-00047.safetensors", + "model.layers.6.mlp.experts.24.up_proj.weight_scale": "model-00007-of-00047.safetensors", + "model.layers.6.mlp.experts.25.down_proj.weight": "model-00007-of-00047.safetensors", + "model.layers.6.mlp.experts.25.down_proj.weight_scale": "model-00007-of-00047.safetensors", + "model.layers.6.mlp.experts.25.gate_proj.weight": "model-00007-of-00047.safetensors", + "model.layers.6.mlp.experts.25.gate_proj.weight_scale": "model-00007-of-00047.safetensors", + "model.layers.6.mlp.experts.25.up_proj.weight": "model-00007-of-00047.safetensors", + "model.layers.6.mlp.experts.25.up_proj.weight_scale": "model-00007-of-00047.safetensors", + "model.layers.6.mlp.experts.26.down_proj.weight": "model-00007-of-00047.safetensors", + "model.layers.6.mlp.experts.26.down_proj.weight_scale": "model-00007-of-00047.safetensors", + "model.layers.6.mlp.experts.26.gate_proj.weight": "model-00007-of-00047.safetensors", + "model.layers.6.mlp.experts.26.gate_proj.weight_scale": "model-00007-of-00047.safetensors", + "model.layers.6.mlp.experts.26.up_proj.weight": "model-00007-of-00047.safetensors", + "model.layers.6.mlp.experts.26.up_proj.weight_scale": "model-00007-of-00047.safetensors", + "model.layers.6.mlp.experts.27.down_proj.weight": "model-00007-of-00047.safetensors", + "model.layers.6.mlp.experts.27.down_proj.weight_scale": "model-00007-of-00047.safetensors", + "model.layers.6.mlp.experts.27.gate_proj.weight": "model-00007-of-00047.safetensors", + "model.layers.6.mlp.experts.27.gate_proj.weight_scale": "model-00007-of-00047.safetensors", + "model.layers.6.mlp.experts.27.up_proj.weight": "model-00007-of-00047.safetensors", + "model.layers.6.mlp.experts.27.up_proj.weight_scale": "model-00007-of-00047.safetensors", + "model.layers.6.mlp.experts.28.down_proj.weight": "model-00007-of-00047.safetensors", + "model.layers.6.mlp.experts.28.down_proj.weight_scale": "model-00007-of-00047.safetensors", + "model.layers.6.mlp.experts.28.gate_proj.weight": "model-00007-of-00047.safetensors", + "model.layers.6.mlp.experts.28.gate_proj.weight_scale": "model-00007-of-00047.safetensors", + "model.layers.6.mlp.experts.28.up_proj.weight": "model-00007-of-00047.safetensors", + "model.layers.6.mlp.experts.28.up_proj.weight_scale": "model-00007-of-00047.safetensors", + "model.layers.6.mlp.experts.29.down_proj.weight": "model-00007-of-00047.safetensors", + "model.layers.6.mlp.experts.29.down_proj.weight_scale": "model-00007-of-00047.safetensors", + "model.layers.6.mlp.experts.29.gate_proj.weight": "model-00007-of-00047.safetensors", + "model.layers.6.mlp.experts.29.gate_proj.weight_scale": "model-00007-of-00047.safetensors", + "model.layers.6.mlp.experts.29.up_proj.weight": "model-00007-of-00047.safetensors", + "model.layers.6.mlp.experts.29.up_proj.weight_scale": "model-00007-of-00047.safetensors", + "model.layers.6.mlp.experts.3.down_proj.weight": "model-00007-of-00047.safetensors", + "model.layers.6.mlp.experts.3.down_proj.weight_scale": "model-00007-of-00047.safetensors", + "model.layers.6.mlp.experts.3.gate_proj.weight": "model-00007-of-00047.safetensors", + "model.layers.6.mlp.experts.3.gate_proj.weight_scale": "model-00007-of-00047.safetensors", + "model.layers.6.mlp.experts.3.up_proj.weight": "model-00007-of-00047.safetensors", + "model.layers.6.mlp.experts.3.up_proj.weight_scale": "model-00007-of-00047.safetensors", + "model.layers.6.mlp.experts.30.down_proj.weight": "model-00007-of-00047.safetensors", + "model.layers.6.mlp.experts.30.down_proj.weight_scale": "model-00007-of-00047.safetensors", + "model.layers.6.mlp.experts.30.gate_proj.weight": "model-00007-of-00047.safetensors", + "model.layers.6.mlp.experts.30.gate_proj.weight_scale": "model-00007-of-00047.safetensors", + "model.layers.6.mlp.experts.30.up_proj.weight": "model-00007-of-00047.safetensors", + "model.layers.6.mlp.experts.30.up_proj.weight_scale": "model-00007-of-00047.safetensors", + "model.layers.6.mlp.experts.31.down_proj.weight": "model-00007-of-00047.safetensors", + "model.layers.6.mlp.experts.31.down_proj.weight_scale": "model-00007-of-00047.safetensors", + "model.layers.6.mlp.experts.31.gate_proj.weight": "model-00007-of-00047.safetensors", + "model.layers.6.mlp.experts.31.gate_proj.weight_scale": "model-00007-of-00047.safetensors", + "model.layers.6.mlp.experts.31.up_proj.weight": "model-00007-of-00047.safetensors", + "model.layers.6.mlp.experts.31.up_proj.weight_scale": "model-00007-of-00047.safetensors", + "model.layers.6.mlp.experts.32.down_proj.weight": "model-00007-of-00047.safetensors", + "model.layers.6.mlp.experts.32.down_proj.weight_scale": "model-00007-of-00047.safetensors", + "model.layers.6.mlp.experts.32.gate_proj.weight": "model-00007-of-00047.safetensors", + "model.layers.6.mlp.experts.32.gate_proj.weight_scale": "model-00007-of-00047.safetensors", + "model.layers.6.mlp.experts.32.up_proj.weight": "model-00007-of-00047.safetensors", + "model.layers.6.mlp.experts.32.up_proj.weight_scale": "model-00007-of-00047.safetensors", + "model.layers.6.mlp.experts.33.down_proj.weight": "model-00007-of-00047.safetensors", + "model.layers.6.mlp.experts.33.down_proj.weight_scale": "model-00007-of-00047.safetensors", + "model.layers.6.mlp.experts.33.gate_proj.weight": "model-00007-of-00047.safetensors", + "model.layers.6.mlp.experts.33.gate_proj.weight_scale": "model-00007-of-00047.safetensors", + "model.layers.6.mlp.experts.33.up_proj.weight": "model-00007-of-00047.safetensors", + "model.layers.6.mlp.experts.33.up_proj.weight_scale": "model-00007-of-00047.safetensors", + "model.layers.6.mlp.experts.34.down_proj.weight": "model-00007-of-00047.safetensors", + "model.layers.6.mlp.experts.34.down_proj.weight_scale": "model-00007-of-00047.safetensors", + "model.layers.6.mlp.experts.34.gate_proj.weight": "model-00007-of-00047.safetensors", + "model.layers.6.mlp.experts.34.gate_proj.weight_scale": "model-00007-of-00047.safetensors", + "model.layers.6.mlp.experts.34.up_proj.weight": "model-00007-of-00047.safetensors", + "model.layers.6.mlp.experts.34.up_proj.weight_scale": "model-00007-of-00047.safetensors", + "model.layers.6.mlp.experts.35.down_proj.weight": "model-00007-of-00047.safetensors", + "model.layers.6.mlp.experts.35.down_proj.weight_scale": "model-00007-of-00047.safetensors", + "model.layers.6.mlp.experts.35.gate_proj.weight": "model-00007-of-00047.safetensors", + "model.layers.6.mlp.experts.35.gate_proj.weight_scale": "model-00007-of-00047.safetensors", + "model.layers.6.mlp.experts.35.up_proj.weight": "model-00007-of-00047.safetensors", + "model.layers.6.mlp.experts.35.up_proj.weight_scale": "model-00007-of-00047.safetensors", + "model.layers.6.mlp.experts.36.down_proj.weight": "model-00007-of-00047.safetensors", + "model.layers.6.mlp.experts.36.down_proj.weight_scale": "model-00007-of-00047.safetensors", + "model.layers.6.mlp.experts.36.gate_proj.weight": "model-00007-of-00047.safetensors", + "model.layers.6.mlp.experts.36.gate_proj.weight_scale": "model-00007-of-00047.safetensors", + "model.layers.6.mlp.experts.36.up_proj.weight": "model-00007-of-00047.safetensors", + "model.layers.6.mlp.experts.36.up_proj.weight_scale": "model-00007-of-00047.safetensors", + "model.layers.6.mlp.experts.37.down_proj.weight": "model-00007-of-00047.safetensors", + "model.layers.6.mlp.experts.37.down_proj.weight_scale": "model-00007-of-00047.safetensors", + "model.layers.6.mlp.experts.37.gate_proj.weight": "model-00007-of-00047.safetensors", + "model.layers.6.mlp.experts.37.gate_proj.weight_scale": "model-00007-of-00047.safetensors", + "model.layers.6.mlp.experts.37.up_proj.weight": "model-00007-of-00047.safetensors", + "model.layers.6.mlp.experts.37.up_proj.weight_scale": "model-00007-of-00047.safetensors", + "model.layers.6.mlp.experts.38.down_proj.weight": "model-00007-of-00047.safetensors", + "model.layers.6.mlp.experts.38.down_proj.weight_scale": "model-00007-of-00047.safetensors", + "model.layers.6.mlp.experts.38.gate_proj.weight": "model-00007-of-00047.safetensors", + "model.layers.6.mlp.experts.38.gate_proj.weight_scale": "model-00007-of-00047.safetensors", + "model.layers.6.mlp.experts.38.up_proj.weight": "model-00007-of-00047.safetensors", + "model.layers.6.mlp.experts.38.up_proj.weight_scale": "model-00007-of-00047.safetensors", + "model.layers.6.mlp.experts.39.down_proj.weight": "model-00007-of-00047.safetensors", + "model.layers.6.mlp.experts.39.down_proj.weight_scale": "model-00007-of-00047.safetensors", + "model.layers.6.mlp.experts.39.gate_proj.weight": "model-00007-of-00047.safetensors", + "model.layers.6.mlp.experts.39.gate_proj.weight_scale": "model-00007-of-00047.safetensors", + "model.layers.6.mlp.experts.39.up_proj.weight": "model-00007-of-00047.safetensors", + "model.layers.6.mlp.experts.39.up_proj.weight_scale": "model-00007-of-00047.safetensors", + "model.layers.6.mlp.experts.4.down_proj.weight": "model-00007-of-00047.safetensors", + "model.layers.6.mlp.experts.4.down_proj.weight_scale": "model-00007-of-00047.safetensors", + "model.layers.6.mlp.experts.4.gate_proj.weight": "model-00007-of-00047.safetensors", + "model.layers.6.mlp.experts.4.gate_proj.weight_scale": "model-00007-of-00047.safetensors", + "model.layers.6.mlp.experts.4.up_proj.weight": "model-00007-of-00047.safetensors", + "model.layers.6.mlp.experts.4.up_proj.weight_scale": "model-00007-of-00047.safetensors", + "model.layers.6.mlp.experts.40.down_proj.weight": "model-00007-of-00047.safetensors", + "model.layers.6.mlp.experts.40.down_proj.weight_scale": "model-00007-of-00047.safetensors", + "model.layers.6.mlp.experts.40.gate_proj.weight": "model-00007-of-00047.safetensors", + "model.layers.6.mlp.experts.40.gate_proj.weight_scale": "model-00007-of-00047.safetensors", + "model.layers.6.mlp.experts.40.up_proj.weight": "model-00007-of-00047.safetensors", + "model.layers.6.mlp.experts.40.up_proj.weight_scale": "model-00007-of-00047.safetensors", + "model.layers.6.mlp.experts.41.down_proj.weight": "model-00007-of-00047.safetensors", + "model.layers.6.mlp.experts.41.down_proj.weight_scale": "model-00007-of-00047.safetensors", + "model.layers.6.mlp.experts.41.gate_proj.weight": "model-00007-of-00047.safetensors", + "model.layers.6.mlp.experts.41.gate_proj.weight_scale": "model-00007-of-00047.safetensors", + "model.layers.6.mlp.experts.41.up_proj.weight": "model-00007-of-00047.safetensors", + "model.layers.6.mlp.experts.41.up_proj.weight_scale": "model-00007-of-00047.safetensors", + "model.layers.6.mlp.experts.42.down_proj.weight": "model-00007-of-00047.safetensors", + "model.layers.6.mlp.experts.42.down_proj.weight_scale": "model-00007-of-00047.safetensors", + "model.layers.6.mlp.experts.42.gate_proj.weight": "model-00007-of-00047.safetensors", + "model.layers.6.mlp.experts.42.gate_proj.weight_scale": "model-00007-of-00047.safetensors", + "model.layers.6.mlp.experts.42.up_proj.weight": "model-00007-of-00047.safetensors", + "model.layers.6.mlp.experts.42.up_proj.weight_scale": "model-00007-of-00047.safetensors", + "model.layers.6.mlp.experts.43.down_proj.weight": "model-00007-of-00047.safetensors", + "model.layers.6.mlp.experts.43.down_proj.weight_scale": "model-00007-of-00047.safetensors", + "model.layers.6.mlp.experts.43.gate_proj.weight": "model-00007-of-00047.safetensors", + "model.layers.6.mlp.experts.43.gate_proj.weight_scale": "model-00007-of-00047.safetensors", + "model.layers.6.mlp.experts.43.up_proj.weight": "model-00007-of-00047.safetensors", + "model.layers.6.mlp.experts.43.up_proj.weight_scale": "model-00007-of-00047.safetensors", + "model.layers.6.mlp.experts.44.down_proj.weight": "model-00007-of-00047.safetensors", + "model.layers.6.mlp.experts.44.down_proj.weight_scale": "model-00007-of-00047.safetensors", + "model.layers.6.mlp.experts.44.gate_proj.weight": "model-00007-of-00047.safetensors", + "model.layers.6.mlp.experts.44.gate_proj.weight_scale": "model-00007-of-00047.safetensors", + "model.layers.6.mlp.experts.44.up_proj.weight": "model-00007-of-00047.safetensors", + "model.layers.6.mlp.experts.44.up_proj.weight_scale": "model-00007-of-00047.safetensors", + "model.layers.6.mlp.experts.45.down_proj.weight": "model-00007-of-00047.safetensors", + "model.layers.6.mlp.experts.45.down_proj.weight_scale": "model-00007-of-00047.safetensors", + "model.layers.6.mlp.experts.45.gate_proj.weight": "model-00007-of-00047.safetensors", + "model.layers.6.mlp.experts.45.gate_proj.weight_scale": "model-00007-of-00047.safetensors", + "model.layers.6.mlp.experts.45.up_proj.weight": "model-00007-of-00047.safetensors", + "model.layers.6.mlp.experts.45.up_proj.weight_scale": "model-00007-of-00047.safetensors", + "model.layers.6.mlp.experts.46.down_proj.weight": "model-00007-of-00047.safetensors", + "model.layers.6.mlp.experts.46.down_proj.weight_scale": "model-00007-of-00047.safetensors", + "model.layers.6.mlp.experts.46.gate_proj.weight": "model-00007-of-00047.safetensors", + "model.layers.6.mlp.experts.46.gate_proj.weight_scale": "model-00007-of-00047.safetensors", + "model.layers.6.mlp.experts.46.up_proj.weight": "model-00007-of-00047.safetensors", + "model.layers.6.mlp.experts.46.up_proj.weight_scale": "model-00007-of-00047.safetensors", + "model.layers.6.mlp.experts.47.down_proj.weight": "model-00007-of-00047.safetensors", + "model.layers.6.mlp.experts.47.down_proj.weight_scale": "model-00007-of-00047.safetensors", + "model.layers.6.mlp.experts.47.gate_proj.weight": "model-00007-of-00047.safetensors", + "model.layers.6.mlp.experts.47.gate_proj.weight_scale": "model-00007-of-00047.safetensors", + "model.layers.6.mlp.experts.47.up_proj.weight": "model-00007-of-00047.safetensors", + "model.layers.6.mlp.experts.47.up_proj.weight_scale": "model-00007-of-00047.safetensors", + "model.layers.6.mlp.experts.48.down_proj.weight": "model-00007-of-00047.safetensors", + "model.layers.6.mlp.experts.48.down_proj.weight_scale": "model-00007-of-00047.safetensors", + "model.layers.6.mlp.experts.48.gate_proj.weight": "model-00007-of-00047.safetensors", + "model.layers.6.mlp.experts.48.gate_proj.weight_scale": "model-00007-of-00047.safetensors", + "model.layers.6.mlp.experts.48.up_proj.weight": "model-00007-of-00047.safetensors", + "model.layers.6.mlp.experts.48.up_proj.weight_scale": "model-00007-of-00047.safetensors", + "model.layers.6.mlp.experts.49.down_proj.weight": "model-00007-of-00047.safetensors", + "model.layers.6.mlp.experts.49.down_proj.weight_scale": "model-00007-of-00047.safetensors", + "model.layers.6.mlp.experts.49.gate_proj.weight": "model-00007-of-00047.safetensors", + "model.layers.6.mlp.experts.49.gate_proj.weight_scale": "model-00007-of-00047.safetensors", + "model.layers.6.mlp.experts.49.up_proj.weight": "model-00007-of-00047.safetensors", + "model.layers.6.mlp.experts.49.up_proj.weight_scale": "model-00007-of-00047.safetensors", + "model.layers.6.mlp.experts.5.down_proj.weight": "model-00007-of-00047.safetensors", + "model.layers.6.mlp.experts.5.down_proj.weight_scale": "model-00007-of-00047.safetensors", + "model.layers.6.mlp.experts.5.gate_proj.weight": "model-00007-of-00047.safetensors", + "model.layers.6.mlp.experts.5.gate_proj.weight_scale": "model-00007-of-00047.safetensors", + "model.layers.6.mlp.experts.5.up_proj.weight": "model-00007-of-00047.safetensors", + "model.layers.6.mlp.experts.5.up_proj.weight_scale": "model-00007-of-00047.safetensors", + "model.layers.6.mlp.experts.50.down_proj.weight": "model-00007-of-00047.safetensors", + "model.layers.6.mlp.experts.50.down_proj.weight_scale": "model-00007-of-00047.safetensors", + "model.layers.6.mlp.experts.50.gate_proj.weight": "model-00007-of-00047.safetensors", + "model.layers.6.mlp.experts.50.gate_proj.weight_scale": "model-00007-of-00047.safetensors", + "model.layers.6.mlp.experts.50.up_proj.weight": "model-00007-of-00047.safetensors", + "model.layers.6.mlp.experts.50.up_proj.weight_scale": "model-00007-of-00047.safetensors", + "model.layers.6.mlp.experts.51.down_proj.weight": "model-00007-of-00047.safetensors", + "model.layers.6.mlp.experts.51.down_proj.weight_scale": "model-00007-of-00047.safetensors", + "model.layers.6.mlp.experts.51.gate_proj.weight": "model-00007-of-00047.safetensors", + "model.layers.6.mlp.experts.51.gate_proj.weight_scale": "model-00007-of-00047.safetensors", + "model.layers.6.mlp.experts.51.up_proj.weight": "model-00007-of-00047.safetensors", + "model.layers.6.mlp.experts.51.up_proj.weight_scale": "model-00007-of-00047.safetensors", + "model.layers.6.mlp.experts.52.down_proj.weight": "model-00007-of-00047.safetensors", + "model.layers.6.mlp.experts.52.down_proj.weight_scale": "model-00007-of-00047.safetensors", + "model.layers.6.mlp.experts.52.gate_proj.weight": "model-00007-of-00047.safetensors", + "model.layers.6.mlp.experts.52.gate_proj.weight_scale": "model-00007-of-00047.safetensors", + "model.layers.6.mlp.experts.52.up_proj.weight": "model-00007-of-00047.safetensors", + "model.layers.6.mlp.experts.52.up_proj.weight_scale": "model-00007-of-00047.safetensors", + "model.layers.6.mlp.experts.53.down_proj.weight": "model-00007-of-00047.safetensors", + "model.layers.6.mlp.experts.53.down_proj.weight_scale": "model-00007-of-00047.safetensors", + "model.layers.6.mlp.experts.53.gate_proj.weight": "model-00007-of-00047.safetensors", + "model.layers.6.mlp.experts.53.gate_proj.weight_scale": "model-00007-of-00047.safetensors", + "model.layers.6.mlp.experts.53.up_proj.weight": "model-00007-of-00047.safetensors", + "model.layers.6.mlp.experts.53.up_proj.weight_scale": "model-00007-of-00047.safetensors", + "model.layers.6.mlp.experts.54.down_proj.weight": "model-00007-of-00047.safetensors", + "model.layers.6.mlp.experts.54.down_proj.weight_scale": "model-00007-of-00047.safetensors", + "model.layers.6.mlp.experts.54.gate_proj.weight": "model-00007-of-00047.safetensors", + "model.layers.6.mlp.experts.54.gate_proj.weight_scale": "model-00007-of-00047.safetensors", + "model.layers.6.mlp.experts.54.up_proj.weight": "model-00007-of-00047.safetensors", + "model.layers.6.mlp.experts.54.up_proj.weight_scale": "model-00007-of-00047.safetensors", + "model.layers.6.mlp.experts.55.down_proj.weight": "model-00007-of-00047.safetensors", + "model.layers.6.mlp.experts.55.down_proj.weight_scale": "model-00007-of-00047.safetensors", + "model.layers.6.mlp.experts.55.gate_proj.weight": "model-00007-of-00047.safetensors", + "model.layers.6.mlp.experts.55.gate_proj.weight_scale": "model-00007-of-00047.safetensors", + "model.layers.6.mlp.experts.55.up_proj.weight": "model-00007-of-00047.safetensors", + "model.layers.6.mlp.experts.55.up_proj.weight_scale": "model-00007-of-00047.safetensors", + "model.layers.6.mlp.experts.56.down_proj.weight": "model-00007-of-00047.safetensors", + "model.layers.6.mlp.experts.56.down_proj.weight_scale": "model-00007-of-00047.safetensors", + "model.layers.6.mlp.experts.56.gate_proj.weight": "model-00007-of-00047.safetensors", + "model.layers.6.mlp.experts.56.gate_proj.weight_scale": "model-00007-of-00047.safetensors", + "model.layers.6.mlp.experts.56.up_proj.weight": "model-00007-of-00047.safetensors", + "model.layers.6.mlp.experts.56.up_proj.weight_scale": "model-00007-of-00047.safetensors", + "model.layers.6.mlp.experts.57.down_proj.weight": "model-00007-of-00047.safetensors", + "model.layers.6.mlp.experts.57.down_proj.weight_scale": "model-00007-of-00047.safetensors", + "model.layers.6.mlp.experts.57.gate_proj.weight": "model-00007-of-00047.safetensors", + "model.layers.6.mlp.experts.57.gate_proj.weight_scale": "model-00007-of-00047.safetensors", + "model.layers.6.mlp.experts.57.up_proj.weight": "model-00007-of-00047.safetensors", + "model.layers.6.mlp.experts.57.up_proj.weight_scale": "model-00007-of-00047.safetensors", + "model.layers.6.mlp.experts.58.down_proj.weight": "model-00007-of-00047.safetensors", + "model.layers.6.mlp.experts.58.down_proj.weight_scale": "model-00007-of-00047.safetensors", + "model.layers.6.mlp.experts.58.gate_proj.weight": "model-00007-of-00047.safetensors", + "model.layers.6.mlp.experts.58.gate_proj.weight_scale": "model-00007-of-00047.safetensors", + "model.layers.6.mlp.experts.58.up_proj.weight": "model-00007-of-00047.safetensors", + "model.layers.6.mlp.experts.58.up_proj.weight_scale": "model-00007-of-00047.safetensors", + "model.layers.6.mlp.experts.59.down_proj.weight": "model-00007-of-00047.safetensors", + "model.layers.6.mlp.experts.59.down_proj.weight_scale": "model-00007-of-00047.safetensors", + "model.layers.6.mlp.experts.59.gate_proj.weight": "model-00007-of-00047.safetensors", + "model.layers.6.mlp.experts.59.gate_proj.weight_scale": "model-00007-of-00047.safetensors", + "model.layers.6.mlp.experts.59.up_proj.weight": "model-00007-of-00047.safetensors", + "model.layers.6.mlp.experts.59.up_proj.weight_scale": "model-00007-of-00047.safetensors", + "model.layers.6.mlp.experts.6.down_proj.weight": "model-00007-of-00047.safetensors", + "model.layers.6.mlp.experts.6.down_proj.weight_scale": "model-00007-of-00047.safetensors", + "model.layers.6.mlp.experts.6.gate_proj.weight": "model-00007-of-00047.safetensors", + "model.layers.6.mlp.experts.6.gate_proj.weight_scale": "model-00007-of-00047.safetensors", + "model.layers.6.mlp.experts.6.up_proj.weight": "model-00007-of-00047.safetensors", + "model.layers.6.mlp.experts.6.up_proj.weight_scale": "model-00007-of-00047.safetensors", + "model.layers.6.mlp.experts.60.down_proj.weight": "model-00007-of-00047.safetensors", + "model.layers.6.mlp.experts.60.down_proj.weight_scale": "model-00007-of-00047.safetensors", + "model.layers.6.mlp.experts.60.gate_proj.weight": "model-00007-of-00047.safetensors", + "model.layers.6.mlp.experts.60.gate_proj.weight_scale": "model-00007-of-00047.safetensors", + "model.layers.6.mlp.experts.60.up_proj.weight": "model-00007-of-00047.safetensors", + "model.layers.6.mlp.experts.60.up_proj.weight_scale": "model-00007-of-00047.safetensors", + "model.layers.6.mlp.experts.61.down_proj.weight": "model-00007-of-00047.safetensors", + "model.layers.6.mlp.experts.61.down_proj.weight_scale": "model-00007-of-00047.safetensors", + "model.layers.6.mlp.experts.61.gate_proj.weight": "model-00007-of-00047.safetensors", + "model.layers.6.mlp.experts.61.gate_proj.weight_scale": "model-00007-of-00047.safetensors", + "model.layers.6.mlp.experts.61.up_proj.weight": "model-00007-of-00047.safetensors", + "model.layers.6.mlp.experts.61.up_proj.weight_scale": "model-00007-of-00047.safetensors", + "model.layers.6.mlp.experts.62.down_proj.weight": "model-00007-of-00047.safetensors", + "model.layers.6.mlp.experts.62.down_proj.weight_scale": "model-00007-of-00047.safetensors", + "model.layers.6.mlp.experts.62.gate_proj.weight": "model-00007-of-00047.safetensors", + "model.layers.6.mlp.experts.62.gate_proj.weight_scale": "model-00007-of-00047.safetensors", + "model.layers.6.mlp.experts.62.up_proj.weight": "model-00007-of-00047.safetensors", + "model.layers.6.mlp.experts.62.up_proj.weight_scale": "model-00007-of-00047.safetensors", + "model.layers.6.mlp.experts.63.down_proj.weight": "model-00007-of-00047.safetensors", + "model.layers.6.mlp.experts.63.down_proj.weight_scale": "model-00007-of-00047.safetensors", + "model.layers.6.mlp.experts.63.gate_proj.weight": "model-00007-of-00047.safetensors", + "model.layers.6.mlp.experts.63.gate_proj.weight_scale": "model-00007-of-00047.safetensors", + "model.layers.6.mlp.experts.63.up_proj.weight": "model-00007-of-00047.safetensors", + "model.layers.6.mlp.experts.63.up_proj.weight_scale": "model-00007-of-00047.safetensors", + "model.layers.6.mlp.experts.64.down_proj.weight": "model-00007-of-00047.safetensors", + "model.layers.6.mlp.experts.64.down_proj.weight_scale": "model-00007-of-00047.safetensors", + "model.layers.6.mlp.experts.64.gate_proj.weight": "model-00007-of-00047.safetensors", + "model.layers.6.mlp.experts.64.gate_proj.weight_scale": "model-00007-of-00047.safetensors", + "model.layers.6.mlp.experts.64.up_proj.weight": "model-00007-of-00047.safetensors", + "model.layers.6.mlp.experts.64.up_proj.weight_scale": "model-00007-of-00047.safetensors", + "model.layers.6.mlp.experts.65.down_proj.weight": "model-00007-of-00047.safetensors", + "model.layers.6.mlp.experts.65.down_proj.weight_scale": "model-00007-of-00047.safetensors", + "model.layers.6.mlp.experts.65.gate_proj.weight": "model-00007-of-00047.safetensors", + "model.layers.6.mlp.experts.65.gate_proj.weight_scale": "model-00007-of-00047.safetensors", + "model.layers.6.mlp.experts.65.up_proj.weight": "model-00007-of-00047.safetensors", + "model.layers.6.mlp.experts.65.up_proj.weight_scale": "model-00007-of-00047.safetensors", + "model.layers.6.mlp.experts.66.down_proj.weight": "model-00007-of-00047.safetensors", + "model.layers.6.mlp.experts.66.down_proj.weight_scale": "model-00007-of-00047.safetensors", + "model.layers.6.mlp.experts.66.gate_proj.weight": "model-00007-of-00047.safetensors", + "model.layers.6.mlp.experts.66.gate_proj.weight_scale": "model-00007-of-00047.safetensors", + "model.layers.6.mlp.experts.66.up_proj.weight": "model-00007-of-00047.safetensors", + "model.layers.6.mlp.experts.66.up_proj.weight_scale": "model-00007-of-00047.safetensors", + "model.layers.6.mlp.experts.67.down_proj.weight": "model-00007-of-00047.safetensors", + "model.layers.6.mlp.experts.67.down_proj.weight_scale": "model-00007-of-00047.safetensors", + "model.layers.6.mlp.experts.67.gate_proj.weight": "model-00007-of-00047.safetensors", + "model.layers.6.mlp.experts.67.gate_proj.weight_scale": "model-00007-of-00047.safetensors", + "model.layers.6.mlp.experts.67.up_proj.weight": "model-00007-of-00047.safetensors", + "model.layers.6.mlp.experts.67.up_proj.weight_scale": "model-00007-of-00047.safetensors", + "model.layers.6.mlp.experts.68.down_proj.weight": "model-00007-of-00047.safetensors", + "model.layers.6.mlp.experts.68.down_proj.weight_scale": "model-00007-of-00047.safetensors", + "model.layers.6.mlp.experts.68.gate_proj.weight": "model-00007-of-00047.safetensors", + "model.layers.6.mlp.experts.68.gate_proj.weight_scale": "model-00007-of-00047.safetensors", + "model.layers.6.mlp.experts.68.up_proj.weight": "model-00007-of-00047.safetensors", + "model.layers.6.mlp.experts.68.up_proj.weight_scale": "model-00007-of-00047.safetensors", + "model.layers.6.mlp.experts.69.down_proj.weight": "model-00007-of-00047.safetensors", + "model.layers.6.mlp.experts.69.down_proj.weight_scale": "model-00007-of-00047.safetensors", + "model.layers.6.mlp.experts.69.gate_proj.weight": "model-00007-of-00047.safetensors", + "model.layers.6.mlp.experts.69.gate_proj.weight_scale": "model-00007-of-00047.safetensors", + "model.layers.6.mlp.experts.69.up_proj.weight": "model-00007-of-00047.safetensors", + "model.layers.6.mlp.experts.69.up_proj.weight_scale": "model-00007-of-00047.safetensors", + "model.layers.6.mlp.experts.7.down_proj.weight": "model-00007-of-00047.safetensors", + "model.layers.6.mlp.experts.7.down_proj.weight_scale": "model-00007-of-00047.safetensors", + "model.layers.6.mlp.experts.7.gate_proj.weight": "model-00007-of-00047.safetensors", + "model.layers.6.mlp.experts.7.gate_proj.weight_scale": "model-00007-of-00047.safetensors", + "model.layers.6.mlp.experts.7.up_proj.weight": "model-00007-of-00047.safetensors", + "model.layers.6.mlp.experts.7.up_proj.weight_scale": "model-00007-of-00047.safetensors", + "model.layers.6.mlp.experts.70.down_proj.weight": "model-00007-of-00047.safetensors", + "model.layers.6.mlp.experts.70.down_proj.weight_scale": "model-00007-of-00047.safetensors", + "model.layers.6.mlp.experts.70.gate_proj.weight": "model-00007-of-00047.safetensors", + "model.layers.6.mlp.experts.70.gate_proj.weight_scale": "model-00007-of-00047.safetensors", + "model.layers.6.mlp.experts.70.up_proj.weight": "model-00007-of-00047.safetensors", + "model.layers.6.mlp.experts.70.up_proj.weight_scale": "model-00007-of-00047.safetensors", + "model.layers.6.mlp.experts.71.down_proj.weight": "model-00007-of-00047.safetensors", + "model.layers.6.mlp.experts.71.down_proj.weight_scale": "model-00007-of-00047.safetensors", + "model.layers.6.mlp.experts.71.gate_proj.weight": "model-00007-of-00047.safetensors", + "model.layers.6.mlp.experts.71.gate_proj.weight_scale": "model-00007-of-00047.safetensors", + "model.layers.6.mlp.experts.71.up_proj.weight": "model-00007-of-00047.safetensors", + "model.layers.6.mlp.experts.71.up_proj.weight_scale": "model-00007-of-00047.safetensors", + "model.layers.6.mlp.experts.72.down_proj.weight": "model-00007-of-00047.safetensors", + "model.layers.6.mlp.experts.72.down_proj.weight_scale": "model-00007-of-00047.safetensors", + "model.layers.6.mlp.experts.72.gate_proj.weight": "model-00007-of-00047.safetensors", + "model.layers.6.mlp.experts.72.gate_proj.weight_scale": "model-00007-of-00047.safetensors", + "model.layers.6.mlp.experts.72.up_proj.weight": "model-00007-of-00047.safetensors", + "model.layers.6.mlp.experts.72.up_proj.weight_scale": "model-00007-of-00047.safetensors", + "model.layers.6.mlp.experts.73.down_proj.weight": "model-00007-of-00047.safetensors", + "model.layers.6.mlp.experts.73.down_proj.weight_scale": "model-00007-of-00047.safetensors", + "model.layers.6.mlp.experts.73.gate_proj.weight": "model-00007-of-00047.safetensors", + "model.layers.6.mlp.experts.73.gate_proj.weight_scale": "model-00007-of-00047.safetensors", + "model.layers.6.mlp.experts.73.up_proj.weight": "model-00007-of-00047.safetensors", + "model.layers.6.mlp.experts.73.up_proj.weight_scale": "model-00007-of-00047.safetensors", + "model.layers.6.mlp.experts.74.down_proj.weight": "model-00007-of-00047.safetensors", + "model.layers.6.mlp.experts.74.down_proj.weight_scale": "model-00007-of-00047.safetensors", + "model.layers.6.mlp.experts.74.gate_proj.weight": "model-00007-of-00047.safetensors", + "model.layers.6.mlp.experts.74.gate_proj.weight_scale": "model-00007-of-00047.safetensors", + "model.layers.6.mlp.experts.74.up_proj.weight": "model-00007-of-00047.safetensors", + "model.layers.6.mlp.experts.74.up_proj.weight_scale": "model-00007-of-00047.safetensors", + "model.layers.6.mlp.experts.75.down_proj.weight": "model-00007-of-00047.safetensors", + "model.layers.6.mlp.experts.75.down_proj.weight_scale": "model-00007-of-00047.safetensors", + "model.layers.6.mlp.experts.75.gate_proj.weight": "model-00007-of-00047.safetensors", + "model.layers.6.mlp.experts.75.gate_proj.weight_scale": "model-00007-of-00047.safetensors", + "model.layers.6.mlp.experts.75.up_proj.weight": "model-00007-of-00047.safetensors", + "model.layers.6.mlp.experts.75.up_proj.weight_scale": "model-00007-of-00047.safetensors", + "model.layers.6.mlp.experts.76.down_proj.weight": "model-00007-of-00047.safetensors", + "model.layers.6.mlp.experts.76.down_proj.weight_scale": "model-00007-of-00047.safetensors", + "model.layers.6.mlp.experts.76.gate_proj.weight": "model-00007-of-00047.safetensors", + "model.layers.6.mlp.experts.76.gate_proj.weight_scale": "model-00007-of-00047.safetensors", + "model.layers.6.mlp.experts.76.up_proj.weight": "model-00007-of-00047.safetensors", + "model.layers.6.mlp.experts.76.up_proj.weight_scale": "model-00007-of-00047.safetensors", + "model.layers.6.mlp.experts.77.down_proj.weight": "model-00007-of-00047.safetensors", + "model.layers.6.mlp.experts.77.down_proj.weight_scale": "model-00007-of-00047.safetensors", + "model.layers.6.mlp.experts.77.gate_proj.weight": "model-00007-of-00047.safetensors", + "model.layers.6.mlp.experts.77.gate_proj.weight_scale": "model-00007-of-00047.safetensors", + "model.layers.6.mlp.experts.77.up_proj.weight": "model-00007-of-00047.safetensors", + "model.layers.6.mlp.experts.77.up_proj.weight_scale": "model-00007-of-00047.safetensors", + "model.layers.6.mlp.experts.78.down_proj.weight": "model-00007-of-00047.safetensors", + "model.layers.6.mlp.experts.78.down_proj.weight_scale": "model-00007-of-00047.safetensors", + "model.layers.6.mlp.experts.78.gate_proj.weight": "model-00007-of-00047.safetensors", + "model.layers.6.mlp.experts.78.gate_proj.weight_scale": "model-00007-of-00047.safetensors", + "model.layers.6.mlp.experts.78.up_proj.weight": "model-00007-of-00047.safetensors", + "model.layers.6.mlp.experts.78.up_proj.weight_scale": "model-00007-of-00047.safetensors", + "model.layers.6.mlp.experts.79.down_proj.weight": "model-00007-of-00047.safetensors", + "model.layers.6.mlp.experts.79.down_proj.weight_scale": "model-00007-of-00047.safetensors", + "model.layers.6.mlp.experts.79.gate_proj.weight": "model-00007-of-00047.safetensors", + "model.layers.6.mlp.experts.79.gate_proj.weight_scale": "model-00007-of-00047.safetensors", + "model.layers.6.mlp.experts.79.up_proj.weight": "model-00007-of-00047.safetensors", + "model.layers.6.mlp.experts.79.up_proj.weight_scale": "model-00007-of-00047.safetensors", + "model.layers.6.mlp.experts.8.down_proj.weight": "model-00007-of-00047.safetensors", + "model.layers.6.mlp.experts.8.down_proj.weight_scale": "model-00007-of-00047.safetensors", + "model.layers.6.mlp.experts.8.gate_proj.weight": "model-00007-of-00047.safetensors", + "model.layers.6.mlp.experts.8.gate_proj.weight_scale": "model-00007-of-00047.safetensors", + "model.layers.6.mlp.experts.8.up_proj.weight": "model-00007-of-00047.safetensors", + "model.layers.6.mlp.experts.8.up_proj.weight_scale": "model-00007-of-00047.safetensors", + "model.layers.6.mlp.experts.80.down_proj.weight": "model-00007-of-00047.safetensors", + "model.layers.6.mlp.experts.80.down_proj.weight_scale": "model-00007-of-00047.safetensors", + "model.layers.6.mlp.experts.80.gate_proj.weight": "model-00007-of-00047.safetensors", + "model.layers.6.mlp.experts.80.gate_proj.weight_scale": "model-00007-of-00047.safetensors", + "model.layers.6.mlp.experts.80.up_proj.weight": "model-00007-of-00047.safetensors", + "model.layers.6.mlp.experts.80.up_proj.weight_scale": "model-00007-of-00047.safetensors", + "model.layers.6.mlp.experts.81.down_proj.weight": "model-00007-of-00047.safetensors", + "model.layers.6.mlp.experts.81.down_proj.weight_scale": "model-00007-of-00047.safetensors", + "model.layers.6.mlp.experts.81.gate_proj.weight": "model-00007-of-00047.safetensors", + "model.layers.6.mlp.experts.81.gate_proj.weight_scale": "model-00007-of-00047.safetensors", + "model.layers.6.mlp.experts.81.up_proj.weight": "model-00007-of-00047.safetensors", + "model.layers.6.mlp.experts.81.up_proj.weight_scale": "model-00007-of-00047.safetensors", + "model.layers.6.mlp.experts.82.down_proj.weight": "model-00007-of-00047.safetensors", + "model.layers.6.mlp.experts.82.down_proj.weight_scale": "model-00007-of-00047.safetensors", + "model.layers.6.mlp.experts.82.gate_proj.weight": "model-00007-of-00047.safetensors", + "model.layers.6.mlp.experts.82.gate_proj.weight_scale": "model-00007-of-00047.safetensors", + "model.layers.6.mlp.experts.82.up_proj.weight": "model-00007-of-00047.safetensors", + "model.layers.6.mlp.experts.82.up_proj.weight_scale": "model-00007-of-00047.safetensors", + "model.layers.6.mlp.experts.83.down_proj.weight": "model-00007-of-00047.safetensors", + "model.layers.6.mlp.experts.83.down_proj.weight_scale": "model-00007-of-00047.safetensors", + "model.layers.6.mlp.experts.83.gate_proj.weight": "model-00007-of-00047.safetensors", + "model.layers.6.mlp.experts.83.gate_proj.weight_scale": "model-00007-of-00047.safetensors", + "model.layers.6.mlp.experts.83.up_proj.weight": "model-00007-of-00047.safetensors", + "model.layers.6.mlp.experts.83.up_proj.weight_scale": "model-00007-of-00047.safetensors", + "model.layers.6.mlp.experts.84.down_proj.weight": "model-00007-of-00047.safetensors", + "model.layers.6.mlp.experts.84.down_proj.weight_scale": "model-00007-of-00047.safetensors", + "model.layers.6.mlp.experts.84.gate_proj.weight": "model-00007-of-00047.safetensors", + "model.layers.6.mlp.experts.84.gate_proj.weight_scale": "model-00007-of-00047.safetensors", + "model.layers.6.mlp.experts.84.up_proj.weight": "model-00007-of-00047.safetensors", + "model.layers.6.mlp.experts.84.up_proj.weight_scale": "model-00007-of-00047.safetensors", + "model.layers.6.mlp.experts.85.down_proj.weight": "model-00007-of-00047.safetensors", + "model.layers.6.mlp.experts.85.down_proj.weight_scale": "model-00007-of-00047.safetensors", + "model.layers.6.mlp.experts.85.gate_proj.weight": "model-00007-of-00047.safetensors", + "model.layers.6.mlp.experts.85.gate_proj.weight_scale": "model-00007-of-00047.safetensors", + "model.layers.6.mlp.experts.85.up_proj.weight": "model-00007-of-00047.safetensors", + "model.layers.6.mlp.experts.85.up_proj.weight_scale": "model-00007-of-00047.safetensors", + "model.layers.6.mlp.experts.86.down_proj.weight": "model-00007-of-00047.safetensors", + "model.layers.6.mlp.experts.86.down_proj.weight_scale": "model-00007-of-00047.safetensors", + "model.layers.6.mlp.experts.86.gate_proj.weight": "model-00007-of-00047.safetensors", + "model.layers.6.mlp.experts.86.gate_proj.weight_scale": "model-00007-of-00047.safetensors", + "model.layers.6.mlp.experts.86.up_proj.weight": "model-00007-of-00047.safetensors", + "model.layers.6.mlp.experts.86.up_proj.weight_scale": "model-00007-of-00047.safetensors", + "model.layers.6.mlp.experts.87.down_proj.weight": "model-00007-of-00047.safetensors", + "model.layers.6.mlp.experts.87.down_proj.weight_scale": "model-00007-of-00047.safetensors", + "model.layers.6.mlp.experts.87.gate_proj.weight": "model-00007-of-00047.safetensors", + "model.layers.6.mlp.experts.87.gate_proj.weight_scale": "model-00007-of-00047.safetensors", + "model.layers.6.mlp.experts.87.up_proj.weight": "model-00007-of-00047.safetensors", + "model.layers.6.mlp.experts.87.up_proj.weight_scale": "model-00007-of-00047.safetensors", + "model.layers.6.mlp.experts.88.down_proj.weight": "model-00007-of-00047.safetensors", + "model.layers.6.mlp.experts.88.down_proj.weight_scale": "model-00007-of-00047.safetensors", + "model.layers.6.mlp.experts.88.gate_proj.weight": "model-00007-of-00047.safetensors", + "model.layers.6.mlp.experts.88.gate_proj.weight_scale": "model-00007-of-00047.safetensors", + "model.layers.6.mlp.experts.88.up_proj.weight": "model-00007-of-00047.safetensors", + "model.layers.6.mlp.experts.88.up_proj.weight_scale": "model-00007-of-00047.safetensors", + "model.layers.6.mlp.experts.89.down_proj.weight": "model-00007-of-00047.safetensors", + "model.layers.6.mlp.experts.89.down_proj.weight_scale": "model-00007-of-00047.safetensors", + "model.layers.6.mlp.experts.89.gate_proj.weight": "model-00007-of-00047.safetensors", + "model.layers.6.mlp.experts.89.gate_proj.weight_scale": "model-00007-of-00047.safetensors", + "model.layers.6.mlp.experts.89.up_proj.weight": "model-00007-of-00047.safetensors", + "model.layers.6.mlp.experts.89.up_proj.weight_scale": "model-00007-of-00047.safetensors", + "model.layers.6.mlp.experts.9.down_proj.weight": "model-00007-of-00047.safetensors", + "model.layers.6.mlp.experts.9.down_proj.weight_scale": "model-00007-of-00047.safetensors", + "model.layers.6.mlp.experts.9.gate_proj.weight": "model-00007-of-00047.safetensors", + "model.layers.6.mlp.experts.9.gate_proj.weight_scale": "model-00007-of-00047.safetensors", + "model.layers.6.mlp.experts.9.up_proj.weight": "model-00007-of-00047.safetensors", + "model.layers.6.mlp.experts.9.up_proj.weight_scale": "model-00007-of-00047.safetensors", + "model.layers.6.mlp.experts.90.down_proj.weight": "model-00007-of-00047.safetensors", + "model.layers.6.mlp.experts.90.down_proj.weight_scale": "model-00007-of-00047.safetensors", + "model.layers.6.mlp.experts.90.gate_proj.weight": "model-00007-of-00047.safetensors", + "model.layers.6.mlp.experts.90.gate_proj.weight_scale": "model-00007-of-00047.safetensors", + "model.layers.6.mlp.experts.90.up_proj.weight": "model-00007-of-00047.safetensors", + "model.layers.6.mlp.experts.90.up_proj.weight_scale": "model-00007-of-00047.safetensors", + "model.layers.6.mlp.experts.91.down_proj.weight": "model-00007-of-00047.safetensors", + "model.layers.6.mlp.experts.91.down_proj.weight_scale": "model-00007-of-00047.safetensors", + "model.layers.6.mlp.experts.91.gate_proj.weight": "model-00007-of-00047.safetensors", + "model.layers.6.mlp.experts.91.gate_proj.weight_scale": "model-00007-of-00047.safetensors", + "model.layers.6.mlp.experts.91.up_proj.weight": "model-00007-of-00047.safetensors", + "model.layers.6.mlp.experts.91.up_proj.weight_scale": "model-00007-of-00047.safetensors", + "model.layers.6.mlp.experts.92.down_proj.weight": "model-00007-of-00047.safetensors", + "model.layers.6.mlp.experts.92.down_proj.weight_scale": "model-00007-of-00047.safetensors", + "model.layers.6.mlp.experts.92.gate_proj.weight": "model-00007-of-00047.safetensors", + "model.layers.6.mlp.experts.92.gate_proj.weight_scale": "model-00007-of-00047.safetensors", + "model.layers.6.mlp.experts.92.up_proj.weight": "model-00007-of-00047.safetensors", + "model.layers.6.mlp.experts.92.up_proj.weight_scale": "model-00007-of-00047.safetensors", + "model.layers.6.mlp.experts.93.down_proj.weight": "model-00007-of-00047.safetensors", + "model.layers.6.mlp.experts.93.down_proj.weight_scale": "model-00007-of-00047.safetensors", + "model.layers.6.mlp.experts.93.gate_proj.weight": "model-00007-of-00047.safetensors", + "model.layers.6.mlp.experts.93.gate_proj.weight_scale": "model-00007-of-00047.safetensors", + "model.layers.6.mlp.experts.93.up_proj.weight": "model-00007-of-00047.safetensors", + "model.layers.6.mlp.experts.93.up_proj.weight_scale": "model-00007-of-00047.safetensors", + "model.layers.6.mlp.experts.94.down_proj.weight": "model-00007-of-00047.safetensors", + "model.layers.6.mlp.experts.94.down_proj.weight_scale": "model-00007-of-00047.safetensors", + "model.layers.6.mlp.experts.94.gate_proj.weight": "model-00007-of-00047.safetensors", + "model.layers.6.mlp.experts.94.gate_proj.weight_scale": "model-00007-of-00047.safetensors", + "model.layers.6.mlp.experts.94.up_proj.weight": "model-00007-of-00047.safetensors", + "model.layers.6.mlp.experts.94.up_proj.weight_scale": "model-00007-of-00047.safetensors", + "model.layers.6.mlp.experts.95.down_proj.weight": "model-00007-of-00047.safetensors", + "model.layers.6.mlp.experts.95.down_proj.weight_scale": "model-00007-of-00047.safetensors", + "model.layers.6.mlp.experts.95.gate_proj.weight": "model-00007-of-00047.safetensors", + "model.layers.6.mlp.experts.95.gate_proj.weight_scale": "model-00007-of-00047.safetensors", + "model.layers.6.mlp.experts.95.up_proj.weight": "model-00007-of-00047.safetensors", + "model.layers.6.mlp.experts.95.up_proj.weight_scale": "model-00007-of-00047.safetensors", + "model.layers.6.mlp.experts.96.down_proj.weight": "model-00007-of-00047.safetensors", + "model.layers.6.mlp.experts.96.down_proj.weight_scale": "model-00007-of-00047.safetensors", + "model.layers.6.mlp.experts.96.gate_proj.weight": "model-00007-of-00047.safetensors", + "model.layers.6.mlp.experts.96.gate_proj.weight_scale": "model-00007-of-00047.safetensors", + "model.layers.6.mlp.experts.96.up_proj.weight": "model-00007-of-00047.safetensors", + "model.layers.6.mlp.experts.96.up_proj.weight_scale": "model-00007-of-00047.safetensors", + "model.layers.6.mlp.experts.97.down_proj.weight": "model-00007-of-00047.safetensors", + "model.layers.6.mlp.experts.97.down_proj.weight_scale": "model-00007-of-00047.safetensors", + "model.layers.6.mlp.experts.97.gate_proj.weight": "model-00007-of-00047.safetensors", + "model.layers.6.mlp.experts.97.gate_proj.weight_scale": "model-00007-of-00047.safetensors", + "model.layers.6.mlp.experts.97.up_proj.weight": "model-00007-of-00047.safetensors", + "model.layers.6.mlp.experts.97.up_proj.weight_scale": "model-00007-of-00047.safetensors", + "model.layers.6.mlp.experts.98.down_proj.weight": "model-00007-of-00047.safetensors", + "model.layers.6.mlp.experts.98.down_proj.weight_scale": "model-00007-of-00047.safetensors", + "model.layers.6.mlp.experts.98.gate_proj.weight": "model-00007-of-00047.safetensors", + "model.layers.6.mlp.experts.98.gate_proj.weight_scale": "model-00007-of-00047.safetensors", + "model.layers.6.mlp.experts.98.up_proj.weight": "model-00007-of-00047.safetensors", + "model.layers.6.mlp.experts.98.up_proj.weight_scale": "model-00007-of-00047.safetensors", + "model.layers.6.mlp.experts.99.down_proj.weight": "model-00007-of-00047.safetensors", + "model.layers.6.mlp.experts.99.down_proj.weight_scale": "model-00007-of-00047.safetensors", + "model.layers.6.mlp.experts.99.gate_proj.weight": "model-00007-of-00047.safetensors", + "model.layers.6.mlp.experts.99.gate_proj.weight_scale": "model-00007-of-00047.safetensors", + "model.layers.6.mlp.experts.99.up_proj.weight": "model-00007-of-00047.safetensors", + "model.layers.6.mlp.experts.99.up_proj.weight_scale": "model-00007-of-00047.safetensors", + "model.layers.6.mlp.gate.e_score_correction_bias": "model-00007-of-00047.safetensors", + "model.layers.6.mlp.gate.weight": "model-00007-of-00047.safetensors", + "model.layers.6.mlp.shared_experts.down_proj.weight": "model-00007-of-00047.safetensors", + "model.layers.6.mlp.shared_experts.down_proj.weight_scale": "model-00007-of-00047.safetensors", + "model.layers.6.mlp.shared_experts.gate_proj.weight": "model-00007-of-00047.safetensors", + "model.layers.6.mlp.shared_experts.gate_proj.weight_scale": "model-00007-of-00047.safetensors", + "model.layers.6.mlp.shared_experts.up_proj.weight": "model-00007-of-00047.safetensors", + "model.layers.6.mlp.shared_experts.up_proj.weight_scale": "model-00007-of-00047.safetensors", + "model.layers.6.post_attention_layernorm.weight": "model-00007-of-00047.safetensors", + "model.layers.6.self_attn.k_proj.bias": "model-00007-of-00047.safetensors", + "model.layers.6.self_attn.k_proj.weight": "model-00007-of-00047.safetensors", + "model.layers.6.self_attn.k_proj.weight_scale": "model-00007-of-00047.safetensors", + "model.layers.6.self_attn.o_proj.weight": "model-00007-of-00047.safetensors", + "model.layers.6.self_attn.o_proj.weight_scale": "model-00007-of-00047.safetensors", + "model.layers.6.self_attn.q_proj.bias": "model-00007-of-00047.safetensors", + "model.layers.6.self_attn.q_proj.weight": "model-00007-of-00047.safetensors", + "model.layers.6.self_attn.q_proj.weight_scale": "model-00007-of-00047.safetensors", + "model.layers.6.self_attn.v_proj.bias": "model-00007-of-00047.safetensors", + "model.layers.6.self_attn.v_proj.weight": "model-00007-of-00047.safetensors", + "model.layers.6.self_attn.v_proj.weight_scale": "model-00007-of-00047.safetensors", + "model.layers.7.input_layernorm.weight": "model-00008-of-00047.safetensors", + "model.layers.7.mlp.experts.0.down_proj.weight": "model-00008-of-00047.safetensors", + "model.layers.7.mlp.experts.0.down_proj.weight_scale": "model-00008-of-00047.safetensors", + "model.layers.7.mlp.experts.0.gate_proj.weight": "model-00008-of-00047.safetensors", + "model.layers.7.mlp.experts.0.gate_proj.weight_scale": "model-00008-of-00047.safetensors", + "model.layers.7.mlp.experts.0.up_proj.weight": "model-00008-of-00047.safetensors", + "model.layers.7.mlp.experts.0.up_proj.weight_scale": "model-00008-of-00047.safetensors", + "model.layers.7.mlp.experts.1.down_proj.weight": "model-00008-of-00047.safetensors", + "model.layers.7.mlp.experts.1.down_proj.weight_scale": "model-00008-of-00047.safetensors", + "model.layers.7.mlp.experts.1.gate_proj.weight": "model-00008-of-00047.safetensors", + "model.layers.7.mlp.experts.1.gate_proj.weight_scale": "model-00008-of-00047.safetensors", + "model.layers.7.mlp.experts.1.up_proj.weight": "model-00008-of-00047.safetensors", + "model.layers.7.mlp.experts.1.up_proj.weight_scale": "model-00008-of-00047.safetensors", + "model.layers.7.mlp.experts.10.down_proj.weight": "model-00008-of-00047.safetensors", + "model.layers.7.mlp.experts.10.down_proj.weight_scale": "model-00008-of-00047.safetensors", + "model.layers.7.mlp.experts.10.gate_proj.weight": "model-00008-of-00047.safetensors", + "model.layers.7.mlp.experts.10.gate_proj.weight_scale": "model-00008-of-00047.safetensors", + "model.layers.7.mlp.experts.10.up_proj.weight": "model-00008-of-00047.safetensors", + "model.layers.7.mlp.experts.10.up_proj.weight_scale": "model-00008-of-00047.safetensors", + "model.layers.7.mlp.experts.100.down_proj.weight": "model-00008-of-00047.safetensors", + "model.layers.7.mlp.experts.100.down_proj.weight_scale": "model-00008-of-00047.safetensors", + "model.layers.7.mlp.experts.100.gate_proj.weight": "model-00008-of-00047.safetensors", + "model.layers.7.mlp.experts.100.gate_proj.weight_scale": "model-00008-of-00047.safetensors", + "model.layers.7.mlp.experts.100.up_proj.weight": "model-00008-of-00047.safetensors", + "model.layers.7.mlp.experts.100.up_proj.weight_scale": "model-00008-of-00047.safetensors", + "model.layers.7.mlp.experts.101.down_proj.weight": "model-00008-of-00047.safetensors", + "model.layers.7.mlp.experts.101.down_proj.weight_scale": "model-00008-of-00047.safetensors", + "model.layers.7.mlp.experts.101.gate_proj.weight": "model-00008-of-00047.safetensors", + "model.layers.7.mlp.experts.101.gate_proj.weight_scale": "model-00008-of-00047.safetensors", + "model.layers.7.mlp.experts.101.up_proj.weight": "model-00008-of-00047.safetensors", + "model.layers.7.mlp.experts.101.up_proj.weight_scale": "model-00008-of-00047.safetensors", + "model.layers.7.mlp.experts.102.down_proj.weight": "model-00008-of-00047.safetensors", + "model.layers.7.mlp.experts.102.down_proj.weight_scale": "model-00008-of-00047.safetensors", + "model.layers.7.mlp.experts.102.gate_proj.weight": "model-00008-of-00047.safetensors", + "model.layers.7.mlp.experts.102.gate_proj.weight_scale": "model-00008-of-00047.safetensors", + "model.layers.7.mlp.experts.102.up_proj.weight": "model-00008-of-00047.safetensors", + "model.layers.7.mlp.experts.102.up_proj.weight_scale": "model-00008-of-00047.safetensors", + "model.layers.7.mlp.experts.103.down_proj.weight": "model-00008-of-00047.safetensors", + "model.layers.7.mlp.experts.103.down_proj.weight_scale": "model-00008-of-00047.safetensors", + "model.layers.7.mlp.experts.103.gate_proj.weight": "model-00008-of-00047.safetensors", + "model.layers.7.mlp.experts.103.gate_proj.weight_scale": "model-00008-of-00047.safetensors", + "model.layers.7.mlp.experts.103.up_proj.weight": "model-00008-of-00047.safetensors", + "model.layers.7.mlp.experts.103.up_proj.weight_scale": "model-00008-of-00047.safetensors", + "model.layers.7.mlp.experts.104.down_proj.weight": "model-00008-of-00047.safetensors", + "model.layers.7.mlp.experts.104.down_proj.weight_scale": "model-00008-of-00047.safetensors", + "model.layers.7.mlp.experts.104.gate_proj.weight": "model-00008-of-00047.safetensors", + "model.layers.7.mlp.experts.104.gate_proj.weight_scale": "model-00008-of-00047.safetensors", + "model.layers.7.mlp.experts.104.up_proj.weight": "model-00008-of-00047.safetensors", + "model.layers.7.mlp.experts.104.up_proj.weight_scale": "model-00008-of-00047.safetensors", + "model.layers.7.mlp.experts.105.down_proj.weight": "model-00008-of-00047.safetensors", + "model.layers.7.mlp.experts.105.down_proj.weight_scale": "model-00008-of-00047.safetensors", + "model.layers.7.mlp.experts.105.gate_proj.weight": "model-00008-of-00047.safetensors", + "model.layers.7.mlp.experts.105.gate_proj.weight_scale": "model-00008-of-00047.safetensors", + "model.layers.7.mlp.experts.105.up_proj.weight": "model-00008-of-00047.safetensors", + "model.layers.7.mlp.experts.105.up_proj.weight_scale": "model-00008-of-00047.safetensors", + "model.layers.7.mlp.experts.106.down_proj.weight": "model-00008-of-00047.safetensors", + "model.layers.7.mlp.experts.106.down_proj.weight_scale": "model-00008-of-00047.safetensors", + "model.layers.7.mlp.experts.106.gate_proj.weight": "model-00008-of-00047.safetensors", + "model.layers.7.mlp.experts.106.gate_proj.weight_scale": "model-00008-of-00047.safetensors", + "model.layers.7.mlp.experts.106.up_proj.weight": "model-00008-of-00047.safetensors", + "model.layers.7.mlp.experts.106.up_proj.weight_scale": "model-00008-of-00047.safetensors", + "model.layers.7.mlp.experts.107.down_proj.weight": "model-00008-of-00047.safetensors", + "model.layers.7.mlp.experts.107.down_proj.weight_scale": "model-00008-of-00047.safetensors", + "model.layers.7.mlp.experts.107.gate_proj.weight": "model-00008-of-00047.safetensors", + "model.layers.7.mlp.experts.107.gate_proj.weight_scale": "model-00008-of-00047.safetensors", + "model.layers.7.mlp.experts.107.up_proj.weight": "model-00008-of-00047.safetensors", + "model.layers.7.mlp.experts.107.up_proj.weight_scale": "model-00008-of-00047.safetensors", + "model.layers.7.mlp.experts.108.down_proj.weight": "model-00008-of-00047.safetensors", + "model.layers.7.mlp.experts.108.down_proj.weight_scale": "model-00008-of-00047.safetensors", + "model.layers.7.mlp.experts.108.gate_proj.weight": "model-00008-of-00047.safetensors", + "model.layers.7.mlp.experts.108.gate_proj.weight_scale": "model-00008-of-00047.safetensors", + "model.layers.7.mlp.experts.108.up_proj.weight": "model-00008-of-00047.safetensors", + "model.layers.7.mlp.experts.108.up_proj.weight_scale": "model-00008-of-00047.safetensors", + "model.layers.7.mlp.experts.109.down_proj.weight": "model-00008-of-00047.safetensors", + "model.layers.7.mlp.experts.109.down_proj.weight_scale": "model-00008-of-00047.safetensors", + "model.layers.7.mlp.experts.109.gate_proj.weight": "model-00008-of-00047.safetensors", + "model.layers.7.mlp.experts.109.gate_proj.weight_scale": "model-00008-of-00047.safetensors", + "model.layers.7.mlp.experts.109.up_proj.weight": "model-00008-of-00047.safetensors", + "model.layers.7.mlp.experts.109.up_proj.weight_scale": "model-00008-of-00047.safetensors", + "model.layers.7.mlp.experts.11.down_proj.weight": "model-00008-of-00047.safetensors", + "model.layers.7.mlp.experts.11.down_proj.weight_scale": "model-00008-of-00047.safetensors", + "model.layers.7.mlp.experts.11.gate_proj.weight": "model-00008-of-00047.safetensors", + "model.layers.7.mlp.experts.11.gate_proj.weight_scale": "model-00008-of-00047.safetensors", + "model.layers.7.mlp.experts.11.up_proj.weight": "model-00008-of-00047.safetensors", + "model.layers.7.mlp.experts.11.up_proj.weight_scale": "model-00008-of-00047.safetensors", + "model.layers.7.mlp.experts.110.down_proj.weight": "model-00008-of-00047.safetensors", + "model.layers.7.mlp.experts.110.down_proj.weight_scale": "model-00008-of-00047.safetensors", + "model.layers.7.mlp.experts.110.gate_proj.weight": "model-00008-of-00047.safetensors", + "model.layers.7.mlp.experts.110.gate_proj.weight_scale": "model-00008-of-00047.safetensors", + "model.layers.7.mlp.experts.110.up_proj.weight": "model-00008-of-00047.safetensors", + "model.layers.7.mlp.experts.110.up_proj.weight_scale": "model-00008-of-00047.safetensors", + "model.layers.7.mlp.experts.111.down_proj.weight": "model-00008-of-00047.safetensors", + "model.layers.7.mlp.experts.111.down_proj.weight_scale": "model-00008-of-00047.safetensors", + "model.layers.7.mlp.experts.111.gate_proj.weight": "model-00008-of-00047.safetensors", + "model.layers.7.mlp.experts.111.gate_proj.weight_scale": "model-00008-of-00047.safetensors", + "model.layers.7.mlp.experts.111.up_proj.weight": "model-00008-of-00047.safetensors", + "model.layers.7.mlp.experts.111.up_proj.weight_scale": "model-00008-of-00047.safetensors", + "model.layers.7.mlp.experts.112.down_proj.weight": "model-00008-of-00047.safetensors", + "model.layers.7.mlp.experts.112.down_proj.weight_scale": "model-00008-of-00047.safetensors", + "model.layers.7.mlp.experts.112.gate_proj.weight": "model-00008-of-00047.safetensors", + "model.layers.7.mlp.experts.112.gate_proj.weight_scale": "model-00008-of-00047.safetensors", + "model.layers.7.mlp.experts.112.up_proj.weight": "model-00008-of-00047.safetensors", + "model.layers.7.mlp.experts.112.up_proj.weight_scale": "model-00008-of-00047.safetensors", + "model.layers.7.mlp.experts.113.down_proj.weight": "model-00008-of-00047.safetensors", + "model.layers.7.mlp.experts.113.down_proj.weight_scale": "model-00008-of-00047.safetensors", + "model.layers.7.mlp.experts.113.gate_proj.weight": "model-00008-of-00047.safetensors", + "model.layers.7.mlp.experts.113.gate_proj.weight_scale": "model-00008-of-00047.safetensors", + "model.layers.7.mlp.experts.113.up_proj.weight": "model-00008-of-00047.safetensors", + "model.layers.7.mlp.experts.113.up_proj.weight_scale": "model-00008-of-00047.safetensors", + "model.layers.7.mlp.experts.114.down_proj.weight": "model-00008-of-00047.safetensors", + "model.layers.7.mlp.experts.114.down_proj.weight_scale": "model-00008-of-00047.safetensors", + "model.layers.7.mlp.experts.114.gate_proj.weight": "model-00008-of-00047.safetensors", + "model.layers.7.mlp.experts.114.gate_proj.weight_scale": "model-00008-of-00047.safetensors", + "model.layers.7.mlp.experts.114.up_proj.weight": "model-00008-of-00047.safetensors", + "model.layers.7.mlp.experts.114.up_proj.weight_scale": "model-00008-of-00047.safetensors", + "model.layers.7.mlp.experts.115.down_proj.weight": "model-00008-of-00047.safetensors", + "model.layers.7.mlp.experts.115.down_proj.weight_scale": "model-00008-of-00047.safetensors", + "model.layers.7.mlp.experts.115.gate_proj.weight": "model-00008-of-00047.safetensors", + "model.layers.7.mlp.experts.115.gate_proj.weight_scale": "model-00008-of-00047.safetensors", + "model.layers.7.mlp.experts.115.up_proj.weight": "model-00008-of-00047.safetensors", + "model.layers.7.mlp.experts.115.up_proj.weight_scale": "model-00008-of-00047.safetensors", + "model.layers.7.mlp.experts.116.down_proj.weight": "model-00008-of-00047.safetensors", + "model.layers.7.mlp.experts.116.down_proj.weight_scale": "model-00008-of-00047.safetensors", + "model.layers.7.mlp.experts.116.gate_proj.weight": "model-00008-of-00047.safetensors", + "model.layers.7.mlp.experts.116.gate_proj.weight_scale": "model-00008-of-00047.safetensors", + "model.layers.7.mlp.experts.116.up_proj.weight": "model-00008-of-00047.safetensors", + "model.layers.7.mlp.experts.116.up_proj.weight_scale": "model-00008-of-00047.safetensors", + "model.layers.7.mlp.experts.117.down_proj.weight": "model-00008-of-00047.safetensors", + "model.layers.7.mlp.experts.117.down_proj.weight_scale": "model-00008-of-00047.safetensors", + "model.layers.7.mlp.experts.117.gate_proj.weight": "model-00008-of-00047.safetensors", + "model.layers.7.mlp.experts.117.gate_proj.weight_scale": "model-00008-of-00047.safetensors", + "model.layers.7.mlp.experts.117.up_proj.weight": "model-00008-of-00047.safetensors", + "model.layers.7.mlp.experts.117.up_proj.weight_scale": "model-00008-of-00047.safetensors", + "model.layers.7.mlp.experts.118.down_proj.weight": "model-00008-of-00047.safetensors", + "model.layers.7.mlp.experts.118.down_proj.weight_scale": "model-00008-of-00047.safetensors", + "model.layers.7.mlp.experts.118.gate_proj.weight": "model-00008-of-00047.safetensors", + "model.layers.7.mlp.experts.118.gate_proj.weight_scale": "model-00008-of-00047.safetensors", + "model.layers.7.mlp.experts.118.up_proj.weight": "model-00008-of-00047.safetensors", + "model.layers.7.mlp.experts.118.up_proj.weight_scale": "model-00008-of-00047.safetensors", + "model.layers.7.mlp.experts.119.down_proj.weight": "model-00008-of-00047.safetensors", + "model.layers.7.mlp.experts.119.down_proj.weight_scale": "model-00008-of-00047.safetensors", + "model.layers.7.mlp.experts.119.gate_proj.weight": "model-00008-of-00047.safetensors", + "model.layers.7.mlp.experts.119.gate_proj.weight_scale": "model-00008-of-00047.safetensors", + "model.layers.7.mlp.experts.119.up_proj.weight": "model-00008-of-00047.safetensors", + "model.layers.7.mlp.experts.119.up_proj.weight_scale": "model-00008-of-00047.safetensors", + "model.layers.7.mlp.experts.12.down_proj.weight": "model-00008-of-00047.safetensors", + "model.layers.7.mlp.experts.12.down_proj.weight_scale": "model-00008-of-00047.safetensors", + "model.layers.7.mlp.experts.12.gate_proj.weight": "model-00008-of-00047.safetensors", + "model.layers.7.mlp.experts.12.gate_proj.weight_scale": "model-00008-of-00047.safetensors", + "model.layers.7.mlp.experts.12.up_proj.weight": "model-00008-of-00047.safetensors", + "model.layers.7.mlp.experts.12.up_proj.weight_scale": "model-00008-of-00047.safetensors", + "model.layers.7.mlp.experts.120.down_proj.weight": "model-00008-of-00047.safetensors", + "model.layers.7.mlp.experts.120.down_proj.weight_scale": "model-00008-of-00047.safetensors", + "model.layers.7.mlp.experts.120.gate_proj.weight": "model-00008-of-00047.safetensors", + "model.layers.7.mlp.experts.120.gate_proj.weight_scale": "model-00008-of-00047.safetensors", + "model.layers.7.mlp.experts.120.up_proj.weight": "model-00008-of-00047.safetensors", + "model.layers.7.mlp.experts.120.up_proj.weight_scale": "model-00008-of-00047.safetensors", + "model.layers.7.mlp.experts.121.down_proj.weight": "model-00008-of-00047.safetensors", + "model.layers.7.mlp.experts.121.down_proj.weight_scale": "model-00008-of-00047.safetensors", + "model.layers.7.mlp.experts.121.gate_proj.weight": "model-00008-of-00047.safetensors", + "model.layers.7.mlp.experts.121.gate_proj.weight_scale": "model-00008-of-00047.safetensors", + "model.layers.7.mlp.experts.121.up_proj.weight": "model-00008-of-00047.safetensors", + "model.layers.7.mlp.experts.121.up_proj.weight_scale": "model-00008-of-00047.safetensors", + "model.layers.7.mlp.experts.122.down_proj.weight": "model-00008-of-00047.safetensors", + "model.layers.7.mlp.experts.122.down_proj.weight_scale": "model-00008-of-00047.safetensors", + "model.layers.7.mlp.experts.122.gate_proj.weight": "model-00008-of-00047.safetensors", + "model.layers.7.mlp.experts.122.gate_proj.weight_scale": "model-00008-of-00047.safetensors", + "model.layers.7.mlp.experts.122.up_proj.weight": "model-00008-of-00047.safetensors", + "model.layers.7.mlp.experts.122.up_proj.weight_scale": "model-00008-of-00047.safetensors", + "model.layers.7.mlp.experts.123.down_proj.weight": "model-00008-of-00047.safetensors", + "model.layers.7.mlp.experts.123.down_proj.weight_scale": "model-00008-of-00047.safetensors", + "model.layers.7.mlp.experts.123.gate_proj.weight": "model-00008-of-00047.safetensors", + "model.layers.7.mlp.experts.123.gate_proj.weight_scale": "model-00008-of-00047.safetensors", + "model.layers.7.mlp.experts.123.up_proj.weight": "model-00008-of-00047.safetensors", + "model.layers.7.mlp.experts.123.up_proj.weight_scale": "model-00008-of-00047.safetensors", + "model.layers.7.mlp.experts.124.down_proj.weight": "model-00008-of-00047.safetensors", + "model.layers.7.mlp.experts.124.down_proj.weight_scale": "model-00008-of-00047.safetensors", + "model.layers.7.mlp.experts.124.gate_proj.weight": "model-00008-of-00047.safetensors", + "model.layers.7.mlp.experts.124.gate_proj.weight_scale": "model-00008-of-00047.safetensors", + "model.layers.7.mlp.experts.124.up_proj.weight": "model-00008-of-00047.safetensors", + "model.layers.7.mlp.experts.124.up_proj.weight_scale": "model-00008-of-00047.safetensors", + "model.layers.7.mlp.experts.125.down_proj.weight": "model-00008-of-00047.safetensors", + "model.layers.7.mlp.experts.125.down_proj.weight_scale": "model-00008-of-00047.safetensors", + "model.layers.7.mlp.experts.125.gate_proj.weight": "model-00008-of-00047.safetensors", + "model.layers.7.mlp.experts.125.gate_proj.weight_scale": "model-00008-of-00047.safetensors", + "model.layers.7.mlp.experts.125.up_proj.weight": "model-00008-of-00047.safetensors", + "model.layers.7.mlp.experts.125.up_proj.weight_scale": "model-00008-of-00047.safetensors", + "model.layers.7.mlp.experts.126.down_proj.weight": "model-00008-of-00047.safetensors", + "model.layers.7.mlp.experts.126.down_proj.weight_scale": "model-00008-of-00047.safetensors", + "model.layers.7.mlp.experts.126.gate_proj.weight": "model-00008-of-00047.safetensors", + "model.layers.7.mlp.experts.126.gate_proj.weight_scale": "model-00008-of-00047.safetensors", + "model.layers.7.mlp.experts.126.up_proj.weight": "model-00008-of-00047.safetensors", + "model.layers.7.mlp.experts.126.up_proj.weight_scale": "model-00008-of-00047.safetensors", + "model.layers.7.mlp.experts.127.down_proj.weight": "model-00008-of-00047.safetensors", + "model.layers.7.mlp.experts.127.down_proj.weight_scale": "model-00008-of-00047.safetensors", + "model.layers.7.mlp.experts.127.gate_proj.weight": "model-00008-of-00047.safetensors", + "model.layers.7.mlp.experts.127.gate_proj.weight_scale": "model-00008-of-00047.safetensors", + "model.layers.7.mlp.experts.127.up_proj.weight": "model-00008-of-00047.safetensors", + "model.layers.7.mlp.experts.127.up_proj.weight_scale": "model-00008-of-00047.safetensors", + "model.layers.7.mlp.experts.13.down_proj.weight": "model-00008-of-00047.safetensors", + "model.layers.7.mlp.experts.13.down_proj.weight_scale": "model-00008-of-00047.safetensors", + "model.layers.7.mlp.experts.13.gate_proj.weight": "model-00008-of-00047.safetensors", + "model.layers.7.mlp.experts.13.gate_proj.weight_scale": "model-00008-of-00047.safetensors", + "model.layers.7.mlp.experts.13.up_proj.weight": "model-00008-of-00047.safetensors", + "model.layers.7.mlp.experts.13.up_proj.weight_scale": "model-00008-of-00047.safetensors", + "model.layers.7.mlp.experts.14.down_proj.weight": "model-00008-of-00047.safetensors", + "model.layers.7.mlp.experts.14.down_proj.weight_scale": "model-00008-of-00047.safetensors", + "model.layers.7.mlp.experts.14.gate_proj.weight": "model-00008-of-00047.safetensors", + "model.layers.7.mlp.experts.14.gate_proj.weight_scale": "model-00008-of-00047.safetensors", + "model.layers.7.mlp.experts.14.up_proj.weight": "model-00008-of-00047.safetensors", + "model.layers.7.mlp.experts.14.up_proj.weight_scale": "model-00008-of-00047.safetensors", + "model.layers.7.mlp.experts.15.down_proj.weight": "model-00008-of-00047.safetensors", + "model.layers.7.mlp.experts.15.down_proj.weight_scale": "model-00008-of-00047.safetensors", + "model.layers.7.mlp.experts.15.gate_proj.weight": "model-00008-of-00047.safetensors", + "model.layers.7.mlp.experts.15.gate_proj.weight_scale": "model-00008-of-00047.safetensors", + "model.layers.7.mlp.experts.15.up_proj.weight": "model-00008-of-00047.safetensors", + "model.layers.7.mlp.experts.15.up_proj.weight_scale": "model-00008-of-00047.safetensors", + "model.layers.7.mlp.experts.16.down_proj.weight": "model-00008-of-00047.safetensors", + "model.layers.7.mlp.experts.16.down_proj.weight_scale": "model-00008-of-00047.safetensors", + "model.layers.7.mlp.experts.16.gate_proj.weight": "model-00008-of-00047.safetensors", + "model.layers.7.mlp.experts.16.gate_proj.weight_scale": "model-00008-of-00047.safetensors", + "model.layers.7.mlp.experts.16.up_proj.weight": "model-00008-of-00047.safetensors", + "model.layers.7.mlp.experts.16.up_proj.weight_scale": "model-00008-of-00047.safetensors", + "model.layers.7.mlp.experts.17.down_proj.weight": "model-00008-of-00047.safetensors", + "model.layers.7.mlp.experts.17.down_proj.weight_scale": "model-00008-of-00047.safetensors", + "model.layers.7.mlp.experts.17.gate_proj.weight": "model-00008-of-00047.safetensors", + "model.layers.7.mlp.experts.17.gate_proj.weight_scale": "model-00008-of-00047.safetensors", + "model.layers.7.mlp.experts.17.up_proj.weight": "model-00008-of-00047.safetensors", + "model.layers.7.mlp.experts.17.up_proj.weight_scale": "model-00008-of-00047.safetensors", + "model.layers.7.mlp.experts.18.down_proj.weight": "model-00008-of-00047.safetensors", + "model.layers.7.mlp.experts.18.down_proj.weight_scale": "model-00008-of-00047.safetensors", + "model.layers.7.mlp.experts.18.gate_proj.weight": "model-00008-of-00047.safetensors", + "model.layers.7.mlp.experts.18.gate_proj.weight_scale": "model-00008-of-00047.safetensors", + "model.layers.7.mlp.experts.18.up_proj.weight": "model-00008-of-00047.safetensors", + "model.layers.7.mlp.experts.18.up_proj.weight_scale": "model-00008-of-00047.safetensors", + "model.layers.7.mlp.experts.19.down_proj.weight": "model-00008-of-00047.safetensors", + "model.layers.7.mlp.experts.19.down_proj.weight_scale": "model-00008-of-00047.safetensors", + "model.layers.7.mlp.experts.19.gate_proj.weight": "model-00008-of-00047.safetensors", + "model.layers.7.mlp.experts.19.gate_proj.weight_scale": "model-00008-of-00047.safetensors", + "model.layers.7.mlp.experts.19.up_proj.weight": "model-00008-of-00047.safetensors", + "model.layers.7.mlp.experts.19.up_proj.weight_scale": "model-00008-of-00047.safetensors", + "model.layers.7.mlp.experts.2.down_proj.weight": "model-00008-of-00047.safetensors", + "model.layers.7.mlp.experts.2.down_proj.weight_scale": "model-00008-of-00047.safetensors", + "model.layers.7.mlp.experts.2.gate_proj.weight": "model-00008-of-00047.safetensors", + "model.layers.7.mlp.experts.2.gate_proj.weight_scale": "model-00008-of-00047.safetensors", + "model.layers.7.mlp.experts.2.up_proj.weight": "model-00008-of-00047.safetensors", + "model.layers.7.mlp.experts.2.up_proj.weight_scale": "model-00008-of-00047.safetensors", + "model.layers.7.mlp.experts.20.down_proj.weight": "model-00008-of-00047.safetensors", + "model.layers.7.mlp.experts.20.down_proj.weight_scale": "model-00008-of-00047.safetensors", + "model.layers.7.mlp.experts.20.gate_proj.weight": "model-00008-of-00047.safetensors", + "model.layers.7.mlp.experts.20.gate_proj.weight_scale": "model-00008-of-00047.safetensors", + "model.layers.7.mlp.experts.20.up_proj.weight": "model-00008-of-00047.safetensors", + "model.layers.7.mlp.experts.20.up_proj.weight_scale": "model-00008-of-00047.safetensors", + "model.layers.7.mlp.experts.21.down_proj.weight": "model-00008-of-00047.safetensors", + "model.layers.7.mlp.experts.21.down_proj.weight_scale": "model-00008-of-00047.safetensors", + "model.layers.7.mlp.experts.21.gate_proj.weight": "model-00008-of-00047.safetensors", + "model.layers.7.mlp.experts.21.gate_proj.weight_scale": "model-00008-of-00047.safetensors", + "model.layers.7.mlp.experts.21.up_proj.weight": "model-00008-of-00047.safetensors", + "model.layers.7.mlp.experts.21.up_proj.weight_scale": "model-00008-of-00047.safetensors", + "model.layers.7.mlp.experts.22.down_proj.weight": "model-00008-of-00047.safetensors", + "model.layers.7.mlp.experts.22.down_proj.weight_scale": "model-00008-of-00047.safetensors", + "model.layers.7.mlp.experts.22.gate_proj.weight": "model-00008-of-00047.safetensors", + "model.layers.7.mlp.experts.22.gate_proj.weight_scale": "model-00008-of-00047.safetensors", + "model.layers.7.mlp.experts.22.up_proj.weight": "model-00008-of-00047.safetensors", + "model.layers.7.mlp.experts.22.up_proj.weight_scale": "model-00008-of-00047.safetensors", + "model.layers.7.mlp.experts.23.down_proj.weight": "model-00008-of-00047.safetensors", + "model.layers.7.mlp.experts.23.down_proj.weight_scale": "model-00008-of-00047.safetensors", + "model.layers.7.mlp.experts.23.gate_proj.weight": "model-00008-of-00047.safetensors", + "model.layers.7.mlp.experts.23.gate_proj.weight_scale": "model-00008-of-00047.safetensors", + "model.layers.7.mlp.experts.23.up_proj.weight": "model-00008-of-00047.safetensors", + "model.layers.7.mlp.experts.23.up_proj.weight_scale": "model-00008-of-00047.safetensors", + "model.layers.7.mlp.experts.24.down_proj.weight": "model-00008-of-00047.safetensors", + "model.layers.7.mlp.experts.24.down_proj.weight_scale": "model-00008-of-00047.safetensors", + "model.layers.7.mlp.experts.24.gate_proj.weight": "model-00008-of-00047.safetensors", + "model.layers.7.mlp.experts.24.gate_proj.weight_scale": "model-00008-of-00047.safetensors", + "model.layers.7.mlp.experts.24.up_proj.weight": "model-00008-of-00047.safetensors", + "model.layers.7.mlp.experts.24.up_proj.weight_scale": "model-00008-of-00047.safetensors", + "model.layers.7.mlp.experts.25.down_proj.weight": "model-00008-of-00047.safetensors", + "model.layers.7.mlp.experts.25.down_proj.weight_scale": "model-00008-of-00047.safetensors", + "model.layers.7.mlp.experts.25.gate_proj.weight": "model-00008-of-00047.safetensors", + "model.layers.7.mlp.experts.25.gate_proj.weight_scale": "model-00008-of-00047.safetensors", + "model.layers.7.mlp.experts.25.up_proj.weight": "model-00008-of-00047.safetensors", + "model.layers.7.mlp.experts.25.up_proj.weight_scale": "model-00008-of-00047.safetensors", + "model.layers.7.mlp.experts.26.down_proj.weight": "model-00008-of-00047.safetensors", + "model.layers.7.mlp.experts.26.down_proj.weight_scale": "model-00008-of-00047.safetensors", + "model.layers.7.mlp.experts.26.gate_proj.weight": "model-00008-of-00047.safetensors", + "model.layers.7.mlp.experts.26.gate_proj.weight_scale": "model-00008-of-00047.safetensors", + "model.layers.7.mlp.experts.26.up_proj.weight": "model-00008-of-00047.safetensors", + "model.layers.7.mlp.experts.26.up_proj.weight_scale": "model-00008-of-00047.safetensors", + "model.layers.7.mlp.experts.27.down_proj.weight": "model-00008-of-00047.safetensors", + "model.layers.7.mlp.experts.27.down_proj.weight_scale": "model-00008-of-00047.safetensors", + "model.layers.7.mlp.experts.27.gate_proj.weight": "model-00008-of-00047.safetensors", + "model.layers.7.mlp.experts.27.gate_proj.weight_scale": "model-00008-of-00047.safetensors", + "model.layers.7.mlp.experts.27.up_proj.weight": "model-00008-of-00047.safetensors", + "model.layers.7.mlp.experts.27.up_proj.weight_scale": "model-00008-of-00047.safetensors", + "model.layers.7.mlp.experts.28.down_proj.weight": "model-00008-of-00047.safetensors", + "model.layers.7.mlp.experts.28.down_proj.weight_scale": "model-00008-of-00047.safetensors", + "model.layers.7.mlp.experts.28.gate_proj.weight": "model-00008-of-00047.safetensors", + "model.layers.7.mlp.experts.28.gate_proj.weight_scale": "model-00008-of-00047.safetensors", + "model.layers.7.mlp.experts.28.up_proj.weight": "model-00008-of-00047.safetensors", + "model.layers.7.mlp.experts.28.up_proj.weight_scale": "model-00008-of-00047.safetensors", + "model.layers.7.mlp.experts.29.down_proj.weight": "model-00008-of-00047.safetensors", + "model.layers.7.mlp.experts.29.down_proj.weight_scale": "model-00008-of-00047.safetensors", + "model.layers.7.mlp.experts.29.gate_proj.weight": "model-00008-of-00047.safetensors", + "model.layers.7.mlp.experts.29.gate_proj.weight_scale": "model-00008-of-00047.safetensors", + "model.layers.7.mlp.experts.29.up_proj.weight": "model-00008-of-00047.safetensors", + "model.layers.7.mlp.experts.29.up_proj.weight_scale": "model-00008-of-00047.safetensors", + "model.layers.7.mlp.experts.3.down_proj.weight": "model-00008-of-00047.safetensors", + "model.layers.7.mlp.experts.3.down_proj.weight_scale": "model-00008-of-00047.safetensors", + "model.layers.7.mlp.experts.3.gate_proj.weight": "model-00008-of-00047.safetensors", + "model.layers.7.mlp.experts.3.gate_proj.weight_scale": "model-00008-of-00047.safetensors", + "model.layers.7.mlp.experts.3.up_proj.weight": "model-00008-of-00047.safetensors", + "model.layers.7.mlp.experts.3.up_proj.weight_scale": "model-00008-of-00047.safetensors", + "model.layers.7.mlp.experts.30.down_proj.weight": "model-00008-of-00047.safetensors", + "model.layers.7.mlp.experts.30.down_proj.weight_scale": "model-00008-of-00047.safetensors", + "model.layers.7.mlp.experts.30.gate_proj.weight": "model-00008-of-00047.safetensors", + "model.layers.7.mlp.experts.30.gate_proj.weight_scale": "model-00008-of-00047.safetensors", + "model.layers.7.mlp.experts.30.up_proj.weight": "model-00008-of-00047.safetensors", + "model.layers.7.mlp.experts.30.up_proj.weight_scale": "model-00008-of-00047.safetensors", + "model.layers.7.mlp.experts.31.down_proj.weight": "model-00008-of-00047.safetensors", + "model.layers.7.mlp.experts.31.down_proj.weight_scale": "model-00008-of-00047.safetensors", + "model.layers.7.mlp.experts.31.gate_proj.weight": "model-00008-of-00047.safetensors", + "model.layers.7.mlp.experts.31.gate_proj.weight_scale": "model-00008-of-00047.safetensors", + "model.layers.7.mlp.experts.31.up_proj.weight": "model-00008-of-00047.safetensors", + "model.layers.7.mlp.experts.31.up_proj.weight_scale": "model-00008-of-00047.safetensors", + "model.layers.7.mlp.experts.32.down_proj.weight": "model-00008-of-00047.safetensors", + "model.layers.7.mlp.experts.32.down_proj.weight_scale": "model-00008-of-00047.safetensors", + "model.layers.7.mlp.experts.32.gate_proj.weight": "model-00008-of-00047.safetensors", + "model.layers.7.mlp.experts.32.gate_proj.weight_scale": "model-00008-of-00047.safetensors", + "model.layers.7.mlp.experts.32.up_proj.weight": "model-00008-of-00047.safetensors", + "model.layers.7.mlp.experts.32.up_proj.weight_scale": "model-00008-of-00047.safetensors", + "model.layers.7.mlp.experts.33.down_proj.weight": "model-00008-of-00047.safetensors", + "model.layers.7.mlp.experts.33.down_proj.weight_scale": "model-00008-of-00047.safetensors", + "model.layers.7.mlp.experts.33.gate_proj.weight": "model-00008-of-00047.safetensors", + "model.layers.7.mlp.experts.33.gate_proj.weight_scale": "model-00008-of-00047.safetensors", + "model.layers.7.mlp.experts.33.up_proj.weight": "model-00008-of-00047.safetensors", + "model.layers.7.mlp.experts.33.up_proj.weight_scale": "model-00008-of-00047.safetensors", + "model.layers.7.mlp.experts.34.down_proj.weight": "model-00008-of-00047.safetensors", + "model.layers.7.mlp.experts.34.down_proj.weight_scale": "model-00008-of-00047.safetensors", + "model.layers.7.mlp.experts.34.gate_proj.weight": "model-00008-of-00047.safetensors", + "model.layers.7.mlp.experts.34.gate_proj.weight_scale": "model-00008-of-00047.safetensors", + "model.layers.7.mlp.experts.34.up_proj.weight": "model-00008-of-00047.safetensors", + "model.layers.7.mlp.experts.34.up_proj.weight_scale": "model-00008-of-00047.safetensors", + "model.layers.7.mlp.experts.35.down_proj.weight": "model-00008-of-00047.safetensors", + "model.layers.7.mlp.experts.35.down_proj.weight_scale": "model-00008-of-00047.safetensors", + "model.layers.7.mlp.experts.35.gate_proj.weight": "model-00008-of-00047.safetensors", + "model.layers.7.mlp.experts.35.gate_proj.weight_scale": "model-00008-of-00047.safetensors", + "model.layers.7.mlp.experts.35.up_proj.weight": "model-00008-of-00047.safetensors", + "model.layers.7.mlp.experts.35.up_proj.weight_scale": "model-00008-of-00047.safetensors", + "model.layers.7.mlp.experts.36.down_proj.weight": "model-00008-of-00047.safetensors", + "model.layers.7.mlp.experts.36.down_proj.weight_scale": "model-00008-of-00047.safetensors", + "model.layers.7.mlp.experts.36.gate_proj.weight": "model-00008-of-00047.safetensors", + "model.layers.7.mlp.experts.36.gate_proj.weight_scale": "model-00008-of-00047.safetensors", + "model.layers.7.mlp.experts.36.up_proj.weight": "model-00008-of-00047.safetensors", + "model.layers.7.mlp.experts.36.up_proj.weight_scale": "model-00008-of-00047.safetensors", + "model.layers.7.mlp.experts.37.down_proj.weight": "model-00008-of-00047.safetensors", + "model.layers.7.mlp.experts.37.down_proj.weight_scale": "model-00008-of-00047.safetensors", + "model.layers.7.mlp.experts.37.gate_proj.weight": "model-00008-of-00047.safetensors", + "model.layers.7.mlp.experts.37.gate_proj.weight_scale": "model-00008-of-00047.safetensors", + "model.layers.7.mlp.experts.37.up_proj.weight": "model-00008-of-00047.safetensors", + "model.layers.7.mlp.experts.37.up_proj.weight_scale": "model-00008-of-00047.safetensors", + "model.layers.7.mlp.experts.38.down_proj.weight": "model-00008-of-00047.safetensors", + "model.layers.7.mlp.experts.38.down_proj.weight_scale": "model-00008-of-00047.safetensors", + "model.layers.7.mlp.experts.38.gate_proj.weight": "model-00008-of-00047.safetensors", + "model.layers.7.mlp.experts.38.gate_proj.weight_scale": "model-00008-of-00047.safetensors", + "model.layers.7.mlp.experts.38.up_proj.weight": "model-00008-of-00047.safetensors", + "model.layers.7.mlp.experts.38.up_proj.weight_scale": "model-00008-of-00047.safetensors", + "model.layers.7.mlp.experts.39.down_proj.weight": "model-00008-of-00047.safetensors", + "model.layers.7.mlp.experts.39.down_proj.weight_scale": "model-00008-of-00047.safetensors", + "model.layers.7.mlp.experts.39.gate_proj.weight": "model-00008-of-00047.safetensors", + "model.layers.7.mlp.experts.39.gate_proj.weight_scale": "model-00008-of-00047.safetensors", + "model.layers.7.mlp.experts.39.up_proj.weight": "model-00008-of-00047.safetensors", + "model.layers.7.mlp.experts.39.up_proj.weight_scale": "model-00008-of-00047.safetensors", + "model.layers.7.mlp.experts.4.down_proj.weight": "model-00008-of-00047.safetensors", + "model.layers.7.mlp.experts.4.down_proj.weight_scale": "model-00008-of-00047.safetensors", + "model.layers.7.mlp.experts.4.gate_proj.weight": "model-00008-of-00047.safetensors", + "model.layers.7.mlp.experts.4.gate_proj.weight_scale": "model-00008-of-00047.safetensors", + "model.layers.7.mlp.experts.4.up_proj.weight": "model-00008-of-00047.safetensors", + "model.layers.7.mlp.experts.4.up_proj.weight_scale": "model-00008-of-00047.safetensors", + "model.layers.7.mlp.experts.40.down_proj.weight": "model-00008-of-00047.safetensors", + "model.layers.7.mlp.experts.40.down_proj.weight_scale": "model-00008-of-00047.safetensors", + "model.layers.7.mlp.experts.40.gate_proj.weight": "model-00008-of-00047.safetensors", + "model.layers.7.mlp.experts.40.gate_proj.weight_scale": "model-00008-of-00047.safetensors", + "model.layers.7.mlp.experts.40.up_proj.weight": "model-00008-of-00047.safetensors", + "model.layers.7.mlp.experts.40.up_proj.weight_scale": "model-00008-of-00047.safetensors", + "model.layers.7.mlp.experts.41.down_proj.weight": "model-00008-of-00047.safetensors", + "model.layers.7.mlp.experts.41.down_proj.weight_scale": "model-00008-of-00047.safetensors", + "model.layers.7.mlp.experts.41.gate_proj.weight": "model-00008-of-00047.safetensors", + "model.layers.7.mlp.experts.41.gate_proj.weight_scale": "model-00008-of-00047.safetensors", + "model.layers.7.mlp.experts.41.up_proj.weight": "model-00008-of-00047.safetensors", + "model.layers.7.mlp.experts.41.up_proj.weight_scale": "model-00008-of-00047.safetensors", + "model.layers.7.mlp.experts.42.down_proj.weight": "model-00008-of-00047.safetensors", + "model.layers.7.mlp.experts.42.down_proj.weight_scale": "model-00008-of-00047.safetensors", + "model.layers.7.mlp.experts.42.gate_proj.weight": "model-00008-of-00047.safetensors", + "model.layers.7.mlp.experts.42.gate_proj.weight_scale": "model-00008-of-00047.safetensors", + "model.layers.7.mlp.experts.42.up_proj.weight": "model-00008-of-00047.safetensors", + "model.layers.7.mlp.experts.42.up_proj.weight_scale": "model-00008-of-00047.safetensors", + "model.layers.7.mlp.experts.43.down_proj.weight": "model-00008-of-00047.safetensors", + "model.layers.7.mlp.experts.43.down_proj.weight_scale": "model-00008-of-00047.safetensors", + "model.layers.7.mlp.experts.43.gate_proj.weight": "model-00008-of-00047.safetensors", + "model.layers.7.mlp.experts.43.gate_proj.weight_scale": "model-00008-of-00047.safetensors", + "model.layers.7.mlp.experts.43.up_proj.weight": "model-00008-of-00047.safetensors", + "model.layers.7.mlp.experts.43.up_proj.weight_scale": "model-00008-of-00047.safetensors", + "model.layers.7.mlp.experts.44.down_proj.weight": "model-00008-of-00047.safetensors", + "model.layers.7.mlp.experts.44.down_proj.weight_scale": "model-00008-of-00047.safetensors", + "model.layers.7.mlp.experts.44.gate_proj.weight": "model-00008-of-00047.safetensors", + "model.layers.7.mlp.experts.44.gate_proj.weight_scale": "model-00008-of-00047.safetensors", + "model.layers.7.mlp.experts.44.up_proj.weight": "model-00008-of-00047.safetensors", + "model.layers.7.mlp.experts.44.up_proj.weight_scale": "model-00008-of-00047.safetensors", + "model.layers.7.mlp.experts.45.down_proj.weight": "model-00008-of-00047.safetensors", + "model.layers.7.mlp.experts.45.down_proj.weight_scale": "model-00008-of-00047.safetensors", + "model.layers.7.mlp.experts.45.gate_proj.weight": "model-00008-of-00047.safetensors", + "model.layers.7.mlp.experts.45.gate_proj.weight_scale": "model-00008-of-00047.safetensors", + "model.layers.7.mlp.experts.45.up_proj.weight": "model-00008-of-00047.safetensors", + "model.layers.7.mlp.experts.45.up_proj.weight_scale": "model-00008-of-00047.safetensors", + "model.layers.7.mlp.experts.46.down_proj.weight": "model-00008-of-00047.safetensors", + "model.layers.7.mlp.experts.46.down_proj.weight_scale": "model-00008-of-00047.safetensors", + "model.layers.7.mlp.experts.46.gate_proj.weight": "model-00008-of-00047.safetensors", + "model.layers.7.mlp.experts.46.gate_proj.weight_scale": "model-00008-of-00047.safetensors", + "model.layers.7.mlp.experts.46.up_proj.weight": "model-00008-of-00047.safetensors", + "model.layers.7.mlp.experts.46.up_proj.weight_scale": "model-00008-of-00047.safetensors", + "model.layers.7.mlp.experts.47.down_proj.weight": "model-00008-of-00047.safetensors", + "model.layers.7.mlp.experts.47.down_proj.weight_scale": "model-00008-of-00047.safetensors", + "model.layers.7.mlp.experts.47.gate_proj.weight": "model-00008-of-00047.safetensors", + "model.layers.7.mlp.experts.47.gate_proj.weight_scale": "model-00008-of-00047.safetensors", + "model.layers.7.mlp.experts.47.up_proj.weight": "model-00008-of-00047.safetensors", + "model.layers.7.mlp.experts.47.up_proj.weight_scale": "model-00008-of-00047.safetensors", + "model.layers.7.mlp.experts.48.down_proj.weight": "model-00008-of-00047.safetensors", + "model.layers.7.mlp.experts.48.down_proj.weight_scale": "model-00008-of-00047.safetensors", + "model.layers.7.mlp.experts.48.gate_proj.weight": "model-00008-of-00047.safetensors", + "model.layers.7.mlp.experts.48.gate_proj.weight_scale": "model-00008-of-00047.safetensors", + "model.layers.7.mlp.experts.48.up_proj.weight": "model-00008-of-00047.safetensors", + "model.layers.7.mlp.experts.48.up_proj.weight_scale": "model-00008-of-00047.safetensors", + "model.layers.7.mlp.experts.49.down_proj.weight": "model-00008-of-00047.safetensors", + "model.layers.7.mlp.experts.49.down_proj.weight_scale": "model-00008-of-00047.safetensors", + "model.layers.7.mlp.experts.49.gate_proj.weight": "model-00008-of-00047.safetensors", + "model.layers.7.mlp.experts.49.gate_proj.weight_scale": "model-00008-of-00047.safetensors", + "model.layers.7.mlp.experts.49.up_proj.weight": "model-00008-of-00047.safetensors", + "model.layers.7.mlp.experts.49.up_proj.weight_scale": "model-00008-of-00047.safetensors", + "model.layers.7.mlp.experts.5.down_proj.weight": "model-00008-of-00047.safetensors", + "model.layers.7.mlp.experts.5.down_proj.weight_scale": "model-00008-of-00047.safetensors", + "model.layers.7.mlp.experts.5.gate_proj.weight": "model-00008-of-00047.safetensors", + "model.layers.7.mlp.experts.5.gate_proj.weight_scale": "model-00008-of-00047.safetensors", + "model.layers.7.mlp.experts.5.up_proj.weight": "model-00008-of-00047.safetensors", + "model.layers.7.mlp.experts.5.up_proj.weight_scale": "model-00008-of-00047.safetensors", + "model.layers.7.mlp.experts.50.down_proj.weight": "model-00008-of-00047.safetensors", + "model.layers.7.mlp.experts.50.down_proj.weight_scale": "model-00008-of-00047.safetensors", + "model.layers.7.mlp.experts.50.gate_proj.weight": "model-00008-of-00047.safetensors", + "model.layers.7.mlp.experts.50.gate_proj.weight_scale": "model-00008-of-00047.safetensors", + "model.layers.7.mlp.experts.50.up_proj.weight": "model-00008-of-00047.safetensors", + "model.layers.7.mlp.experts.50.up_proj.weight_scale": "model-00008-of-00047.safetensors", + "model.layers.7.mlp.experts.51.down_proj.weight": "model-00008-of-00047.safetensors", + "model.layers.7.mlp.experts.51.down_proj.weight_scale": "model-00008-of-00047.safetensors", + "model.layers.7.mlp.experts.51.gate_proj.weight": "model-00008-of-00047.safetensors", + "model.layers.7.mlp.experts.51.gate_proj.weight_scale": "model-00008-of-00047.safetensors", + "model.layers.7.mlp.experts.51.up_proj.weight": "model-00008-of-00047.safetensors", + "model.layers.7.mlp.experts.51.up_proj.weight_scale": "model-00008-of-00047.safetensors", + "model.layers.7.mlp.experts.52.down_proj.weight": "model-00008-of-00047.safetensors", + "model.layers.7.mlp.experts.52.down_proj.weight_scale": "model-00008-of-00047.safetensors", + "model.layers.7.mlp.experts.52.gate_proj.weight": "model-00008-of-00047.safetensors", + "model.layers.7.mlp.experts.52.gate_proj.weight_scale": "model-00008-of-00047.safetensors", + "model.layers.7.mlp.experts.52.up_proj.weight": "model-00008-of-00047.safetensors", + "model.layers.7.mlp.experts.52.up_proj.weight_scale": "model-00008-of-00047.safetensors", + "model.layers.7.mlp.experts.53.down_proj.weight": "model-00008-of-00047.safetensors", + "model.layers.7.mlp.experts.53.down_proj.weight_scale": "model-00008-of-00047.safetensors", + "model.layers.7.mlp.experts.53.gate_proj.weight": "model-00008-of-00047.safetensors", + "model.layers.7.mlp.experts.53.gate_proj.weight_scale": "model-00008-of-00047.safetensors", + "model.layers.7.mlp.experts.53.up_proj.weight": "model-00008-of-00047.safetensors", + "model.layers.7.mlp.experts.53.up_proj.weight_scale": "model-00008-of-00047.safetensors", + "model.layers.7.mlp.experts.54.down_proj.weight": "model-00008-of-00047.safetensors", + "model.layers.7.mlp.experts.54.down_proj.weight_scale": "model-00008-of-00047.safetensors", + "model.layers.7.mlp.experts.54.gate_proj.weight": "model-00008-of-00047.safetensors", + "model.layers.7.mlp.experts.54.gate_proj.weight_scale": "model-00008-of-00047.safetensors", + "model.layers.7.mlp.experts.54.up_proj.weight": "model-00008-of-00047.safetensors", + "model.layers.7.mlp.experts.54.up_proj.weight_scale": "model-00008-of-00047.safetensors", + "model.layers.7.mlp.experts.55.down_proj.weight": "model-00008-of-00047.safetensors", + "model.layers.7.mlp.experts.55.down_proj.weight_scale": "model-00008-of-00047.safetensors", + "model.layers.7.mlp.experts.55.gate_proj.weight": "model-00008-of-00047.safetensors", + "model.layers.7.mlp.experts.55.gate_proj.weight_scale": "model-00008-of-00047.safetensors", + "model.layers.7.mlp.experts.55.up_proj.weight": "model-00008-of-00047.safetensors", + "model.layers.7.mlp.experts.55.up_proj.weight_scale": "model-00008-of-00047.safetensors", + "model.layers.7.mlp.experts.56.down_proj.weight": "model-00008-of-00047.safetensors", + "model.layers.7.mlp.experts.56.down_proj.weight_scale": "model-00008-of-00047.safetensors", + "model.layers.7.mlp.experts.56.gate_proj.weight": "model-00008-of-00047.safetensors", + "model.layers.7.mlp.experts.56.gate_proj.weight_scale": "model-00008-of-00047.safetensors", + "model.layers.7.mlp.experts.56.up_proj.weight": "model-00008-of-00047.safetensors", + "model.layers.7.mlp.experts.56.up_proj.weight_scale": "model-00008-of-00047.safetensors", + "model.layers.7.mlp.experts.57.down_proj.weight": "model-00008-of-00047.safetensors", + "model.layers.7.mlp.experts.57.down_proj.weight_scale": "model-00008-of-00047.safetensors", + "model.layers.7.mlp.experts.57.gate_proj.weight": "model-00008-of-00047.safetensors", + "model.layers.7.mlp.experts.57.gate_proj.weight_scale": "model-00008-of-00047.safetensors", + "model.layers.7.mlp.experts.57.up_proj.weight": "model-00008-of-00047.safetensors", + "model.layers.7.mlp.experts.57.up_proj.weight_scale": "model-00008-of-00047.safetensors", + "model.layers.7.mlp.experts.58.down_proj.weight": "model-00008-of-00047.safetensors", + "model.layers.7.mlp.experts.58.down_proj.weight_scale": "model-00008-of-00047.safetensors", + "model.layers.7.mlp.experts.58.gate_proj.weight": "model-00008-of-00047.safetensors", + "model.layers.7.mlp.experts.58.gate_proj.weight_scale": "model-00008-of-00047.safetensors", + "model.layers.7.mlp.experts.58.up_proj.weight": "model-00008-of-00047.safetensors", + "model.layers.7.mlp.experts.58.up_proj.weight_scale": "model-00008-of-00047.safetensors", + "model.layers.7.mlp.experts.59.down_proj.weight": "model-00008-of-00047.safetensors", + "model.layers.7.mlp.experts.59.down_proj.weight_scale": "model-00008-of-00047.safetensors", + "model.layers.7.mlp.experts.59.gate_proj.weight": "model-00008-of-00047.safetensors", + "model.layers.7.mlp.experts.59.gate_proj.weight_scale": "model-00008-of-00047.safetensors", + "model.layers.7.mlp.experts.59.up_proj.weight": "model-00008-of-00047.safetensors", + "model.layers.7.mlp.experts.59.up_proj.weight_scale": "model-00008-of-00047.safetensors", + "model.layers.7.mlp.experts.6.down_proj.weight": "model-00008-of-00047.safetensors", + "model.layers.7.mlp.experts.6.down_proj.weight_scale": "model-00008-of-00047.safetensors", + "model.layers.7.mlp.experts.6.gate_proj.weight": "model-00008-of-00047.safetensors", + "model.layers.7.mlp.experts.6.gate_proj.weight_scale": "model-00008-of-00047.safetensors", + "model.layers.7.mlp.experts.6.up_proj.weight": "model-00008-of-00047.safetensors", + "model.layers.7.mlp.experts.6.up_proj.weight_scale": "model-00008-of-00047.safetensors", + "model.layers.7.mlp.experts.60.down_proj.weight": "model-00008-of-00047.safetensors", + "model.layers.7.mlp.experts.60.down_proj.weight_scale": "model-00008-of-00047.safetensors", + "model.layers.7.mlp.experts.60.gate_proj.weight": "model-00008-of-00047.safetensors", + "model.layers.7.mlp.experts.60.gate_proj.weight_scale": "model-00008-of-00047.safetensors", + "model.layers.7.mlp.experts.60.up_proj.weight": "model-00008-of-00047.safetensors", + "model.layers.7.mlp.experts.60.up_proj.weight_scale": "model-00008-of-00047.safetensors", + "model.layers.7.mlp.experts.61.down_proj.weight": "model-00008-of-00047.safetensors", + "model.layers.7.mlp.experts.61.down_proj.weight_scale": "model-00008-of-00047.safetensors", + "model.layers.7.mlp.experts.61.gate_proj.weight": "model-00008-of-00047.safetensors", + "model.layers.7.mlp.experts.61.gate_proj.weight_scale": "model-00008-of-00047.safetensors", + "model.layers.7.mlp.experts.61.up_proj.weight": "model-00008-of-00047.safetensors", + "model.layers.7.mlp.experts.61.up_proj.weight_scale": "model-00008-of-00047.safetensors", + "model.layers.7.mlp.experts.62.down_proj.weight": "model-00008-of-00047.safetensors", + "model.layers.7.mlp.experts.62.down_proj.weight_scale": "model-00008-of-00047.safetensors", + "model.layers.7.mlp.experts.62.gate_proj.weight": "model-00008-of-00047.safetensors", + "model.layers.7.mlp.experts.62.gate_proj.weight_scale": "model-00008-of-00047.safetensors", + "model.layers.7.mlp.experts.62.up_proj.weight": "model-00008-of-00047.safetensors", + "model.layers.7.mlp.experts.62.up_proj.weight_scale": "model-00008-of-00047.safetensors", + "model.layers.7.mlp.experts.63.down_proj.weight": "model-00008-of-00047.safetensors", + "model.layers.7.mlp.experts.63.down_proj.weight_scale": "model-00008-of-00047.safetensors", + "model.layers.7.mlp.experts.63.gate_proj.weight": "model-00008-of-00047.safetensors", + "model.layers.7.mlp.experts.63.gate_proj.weight_scale": "model-00008-of-00047.safetensors", + "model.layers.7.mlp.experts.63.up_proj.weight": "model-00008-of-00047.safetensors", + "model.layers.7.mlp.experts.63.up_proj.weight_scale": "model-00008-of-00047.safetensors", + "model.layers.7.mlp.experts.64.down_proj.weight": "model-00008-of-00047.safetensors", + "model.layers.7.mlp.experts.64.down_proj.weight_scale": "model-00008-of-00047.safetensors", + "model.layers.7.mlp.experts.64.gate_proj.weight": "model-00008-of-00047.safetensors", + "model.layers.7.mlp.experts.64.gate_proj.weight_scale": "model-00008-of-00047.safetensors", + "model.layers.7.mlp.experts.64.up_proj.weight": "model-00008-of-00047.safetensors", + "model.layers.7.mlp.experts.64.up_proj.weight_scale": "model-00008-of-00047.safetensors", + "model.layers.7.mlp.experts.65.down_proj.weight": "model-00008-of-00047.safetensors", + "model.layers.7.mlp.experts.65.down_proj.weight_scale": "model-00008-of-00047.safetensors", + "model.layers.7.mlp.experts.65.gate_proj.weight": "model-00008-of-00047.safetensors", + "model.layers.7.mlp.experts.65.gate_proj.weight_scale": "model-00008-of-00047.safetensors", + "model.layers.7.mlp.experts.65.up_proj.weight": "model-00008-of-00047.safetensors", + "model.layers.7.mlp.experts.65.up_proj.weight_scale": "model-00008-of-00047.safetensors", + "model.layers.7.mlp.experts.66.down_proj.weight": "model-00008-of-00047.safetensors", + "model.layers.7.mlp.experts.66.down_proj.weight_scale": "model-00008-of-00047.safetensors", + "model.layers.7.mlp.experts.66.gate_proj.weight": "model-00008-of-00047.safetensors", + "model.layers.7.mlp.experts.66.gate_proj.weight_scale": "model-00008-of-00047.safetensors", + "model.layers.7.mlp.experts.66.up_proj.weight": "model-00008-of-00047.safetensors", + "model.layers.7.mlp.experts.66.up_proj.weight_scale": "model-00008-of-00047.safetensors", + "model.layers.7.mlp.experts.67.down_proj.weight": "model-00008-of-00047.safetensors", + "model.layers.7.mlp.experts.67.down_proj.weight_scale": "model-00008-of-00047.safetensors", + "model.layers.7.mlp.experts.67.gate_proj.weight": "model-00008-of-00047.safetensors", + "model.layers.7.mlp.experts.67.gate_proj.weight_scale": "model-00008-of-00047.safetensors", + "model.layers.7.mlp.experts.67.up_proj.weight": "model-00008-of-00047.safetensors", + "model.layers.7.mlp.experts.67.up_proj.weight_scale": "model-00008-of-00047.safetensors", + "model.layers.7.mlp.experts.68.down_proj.weight": "model-00008-of-00047.safetensors", + "model.layers.7.mlp.experts.68.down_proj.weight_scale": "model-00008-of-00047.safetensors", + "model.layers.7.mlp.experts.68.gate_proj.weight": "model-00008-of-00047.safetensors", + "model.layers.7.mlp.experts.68.gate_proj.weight_scale": "model-00008-of-00047.safetensors", + "model.layers.7.mlp.experts.68.up_proj.weight": "model-00008-of-00047.safetensors", + "model.layers.7.mlp.experts.68.up_proj.weight_scale": "model-00008-of-00047.safetensors", + "model.layers.7.mlp.experts.69.down_proj.weight": "model-00008-of-00047.safetensors", + "model.layers.7.mlp.experts.69.down_proj.weight_scale": "model-00008-of-00047.safetensors", + "model.layers.7.mlp.experts.69.gate_proj.weight": "model-00008-of-00047.safetensors", + "model.layers.7.mlp.experts.69.gate_proj.weight_scale": "model-00008-of-00047.safetensors", + "model.layers.7.mlp.experts.69.up_proj.weight": "model-00008-of-00047.safetensors", + "model.layers.7.mlp.experts.69.up_proj.weight_scale": "model-00008-of-00047.safetensors", + "model.layers.7.mlp.experts.7.down_proj.weight": "model-00008-of-00047.safetensors", + "model.layers.7.mlp.experts.7.down_proj.weight_scale": "model-00008-of-00047.safetensors", + "model.layers.7.mlp.experts.7.gate_proj.weight": "model-00008-of-00047.safetensors", + "model.layers.7.mlp.experts.7.gate_proj.weight_scale": "model-00008-of-00047.safetensors", + "model.layers.7.mlp.experts.7.up_proj.weight": "model-00008-of-00047.safetensors", + "model.layers.7.mlp.experts.7.up_proj.weight_scale": "model-00008-of-00047.safetensors", + "model.layers.7.mlp.experts.70.down_proj.weight": "model-00008-of-00047.safetensors", + "model.layers.7.mlp.experts.70.down_proj.weight_scale": "model-00008-of-00047.safetensors", + "model.layers.7.mlp.experts.70.gate_proj.weight": "model-00008-of-00047.safetensors", + "model.layers.7.mlp.experts.70.gate_proj.weight_scale": "model-00008-of-00047.safetensors", + "model.layers.7.mlp.experts.70.up_proj.weight": "model-00008-of-00047.safetensors", + "model.layers.7.mlp.experts.70.up_proj.weight_scale": "model-00008-of-00047.safetensors", + "model.layers.7.mlp.experts.71.down_proj.weight": "model-00008-of-00047.safetensors", + "model.layers.7.mlp.experts.71.down_proj.weight_scale": "model-00008-of-00047.safetensors", + "model.layers.7.mlp.experts.71.gate_proj.weight": "model-00008-of-00047.safetensors", + "model.layers.7.mlp.experts.71.gate_proj.weight_scale": "model-00008-of-00047.safetensors", + "model.layers.7.mlp.experts.71.up_proj.weight": "model-00008-of-00047.safetensors", + "model.layers.7.mlp.experts.71.up_proj.weight_scale": "model-00008-of-00047.safetensors", + "model.layers.7.mlp.experts.72.down_proj.weight": "model-00008-of-00047.safetensors", + "model.layers.7.mlp.experts.72.down_proj.weight_scale": "model-00008-of-00047.safetensors", + "model.layers.7.mlp.experts.72.gate_proj.weight": "model-00008-of-00047.safetensors", + "model.layers.7.mlp.experts.72.gate_proj.weight_scale": "model-00008-of-00047.safetensors", + "model.layers.7.mlp.experts.72.up_proj.weight": "model-00008-of-00047.safetensors", + "model.layers.7.mlp.experts.72.up_proj.weight_scale": "model-00008-of-00047.safetensors", + "model.layers.7.mlp.experts.73.down_proj.weight": "model-00008-of-00047.safetensors", + "model.layers.7.mlp.experts.73.down_proj.weight_scale": "model-00008-of-00047.safetensors", + "model.layers.7.mlp.experts.73.gate_proj.weight": "model-00008-of-00047.safetensors", + "model.layers.7.mlp.experts.73.gate_proj.weight_scale": "model-00008-of-00047.safetensors", + "model.layers.7.mlp.experts.73.up_proj.weight": "model-00008-of-00047.safetensors", + "model.layers.7.mlp.experts.73.up_proj.weight_scale": "model-00008-of-00047.safetensors", + "model.layers.7.mlp.experts.74.down_proj.weight": "model-00008-of-00047.safetensors", + "model.layers.7.mlp.experts.74.down_proj.weight_scale": "model-00008-of-00047.safetensors", + "model.layers.7.mlp.experts.74.gate_proj.weight": "model-00008-of-00047.safetensors", + "model.layers.7.mlp.experts.74.gate_proj.weight_scale": "model-00008-of-00047.safetensors", + "model.layers.7.mlp.experts.74.up_proj.weight": "model-00008-of-00047.safetensors", + "model.layers.7.mlp.experts.74.up_proj.weight_scale": "model-00008-of-00047.safetensors", + "model.layers.7.mlp.experts.75.down_proj.weight": "model-00008-of-00047.safetensors", + "model.layers.7.mlp.experts.75.down_proj.weight_scale": "model-00008-of-00047.safetensors", + "model.layers.7.mlp.experts.75.gate_proj.weight": "model-00008-of-00047.safetensors", + "model.layers.7.mlp.experts.75.gate_proj.weight_scale": "model-00008-of-00047.safetensors", + "model.layers.7.mlp.experts.75.up_proj.weight": "model-00008-of-00047.safetensors", + "model.layers.7.mlp.experts.75.up_proj.weight_scale": "model-00008-of-00047.safetensors", + "model.layers.7.mlp.experts.76.down_proj.weight": "model-00008-of-00047.safetensors", + "model.layers.7.mlp.experts.76.down_proj.weight_scale": "model-00008-of-00047.safetensors", + "model.layers.7.mlp.experts.76.gate_proj.weight": "model-00008-of-00047.safetensors", + "model.layers.7.mlp.experts.76.gate_proj.weight_scale": "model-00008-of-00047.safetensors", + "model.layers.7.mlp.experts.76.up_proj.weight": "model-00008-of-00047.safetensors", + "model.layers.7.mlp.experts.76.up_proj.weight_scale": "model-00008-of-00047.safetensors", + "model.layers.7.mlp.experts.77.down_proj.weight": "model-00008-of-00047.safetensors", + "model.layers.7.mlp.experts.77.down_proj.weight_scale": "model-00008-of-00047.safetensors", + "model.layers.7.mlp.experts.77.gate_proj.weight": "model-00008-of-00047.safetensors", + "model.layers.7.mlp.experts.77.gate_proj.weight_scale": "model-00008-of-00047.safetensors", + "model.layers.7.mlp.experts.77.up_proj.weight": "model-00008-of-00047.safetensors", + "model.layers.7.mlp.experts.77.up_proj.weight_scale": "model-00008-of-00047.safetensors", + "model.layers.7.mlp.experts.78.down_proj.weight": "model-00008-of-00047.safetensors", + "model.layers.7.mlp.experts.78.down_proj.weight_scale": "model-00008-of-00047.safetensors", + "model.layers.7.mlp.experts.78.gate_proj.weight": "model-00008-of-00047.safetensors", + "model.layers.7.mlp.experts.78.gate_proj.weight_scale": "model-00008-of-00047.safetensors", + "model.layers.7.mlp.experts.78.up_proj.weight": "model-00008-of-00047.safetensors", + "model.layers.7.mlp.experts.78.up_proj.weight_scale": "model-00008-of-00047.safetensors", + "model.layers.7.mlp.experts.79.down_proj.weight": "model-00008-of-00047.safetensors", + "model.layers.7.mlp.experts.79.down_proj.weight_scale": "model-00008-of-00047.safetensors", + "model.layers.7.mlp.experts.79.gate_proj.weight": "model-00008-of-00047.safetensors", + "model.layers.7.mlp.experts.79.gate_proj.weight_scale": "model-00008-of-00047.safetensors", + "model.layers.7.mlp.experts.79.up_proj.weight": "model-00008-of-00047.safetensors", + "model.layers.7.mlp.experts.79.up_proj.weight_scale": "model-00008-of-00047.safetensors", + "model.layers.7.mlp.experts.8.down_proj.weight": "model-00008-of-00047.safetensors", + "model.layers.7.mlp.experts.8.down_proj.weight_scale": "model-00008-of-00047.safetensors", + "model.layers.7.mlp.experts.8.gate_proj.weight": "model-00008-of-00047.safetensors", + "model.layers.7.mlp.experts.8.gate_proj.weight_scale": "model-00008-of-00047.safetensors", + "model.layers.7.mlp.experts.8.up_proj.weight": "model-00008-of-00047.safetensors", + "model.layers.7.mlp.experts.8.up_proj.weight_scale": "model-00008-of-00047.safetensors", + "model.layers.7.mlp.experts.80.down_proj.weight": "model-00008-of-00047.safetensors", + "model.layers.7.mlp.experts.80.down_proj.weight_scale": "model-00008-of-00047.safetensors", + "model.layers.7.mlp.experts.80.gate_proj.weight": "model-00008-of-00047.safetensors", + "model.layers.7.mlp.experts.80.gate_proj.weight_scale": "model-00008-of-00047.safetensors", + "model.layers.7.mlp.experts.80.up_proj.weight": "model-00008-of-00047.safetensors", + "model.layers.7.mlp.experts.80.up_proj.weight_scale": "model-00008-of-00047.safetensors", + "model.layers.7.mlp.experts.81.down_proj.weight": "model-00008-of-00047.safetensors", + "model.layers.7.mlp.experts.81.down_proj.weight_scale": "model-00008-of-00047.safetensors", + "model.layers.7.mlp.experts.81.gate_proj.weight": "model-00008-of-00047.safetensors", + "model.layers.7.mlp.experts.81.gate_proj.weight_scale": "model-00008-of-00047.safetensors", + "model.layers.7.mlp.experts.81.up_proj.weight": "model-00008-of-00047.safetensors", + "model.layers.7.mlp.experts.81.up_proj.weight_scale": "model-00008-of-00047.safetensors", + "model.layers.7.mlp.experts.82.down_proj.weight": "model-00008-of-00047.safetensors", + "model.layers.7.mlp.experts.82.down_proj.weight_scale": "model-00008-of-00047.safetensors", + "model.layers.7.mlp.experts.82.gate_proj.weight": "model-00008-of-00047.safetensors", + "model.layers.7.mlp.experts.82.gate_proj.weight_scale": "model-00008-of-00047.safetensors", + "model.layers.7.mlp.experts.82.up_proj.weight": "model-00008-of-00047.safetensors", + "model.layers.7.mlp.experts.82.up_proj.weight_scale": "model-00008-of-00047.safetensors", + "model.layers.7.mlp.experts.83.down_proj.weight": "model-00008-of-00047.safetensors", + "model.layers.7.mlp.experts.83.down_proj.weight_scale": "model-00008-of-00047.safetensors", + "model.layers.7.mlp.experts.83.gate_proj.weight": "model-00008-of-00047.safetensors", + "model.layers.7.mlp.experts.83.gate_proj.weight_scale": "model-00008-of-00047.safetensors", + "model.layers.7.mlp.experts.83.up_proj.weight": "model-00008-of-00047.safetensors", + "model.layers.7.mlp.experts.83.up_proj.weight_scale": "model-00008-of-00047.safetensors", + "model.layers.7.mlp.experts.84.down_proj.weight": "model-00008-of-00047.safetensors", + "model.layers.7.mlp.experts.84.down_proj.weight_scale": "model-00008-of-00047.safetensors", + "model.layers.7.mlp.experts.84.gate_proj.weight": "model-00008-of-00047.safetensors", + "model.layers.7.mlp.experts.84.gate_proj.weight_scale": "model-00008-of-00047.safetensors", + "model.layers.7.mlp.experts.84.up_proj.weight": "model-00008-of-00047.safetensors", + "model.layers.7.mlp.experts.84.up_proj.weight_scale": "model-00008-of-00047.safetensors", + "model.layers.7.mlp.experts.85.down_proj.weight": "model-00008-of-00047.safetensors", + "model.layers.7.mlp.experts.85.down_proj.weight_scale": "model-00008-of-00047.safetensors", + "model.layers.7.mlp.experts.85.gate_proj.weight": "model-00008-of-00047.safetensors", + "model.layers.7.mlp.experts.85.gate_proj.weight_scale": "model-00008-of-00047.safetensors", + "model.layers.7.mlp.experts.85.up_proj.weight": "model-00008-of-00047.safetensors", + "model.layers.7.mlp.experts.85.up_proj.weight_scale": "model-00008-of-00047.safetensors", + "model.layers.7.mlp.experts.86.down_proj.weight": "model-00008-of-00047.safetensors", + "model.layers.7.mlp.experts.86.down_proj.weight_scale": "model-00008-of-00047.safetensors", + "model.layers.7.mlp.experts.86.gate_proj.weight": "model-00008-of-00047.safetensors", + "model.layers.7.mlp.experts.86.gate_proj.weight_scale": "model-00008-of-00047.safetensors", + "model.layers.7.mlp.experts.86.up_proj.weight": "model-00008-of-00047.safetensors", + "model.layers.7.mlp.experts.86.up_proj.weight_scale": "model-00008-of-00047.safetensors", + "model.layers.7.mlp.experts.87.down_proj.weight": "model-00008-of-00047.safetensors", + "model.layers.7.mlp.experts.87.down_proj.weight_scale": "model-00008-of-00047.safetensors", + "model.layers.7.mlp.experts.87.gate_proj.weight": "model-00008-of-00047.safetensors", + "model.layers.7.mlp.experts.87.gate_proj.weight_scale": "model-00008-of-00047.safetensors", + "model.layers.7.mlp.experts.87.up_proj.weight": "model-00008-of-00047.safetensors", + "model.layers.7.mlp.experts.87.up_proj.weight_scale": "model-00008-of-00047.safetensors", + "model.layers.7.mlp.experts.88.down_proj.weight": "model-00008-of-00047.safetensors", + "model.layers.7.mlp.experts.88.down_proj.weight_scale": "model-00008-of-00047.safetensors", + "model.layers.7.mlp.experts.88.gate_proj.weight": "model-00008-of-00047.safetensors", + "model.layers.7.mlp.experts.88.gate_proj.weight_scale": "model-00008-of-00047.safetensors", + "model.layers.7.mlp.experts.88.up_proj.weight": "model-00008-of-00047.safetensors", + "model.layers.7.mlp.experts.88.up_proj.weight_scale": "model-00008-of-00047.safetensors", + "model.layers.7.mlp.experts.89.down_proj.weight": "model-00008-of-00047.safetensors", + "model.layers.7.mlp.experts.89.down_proj.weight_scale": "model-00008-of-00047.safetensors", + "model.layers.7.mlp.experts.89.gate_proj.weight": "model-00008-of-00047.safetensors", + "model.layers.7.mlp.experts.89.gate_proj.weight_scale": "model-00008-of-00047.safetensors", + "model.layers.7.mlp.experts.89.up_proj.weight": "model-00008-of-00047.safetensors", + "model.layers.7.mlp.experts.89.up_proj.weight_scale": "model-00008-of-00047.safetensors", + "model.layers.7.mlp.experts.9.down_proj.weight": "model-00008-of-00047.safetensors", + "model.layers.7.mlp.experts.9.down_proj.weight_scale": "model-00008-of-00047.safetensors", + "model.layers.7.mlp.experts.9.gate_proj.weight": "model-00008-of-00047.safetensors", + "model.layers.7.mlp.experts.9.gate_proj.weight_scale": "model-00008-of-00047.safetensors", + "model.layers.7.mlp.experts.9.up_proj.weight": "model-00008-of-00047.safetensors", + "model.layers.7.mlp.experts.9.up_proj.weight_scale": "model-00008-of-00047.safetensors", + "model.layers.7.mlp.experts.90.down_proj.weight": "model-00008-of-00047.safetensors", + "model.layers.7.mlp.experts.90.down_proj.weight_scale": "model-00008-of-00047.safetensors", + "model.layers.7.mlp.experts.90.gate_proj.weight": "model-00008-of-00047.safetensors", + "model.layers.7.mlp.experts.90.gate_proj.weight_scale": "model-00008-of-00047.safetensors", + "model.layers.7.mlp.experts.90.up_proj.weight": "model-00008-of-00047.safetensors", + "model.layers.7.mlp.experts.90.up_proj.weight_scale": "model-00008-of-00047.safetensors", + "model.layers.7.mlp.experts.91.down_proj.weight": "model-00008-of-00047.safetensors", + "model.layers.7.mlp.experts.91.down_proj.weight_scale": "model-00008-of-00047.safetensors", + "model.layers.7.mlp.experts.91.gate_proj.weight": "model-00008-of-00047.safetensors", + "model.layers.7.mlp.experts.91.gate_proj.weight_scale": "model-00008-of-00047.safetensors", + "model.layers.7.mlp.experts.91.up_proj.weight": "model-00008-of-00047.safetensors", + "model.layers.7.mlp.experts.91.up_proj.weight_scale": "model-00008-of-00047.safetensors", + "model.layers.7.mlp.experts.92.down_proj.weight": "model-00008-of-00047.safetensors", + "model.layers.7.mlp.experts.92.down_proj.weight_scale": "model-00008-of-00047.safetensors", + "model.layers.7.mlp.experts.92.gate_proj.weight": "model-00008-of-00047.safetensors", + "model.layers.7.mlp.experts.92.gate_proj.weight_scale": "model-00008-of-00047.safetensors", + "model.layers.7.mlp.experts.92.up_proj.weight": "model-00008-of-00047.safetensors", + "model.layers.7.mlp.experts.92.up_proj.weight_scale": "model-00008-of-00047.safetensors", + "model.layers.7.mlp.experts.93.down_proj.weight": "model-00008-of-00047.safetensors", + "model.layers.7.mlp.experts.93.down_proj.weight_scale": "model-00008-of-00047.safetensors", + "model.layers.7.mlp.experts.93.gate_proj.weight": "model-00008-of-00047.safetensors", + "model.layers.7.mlp.experts.93.gate_proj.weight_scale": "model-00008-of-00047.safetensors", + "model.layers.7.mlp.experts.93.up_proj.weight": "model-00008-of-00047.safetensors", + "model.layers.7.mlp.experts.93.up_proj.weight_scale": "model-00008-of-00047.safetensors", + "model.layers.7.mlp.experts.94.down_proj.weight": "model-00008-of-00047.safetensors", + "model.layers.7.mlp.experts.94.down_proj.weight_scale": "model-00008-of-00047.safetensors", + "model.layers.7.mlp.experts.94.gate_proj.weight": "model-00008-of-00047.safetensors", + "model.layers.7.mlp.experts.94.gate_proj.weight_scale": "model-00008-of-00047.safetensors", + "model.layers.7.mlp.experts.94.up_proj.weight": "model-00008-of-00047.safetensors", + "model.layers.7.mlp.experts.94.up_proj.weight_scale": "model-00008-of-00047.safetensors", + "model.layers.7.mlp.experts.95.down_proj.weight": "model-00008-of-00047.safetensors", + "model.layers.7.mlp.experts.95.down_proj.weight_scale": "model-00008-of-00047.safetensors", + "model.layers.7.mlp.experts.95.gate_proj.weight": "model-00008-of-00047.safetensors", + "model.layers.7.mlp.experts.95.gate_proj.weight_scale": "model-00008-of-00047.safetensors", + "model.layers.7.mlp.experts.95.up_proj.weight": "model-00008-of-00047.safetensors", + "model.layers.7.mlp.experts.95.up_proj.weight_scale": "model-00008-of-00047.safetensors", + "model.layers.7.mlp.experts.96.down_proj.weight": "model-00008-of-00047.safetensors", + "model.layers.7.mlp.experts.96.down_proj.weight_scale": "model-00008-of-00047.safetensors", + "model.layers.7.mlp.experts.96.gate_proj.weight": "model-00008-of-00047.safetensors", + "model.layers.7.mlp.experts.96.gate_proj.weight_scale": "model-00008-of-00047.safetensors", + "model.layers.7.mlp.experts.96.up_proj.weight": "model-00008-of-00047.safetensors", + "model.layers.7.mlp.experts.96.up_proj.weight_scale": "model-00008-of-00047.safetensors", + "model.layers.7.mlp.experts.97.down_proj.weight": "model-00008-of-00047.safetensors", + "model.layers.7.mlp.experts.97.down_proj.weight_scale": "model-00008-of-00047.safetensors", + "model.layers.7.mlp.experts.97.gate_proj.weight": "model-00008-of-00047.safetensors", + "model.layers.7.mlp.experts.97.gate_proj.weight_scale": "model-00008-of-00047.safetensors", + "model.layers.7.mlp.experts.97.up_proj.weight": "model-00008-of-00047.safetensors", + "model.layers.7.mlp.experts.97.up_proj.weight_scale": "model-00008-of-00047.safetensors", + "model.layers.7.mlp.experts.98.down_proj.weight": "model-00008-of-00047.safetensors", + "model.layers.7.mlp.experts.98.down_proj.weight_scale": "model-00008-of-00047.safetensors", + "model.layers.7.mlp.experts.98.gate_proj.weight": "model-00008-of-00047.safetensors", + "model.layers.7.mlp.experts.98.gate_proj.weight_scale": "model-00008-of-00047.safetensors", + "model.layers.7.mlp.experts.98.up_proj.weight": "model-00008-of-00047.safetensors", + "model.layers.7.mlp.experts.98.up_proj.weight_scale": "model-00008-of-00047.safetensors", + "model.layers.7.mlp.experts.99.down_proj.weight": "model-00008-of-00047.safetensors", + "model.layers.7.mlp.experts.99.down_proj.weight_scale": "model-00008-of-00047.safetensors", + "model.layers.7.mlp.experts.99.gate_proj.weight": "model-00008-of-00047.safetensors", + "model.layers.7.mlp.experts.99.gate_proj.weight_scale": "model-00008-of-00047.safetensors", + "model.layers.7.mlp.experts.99.up_proj.weight": "model-00008-of-00047.safetensors", + "model.layers.7.mlp.experts.99.up_proj.weight_scale": "model-00008-of-00047.safetensors", + "model.layers.7.mlp.gate.e_score_correction_bias": "model-00008-of-00047.safetensors", + "model.layers.7.mlp.gate.weight": "model-00008-of-00047.safetensors", + "model.layers.7.mlp.shared_experts.down_proj.weight": "model-00008-of-00047.safetensors", + "model.layers.7.mlp.shared_experts.down_proj.weight_scale": "model-00008-of-00047.safetensors", + "model.layers.7.mlp.shared_experts.gate_proj.weight": "model-00008-of-00047.safetensors", + "model.layers.7.mlp.shared_experts.gate_proj.weight_scale": "model-00008-of-00047.safetensors", + "model.layers.7.mlp.shared_experts.up_proj.weight": "model-00008-of-00047.safetensors", + "model.layers.7.mlp.shared_experts.up_proj.weight_scale": "model-00008-of-00047.safetensors", + "model.layers.7.post_attention_layernorm.weight": "model-00008-of-00047.safetensors", + "model.layers.7.self_attn.k_proj.bias": "model-00008-of-00047.safetensors", + "model.layers.7.self_attn.k_proj.weight": "model-00008-of-00047.safetensors", + "model.layers.7.self_attn.k_proj.weight_scale": "model-00008-of-00047.safetensors", + "model.layers.7.self_attn.o_proj.weight": "model-00008-of-00047.safetensors", + "model.layers.7.self_attn.o_proj.weight_scale": "model-00008-of-00047.safetensors", + "model.layers.7.self_attn.q_proj.bias": "model-00008-of-00047.safetensors", + "model.layers.7.self_attn.q_proj.weight": "model-00008-of-00047.safetensors", + "model.layers.7.self_attn.q_proj.weight_scale": "model-00008-of-00047.safetensors", + "model.layers.7.self_attn.v_proj.bias": "model-00008-of-00047.safetensors", + "model.layers.7.self_attn.v_proj.weight": "model-00008-of-00047.safetensors", + "model.layers.7.self_attn.v_proj.weight_scale": "model-00008-of-00047.safetensors", + "model.layers.8.input_layernorm.weight": "model-00009-of-00047.safetensors", + "model.layers.8.mlp.experts.0.down_proj.weight": "model-00009-of-00047.safetensors", + "model.layers.8.mlp.experts.0.down_proj.weight_scale": "model-00009-of-00047.safetensors", + "model.layers.8.mlp.experts.0.gate_proj.weight": "model-00009-of-00047.safetensors", + "model.layers.8.mlp.experts.0.gate_proj.weight_scale": "model-00009-of-00047.safetensors", + "model.layers.8.mlp.experts.0.up_proj.weight": "model-00009-of-00047.safetensors", + "model.layers.8.mlp.experts.0.up_proj.weight_scale": "model-00009-of-00047.safetensors", + "model.layers.8.mlp.experts.1.down_proj.weight": "model-00009-of-00047.safetensors", + "model.layers.8.mlp.experts.1.down_proj.weight_scale": "model-00009-of-00047.safetensors", + "model.layers.8.mlp.experts.1.gate_proj.weight": "model-00009-of-00047.safetensors", + "model.layers.8.mlp.experts.1.gate_proj.weight_scale": "model-00009-of-00047.safetensors", + "model.layers.8.mlp.experts.1.up_proj.weight": "model-00009-of-00047.safetensors", + "model.layers.8.mlp.experts.1.up_proj.weight_scale": "model-00009-of-00047.safetensors", + "model.layers.8.mlp.experts.10.down_proj.weight": "model-00009-of-00047.safetensors", + "model.layers.8.mlp.experts.10.down_proj.weight_scale": "model-00009-of-00047.safetensors", + "model.layers.8.mlp.experts.10.gate_proj.weight": "model-00009-of-00047.safetensors", + "model.layers.8.mlp.experts.10.gate_proj.weight_scale": "model-00009-of-00047.safetensors", + "model.layers.8.mlp.experts.10.up_proj.weight": "model-00009-of-00047.safetensors", + "model.layers.8.mlp.experts.10.up_proj.weight_scale": "model-00009-of-00047.safetensors", + "model.layers.8.mlp.experts.100.down_proj.weight": "model-00009-of-00047.safetensors", + "model.layers.8.mlp.experts.100.down_proj.weight_scale": "model-00009-of-00047.safetensors", + "model.layers.8.mlp.experts.100.gate_proj.weight": "model-00009-of-00047.safetensors", + "model.layers.8.mlp.experts.100.gate_proj.weight_scale": "model-00009-of-00047.safetensors", + "model.layers.8.mlp.experts.100.up_proj.weight": "model-00009-of-00047.safetensors", + "model.layers.8.mlp.experts.100.up_proj.weight_scale": "model-00009-of-00047.safetensors", + "model.layers.8.mlp.experts.101.down_proj.weight": "model-00009-of-00047.safetensors", + "model.layers.8.mlp.experts.101.down_proj.weight_scale": "model-00009-of-00047.safetensors", + "model.layers.8.mlp.experts.101.gate_proj.weight": "model-00009-of-00047.safetensors", + "model.layers.8.mlp.experts.101.gate_proj.weight_scale": "model-00009-of-00047.safetensors", + "model.layers.8.mlp.experts.101.up_proj.weight": "model-00009-of-00047.safetensors", + "model.layers.8.mlp.experts.101.up_proj.weight_scale": "model-00009-of-00047.safetensors", + "model.layers.8.mlp.experts.102.down_proj.weight": "model-00009-of-00047.safetensors", + "model.layers.8.mlp.experts.102.down_proj.weight_scale": "model-00009-of-00047.safetensors", + "model.layers.8.mlp.experts.102.gate_proj.weight": "model-00009-of-00047.safetensors", + "model.layers.8.mlp.experts.102.gate_proj.weight_scale": "model-00009-of-00047.safetensors", + "model.layers.8.mlp.experts.102.up_proj.weight": "model-00009-of-00047.safetensors", + "model.layers.8.mlp.experts.102.up_proj.weight_scale": "model-00009-of-00047.safetensors", + "model.layers.8.mlp.experts.103.down_proj.weight": "model-00009-of-00047.safetensors", + "model.layers.8.mlp.experts.103.down_proj.weight_scale": "model-00009-of-00047.safetensors", + "model.layers.8.mlp.experts.103.gate_proj.weight": "model-00009-of-00047.safetensors", + "model.layers.8.mlp.experts.103.gate_proj.weight_scale": "model-00009-of-00047.safetensors", + "model.layers.8.mlp.experts.103.up_proj.weight": "model-00009-of-00047.safetensors", + "model.layers.8.mlp.experts.103.up_proj.weight_scale": "model-00009-of-00047.safetensors", + "model.layers.8.mlp.experts.104.down_proj.weight": "model-00009-of-00047.safetensors", + "model.layers.8.mlp.experts.104.down_proj.weight_scale": "model-00009-of-00047.safetensors", + "model.layers.8.mlp.experts.104.gate_proj.weight": "model-00009-of-00047.safetensors", + "model.layers.8.mlp.experts.104.gate_proj.weight_scale": "model-00009-of-00047.safetensors", + "model.layers.8.mlp.experts.104.up_proj.weight": "model-00009-of-00047.safetensors", + "model.layers.8.mlp.experts.104.up_proj.weight_scale": "model-00009-of-00047.safetensors", + "model.layers.8.mlp.experts.105.down_proj.weight": "model-00009-of-00047.safetensors", + "model.layers.8.mlp.experts.105.down_proj.weight_scale": "model-00009-of-00047.safetensors", + "model.layers.8.mlp.experts.105.gate_proj.weight": "model-00009-of-00047.safetensors", + "model.layers.8.mlp.experts.105.gate_proj.weight_scale": "model-00009-of-00047.safetensors", + "model.layers.8.mlp.experts.105.up_proj.weight": "model-00009-of-00047.safetensors", + "model.layers.8.mlp.experts.105.up_proj.weight_scale": "model-00009-of-00047.safetensors", + "model.layers.8.mlp.experts.106.down_proj.weight": "model-00009-of-00047.safetensors", + "model.layers.8.mlp.experts.106.down_proj.weight_scale": "model-00009-of-00047.safetensors", + "model.layers.8.mlp.experts.106.gate_proj.weight": "model-00009-of-00047.safetensors", + "model.layers.8.mlp.experts.106.gate_proj.weight_scale": "model-00009-of-00047.safetensors", + "model.layers.8.mlp.experts.106.up_proj.weight": "model-00009-of-00047.safetensors", + "model.layers.8.mlp.experts.106.up_proj.weight_scale": "model-00009-of-00047.safetensors", + "model.layers.8.mlp.experts.107.down_proj.weight": "model-00009-of-00047.safetensors", + "model.layers.8.mlp.experts.107.down_proj.weight_scale": "model-00009-of-00047.safetensors", + "model.layers.8.mlp.experts.107.gate_proj.weight": "model-00009-of-00047.safetensors", + "model.layers.8.mlp.experts.107.gate_proj.weight_scale": "model-00009-of-00047.safetensors", + "model.layers.8.mlp.experts.107.up_proj.weight": "model-00009-of-00047.safetensors", + "model.layers.8.mlp.experts.107.up_proj.weight_scale": "model-00009-of-00047.safetensors", + "model.layers.8.mlp.experts.108.down_proj.weight": "model-00009-of-00047.safetensors", + "model.layers.8.mlp.experts.108.down_proj.weight_scale": "model-00009-of-00047.safetensors", + "model.layers.8.mlp.experts.108.gate_proj.weight": "model-00009-of-00047.safetensors", + "model.layers.8.mlp.experts.108.gate_proj.weight_scale": "model-00009-of-00047.safetensors", + "model.layers.8.mlp.experts.108.up_proj.weight": "model-00009-of-00047.safetensors", + "model.layers.8.mlp.experts.108.up_proj.weight_scale": "model-00009-of-00047.safetensors", + "model.layers.8.mlp.experts.109.down_proj.weight": "model-00009-of-00047.safetensors", + "model.layers.8.mlp.experts.109.down_proj.weight_scale": "model-00009-of-00047.safetensors", + "model.layers.8.mlp.experts.109.gate_proj.weight": "model-00009-of-00047.safetensors", + "model.layers.8.mlp.experts.109.gate_proj.weight_scale": "model-00009-of-00047.safetensors", + "model.layers.8.mlp.experts.109.up_proj.weight": "model-00009-of-00047.safetensors", + "model.layers.8.mlp.experts.109.up_proj.weight_scale": "model-00009-of-00047.safetensors", + "model.layers.8.mlp.experts.11.down_proj.weight": "model-00009-of-00047.safetensors", + "model.layers.8.mlp.experts.11.down_proj.weight_scale": "model-00009-of-00047.safetensors", + "model.layers.8.mlp.experts.11.gate_proj.weight": "model-00009-of-00047.safetensors", + "model.layers.8.mlp.experts.11.gate_proj.weight_scale": "model-00009-of-00047.safetensors", + "model.layers.8.mlp.experts.11.up_proj.weight": "model-00009-of-00047.safetensors", + "model.layers.8.mlp.experts.11.up_proj.weight_scale": "model-00009-of-00047.safetensors", + "model.layers.8.mlp.experts.110.down_proj.weight": "model-00009-of-00047.safetensors", + "model.layers.8.mlp.experts.110.down_proj.weight_scale": "model-00009-of-00047.safetensors", + "model.layers.8.mlp.experts.110.gate_proj.weight": "model-00009-of-00047.safetensors", + "model.layers.8.mlp.experts.110.gate_proj.weight_scale": "model-00009-of-00047.safetensors", + "model.layers.8.mlp.experts.110.up_proj.weight": "model-00009-of-00047.safetensors", + "model.layers.8.mlp.experts.110.up_proj.weight_scale": "model-00009-of-00047.safetensors", + "model.layers.8.mlp.experts.111.down_proj.weight": "model-00009-of-00047.safetensors", + "model.layers.8.mlp.experts.111.down_proj.weight_scale": "model-00009-of-00047.safetensors", + "model.layers.8.mlp.experts.111.gate_proj.weight": "model-00009-of-00047.safetensors", + "model.layers.8.mlp.experts.111.gate_proj.weight_scale": "model-00009-of-00047.safetensors", + "model.layers.8.mlp.experts.111.up_proj.weight": "model-00009-of-00047.safetensors", + "model.layers.8.mlp.experts.111.up_proj.weight_scale": "model-00009-of-00047.safetensors", + "model.layers.8.mlp.experts.112.down_proj.weight": "model-00009-of-00047.safetensors", + "model.layers.8.mlp.experts.112.down_proj.weight_scale": "model-00009-of-00047.safetensors", + "model.layers.8.mlp.experts.112.gate_proj.weight": "model-00009-of-00047.safetensors", + "model.layers.8.mlp.experts.112.gate_proj.weight_scale": "model-00009-of-00047.safetensors", + "model.layers.8.mlp.experts.112.up_proj.weight": "model-00009-of-00047.safetensors", + "model.layers.8.mlp.experts.112.up_proj.weight_scale": "model-00009-of-00047.safetensors", + "model.layers.8.mlp.experts.113.down_proj.weight": "model-00009-of-00047.safetensors", + "model.layers.8.mlp.experts.113.down_proj.weight_scale": "model-00009-of-00047.safetensors", + "model.layers.8.mlp.experts.113.gate_proj.weight": "model-00009-of-00047.safetensors", + "model.layers.8.mlp.experts.113.gate_proj.weight_scale": "model-00009-of-00047.safetensors", + "model.layers.8.mlp.experts.113.up_proj.weight": "model-00009-of-00047.safetensors", + "model.layers.8.mlp.experts.113.up_proj.weight_scale": "model-00009-of-00047.safetensors", + "model.layers.8.mlp.experts.114.down_proj.weight": "model-00009-of-00047.safetensors", + "model.layers.8.mlp.experts.114.down_proj.weight_scale": "model-00009-of-00047.safetensors", + "model.layers.8.mlp.experts.114.gate_proj.weight": "model-00009-of-00047.safetensors", + "model.layers.8.mlp.experts.114.gate_proj.weight_scale": "model-00009-of-00047.safetensors", + "model.layers.8.mlp.experts.114.up_proj.weight": "model-00009-of-00047.safetensors", + "model.layers.8.mlp.experts.114.up_proj.weight_scale": "model-00009-of-00047.safetensors", + "model.layers.8.mlp.experts.115.down_proj.weight": "model-00009-of-00047.safetensors", + "model.layers.8.mlp.experts.115.down_proj.weight_scale": "model-00009-of-00047.safetensors", + "model.layers.8.mlp.experts.115.gate_proj.weight": "model-00009-of-00047.safetensors", + "model.layers.8.mlp.experts.115.gate_proj.weight_scale": "model-00009-of-00047.safetensors", + "model.layers.8.mlp.experts.115.up_proj.weight": "model-00009-of-00047.safetensors", + "model.layers.8.mlp.experts.115.up_proj.weight_scale": "model-00009-of-00047.safetensors", + "model.layers.8.mlp.experts.116.down_proj.weight": "model-00009-of-00047.safetensors", + "model.layers.8.mlp.experts.116.down_proj.weight_scale": "model-00009-of-00047.safetensors", + "model.layers.8.mlp.experts.116.gate_proj.weight": "model-00009-of-00047.safetensors", + "model.layers.8.mlp.experts.116.gate_proj.weight_scale": "model-00009-of-00047.safetensors", + "model.layers.8.mlp.experts.116.up_proj.weight": "model-00009-of-00047.safetensors", + "model.layers.8.mlp.experts.116.up_proj.weight_scale": "model-00009-of-00047.safetensors", + "model.layers.8.mlp.experts.117.down_proj.weight": "model-00009-of-00047.safetensors", + "model.layers.8.mlp.experts.117.down_proj.weight_scale": "model-00009-of-00047.safetensors", + "model.layers.8.mlp.experts.117.gate_proj.weight": "model-00009-of-00047.safetensors", + "model.layers.8.mlp.experts.117.gate_proj.weight_scale": "model-00009-of-00047.safetensors", + "model.layers.8.mlp.experts.117.up_proj.weight": "model-00009-of-00047.safetensors", + "model.layers.8.mlp.experts.117.up_proj.weight_scale": "model-00009-of-00047.safetensors", + "model.layers.8.mlp.experts.118.down_proj.weight": "model-00009-of-00047.safetensors", + "model.layers.8.mlp.experts.118.down_proj.weight_scale": "model-00009-of-00047.safetensors", + "model.layers.8.mlp.experts.118.gate_proj.weight": "model-00009-of-00047.safetensors", + "model.layers.8.mlp.experts.118.gate_proj.weight_scale": "model-00009-of-00047.safetensors", + "model.layers.8.mlp.experts.118.up_proj.weight": "model-00009-of-00047.safetensors", + "model.layers.8.mlp.experts.118.up_proj.weight_scale": "model-00009-of-00047.safetensors", + "model.layers.8.mlp.experts.119.down_proj.weight": "model-00009-of-00047.safetensors", + "model.layers.8.mlp.experts.119.down_proj.weight_scale": "model-00009-of-00047.safetensors", + "model.layers.8.mlp.experts.119.gate_proj.weight": "model-00009-of-00047.safetensors", + "model.layers.8.mlp.experts.119.gate_proj.weight_scale": "model-00009-of-00047.safetensors", + "model.layers.8.mlp.experts.119.up_proj.weight": "model-00009-of-00047.safetensors", + "model.layers.8.mlp.experts.119.up_proj.weight_scale": "model-00009-of-00047.safetensors", + "model.layers.8.mlp.experts.12.down_proj.weight": "model-00009-of-00047.safetensors", + "model.layers.8.mlp.experts.12.down_proj.weight_scale": "model-00009-of-00047.safetensors", + "model.layers.8.mlp.experts.12.gate_proj.weight": "model-00009-of-00047.safetensors", + "model.layers.8.mlp.experts.12.gate_proj.weight_scale": "model-00009-of-00047.safetensors", + "model.layers.8.mlp.experts.12.up_proj.weight": "model-00009-of-00047.safetensors", + "model.layers.8.mlp.experts.12.up_proj.weight_scale": "model-00009-of-00047.safetensors", + "model.layers.8.mlp.experts.120.down_proj.weight": "model-00009-of-00047.safetensors", + "model.layers.8.mlp.experts.120.down_proj.weight_scale": "model-00009-of-00047.safetensors", + "model.layers.8.mlp.experts.120.gate_proj.weight": "model-00009-of-00047.safetensors", + "model.layers.8.mlp.experts.120.gate_proj.weight_scale": "model-00009-of-00047.safetensors", + "model.layers.8.mlp.experts.120.up_proj.weight": "model-00009-of-00047.safetensors", + "model.layers.8.mlp.experts.120.up_proj.weight_scale": "model-00009-of-00047.safetensors", + "model.layers.8.mlp.experts.121.down_proj.weight": "model-00009-of-00047.safetensors", + "model.layers.8.mlp.experts.121.down_proj.weight_scale": "model-00009-of-00047.safetensors", + "model.layers.8.mlp.experts.121.gate_proj.weight": "model-00009-of-00047.safetensors", + "model.layers.8.mlp.experts.121.gate_proj.weight_scale": "model-00009-of-00047.safetensors", + "model.layers.8.mlp.experts.121.up_proj.weight": "model-00009-of-00047.safetensors", + "model.layers.8.mlp.experts.121.up_proj.weight_scale": "model-00009-of-00047.safetensors", + "model.layers.8.mlp.experts.122.down_proj.weight": "model-00009-of-00047.safetensors", + "model.layers.8.mlp.experts.122.down_proj.weight_scale": "model-00009-of-00047.safetensors", + "model.layers.8.mlp.experts.122.gate_proj.weight": "model-00009-of-00047.safetensors", + "model.layers.8.mlp.experts.122.gate_proj.weight_scale": "model-00009-of-00047.safetensors", + "model.layers.8.mlp.experts.122.up_proj.weight": "model-00009-of-00047.safetensors", + "model.layers.8.mlp.experts.122.up_proj.weight_scale": "model-00009-of-00047.safetensors", + "model.layers.8.mlp.experts.123.down_proj.weight": "model-00009-of-00047.safetensors", + "model.layers.8.mlp.experts.123.down_proj.weight_scale": "model-00009-of-00047.safetensors", + "model.layers.8.mlp.experts.123.gate_proj.weight": "model-00009-of-00047.safetensors", + "model.layers.8.mlp.experts.123.gate_proj.weight_scale": "model-00009-of-00047.safetensors", + "model.layers.8.mlp.experts.123.up_proj.weight": "model-00009-of-00047.safetensors", + "model.layers.8.mlp.experts.123.up_proj.weight_scale": "model-00009-of-00047.safetensors", + "model.layers.8.mlp.experts.124.down_proj.weight": "model-00009-of-00047.safetensors", + "model.layers.8.mlp.experts.124.down_proj.weight_scale": "model-00009-of-00047.safetensors", + "model.layers.8.mlp.experts.124.gate_proj.weight": "model-00009-of-00047.safetensors", + "model.layers.8.mlp.experts.124.gate_proj.weight_scale": "model-00009-of-00047.safetensors", + "model.layers.8.mlp.experts.124.up_proj.weight": "model-00009-of-00047.safetensors", + "model.layers.8.mlp.experts.124.up_proj.weight_scale": "model-00009-of-00047.safetensors", + "model.layers.8.mlp.experts.125.down_proj.weight": "model-00009-of-00047.safetensors", + "model.layers.8.mlp.experts.125.down_proj.weight_scale": "model-00009-of-00047.safetensors", + "model.layers.8.mlp.experts.125.gate_proj.weight": "model-00009-of-00047.safetensors", + "model.layers.8.mlp.experts.125.gate_proj.weight_scale": "model-00009-of-00047.safetensors", + "model.layers.8.mlp.experts.125.up_proj.weight": "model-00009-of-00047.safetensors", + "model.layers.8.mlp.experts.125.up_proj.weight_scale": "model-00009-of-00047.safetensors", + "model.layers.8.mlp.experts.126.down_proj.weight": "model-00009-of-00047.safetensors", + "model.layers.8.mlp.experts.126.down_proj.weight_scale": "model-00009-of-00047.safetensors", + "model.layers.8.mlp.experts.126.gate_proj.weight": "model-00009-of-00047.safetensors", + "model.layers.8.mlp.experts.126.gate_proj.weight_scale": "model-00009-of-00047.safetensors", + "model.layers.8.mlp.experts.126.up_proj.weight": "model-00009-of-00047.safetensors", + "model.layers.8.mlp.experts.126.up_proj.weight_scale": "model-00009-of-00047.safetensors", + "model.layers.8.mlp.experts.127.down_proj.weight": "model-00009-of-00047.safetensors", + "model.layers.8.mlp.experts.127.down_proj.weight_scale": "model-00009-of-00047.safetensors", + "model.layers.8.mlp.experts.127.gate_proj.weight": "model-00009-of-00047.safetensors", + "model.layers.8.mlp.experts.127.gate_proj.weight_scale": "model-00009-of-00047.safetensors", + "model.layers.8.mlp.experts.127.up_proj.weight": "model-00009-of-00047.safetensors", + "model.layers.8.mlp.experts.127.up_proj.weight_scale": "model-00009-of-00047.safetensors", + "model.layers.8.mlp.experts.13.down_proj.weight": "model-00009-of-00047.safetensors", + "model.layers.8.mlp.experts.13.down_proj.weight_scale": "model-00009-of-00047.safetensors", + "model.layers.8.mlp.experts.13.gate_proj.weight": "model-00009-of-00047.safetensors", + "model.layers.8.mlp.experts.13.gate_proj.weight_scale": "model-00009-of-00047.safetensors", + "model.layers.8.mlp.experts.13.up_proj.weight": "model-00009-of-00047.safetensors", + "model.layers.8.mlp.experts.13.up_proj.weight_scale": "model-00009-of-00047.safetensors", + "model.layers.8.mlp.experts.14.down_proj.weight": "model-00009-of-00047.safetensors", + "model.layers.8.mlp.experts.14.down_proj.weight_scale": "model-00009-of-00047.safetensors", + "model.layers.8.mlp.experts.14.gate_proj.weight": "model-00009-of-00047.safetensors", + "model.layers.8.mlp.experts.14.gate_proj.weight_scale": "model-00009-of-00047.safetensors", + "model.layers.8.mlp.experts.14.up_proj.weight": "model-00009-of-00047.safetensors", + "model.layers.8.mlp.experts.14.up_proj.weight_scale": "model-00009-of-00047.safetensors", + "model.layers.8.mlp.experts.15.down_proj.weight": "model-00009-of-00047.safetensors", + "model.layers.8.mlp.experts.15.down_proj.weight_scale": "model-00009-of-00047.safetensors", + "model.layers.8.mlp.experts.15.gate_proj.weight": "model-00009-of-00047.safetensors", + "model.layers.8.mlp.experts.15.gate_proj.weight_scale": "model-00009-of-00047.safetensors", + "model.layers.8.mlp.experts.15.up_proj.weight": "model-00009-of-00047.safetensors", + "model.layers.8.mlp.experts.15.up_proj.weight_scale": "model-00009-of-00047.safetensors", + "model.layers.8.mlp.experts.16.down_proj.weight": "model-00009-of-00047.safetensors", + "model.layers.8.mlp.experts.16.down_proj.weight_scale": "model-00009-of-00047.safetensors", + "model.layers.8.mlp.experts.16.gate_proj.weight": "model-00009-of-00047.safetensors", + "model.layers.8.mlp.experts.16.gate_proj.weight_scale": "model-00009-of-00047.safetensors", + "model.layers.8.mlp.experts.16.up_proj.weight": "model-00009-of-00047.safetensors", + "model.layers.8.mlp.experts.16.up_proj.weight_scale": "model-00009-of-00047.safetensors", + "model.layers.8.mlp.experts.17.down_proj.weight": "model-00009-of-00047.safetensors", + "model.layers.8.mlp.experts.17.down_proj.weight_scale": "model-00009-of-00047.safetensors", + "model.layers.8.mlp.experts.17.gate_proj.weight": "model-00009-of-00047.safetensors", + "model.layers.8.mlp.experts.17.gate_proj.weight_scale": "model-00009-of-00047.safetensors", + "model.layers.8.mlp.experts.17.up_proj.weight": "model-00009-of-00047.safetensors", + "model.layers.8.mlp.experts.17.up_proj.weight_scale": "model-00009-of-00047.safetensors", + "model.layers.8.mlp.experts.18.down_proj.weight": "model-00009-of-00047.safetensors", + "model.layers.8.mlp.experts.18.down_proj.weight_scale": "model-00009-of-00047.safetensors", + "model.layers.8.mlp.experts.18.gate_proj.weight": "model-00009-of-00047.safetensors", + "model.layers.8.mlp.experts.18.gate_proj.weight_scale": "model-00009-of-00047.safetensors", + "model.layers.8.mlp.experts.18.up_proj.weight": "model-00009-of-00047.safetensors", + "model.layers.8.mlp.experts.18.up_proj.weight_scale": "model-00009-of-00047.safetensors", + "model.layers.8.mlp.experts.19.down_proj.weight": "model-00009-of-00047.safetensors", + "model.layers.8.mlp.experts.19.down_proj.weight_scale": "model-00009-of-00047.safetensors", + "model.layers.8.mlp.experts.19.gate_proj.weight": "model-00009-of-00047.safetensors", + "model.layers.8.mlp.experts.19.gate_proj.weight_scale": "model-00009-of-00047.safetensors", + "model.layers.8.mlp.experts.19.up_proj.weight": "model-00009-of-00047.safetensors", + "model.layers.8.mlp.experts.19.up_proj.weight_scale": "model-00009-of-00047.safetensors", + "model.layers.8.mlp.experts.2.down_proj.weight": "model-00009-of-00047.safetensors", + "model.layers.8.mlp.experts.2.down_proj.weight_scale": "model-00009-of-00047.safetensors", + "model.layers.8.mlp.experts.2.gate_proj.weight": "model-00009-of-00047.safetensors", + "model.layers.8.mlp.experts.2.gate_proj.weight_scale": "model-00009-of-00047.safetensors", + "model.layers.8.mlp.experts.2.up_proj.weight": "model-00009-of-00047.safetensors", + "model.layers.8.mlp.experts.2.up_proj.weight_scale": "model-00009-of-00047.safetensors", + "model.layers.8.mlp.experts.20.down_proj.weight": "model-00009-of-00047.safetensors", + "model.layers.8.mlp.experts.20.down_proj.weight_scale": "model-00009-of-00047.safetensors", + "model.layers.8.mlp.experts.20.gate_proj.weight": "model-00009-of-00047.safetensors", + "model.layers.8.mlp.experts.20.gate_proj.weight_scale": "model-00009-of-00047.safetensors", + "model.layers.8.mlp.experts.20.up_proj.weight": "model-00009-of-00047.safetensors", + "model.layers.8.mlp.experts.20.up_proj.weight_scale": "model-00009-of-00047.safetensors", + "model.layers.8.mlp.experts.21.down_proj.weight": "model-00009-of-00047.safetensors", + "model.layers.8.mlp.experts.21.down_proj.weight_scale": "model-00009-of-00047.safetensors", + "model.layers.8.mlp.experts.21.gate_proj.weight": "model-00009-of-00047.safetensors", + "model.layers.8.mlp.experts.21.gate_proj.weight_scale": "model-00009-of-00047.safetensors", + "model.layers.8.mlp.experts.21.up_proj.weight": "model-00009-of-00047.safetensors", + "model.layers.8.mlp.experts.21.up_proj.weight_scale": "model-00009-of-00047.safetensors", + "model.layers.8.mlp.experts.22.down_proj.weight": "model-00009-of-00047.safetensors", + "model.layers.8.mlp.experts.22.down_proj.weight_scale": "model-00009-of-00047.safetensors", + "model.layers.8.mlp.experts.22.gate_proj.weight": "model-00009-of-00047.safetensors", + "model.layers.8.mlp.experts.22.gate_proj.weight_scale": "model-00009-of-00047.safetensors", + "model.layers.8.mlp.experts.22.up_proj.weight": "model-00009-of-00047.safetensors", + "model.layers.8.mlp.experts.22.up_proj.weight_scale": "model-00009-of-00047.safetensors", + "model.layers.8.mlp.experts.23.down_proj.weight": "model-00009-of-00047.safetensors", + "model.layers.8.mlp.experts.23.down_proj.weight_scale": "model-00009-of-00047.safetensors", + "model.layers.8.mlp.experts.23.gate_proj.weight": "model-00009-of-00047.safetensors", + "model.layers.8.mlp.experts.23.gate_proj.weight_scale": "model-00009-of-00047.safetensors", + "model.layers.8.mlp.experts.23.up_proj.weight": "model-00009-of-00047.safetensors", + "model.layers.8.mlp.experts.23.up_proj.weight_scale": "model-00009-of-00047.safetensors", + "model.layers.8.mlp.experts.24.down_proj.weight": "model-00009-of-00047.safetensors", + "model.layers.8.mlp.experts.24.down_proj.weight_scale": "model-00009-of-00047.safetensors", + "model.layers.8.mlp.experts.24.gate_proj.weight": "model-00009-of-00047.safetensors", + "model.layers.8.mlp.experts.24.gate_proj.weight_scale": "model-00009-of-00047.safetensors", + "model.layers.8.mlp.experts.24.up_proj.weight": "model-00009-of-00047.safetensors", + "model.layers.8.mlp.experts.24.up_proj.weight_scale": "model-00009-of-00047.safetensors", + "model.layers.8.mlp.experts.25.down_proj.weight": "model-00009-of-00047.safetensors", + "model.layers.8.mlp.experts.25.down_proj.weight_scale": "model-00009-of-00047.safetensors", + "model.layers.8.mlp.experts.25.gate_proj.weight": "model-00009-of-00047.safetensors", + "model.layers.8.mlp.experts.25.gate_proj.weight_scale": "model-00009-of-00047.safetensors", + "model.layers.8.mlp.experts.25.up_proj.weight": "model-00009-of-00047.safetensors", + "model.layers.8.mlp.experts.25.up_proj.weight_scale": "model-00009-of-00047.safetensors", + "model.layers.8.mlp.experts.26.down_proj.weight": "model-00009-of-00047.safetensors", + "model.layers.8.mlp.experts.26.down_proj.weight_scale": "model-00009-of-00047.safetensors", + "model.layers.8.mlp.experts.26.gate_proj.weight": "model-00009-of-00047.safetensors", + "model.layers.8.mlp.experts.26.gate_proj.weight_scale": "model-00009-of-00047.safetensors", + "model.layers.8.mlp.experts.26.up_proj.weight": "model-00009-of-00047.safetensors", + "model.layers.8.mlp.experts.26.up_proj.weight_scale": "model-00009-of-00047.safetensors", + "model.layers.8.mlp.experts.27.down_proj.weight": "model-00009-of-00047.safetensors", + "model.layers.8.mlp.experts.27.down_proj.weight_scale": "model-00009-of-00047.safetensors", + "model.layers.8.mlp.experts.27.gate_proj.weight": "model-00009-of-00047.safetensors", + "model.layers.8.mlp.experts.27.gate_proj.weight_scale": "model-00009-of-00047.safetensors", + "model.layers.8.mlp.experts.27.up_proj.weight": "model-00009-of-00047.safetensors", + "model.layers.8.mlp.experts.27.up_proj.weight_scale": "model-00009-of-00047.safetensors", + "model.layers.8.mlp.experts.28.down_proj.weight": "model-00009-of-00047.safetensors", + "model.layers.8.mlp.experts.28.down_proj.weight_scale": "model-00009-of-00047.safetensors", + "model.layers.8.mlp.experts.28.gate_proj.weight": "model-00009-of-00047.safetensors", + "model.layers.8.mlp.experts.28.gate_proj.weight_scale": "model-00009-of-00047.safetensors", + "model.layers.8.mlp.experts.28.up_proj.weight": "model-00009-of-00047.safetensors", + "model.layers.8.mlp.experts.28.up_proj.weight_scale": "model-00009-of-00047.safetensors", + "model.layers.8.mlp.experts.29.down_proj.weight": "model-00009-of-00047.safetensors", + "model.layers.8.mlp.experts.29.down_proj.weight_scale": "model-00009-of-00047.safetensors", + "model.layers.8.mlp.experts.29.gate_proj.weight": "model-00009-of-00047.safetensors", + "model.layers.8.mlp.experts.29.gate_proj.weight_scale": "model-00009-of-00047.safetensors", + "model.layers.8.mlp.experts.29.up_proj.weight": "model-00009-of-00047.safetensors", + "model.layers.8.mlp.experts.29.up_proj.weight_scale": "model-00009-of-00047.safetensors", + "model.layers.8.mlp.experts.3.down_proj.weight": "model-00009-of-00047.safetensors", + "model.layers.8.mlp.experts.3.down_proj.weight_scale": "model-00009-of-00047.safetensors", + "model.layers.8.mlp.experts.3.gate_proj.weight": "model-00009-of-00047.safetensors", + "model.layers.8.mlp.experts.3.gate_proj.weight_scale": "model-00009-of-00047.safetensors", + "model.layers.8.mlp.experts.3.up_proj.weight": "model-00009-of-00047.safetensors", + "model.layers.8.mlp.experts.3.up_proj.weight_scale": "model-00009-of-00047.safetensors", + "model.layers.8.mlp.experts.30.down_proj.weight": "model-00009-of-00047.safetensors", + "model.layers.8.mlp.experts.30.down_proj.weight_scale": "model-00009-of-00047.safetensors", + "model.layers.8.mlp.experts.30.gate_proj.weight": "model-00009-of-00047.safetensors", + "model.layers.8.mlp.experts.30.gate_proj.weight_scale": "model-00009-of-00047.safetensors", + "model.layers.8.mlp.experts.30.up_proj.weight": "model-00009-of-00047.safetensors", + "model.layers.8.mlp.experts.30.up_proj.weight_scale": "model-00009-of-00047.safetensors", + "model.layers.8.mlp.experts.31.down_proj.weight": "model-00009-of-00047.safetensors", + "model.layers.8.mlp.experts.31.down_proj.weight_scale": "model-00009-of-00047.safetensors", + "model.layers.8.mlp.experts.31.gate_proj.weight": "model-00009-of-00047.safetensors", + "model.layers.8.mlp.experts.31.gate_proj.weight_scale": "model-00009-of-00047.safetensors", + "model.layers.8.mlp.experts.31.up_proj.weight": "model-00009-of-00047.safetensors", + "model.layers.8.mlp.experts.31.up_proj.weight_scale": "model-00009-of-00047.safetensors", + "model.layers.8.mlp.experts.32.down_proj.weight": "model-00009-of-00047.safetensors", + "model.layers.8.mlp.experts.32.down_proj.weight_scale": "model-00009-of-00047.safetensors", + "model.layers.8.mlp.experts.32.gate_proj.weight": "model-00009-of-00047.safetensors", + "model.layers.8.mlp.experts.32.gate_proj.weight_scale": "model-00009-of-00047.safetensors", + "model.layers.8.mlp.experts.32.up_proj.weight": "model-00009-of-00047.safetensors", + "model.layers.8.mlp.experts.32.up_proj.weight_scale": "model-00009-of-00047.safetensors", + "model.layers.8.mlp.experts.33.down_proj.weight": "model-00009-of-00047.safetensors", + "model.layers.8.mlp.experts.33.down_proj.weight_scale": "model-00009-of-00047.safetensors", + "model.layers.8.mlp.experts.33.gate_proj.weight": "model-00009-of-00047.safetensors", + "model.layers.8.mlp.experts.33.gate_proj.weight_scale": "model-00009-of-00047.safetensors", + "model.layers.8.mlp.experts.33.up_proj.weight": "model-00009-of-00047.safetensors", + "model.layers.8.mlp.experts.33.up_proj.weight_scale": "model-00009-of-00047.safetensors", + "model.layers.8.mlp.experts.34.down_proj.weight": "model-00009-of-00047.safetensors", + "model.layers.8.mlp.experts.34.down_proj.weight_scale": "model-00009-of-00047.safetensors", + "model.layers.8.mlp.experts.34.gate_proj.weight": "model-00009-of-00047.safetensors", + "model.layers.8.mlp.experts.34.gate_proj.weight_scale": "model-00009-of-00047.safetensors", + "model.layers.8.mlp.experts.34.up_proj.weight": "model-00009-of-00047.safetensors", + "model.layers.8.mlp.experts.34.up_proj.weight_scale": "model-00009-of-00047.safetensors", + "model.layers.8.mlp.experts.35.down_proj.weight": "model-00009-of-00047.safetensors", + "model.layers.8.mlp.experts.35.down_proj.weight_scale": "model-00009-of-00047.safetensors", + "model.layers.8.mlp.experts.35.gate_proj.weight": "model-00009-of-00047.safetensors", + "model.layers.8.mlp.experts.35.gate_proj.weight_scale": "model-00009-of-00047.safetensors", + "model.layers.8.mlp.experts.35.up_proj.weight": "model-00009-of-00047.safetensors", + "model.layers.8.mlp.experts.35.up_proj.weight_scale": "model-00009-of-00047.safetensors", + "model.layers.8.mlp.experts.36.down_proj.weight": "model-00009-of-00047.safetensors", + "model.layers.8.mlp.experts.36.down_proj.weight_scale": "model-00009-of-00047.safetensors", + "model.layers.8.mlp.experts.36.gate_proj.weight": "model-00009-of-00047.safetensors", + "model.layers.8.mlp.experts.36.gate_proj.weight_scale": "model-00009-of-00047.safetensors", + "model.layers.8.mlp.experts.36.up_proj.weight": "model-00009-of-00047.safetensors", + "model.layers.8.mlp.experts.36.up_proj.weight_scale": "model-00009-of-00047.safetensors", + "model.layers.8.mlp.experts.37.down_proj.weight": "model-00009-of-00047.safetensors", + "model.layers.8.mlp.experts.37.down_proj.weight_scale": "model-00009-of-00047.safetensors", + "model.layers.8.mlp.experts.37.gate_proj.weight": "model-00009-of-00047.safetensors", + "model.layers.8.mlp.experts.37.gate_proj.weight_scale": "model-00009-of-00047.safetensors", + "model.layers.8.mlp.experts.37.up_proj.weight": "model-00009-of-00047.safetensors", + "model.layers.8.mlp.experts.37.up_proj.weight_scale": "model-00009-of-00047.safetensors", + "model.layers.8.mlp.experts.38.down_proj.weight": "model-00009-of-00047.safetensors", + "model.layers.8.mlp.experts.38.down_proj.weight_scale": "model-00009-of-00047.safetensors", + "model.layers.8.mlp.experts.38.gate_proj.weight": "model-00009-of-00047.safetensors", + "model.layers.8.mlp.experts.38.gate_proj.weight_scale": "model-00009-of-00047.safetensors", + "model.layers.8.mlp.experts.38.up_proj.weight": "model-00009-of-00047.safetensors", + "model.layers.8.mlp.experts.38.up_proj.weight_scale": "model-00009-of-00047.safetensors", + "model.layers.8.mlp.experts.39.down_proj.weight": "model-00009-of-00047.safetensors", + "model.layers.8.mlp.experts.39.down_proj.weight_scale": "model-00009-of-00047.safetensors", + "model.layers.8.mlp.experts.39.gate_proj.weight": "model-00009-of-00047.safetensors", + "model.layers.8.mlp.experts.39.gate_proj.weight_scale": "model-00009-of-00047.safetensors", + "model.layers.8.mlp.experts.39.up_proj.weight": "model-00009-of-00047.safetensors", + "model.layers.8.mlp.experts.39.up_proj.weight_scale": "model-00009-of-00047.safetensors", + "model.layers.8.mlp.experts.4.down_proj.weight": "model-00009-of-00047.safetensors", + "model.layers.8.mlp.experts.4.down_proj.weight_scale": "model-00009-of-00047.safetensors", + "model.layers.8.mlp.experts.4.gate_proj.weight": "model-00009-of-00047.safetensors", + "model.layers.8.mlp.experts.4.gate_proj.weight_scale": "model-00009-of-00047.safetensors", + "model.layers.8.mlp.experts.4.up_proj.weight": "model-00009-of-00047.safetensors", + "model.layers.8.mlp.experts.4.up_proj.weight_scale": "model-00009-of-00047.safetensors", + "model.layers.8.mlp.experts.40.down_proj.weight": "model-00009-of-00047.safetensors", + "model.layers.8.mlp.experts.40.down_proj.weight_scale": "model-00009-of-00047.safetensors", + "model.layers.8.mlp.experts.40.gate_proj.weight": "model-00009-of-00047.safetensors", + "model.layers.8.mlp.experts.40.gate_proj.weight_scale": "model-00009-of-00047.safetensors", + "model.layers.8.mlp.experts.40.up_proj.weight": "model-00009-of-00047.safetensors", + "model.layers.8.mlp.experts.40.up_proj.weight_scale": "model-00009-of-00047.safetensors", + "model.layers.8.mlp.experts.41.down_proj.weight": "model-00009-of-00047.safetensors", + "model.layers.8.mlp.experts.41.down_proj.weight_scale": "model-00009-of-00047.safetensors", + "model.layers.8.mlp.experts.41.gate_proj.weight": "model-00009-of-00047.safetensors", + "model.layers.8.mlp.experts.41.gate_proj.weight_scale": "model-00009-of-00047.safetensors", + "model.layers.8.mlp.experts.41.up_proj.weight": "model-00009-of-00047.safetensors", + "model.layers.8.mlp.experts.41.up_proj.weight_scale": "model-00009-of-00047.safetensors", + "model.layers.8.mlp.experts.42.down_proj.weight": "model-00009-of-00047.safetensors", + "model.layers.8.mlp.experts.42.down_proj.weight_scale": "model-00009-of-00047.safetensors", + "model.layers.8.mlp.experts.42.gate_proj.weight": "model-00009-of-00047.safetensors", + "model.layers.8.mlp.experts.42.gate_proj.weight_scale": "model-00009-of-00047.safetensors", + "model.layers.8.mlp.experts.42.up_proj.weight": "model-00009-of-00047.safetensors", + "model.layers.8.mlp.experts.42.up_proj.weight_scale": "model-00009-of-00047.safetensors", + "model.layers.8.mlp.experts.43.down_proj.weight": "model-00009-of-00047.safetensors", + "model.layers.8.mlp.experts.43.down_proj.weight_scale": "model-00009-of-00047.safetensors", + "model.layers.8.mlp.experts.43.gate_proj.weight": "model-00009-of-00047.safetensors", + "model.layers.8.mlp.experts.43.gate_proj.weight_scale": "model-00009-of-00047.safetensors", + "model.layers.8.mlp.experts.43.up_proj.weight": "model-00009-of-00047.safetensors", + "model.layers.8.mlp.experts.43.up_proj.weight_scale": "model-00009-of-00047.safetensors", + "model.layers.8.mlp.experts.44.down_proj.weight": "model-00009-of-00047.safetensors", + "model.layers.8.mlp.experts.44.down_proj.weight_scale": "model-00009-of-00047.safetensors", + "model.layers.8.mlp.experts.44.gate_proj.weight": "model-00009-of-00047.safetensors", + "model.layers.8.mlp.experts.44.gate_proj.weight_scale": "model-00009-of-00047.safetensors", + "model.layers.8.mlp.experts.44.up_proj.weight": "model-00009-of-00047.safetensors", + "model.layers.8.mlp.experts.44.up_proj.weight_scale": "model-00009-of-00047.safetensors", + "model.layers.8.mlp.experts.45.down_proj.weight": "model-00009-of-00047.safetensors", + "model.layers.8.mlp.experts.45.down_proj.weight_scale": "model-00009-of-00047.safetensors", + "model.layers.8.mlp.experts.45.gate_proj.weight": "model-00009-of-00047.safetensors", + "model.layers.8.mlp.experts.45.gate_proj.weight_scale": "model-00009-of-00047.safetensors", + "model.layers.8.mlp.experts.45.up_proj.weight": "model-00009-of-00047.safetensors", + "model.layers.8.mlp.experts.45.up_proj.weight_scale": "model-00009-of-00047.safetensors", + "model.layers.8.mlp.experts.46.down_proj.weight": "model-00009-of-00047.safetensors", + "model.layers.8.mlp.experts.46.down_proj.weight_scale": "model-00009-of-00047.safetensors", + "model.layers.8.mlp.experts.46.gate_proj.weight": "model-00009-of-00047.safetensors", + "model.layers.8.mlp.experts.46.gate_proj.weight_scale": "model-00009-of-00047.safetensors", + "model.layers.8.mlp.experts.46.up_proj.weight": "model-00009-of-00047.safetensors", + "model.layers.8.mlp.experts.46.up_proj.weight_scale": "model-00009-of-00047.safetensors", + "model.layers.8.mlp.experts.47.down_proj.weight": "model-00009-of-00047.safetensors", + "model.layers.8.mlp.experts.47.down_proj.weight_scale": "model-00009-of-00047.safetensors", + "model.layers.8.mlp.experts.47.gate_proj.weight": "model-00009-of-00047.safetensors", + "model.layers.8.mlp.experts.47.gate_proj.weight_scale": "model-00009-of-00047.safetensors", + "model.layers.8.mlp.experts.47.up_proj.weight": "model-00009-of-00047.safetensors", + "model.layers.8.mlp.experts.47.up_proj.weight_scale": "model-00009-of-00047.safetensors", + "model.layers.8.mlp.experts.48.down_proj.weight": "model-00009-of-00047.safetensors", + "model.layers.8.mlp.experts.48.down_proj.weight_scale": "model-00009-of-00047.safetensors", + "model.layers.8.mlp.experts.48.gate_proj.weight": "model-00009-of-00047.safetensors", + "model.layers.8.mlp.experts.48.gate_proj.weight_scale": "model-00009-of-00047.safetensors", + "model.layers.8.mlp.experts.48.up_proj.weight": "model-00009-of-00047.safetensors", + "model.layers.8.mlp.experts.48.up_proj.weight_scale": "model-00009-of-00047.safetensors", + "model.layers.8.mlp.experts.49.down_proj.weight": "model-00009-of-00047.safetensors", + "model.layers.8.mlp.experts.49.down_proj.weight_scale": "model-00009-of-00047.safetensors", + "model.layers.8.mlp.experts.49.gate_proj.weight": "model-00009-of-00047.safetensors", + "model.layers.8.mlp.experts.49.gate_proj.weight_scale": "model-00009-of-00047.safetensors", + "model.layers.8.mlp.experts.49.up_proj.weight": "model-00009-of-00047.safetensors", + "model.layers.8.mlp.experts.49.up_proj.weight_scale": "model-00009-of-00047.safetensors", + "model.layers.8.mlp.experts.5.down_proj.weight": "model-00009-of-00047.safetensors", + "model.layers.8.mlp.experts.5.down_proj.weight_scale": "model-00009-of-00047.safetensors", + "model.layers.8.mlp.experts.5.gate_proj.weight": "model-00009-of-00047.safetensors", + "model.layers.8.mlp.experts.5.gate_proj.weight_scale": "model-00009-of-00047.safetensors", + "model.layers.8.mlp.experts.5.up_proj.weight": "model-00009-of-00047.safetensors", + "model.layers.8.mlp.experts.5.up_proj.weight_scale": "model-00009-of-00047.safetensors", + "model.layers.8.mlp.experts.50.down_proj.weight": "model-00009-of-00047.safetensors", + "model.layers.8.mlp.experts.50.down_proj.weight_scale": "model-00009-of-00047.safetensors", + "model.layers.8.mlp.experts.50.gate_proj.weight": "model-00009-of-00047.safetensors", + "model.layers.8.mlp.experts.50.gate_proj.weight_scale": "model-00009-of-00047.safetensors", + "model.layers.8.mlp.experts.50.up_proj.weight": "model-00009-of-00047.safetensors", + "model.layers.8.mlp.experts.50.up_proj.weight_scale": "model-00009-of-00047.safetensors", + "model.layers.8.mlp.experts.51.down_proj.weight": "model-00009-of-00047.safetensors", + "model.layers.8.mlp.experts.51.down_proj.weight_scale": "model-00009-of-00047.safetensors", + "model.layers.8.mlp.experts.51.gate_proj.weight": "model-00009-of-00047.safetensors", + "model.layers.8.mlp.experts.51.gate_proj.weight_scale": "model-00009-of-00047.safetensors", + "model.layers.8.mlp.experts.51.up_proj.weight": "model-00009-of-00047.safetensors", + "model.layers.8.mlp.experts.51.up_proj.weight_scale": "model-00009-of-00047.safetensors", + "model.layers.8.mlp.experts.52.down_proj.weight": "model-00009-of-00047.safetensors", + "model.layers.8.mlp.experts.52.down_proj.weight_scale": "model-00009-of-00047.safetensors", + "model.layers.8.mlp.experts.52.gate_proj.weight": "model-00009-of-00047.safetensors", + "model.layers.8.mlp.experts.52.gate_proj.weight_scale": "model-00009-of-00047.safetensors", + "model.layers.8.mlp.experts.52.up_proj.weight": "model-00009-of-00047.safetensors", + "model.layers.8.mlp.experts.52.up_proj.weight_scale": "model-00009-of-00047.safetensors", + "model.layers.8.mlp.experts.53.down_proj.weight": "model-00009-of-00047.safetensors", + "model.layers.8.mlp.experts.53.down_proj.weight_scale": "model-00009-of-00047.safetensors", + "model.layers.8.mlp.experts.53.gate_proj.weight": "model-00009-of-00047.safetensors", + "model.layers.8.mlp.experts.53.gate_proj.weight_scale": "model-00009-of-00047.safetensors", + "model.layers.8.mlp.experts.53.up_proj.weight": "model-00009-of-00047.safetensors", + "model.layers.8.mlp.experts.53.up_proj.weight_scale": "model-00009-of-00047.safetensors", + "model.layers.8.mlp.experts.54.down_proj.weight": "model-00009-of-00047.safetensors", + "model.layers.8.mlp.experts.54.down_proj.weight_scale": "model-00009-of-00047.safetensors", + "model.layers.8.mlp.experts.54.gate_proj.weight": "model-00009-of-00047.safetensors", + "model.layers.8.mlp.experts.54.gate_proj.weight_scale": "model-00009-of-00047.safetensors", + "model.layers.8.mlp.experts.54.up_proj.weight": "model-00009-of-00047.safetensors", + "model.layers.8.mlp.experts.54.up_proj.weight_scale": "model-00009-of-00047.safetensors", + "model.layers.8.mlp.experts.55.down_proj.weight": "model-00009-of-00047.safetensors", + "model.layers.8.mlp.experts.55.down_proj.weight_scale": "model-00009-of-00047.safetensors", + "model.layers.8.mlp.experts.55.gate_proj.weight": "model-00009-of-00047.safetensors", + "model.layers.8.mlp.experts.55.gate_proj.weight_scale": "model-00009-of-00047.safetensors", + "model.layers.8.mlp.experts.55.up_proj.weight": "model-00009-of-00047.safetensors", + "model.layers.8.mlp.experts.55.up_proj.weight_scale": "model-00009-of-00047.safetensors", + "model.layers.8.mlp.experts.56.down_proj.weight": "model-00009-of-00047.safetensors", + "model.layers.8.mlp.experts.56.down_proj.weight_scale": "model-00009-of-00047.safetensors", + "model.layers.8.mlp.experts.56.gate_proj.weight": "model-00009-of-00047.safetensors", + "model.layers.8.mlp.experts.56.gate_proj.weight_scale": "model-00009-of-00047.safetensors", + "model.layers.8.mlp.experts.56.up_proj.weight": "model-00009-of-00047.safetensors", + "model.layers.8.mlp.experts.56.up_proj.weight_scale": "model-00009-of-00047.safetensors", + "model.layers.8.mlp.experts.57.down_proj.weight": "model-00009-of-00047.safetensors", + "model.layers.8.mlp.experts.57.down_proj.weight_scale": "model-00009-of-00047.safetensors", + "model.layers.8.mlp.experts.57.gate_proj.weight": "model-00009-of-00047.safetensors", + "model.layers.8.mlp.experts.57.gate_proj.weight_scale": "model-00009-of-00047.safetensors", + "model.layers.8.mlp.experts.57.up_proj.weight": "model-00009-of-00047.safetensors", + "model.layers.8.mlp.experts.57.up_proj.weight_scale": "model-00009-of-00047.safetensors", + "model.layers.8.mlp.experts.58.down_proj.weight": "model-00009-of-00047.safetensors", + "model.layers.8.mlp.experts.58.down_proj.weight_scale": "model-00009-of-00047.safetensors", + "model.layers.8.mlp.experts.58.gate_proj.weight": "model-00009-of-00047.safetensors", + "model.layers.8.mlp.experts.58.gate_proj.weight_scale": "model-00009-of-00047.safetensors", + "model.layers.8.mlp.experts.58.up_proj.weight": "model-00009-of-00047.safetensors", + "model.layers.8.mlp.experts.58.up_proj.weight_scale": "model-00009-of-00047.safetensors", + "model.layers.8.mlp.experts.59.down_proj.weight": "model-00009-of-00047.safetensors", + "model.layers.8.mlp.experts.59.down_proj.weight_scale": "model-00009-of-00047.safetensors", + "model.layers.8.mlp.experts.59.gate_proj.weight": "model-00009-of-00047.safetensors", + "model.layers.8.mlp.experts.59.gate_proj.weight_scale": "model-00009-of-00047.safetensors", + "model.layers.8.mlp.experts.59.up_proj.weight": "model-00009-of-00047.safetensors", + "model.layers.8.mlp.experts.59.up_proj.weight_scale": "model-00009-of-00047.safetensors", + "model.layers.8.mlp.experts.6.down_proj.weight": "model-00009-of-00047.safetensors", + "model.layers.8.mlp.experts.6.down_proj.weight_scale": "model-00009-of-00047.safetensors", + "model.layers.8.mlp.experts.6.gate_proj.weight": "model-00009-of-00047.safetensors", + "model.layers.8.mlp.experts.6.gate_proj.weight_scale": "model-00009-of-00047.safetensors", + "model.layers.8.mlp.experts.6.up_proj.weight": "model-00009-of-00047.safetensors", + "model.layers.8.mlp.experts.6.up_proj.weight_scale": "model-00009-of-00047.safetensors", + "model.layers.8.mlp.experts.60.down_proj.weight": "model-00009-of-00047.safetensors", + "model.layers.8.mlp.experts.60.down_proj.weight_scale": "model-00009-of-00047.safetensors", + "model.layers.8.mlp.experts.60.gate_proj.weight": "model-00009-of-00047.safetensors", + "model.layers.8.mlp.experts.60.gate_proj.weight_scale": "model-00009-of-00047.safetensors", + "model.layers.8.mlp.experts.60.up_proj.weight": "model-00009-of-00047.safetensors", + "model.layers.8.mlp.experts.60.up_proj.weight_scale": "model-00009-of-00047.safetensors", + "model.layers.8.mlp.experts.61.down_proj.weight": "model-00009-of-00047.safetensors", + "model.layers.8.mlp.experts.61.down_proj.weight_scale": "model-00009-of-00047.safetensors", + "model.layers.8.mlp.experts.61.gate_proj.weight": "model-00009-of-00047.safetensors", + "model.layers.8.mlp.experts.61.gate_proj.weight_scale": "model-00009-of-00047.safetensors", + "model.layers.8.mlp.experts.61.up_proj.weight": "model-00009-of-00047.safetensors", + "model.layers.8.mlp.experts.61.up_proj.weight_scale": "model-00009-of-00047.safetensors", + "model.layers.8.mlp.experts.62.down_proj.weight": "model-00009-of-00047.safetensors", + "model.layers.8.mlp.experts.62.down_proj.weight_scale": "model-00009-of-00047.safetensors", + "model.layers.8.mlp.experts.62.gate_proj.weight": "model-00009-of-00047.safetensors", + "model.layers.8.mlp.experts.62.gate_proj.weight_scale": "model-00009-of-00047.safetensors", + "model.layers.8.mlp.experts.62.up_proj.weight": "model-00009-of-00047.safetensors", + "model.layers.8.mlp.experts.62.up_proj.weight_scale": "model-00009-of-00047.safetensors", + "model.layers.8.mlp.experts.63.down_proj.weight": "model-00009-of-00047.safetensors", + "model.layers.8.mlp.experts.63.down_proj.weight_scale": "model-00009-of-00047.safetensors", + "model.layers.8.mlp.experts.63.gate_proj.weight": "model-00009-of-00047.safetensors", + "model.layers.8.mlp.experts.63.gate_proj.weight_scale": "model-00009-of-00047.safetensors", + "model.layers.8.mlp.experts.63.up_proj.weight": "model-00009-of-00047.safetensors", + "model.layers.8.mlp.experts.63.up_proj.weight_scale": "model-00009-of-00047.safetensors", + "model.layers.8.mlp.experts.64.down_proj.weight": "model-00009-of-00047.safetensors", + "model.layers.8.mlp.experts.64.down_proj.weight_scale": "model-00009-of-00047.safetensors", + "model.layers.8.mlp.experts.64.gate_proj.weight": "model-00009-of-00047.safetensors", + "model.layers.8.mlp.experts.64.gate_proj.weight_scale": "model-00009-of-00047.safetensors", + "model.layers.8.mlp.experts.64.up_proj.weight": "model-00009-of-00047.safetensors", + "model.layers.8.mlp.experts.64.up_proj.weight_scale": "model-00009-of-00047.safetensors", + "model.layers.8.mlp.experts.65.down_proj.weight": "model-00009-of-00047.safetensors", + "model.layers.8.mlp.experts.65.down_proj.weight_scale": "model-00009-of-00047.safetensors", + "model.layers.8.mlp.experts.65.gate_proj.weight": "model-00009-of-00047.safetensors", + "model.layers.8.mlp.experts.65.gate_proj.weight_scale": "model-00009-of-00047.safetensors", + "model.layers.8.mlp.experts.65.up_proj.weight": "model-00009-of-00047.safetensors", + "model.layers.8.mlp.experts.65.up_proj.weight_scale": "model-00009-of-00047.safetensors", + "model.layers.8.mlp.experts.66.down_proj.weight": "model-00009-of-00047.safetensors", + "model.layers.8.mlp.experts.66.down_proj.weight_scale": "model-00009-of-00047.safetensors", + "model.layers.8.mlp.experts.66.gate_proj.weight": "model-00009-of-00047.safetensors", + "model.layers.8.mlp.experts.66.gate_proj.weight_scale": "model-00009-of-00047.safetensors", + "model.layers.8.mlp.experts.66.up_proj.weight": "model-00009-of-00047.safetensors", + "model.layers.8.mlp.experts.66.up_proj.weight_scale": "model-00009-of-00047.safetensors", + "model.layers.8.mlp.experts.67.down_proj.weight": "model-00009-of-00047.safetensors", + "model.layers.8.mlp.experts.67.down_proj.weight_scale": "model-00009-of-00047.safetensors", + "model.layers.8.mlp.experts.67.gate_proj.weight": "model-00009-of-00047.safetensors", + "model.layers.8.mlp.experts.67.gate_proj.weight_scale": "model-00009-of-00047.safetensors", + "model.layers.8.mlp.experts.67.up_proj.weight": "model-00009-of-00047.safetensors", + "model.layers.8.mlp.experts.67.up_proj.weight_scale": "model-00009-of-00047.safetensors", + "model.layers.8.mlp.experts.68.down_proj.weight": "model-00009-of-00047.safetensors", + "model.layers.8.mlp.experts.68.down_proj.weight_scale": "model-00009-of-00047.safetensors", + "model.layers.8.mlp.experts.68.gate_proj.weight": "model-00009-of-00047.safetensors", + "model.layers.8.mlp.experts.68.gate_proj.weight_scale": "model-00009-of-00047.safetensors", + "model.layers.8.mlp.experts.68.up_proj.weight": "model-00009-of-00047.safetensors", + "model.layers.8.mlp.experts.68.up_proj.weight_scale": "model-00009-of-00047.safetensors", + "model.layers.8.mlp.experts.69.down_proj.weight": "model-00009-of-00047.safetensors", + "model.layers.8.mlp.experts.69.down_proj.weight_scale": "model-00009-of-00047.safetensors", + "model.layers.8.mlp.experts.69.gate_proj.weight": "model-00009-of-00047.safetensors", + "model.layers.8.mlp.experts.69.gate_proj.weight_scale": "model-00009-of-00047.safetensors", + "model.layers.8.mlp.experts.69.up_proj.weight": "model-00009-of-00047.safetensors", + "model.layers.8.mlp.experts.69.up_proj.weight_scale": "model-00009-of-00047.safetensors", + "model.layers.8.mlp.experts.7.down_proj.weight": "model-00009-of-00047.safetensors", + "model.layers.8.mlp.experts.7.down_proj.weight_scale": "model-00009-of-00047.safetensors", + "model.layers.8.mlp.experts.7.gate_proj.weight": "model-00009-of-00047.safetensors", + "model.layers.8.mlp.experts.7.gate_proj.weight_scale": "model-00009-of-00047.safetensors", + "model.layers.8.mlp.experts.7.up_proj.weight": "model-00009-of-00047.safetensors", + "model.layers.8.mlp.experts.7.up_proj.weight_scale": "model-00009-of-00047.safetensors", + "model.layers.8.mlp.experts.70.down_proj.weight": "model-00009-of-00047.safetensors", + "model.layers.8.mlp.experts.70.down_proj.weight_scale": "model-00009-of-00047.safetensors", + "model.layers.8.mlp.experts.70.gate_proj.weight": "model-00009-of-00047.safetensors", + "model.layers.8.mlp.experts.70.gate_proj.weight_scale": "model-00009-of-00047.safetensors", + "model.layers.8.mlp.experts.70.up_proj.weight": "model-00009-of-00047.safetensors", + "model.layers.8.mlp.experts.70.up_proj.weight_scale": "model-00009-of-00047.safetensors", + "model.layers.8.mlp.experts.71.down_proj.weight": "model-00009-of-00047.safetensors", + "model.layers.8.mlp.experts.71.down_proj.weight_scale": "model-00009-of-00047.safetensors", + "model.layers.8.mlp.experts.71.gate_proj.weight": "model-00009-of-00047.safetensors", + "model.layers.8.mlp.experts.71.gate_proj.weight_scale": "model-00009-of-00047.safetensors", + "model.layers.8.mlp.experts.71.up_proj.weight": "model-00009-of-00047.safetensors", + "model.layers.8.mlp.experts.71.up_proj.weight_scale": "model-00009-of-00047.safetensors", + "model.layers.8.mlp.experts.72.down_proj.weight": "model-00009-of-00047.safetensors", + "model.layers.8.mlp.experts.72.down_proj.weight_scale": "model-00009-of-00047.safetensors", + "model.layers.8.mlp.experts.72.gate_proj.weight": "model-00009-of-00047.safetensors", + "model.layers.8.mlp.experts.72.gate_proj.weight_scale": "model-00009-of-00047.safetensors", + "model.layers.8.mlp.experts.72.up_proj.weight": "model-00009-of-00047.safetensors", + "model.layers.8.mlp.experts.72.up_proj.weight_scale": "model-00009-of-00047.safetensors", + "model.layers.8.mlp.experts.73.down_proj.weight": "model-00009-of-00047.safetensors", + "model.layers.8.mlp.experts.73.down_proj.weight_scale": "model-00009-of-00047.safetensors", + "model.layers.8.mlp.experts.73.gate_proj.weight": "model-00009-of-00047.safetensors", + "model.layers.8.mlp.experts.73.gate_proj.weight_scale": "model-00009-of-00047.safetensors", + "model.layers.8.mlp.experts.73.up_proj.weight": "model-00009-of-00047.safetensors", + "model.layers.8.mlp.experts.73.up_proj.weight_scale": "model-00009-of-00047.safetensors", + "model.layers.8.mlp.experts.74.down_proj.weight": "model-00009-of-00047.safetensors", + "model.layers.8.mlp.experts.74.down_proj.weight_scale": "model-00009-of-00047.safetensors", + "model.layers.8.mlp.experts.74.gate_proj.weight": "model-00009-of-00047.safetensors", + "model.layers.8.mlp.experts.74.gate_proj.weight_scale": "model-00009-of-00047.safetensors", + "model.layers.8.mlp.experts.74.up_proj.weight": "model-00009-of-00047.safetensors", + "model.layers.8.mlp.experts.74.up_proj.weight_scale": "model-00009-of-00047.safetensors", + "model.layers.8.mlp.experts.75.down_proj.weight": "model-00009-of-00047.safetensors", + "model.layers.8.mlp.experts.75.down_proj.weight_scale": "model-00009-of-00047.safetensors", + "model.layers.8.mlp.experts.75.gate_proj.weight": "model-00009-of-00047.safetensors", + "model.layers.8.mlp.experts.75.gate_proj.weight_scale": "model-00009-of-00047.safetensors", + "model.layers.8.mlp.experts.75.up_proj.weight": "model-00009-of-00047.safetensors", + "model.layers.8.mlp.experts.75.up_proj.weight_scale": "model-00009-of-00047.safetensors", + "model.layers.8.mlp.experts.76.down_proj.weight": "model-00009-of-00047.safetensors", + "model.layers.8.mlp.experts.76.down_proj.weight_scale": "model-00009-of-00047.safetensors", + "model.layers.8.mlp.experts.76.gate_proj.weight": "model-00009-of-00047.safetensors", + "model.layers.8.mlp.experts.76.gate_proj.weight_scale": "model-00009-of-00047.safetensors", + "model.layers.8.mlp.experts.76.up_proj.weight": "model-00009-of-00047.safetensors", + "model.layers.8.mlp.experts.76.up_proj.weight_scale": "model-00009-of-00047.safetensors", + "model.layers.8.mlp.experts.77.down_proj.weight": "model-00009-of-00047.safetensors", + "model.layers.8.mlp.experts.77.down_proj.weight_scale": "model-00009-of-00047.safetensors", + "model.layers.8.mlp.experts.77.gate_proj.weight": "model-00009-of-00047.safetensors", + "model.layers.8.mlp.experts.77.gate_proj.weight_scale": "model-00009-of-00047.safetensors", + "model.layers.8.mlp.experts.77.up_proj.weight": "model-00009-of-00047.safetensors", + "model.layers.8.mlp.experts.77.up_proj.weight_scale": "model-00009-of-00047.safetensors", + "model.layers.8.mlp.experts.78.down_proj.weight": "model-00009-of-00047.safetensors", + "model.layers.8.mlp.experts.78.down_proj.weight_scale": "model-00009-of-00047.safetensors", + "model.layers.8.mlp.experts.78.gate_proj.weight": "model-00009-of-00047.safetensors", + "model.layers.8.mlp.experts.78.gate_proj.weight_scale": "model-00009-of-00047.safetensors", + "model.layers.8.mlp.experts.78.up_proj.weight": "model-00009-of-00047.safetensors", + "model.layers.8.mlp.experts.78.up_proj.weight_scale": "model-00009-of-00047.safetensors", + "model.layers.8.mlp.experts.79.down_proj.weight": "model-00009-of-00047.safetensors", + "model.layers.8.mlp.experts.79.down_proj.weight_scale": "model-00009-of-00047.safetensors", + "model.layers.8.mlp.experts.79.gate_proj.weight": "model-00009-of-00047.safetensors", + "model.layers.8.mlp.experts.79.gate_proj.weight_scale": "model-00009-of-00047.safetensors", + "model.layers.8.mlp.experts.79.up_proj.weight": "model-00009-of-00047.safetensors", + "model.layers.8.mlp.experts.79.up_proj.weight_scale": "model-00009-of-00047.safetensors", + "model.layers.8.mlp.experts.8.down_proj.weight": "model-00009-of-00047.safetensors", + "model.layers.8.mlp.experts.8.down_proj.weight_scale": "model-00009-of-00047.safetensors", + "model.layers.8.mlp.experts.8.gate_proj.weight": "model-00009-of-00047.safetensors", + "model.layers.8.mlp.experts.8.gate_proj.weight_scale": "model-00009-of-00047.safetensors", + "model.layers.8.mlp.experts.8.up_proj.weight": "model-00009-of-00047.safetensors", + "model.layers.8.mlp.experts.8.up_proj.weight_scale": "model-00009-of-00047.safetensors", + "model.layers.8.mlp.experts.80.down_proj.weight": "model-00009-of-00047.safetensors", + "model.layers.8.mlp.experts.80.down_proj.weight_scale": "model-00009-of-00047.safetensors", + "model.layers.8.mlp.experts.80.gate_proj.weight": "model-00009-of-00047.safetensors", + "model.layers.8.mlp.experts.80.gate_proj.weight_scale": "model-00009-of-00047.safetensors", + "model.layers.8.mlp.experts.80.up_proj.weight": "model-00009-of-00047.safetensors", + "model.layers.8.mlp.experts.80.up_proj.weight_scale": "model-00009-of-00047.safetensors", + "model.layers.8.mlp.experts.81.down_proj.weight": "model-00009-of-00047.safetensors", + "model.layers.8.mlp.experts.81.down_proj.weight_scale": "model-00009-of-00047.safetensors", + "model.layers.8.mlp.experts.81.gate_proj.weight": "model-00009-of-00047.safetensors", + "model.layers.8.mlp.experts.81.gate_proj.weight_scale": "model-00009-of-00047.safetensors", + "model.layers.8.mlp.experts.81.up_proj.weight": "model-00009-of-00047.safetensors", + "model.layers.8.mlp.experts.81.up_proj.weight_scale": "model-00009-of-00047.safetensors", + "model.layers.8.mlp.experts.82.down_proj.weight": "model-00009-of-00047.safetensors", + "model.layers.8.mlp.experts.82.down_proj.weight_scale": "model-00009-of-00047.safetensors", + "model.layers.8.mlp.experts.82.gate_proj.weight": "model-00009-of-00047.safetensors", + "model.layers.8.mlp.experts.82.gate_proj.weight_scale": "model-00009-of-00047.safetensors", + "model.layers.8.mlp.experts.82.up_proj.weight": "model-00009-of-00047.safetensors", + "model.layers.8.mlp.experts.82.up_proj.weight_scale": "model-00009-of-00047.safetensors", + "model.layers.8.mlp.experts.83.down_proj.weight": "model-00009-of-00047.safetensors", + "model.layers.8.mlp.experts.83.down_proj.weight_scale": "model-00009-of-00047.safetensors", + "model.layers.8.mlp.experts.83.gate_proj.weight": "model-00009-of-00047.safetensors", + "model.layers.8.mlp.experts.83.gate_proj.weight_scale": "model-00009-of-00047.safetensors", + "model.layers.8.mlp.experts.83.up_proj.weight": "model-00009-of-00047.safetensors", + "model.layers.8.mlp.experts.83.up_proj.weight_scale": "model-00009-of-00047.safetensors", + "model.layers.8.mlp.experts.84.down_proj.weight": "model-00009-of-00047.safetensors", + "model.layers.8.mlp.experts.84.down_proj.weight_scale": "model-00009-of-00047.safetensors", + "model.layers.8.mlp.experts.84.gate_proj.weight": "model-00009-of-00047.safetensors", + "model.layers.8.mlp.experts.84.gate_proj.weight_scale": "model-00009-of-00047.safetensors", + "model.layers.8.mlp.experts.84.up_proj.weight": "model-00009-of-00047.safetensors", + "model.layers.8.mlp.experts.84.up_proj.weight_scale": "model-00009-of-00047.safetensors", + "model.layers.8.mlp.experts.85.down_proj.weight": "model-00009-of-00047.safetensors", + "model.layers.8.mlp.experts.85.down_proj.weight_scale": "model-00009-of-00047.safetensors", + "model.layers.8.mlp.experts.85.gate_proj.weight": "model-00009-of-00047.safetensors", + "model.layers.8.mlp.experts.85.gate_proj.weight_scale": "model-00009-of-00047.safetensors", + "model.layers.8.mlp.experts.85.up_proj.weight": "model-00009-of-00047.safetensors", + "model.layers.8.mlp.experts.85.up_proj.weight_scale": "model-00009-of-00047.safetensors", + "model.layers.8.mlp.experts.86.down_proj.weight": "model-00009-of-00047.safetensors", + "model.layers.8.mlp.experts.86.down_proj.weight_scale": "model-00009-of-00047.safetensors", + "model.layers.8.mlp.experts.86.gate_proj.weight": "model-00009-of-00047.safetensors", + "model.layers.8.mlp.experts.86.gate_proj.weight_scale": "model-00009-of-00047.safetensors", + "model.layers.8.mlp.experts.86.up_proj.weight": "model-00009-of-00047.safetensors", + "model.layers.8.mlp.experts.86.up_proj.weight_scale": "model-00009-of-00047.safetensors", + "model.layers.8.mlp.experts.87.down_proj.weight": "model-00009-of-00047.safetensors", + "model.layers.8.mlp.experts.87.down_proj.weight_scale": "model-00009-of-00047.safetensors", + "model.layers.8.mlp.experts.87.gate_proj.weight": "model-00009-of-00047.safetensors", + "model.layers.8.mlp.experts.87.gate_proj.weight_scale": "model-00009-of-00047.safetensors", + "model.layers.8.mlp.experts.87.up_proj.weight": "model-00009-of-00047.safetensors", + "model.layers.8.mlp.experts.87.up_proj.weight_scale": "model-00009-of-00047.safetensors", + "model.layers.8.mlp.experts.88.down_proj.weight": "model-00009-of-00047.safetensors", + "model.layers.8.mlp.experts.88.down_proj.weight_scale": "model-00009-of-00047.safetensors", + "model.layers.8.mlp.experts.88.gate_proj.weight": "model-00009-of-00047.safetensors", + "model.layers.8.mlp.experts.88.gate_proj.weight_scale": "model-00009-of-00047.safetensors", + "model.layers.8.mlp.experts.88.up_proj.weight": "model-00009-of-00047.safetensors", + "model.layers.8.mlp.experts.88.up_proj.weight_scale": "model-00009-of-00047.safetensors", + "model.layers.8.mlp.experts.89.down_proj.weight": "model-00009-of-00047.safetensors", + "model.layers.8.mlp.experts.89.down_proj.weight_scale": "model-00009-of-00047.safetensors", + "model.layers.8.mlp.experts.89.gate_proj.weight": "model-00009-of-00047.safetensors", + "model.layers.8.mlp.experts.89.gate_proj.weight_scale": "model-00009-of-00047.safetensors", + "model.layers.8.mlp.experts.89.up_proj.weight": "model-00009-of-00047.safetensors", + "model.layers.8.mlp.experts.89.up_proj.weight_scale": "model-00009-of-00047.safetensors", + "model.layers.8.mlp.experts.9.down_proj.weight": "model-00009-of-00047.safetensors", + "model.layers.8.mlp.experts.9.down_proj.weight_scale": "model-00009-of-00047.safetensors", + "model.layers.8.mlp.experts.9.gate_proj.weight": "model-00009-of-00047.safetensors", + "model.layers.8.mlp.experts.9.gate_proj.weight_scale": "model-00009-of-00047.safetensors", + "model.layers.8.mlp.experts.9.up_proj.weight": "model-00009-of-00047.safetensors", + "model.layers.8.mlp.experts.9.up_proj.weight_scale": "model-00009-of-00047.safetensors", + "model.layers.8.mlp.experts.90.down_proj.weight": "model-00009-of-00047.safetensors", + "model.layers.8.mlp.experts.90.down_proj.weight_scale": "model-00009-of-00047.safetensors", + "model.layers.8.mlp.experts.90.gate_proj.weight": "model-00009-of-00047.safetensors", + "model.layers.8.mlp.experts.90.gate_proj.weight_scale": "model-00009-of-00047.safetensors", + "model.layers.8.mlp.experts.90.up_proj.weight": "model-00009-of-00047.safetensors", + "model.layers.8.mlp.experts.90.up_proj.weight_scale": "model-00009-of-00047.safetensors", + "model.layers.8.mlp.experts.91.down_proj.weight": "model-00009-of-00047.safetensors", + "model.layers.8.mlp.experts.91.down_proj.weight_scale": "model-00009-of-00047.safetensors", + "model.layers.8.mlp.experts.91.gate_proj.weight": "model-00009-of-00047.safetensors", + "model.layers.8.mlp.experts.91.gate_proj.weight_scale": "model-00009-of-00047.safetensors", + "model.layers.8.mlp.experts.91.up_proj.weight": "model-00009-of-00047.safetensors", + "model.layers.8.mlp.experts.91.up_proj.weight_scale": "model-00009-of-00047.safetensors", + "model.layers.8.mlp.experts.92.down_proj.weight": "model-00009-of-00047.safetensors", + "model.layers.8.mlp.experts.92.down_proj.weight_scale": "model-00009-of-00047.safetensors", + "model.layers.8.mlp.experts.92.gate_proj.weight": "model-00009-of-00047.safetensors", + "model.layers.8.mlp.experts.92.gate_proj.weight_scale": "model-00009-of-00047.safetensors", + "model.layers.8.mlp.experts.92.up_proj.weight": "model-00009-of-00047.safetensors", + "model.layers.8.mlp.experts.92.up_proj.weight_scale": "model-00009-of-00047.safetensors", + "model.layers.8.mlp.experts.93.down_proj.weight": "model-00009-of-00047.safetensors", + "model.layers.8.mlp.experts.93.down_proj.weight_scale": "model-00009-of-00047.safetensors", + "model.layers.8.mlp.experts.93.gate_proj.weight": "model-00009-of-00047.safetensors", + "model.layers.8.mlp.experts.93.gate_proj.weight_scale": "model-00009-of-00047.safetensors", + "model.layers.8.mlp.experts.93.up_proj.weight": "model-00009-of-00047.safetensors", + "model.layers.8.mlp.experts.93.up_proj.weight_scale": "model-00009-of-00047.safetensors", + "model.layers.8.mlp.experts.94.down_proj.weight": "model-00009-of-00047.safetensors", + "model.layers.8.mlp.experts.94.down_proj.weight_scale": "model-00009-of-00047.safetensors", + "model.layers.8.mlp.experts.94.gate_proj.weight": "model-00009-of-00047.safetensors", + "model.layers.8.mlp.experts.94.gate_proj.weight_scale": "model-00009-of-00047.safetensors", + "model.layers.8.mlp.experts.94.up_proj.weight": "model-00009-of-00047.safetensors", + "model.layers.8.mlp.experts.94.up_proj.weight_scale": "model-00009-of-00047.safetensors", + "model.layers.8.mlp.experts.95.down_proj.weight": "model-00009-of-00047.safetensors", + "model.layers.8.mlp.experts.95.down_proj.weight_scale": "model-00009-of-00047.safetensors", + "model.layers.8.mlp.experts.95.gate_proj.weight": "model-00009-of-00047.safetensors", + "model.layers.8.mlp.experts.95.gate_proj.weight_scale": "model-00009-of-00047.safetensors", + "model.layers.8.mlp.experts.95.up_proj.weight": "model-00009-of-00047.safetensors", + "model.layers.8.mlp.experts.95.up_proj.weight_scale": "model-00009-of-00047.safetensors", + "model.layers.8.mlp.experts.96.down_proj.weight": "model-00009-of-00047.safetensors", + "model.layers.8.mlp.experts.96.down_proj.weight_scale": "model-00009-of-00047.safetensors", + "model.layers.8.mlp.experts.96.gate_proj.weight": "model-00009-of-00047.safetensors", + "model.layers.8.mlp.experts.96.gate_proj.weight_scale": "model-00009-of-00047.safetensors", + "model.layers.8.mlp.experts.96.up_proj.weight": "model-00009-of-00047.safetensors", + "model.layers.8.mlp.experts.96.up_proj.weight_scale": "model-00009-of-00047.safetensors", + "model.layers.8.mlp.experts.97.down_proj.weight": "model-00009-of-00047.safetensors", + "model.layers.8.mlp.experts.97.down_proj.weight_scale": "model-00009-of-00047.safetensors", + "model.layers.8.mlp.experts.97.gate_proj.weight": "model-00009-of-00047.safetensors", + "model.layers.8.mlp.experts.97.gate_proj.weight_scale": "model-00009-of-00047.safetensors", + "model.layers.8.mlp.experts.97.up_proj.weight": "model-00009-of-00047.safetensors", + "model.layers.8.mlp.experts.97.up_proj.weight_scale": "model-00009-of-00047.safetensors", + "model.layers.8.mlp.experts.98.down_proj.weight": "model-00009-of-00047.safetensors", + "model.layers.8.mlp.experts.98.down_proj.weight_scale": "model-00009-of-00047.safetensors", + "model.layers.8.mlp.experts.98.gate_proj.weight": "model-00009-of-00047.safetensors", + "model.layers.8.mlp.experts.98.gate_proj.weight_scale": "model-00009-of-00047.safetensors", + "model.layers.8.mlp.experts.98.up_proj.weight": "model-00009-of-00047.safetensors", + "model.layers.8.mlp.experts.98.up_proj.weight_scale": "model-00009-of-00047.safetensors", + "model.layers.8.mlp.experts.99.down_proj.weight": "model-00009-of-00047.safetensors", + "model.layers.8.mlp.experts.99.down_proj.weight_scale": "model-00009-of-00047.safetensors", + "model.layers.8.mlp.experts.99.gate_proj.weight": "model-00009-of-00047.safetensors", + "model.layers.8.mlp.experts.99.gate_proj.weight_scale": "model-00009-of-00047.safetensors", + "model.layers.8.mlp.experts.99.up_proj.weight": "model-00009-of-00047.safetensors", + "model.layers.8.mlp.experts.99.up_proj.weight_scale": "model-00009-of-00047.safetensors", + "model.layers.8.mlp.gate.e_score_correction_bias": "model-00009-of-00047.safetensors", + "model.layers.8.mlp.gate.weight": "model-00009-of-00047.safetensors", + "model.layers.8.mlp.shared_experts.down_proj.weight": "model-00009-of-00047.safetensors", + "model.layers.8.mlp.shared_experts.down_proj.weight_scale": "model-00009-of-00047.safetensors", + "model.layers.8.mlp.shared_experts.gate_proj.weight": "model-00009-of-00047.safetensors", + "model.layers.8.mlp.shared_experts.gate_proj.weight_scale": "model-00009-of-00047.safetensors", + "model.layers.8.mlp.shared_experts.up_proj.weight": "model-00009-of-00047.safetensors", + "model.layers.8.mlp.shared_experts.up_proj.weight_scale": "model-00009-of-00047.safetensors", + "model.layers.8.post_attention_layernorm.weight": "model-00009-of-00047.safetensors", + "model.layers.8.self_attn.k_proj.bias": "model-00009-of-00047.safetensors", + "model.layers.8.self_attn.k_proj.weight": "model-00009-of-00047.safetensors", + "model.layers.8.self_attn.k_proj.weight_scale": "model-00009-of-00047.safetensors", + "model.layers.8.self_attn.o_proj.weight": "model-00009-of-00047.safetensors", + "model.layers.8.self_attn.o_proj.weight_scale": "model-00009-of-00047.safetensors", + "model.layers.8.self_attn.q_proj.bias": "model-00009-of-00047.safetensors", + "model.layers.8.self_attn.q_proj.weight": "model-00009-of-00047.safetensors", + "model.layers.8.self_attn.q_proj.weight_scale": "model-00009-of-00047.safetensors", + "model.layers.8.self_attn.v_proj.bias": "model-00009-of-00047.safetensors", + "model.layers.8.self_attn.v_proj.weight": "model-00009-of-00047.safetensors", + "model.layers.8.self_attn.v_proj.weight_scale": "model-00009-of-00047.safetensors", + "model.layers.9.input_layernorm.weight": "model-00010-of-00047.safetensors", + "model.layers.9.mlp.experts.0.down_proj.weight": "model-00010-of-00047.safetensors", + "model.layers.9.mlp.experts.0.down_proj.weight_scale": "model-00010-of-00047.safetensors", + "model.layers.9.mlp.experts.0.gate_proj.weight": "model-00010-of-00047.safetensors", + "model.layers.9.mlp.experts.0.gate_proj.weight_scale": "model-00010-of-00047.safetensors", + "model.layers.9.mlp.experts.0.up_proj.weight": "model-00010-of-00047.safetensors", + "model.layers.9.mlp.experts.0.up_proj.weight_scale": "model-00010-of-00047.safetensors", + "model.layers.9.mlp.experts.1.down_proj.weight": "model-00010-of-00047.safetensors", + "model.layers.9.mlp.experts.1.down_proj.weight_scale": "model-00010-of-00047.safetensors", + "model.layers.9.mlp.experts.1.gate_proj.weight": "model-00010-of-00047.safetensors", + "model.layers.9.mlp.experts.1.gate_proj.weight_scale": "model-00010-of-00047.safetensors", + "model.layers.9.mlp.experts.1.up_proj.weight": "model-00010-of-00047.safetensors", + "model.layers.9.mlp.experts.1.up_proj.weight_scale": "model-00010-of-00047.safetensors", + "model.layers.9.mlp.experts.10.down_proj.weight": "model-00010-of-00047.safetensors", + "model.layers.9.mlp.experts.10.down_proj.weight_scale": "model-00010-of-00047.safetensors", + "model.layers.9.mlp.experts.10.gate_proj.weight": "model-00010-of-00047.safetensors", + "model.layers.9.mlp.experts.10.gate_proj.weight_scale": "model-00010-of-00047.safetensors", + "model.layers.9.mlp.experts.10.up_proj.weight": "model-00010-of-00047.safetensors", + "model.layers.9.mlp.experts.10.up_proj.weight_scale": "model-00010-of-00047.safetensors", + "model.layers.9.mlp.experts.100.down_proj.weight": "model-00010-of-00047.safetensors", + "model.layers.9.mlp.experts.100.down_proj.weight_scale": "model-00010-of-00047.safetensors", + "model.layers.9.mlp.experts.100.gate_proj.weight": "model-00010-of-00047.safetensors", + "model.layers.9.mlp.experts.100.gate_proj.weight_scale": "model-00010-of-00047.safetensors", + "model.layers.9.mlp.experts.100.up_proj.weight": "model-00010-of-00047.safetensors", + "model.layers.9.mlp.experts.100.up_proj.weight_scale": "model-00010-of-00047.safetensors", + "model.layers.9.mlp.experts.101.down_proj.weight": "model-00010-of-00047.safetensors", + "model.layers.9.mlp.experts.101.down_proj.weight_scale": "model-00010-of-00047.safetensors", + "model.layers.9.mlp.experts.101.gate_proj.weight": "model-00010-of-00047.safetensors", + "model.layers.9.mlp.experts.101.gate_proj.weight_scale": "model-00010-of-00047.safetensors", + "model.layers.9.mlp.experts.101.up_proj.weight": "model-00010-of-00047.safetensors", + "model.layers.9.mlp.experts.101.up_proj.weight_scale": "model-00010-of-00047.safetensors", + "model.layers.9.mlp.experts.102.down_proj.weight": "model-00010-of-00047.safetensors", + "model.layers.9.mlp.experts.102.down_proj.weight_scale": "model-00010-of-00047.safetensors", + "model.layers.9.mlp.experts.102.gate_proj.weight": "model-00010-of-00047.safetensors", + "model.layers.9.mlp.experts.102.gate_proj.weight_scale": "model-00010-of-00047.safetensors", + "model.layers.9.mlp.experts.102.up_proj.weight": "model-00010-of-00047.safetensors", + "model.layers.9.mlp.experts.102.up_proj.weight_scale": "model-00010-of-00047.safetensors", + "model.layers.9.mlp.experts.103.down_proj.weight": "model-00010-of-00047.safetensors", + "model.layers.9.mlp.experts.103.down_proj.weight_scale": "model-00010-of-00047.safetensors", + "model.layers.9.mlp.experts.103.gate_proj.weight": "model-00010-of-00047.safetensors", + "model.layers.9.mlp.experts.103.gate_proj.weight_scale": "model-00010-of-00047.safetensors", + "model.layers.9.mlp.experts.103.up_proj.weight": "model-00010-of-00047.safetensors", + "model.layers.9.mlp.experts.103.up_proj.weight_scale": "model-00010-of-00047.safetensors", + "model.layers.9.mlp.experts.104.down_proj.weight": "model-00010-of-00047.safetensors", + "model.layers.9.mlp.experts.104.down_proj.weight_scale": "model-00010-of-00047.safetensors", + "model.layers.9.mlp.experts.104.gate_proj.weight": "model-00010-of-00047.safetensors", + "model.layers.9.mlp.experts.104.gate_proj.weight_scale": "model-00010-of-00047.safetensors", + "model.layers.9.mlp.experts.104.up_proj.weight": "model-00010-of-00047.safetensors", + "model.layers.9.mlp.experts.104.up_proj.weight_scale": "model-00010-of-00047.safetensors", + "model.layers.9.mlp.experts.105.down_proj.weight": "model-00010-of-00047.safetensors", + "model.layers.9.mlp.experts.105.down_proj.weight_scale": "model-00010-of-00047.safetensors", + "model.layers.9.mlp.experts.105.gate_proj.weight": "model-00010-of-00047.safetensors", + "model.layers.9.mlp.experts.105.gate_proj.weight_scale": "model-00010-of-00047.safetensors", + "model.layers.9.mlp.experts.105.up_proj.weight": "model-00010-of-00047.safetensors", + "model.layers.9.mlp.experts.105.up_proj.weight_scale": "model-00010-of-00047.safetensors", + "model.layers.9.mlp.experts.106.down_proj.weight": "model-00010-of-00047.safetensors", + "model.layers.9.mlp.experts.106.down_proj.weight_scale": "model-00010-of-00047.safetensors", + "model.layers.9.mlp.experts.106.gate_proj.weight": "model-00010-of-00047.safetensors", + "model.layers.9.mlp.experts.106.gate_proj.weight_scale": "model-00010-of-00047.safetensors", + "model.layers.9.mlp.experts.106.up_proj.weight": "model-00010-of-00047.safetensors", + "model.layers.9.mlp.experts.106.up_proj.weight_scale": "model-00010-of-00047.safetensors", + "model.layers.9.mlp.experts.107.down_proj.weight": "model-00010-of-00047.safetensors", + "model.layers.9.mlp.experts.107.down_proj.weight_scale": "model-00010-of-00047.safetensors", + "model.layers.9.mlp.experts.107.gate_proj.weight": "model-00010-of-00047.safetensors", + "model.layers.9.mlp.experts.107.gate_proj.weight_scale": "model-00010-of-00047.safetensors", + "model.layers.9.mlp.experts.107.up_proj.weight": "model-00010-of-00047.safetensors", + "model.layers.9.mlp.experts.107.up_proj.weight_scale": "model-00010-of-00047.safetensors", + "model.layers.9.mlp.experts.108.down_proj.weight": "model-00010-of-00047.safetensors", + "model.layers.9.mlp.experts.108.down_proj.weight_scale": "model-00010-of-00047.safetensors", + "model.layers.9.mlp.experts.108.gate_proj.weight": "model-00010-of-00047.safetensors", + "model.layers.9.mlp.experts.108.gate_proj.weight_scale": "model-00010-of-00047.safetensors", + "model.layers.9.mlp.experts.108.up_proj.weight": "model-00010-of-00047.safetensors", + "model.layers.9.mlp.experts.108.up_proj.weight_scale": "model-00010-of-00047.safetensors", + "model.layers.9.mlp.experts.109.down_proj.weight": "model-00010-of-00047.safetensors", + "model.layers.9.mlp.experts.109.down_proj.weight_scale": "model-00010-of-00047.safetensors", + "model.layers.9.mlp.experts.109.gate_proj.weight": "model-00010-of-00047.safetensors", + "model.layers.9.mlp.experts.109.gate_proj.weight_scale": "model-00010-of-00047.safetensors", + "model.layers.9.mlp.experts.109.up_proj.weight": "model-00010-of-00047.safetensors", + "model.layers.9.mlp.experts.109.up_proj.weight_scale": "model-00010-of-00047.safetensors", + "model.layers.9.mlp.experts.11.down_proj.weight": "model-00010-of-00047.safetensors", + "model.layers.9.mlp.experts.11.down_proj.weight_scale": "model-00010-of-00047.safetensors", + "model.layers.9.mlp.experts.11.gate_proj.weight": "model-00010-of-00047.safetensors", + "model.layers.9.mlp.experts.11.gate_proj.weight_scale": "model-00010-of-00047.safetensors", + "model.layers.9.mlp.experts.11.up_proj.weight": "model-00010-of-00047.safetensors", + "model.layers.9.mlp.experts.11.up_proj.weight_scale": "model-00010-of-00047.safetensors", + "model.layers.9.mlp.experts.110.down_proj.weight": "model-00010-of-00047.safetensors", + "model.layers.9.mlp.experts.110.down_proj.weight_scale": "model-00010-of-00047.safetensors", + "model.layers.9.mlp.experts.110.gate_proj.weight": "model-00010-of-00047.safetensors", + "model.layers.9.mlp.experts.110.gate_proj.weight_scale": "model-00010-of-00047.safetensors", + "model.layers.9.mlp.experts.110.up_proj.weight": "model-00010-of-00047.safetensors", + "model.layers.9.mlp.experts.110.up_proj.weight_scale": "model-00010-of-00047.safetensors", + "model.layers.9.mlp.experts.111.down_proj.weight": "model-00010-of-00047.safetensors", + "model.layers.9.mlp.experts.111.down_proj.weight_scale": "model-00010-of-00047.safetensors", + "model.layers.9.mlp.experts.111.gate_proj.weight": "model-00010-of-00047.safetensors", + "model.layers.9.mlp.experts.111.gate_proj.weight_scale": "model-00010-of-00047.safetensors", + "model.layers.9.mlp.experts.111.up_proj.weight": "model-00010-of-00047.safetensors", + "model.layers.9.mlp.experts.111.up_proj.weight_scale": "model-00010-of-00047.safetensors", + "model.layers.9.mlp.experts.112.down_proj.weight": "model-00010-of-00047.safetensors", + "model.layers.9.mlp.experts.112.down_proj.weight_scale": "model-00010-of-00047.safetensors", + "model.layers.9.mlp.experts.112.gate_proj.weight": "model-00010-of-00047.safetensors", + "model.layers.9.mlp.experts.112.gate_proj.weight_scale": "model-00010-of-00047.safetensors", + "model.layers.9.mlp.experts.112.up_proj.weight": "model-00010-of-00047.safetensors", + "model.layers.9.mlp.experts.112.up_proj.weight_scale": "model-00010-of-00047.safetensors", + "model.layers.9.mlp.experts.113.down_proj.weight": "model-00010-of-00047.safetensors", + "model.layers.9.mlp.experts.113.down_proj.weight_scale": "model-00010-of-00047.safetensors", + "model.layers.9.mlp.experts.113.gate_proj.weight": "model-00010-of-00047.safetensors", + "model.layers.9.mlp.experts.113.gate_proj.weight_scale": "model-00010-of-00047.safetensors", + "model.layers.9.mlp.experts.113.up_proj.weight": "model-00010-of-00047.safetensors", + "model.layers.9.mlp.experts.113.up_proj.weight_scale": "model-00010-of-00047.safetensors", + "model.layers.9.mlp.experts.114.down_proj.weight": "model-00010-of-00047.safetensors", + "model.layers.9.mlp.experts.114.down_proj.weight_scale": "model-00010-of-00047.safetensors", + "model.layers.9.mlp.experts.114.gate_proj.weight": "model-00010-of-00047.safetensors", + "model.layers.9.mlp.experts.114.gate_proj.weight_scale": "model-00010-of-00047.safetensors", + "model.layers.9.mlp.experts.114.up_proj.weight": "model-00010-of-00047.safetensors", + "model.layers.9.mlp.experts.114.up_proj.weight_scale": "model-00010-of-00047.safetensors", + "model.layers.9.mlp.experts.115.down_proj.weight": "model-00010-of-00047.safetensors", + "model.layers.9.mlp.experts.115.down_proj.weight_scale": "model-00010-of-00047.safetensors", + "model.layers.9.mlp.experts.115.gate_proj.weight": "model-00010-of-00047.safetensors", + "model.layers.9.mlp.experts.115.gate_proj.weight_scale": "model-00010-of-00047.safetensors", + "model.layers.9.mlp.experts.115.up_proj.weight": "model-00010-of-00047.safetensors", + "model.layers.9.mlp.experts.115.up_proj.weight_scale": "model-00010-of-00047.safetensors", + "model.layers.9.mlp.experts.116.down_proj.weight": "model-00010-of-00047.safetensors", + "model.layers.9.mlp.experts.116.down_proj.weight_scale": "model-00010-of-00047.safetensors", + "model.layers.9.mlp.experts.116.gate_proj.weight": "model-00010-of-00047.safetensors", + "model.layers.9.mlp.experts.116.gate_proj.weight_scale": "model-00010-of-00047.safetensors", + "model.layers.9.mlp.experts.116.up_proj.weight": "model-00010-of-00047.safetensors", + "model.layers.9.mlp.experts.116.up_proj.weight_scale": "model-00010-of-00047.safetensors", + "model.layers.9.mlp.experts.117.down_proj.weight": "model-00010-of-00047.safetensors", + "model.layers.9.mlp.experts.117.down_proj.weight_scale": "model-00010-of-00047.safetensors", + "model.layers.9.mlp.experts.117.gate_proj.weight": "model-00010-of-00047.safetensors", + "model.layers.9.mlp.experts.117.gate_proj.weight_scale": "model-00010-of-00047.safetensors", + "model.layers.9.mlp.experts.117.up_proj.weight": "model-00010-of-00047.safetensors", + "model.layers.9.mlp.experts.117.up_proj.weight_scale": "model-00010-of-00047.safetensors", + "model.layers.9.mlp.experts.118.down_proj.weight": "model-00010-of-00047.safetensors", + "model.layers.9.mlp.experts.118.down_proj.weight_scale": "model-00010-of-00047.safetensors", + "model.layers.9.mlp.experts.118.gate_proj.weight": "model-00010-of-00047.safetensors", + "model.layers.9.mlp.experts.118.gate_proj.weight_scale": "model-00010-of-00047.safetensors", + "model.layers.9.mlp.experts.118.up_proj.weight": "model-00010-of-00047.safetensors", + "model.layers.9.mlp.experts.118.up_proj.weight_scale": "model-00010-of-00047.safetensors", + "model.layers.9.mlp.experts.119.down_proj.weight": "model-00010-of-00047.safetensors", + "model.layers.9.mlp.experts.119.down_proj.weight_scale": "model-00010-of-00047.safetensors", + "model.layers.9.mlp.experts.119.gate_proj.weight": "model-00010-of-00047.safetensors", + "model.layers.9.mlp.experts.119.gate_proj.weight_scale": "model-00010-of-00047.safetensors", + "model.layers.9.mlp.experts.119.up_proj.weight": "model-00010-of-00047.safetensors", + "model.layers.9.mlp.experts.119.up_proj.weight_scale": "model-00010-of-00047.safetensors", + "model.layers.9.mlp.experts.12.down_proj.weight": "model-00010-of-00047.safetensors", + "model.layers.9.mlp.experts.12.down_proj.weight_scale": "model-00010-of-00047.safetensors", + "model.layers.9.mlp.experts.12.gate_proj.weight": "model-00010-of-00047.safetensors", + "model.layers.9.mlp.experts.12.gate_proj.weight_scale": "model-00010-of-00047.safetensors", + "model.layers.9.mlp.experts.12.up_proj.weight": "model-00010-of-00047.safetensors", + "model.layers.9.mlp.experts.12.up_proj.weight_scale": "model-00010-of-00047.safetensors", + "model.layers.9.mlp.experts.120.down_proj.weight": "model-00010-of-00047.safetensors", + "model.layers.9.mlp.experts.120.down_proj.weight_scale": "model-00010-of-00047.safetensors", + "model.layers.9.mlp.experts.120.gate_proj.weight": "model-00010-of-00047.safetensors", + "model.layers.9.mlp.experts.120.gate_proj.weight_scale": "model-00010-of-00047.safetensors", + "model.layers.9.mlp.experts.120.up_proj.weight": "model-00010-of-00047.safetensors", + "model.layers.9.mlp.experts.120.up_proj.weight_scale": "model-00010-of-00047.safetensors", + "model.layers.9.mlp.experts.121.down_proj.weight": "model-00010-of-00047.safetensors", + "model.layers.9.mlp.experts.121.down_proj.weight_scale": "model-00010-of-00047.safetensors", + "model.layers.9.mlp.experts.121.gate_proj.weight": "model-00010-of-00047.safetensors", + "model.layers.9.mlp.experts.121.gate_proj.weight_scale": "model-00010-of-00047.safetensors", + "model.layers.9.mlp.experts.121.up_proj.weight": "model-00010-of-00047.safetensors", + "model.layers.9.mlp.experts.121.up_proj.weight_scale": "model-00010-of-00047.safetensors", + "model.layers.9.mlp.experts.122.down_proj.weight": "model-00010-of-00047.safetensors", + "model.layers.9.mlp.experts.122.down_proj.weight_scale": "model-00010-of-00047.safetensors", + "model.layers.9.mlp.experts.122.gate_proj.weight": "model-00010-of-00047.safetensors", + "model.layers.9.mlp.experts.122.gate_proj.weight_scale": "model-00010-of-00047.safetensors", + "model.layers.9.mlp.experts.122.up_proj.weight": "model-00010-of-00047.safetensors", + "model.layers.9.mlp.experts.122.up_proj.weight_scale": "model-00010-of-00047.safetensors", + "model.layers.9.mlp.experts.123.down_proj.weight": "model-00010-of-00047.safetensors", + "model.layers.9.mlp.experts.123.down_proj.weight_scale": "model-00010-of-00047.safetensors", + "model.layers.9.mlp.experts.123.gate_proj.weight": "model-00010-of-00047.safetensors", + "model.layers.9.mlp.experts.123.gate_proj.weight_scale": "model-00010-of-00047.safetensors", + "model.layers.9.mlp.experts.123.up_proj.weight": "model-00010-of-00047.safetensors", + "model.layers.9.mlp.experts.123.up_proj.weight_scale": "model-00010-of-00047.safetensors", + "model.layers.9.mlp.experts.124.down_proj.weight": "model-00010-of-00047.safetensors", + "model.layers.9.mlp.experts.124.down_proj.weight_scale": "model-00010-of-00047.safetensors", + "model.layers.9.mlp.experts.124.gate_proj.weight": "model-00010-of-00047.safetensors", + "model.layers.9.mlp.experts.124.gate_proj.weight_scale": "model-00010-of-00047.safetensors", + "model.layers.9.mlp.experts.124.up_proj.weight": "model-00010-of-00047.safetensors", + "model.layers.9.mlp.experts.124.up_proj.weight_scale": "model-00010-of-00047.safetensors", + "model.layers.9.mlp.experts.125.down_proj.weight": "model-00010-of-00047.safetensors", + "model.layers.9.mlp.experts.125.down_proj.weight_scale": "model-00010-of-00047.safetensors", + "model.layers.9.mlp.experts.125.gate_proj.weight": "model-00010-of-00047.safetensors", + "model.layers.9.mlp.experts.125.gate_proj.weight_scale": "model-00010-of-00047.safetensors", + "model.layers.9.mlp.experts.125.up_proj.weight": "model-00010-of-00047.safetensors", + "model.layers.9.mlp.experts.125.up_proj.weight_scale": "model-00010-of-00047.safetensors", + "model.layers.9.mlp.experts.126.down_proj.weight": "model-00010-of-00047.safetensors", + "model.layers.9.mlp.experts.126.down_proj.weight_scale": "model-00010-of-00047.safetensors", + "model.layers.9.mlp.experts.126.gate_proj.weight": "model-00010-of-00047.safetensors", + "model.layers.9.mlp.experts.126.gate_proj.weight_scale": "model-00010-of-00047.safetensors", + "model.layers.9.mlp.experts.126.up_proj.weight": "model-00010-of-00047.safetensors", + "model.layers.9.mlp.experts.126.up_proj.weight_scale": "model-00010-of-00047.safetensors", + "model.layers.9.mlp.experts.127.down_proj.weight": "model-00010-of-00047.safetensors", + "model.layers.9.mlp.experts.127.down_proj.weight_scale": "model-00010-of-00047.safetensors", + "model.layers.9.mlp.experts.127.gate_proj.weight": "model-00010-of-00047.safetensors", + "model.layers.9.mlp.experts.127.gate_proj.weight_scale": "model-00010-of-00047.safetensors", + "model.layers.9.mlp.experts.127.up_proj.weight": "model-00010-of-00047.safetensors", + "model.layers.9.mlp.experts.127.up_proj.weight_scale": "model-00010-of-00047.safetensors", + "model.layers.9.mlp.experts.13.down_proj.weight": "model-00010-of-00047.safetensors", + "model.layers.9.mlp.experts.13.down_proj.weight_scale": "model-00010-of-00047.safetensors", + "model.layers.9.mlp.experts.13.gate_proj.weight": "model-00010-of-00047.safetensors", + "model.layers.9.mlp.experts.13.gate_proj.weight_scale": "model-00010-of-00047.safetensors", + "model.layers.9.mlp.experts.13.up_proj.weight": "model-00010-of-00047.safetensors", + "model.layers.9.mlp.experts.13.up_proj.weight_scale": "model-00010-of-00047.safetensors", + "model.layers.9.mlp.experts.14.down_proj.weight": "model-00010-of-00047.safetensors", + "model.layers.9.mlp.experts.14.down_proj.weight_scale": "model-00010-of-00047.safetensors", + "model.layers.9.mlp.experts.14.gate_proj.weight": "model-00010-of-00047.safetensors", + "model.layers.9.mlp.experts.14.gate_proj.weight_scale": "model-00010-of-00047.safetensors", + "model.layers.9.mlp.experts.14.up_proj.weight": "model-00010-of-00047.safetensors", + "model.layers.9.mlp.experts.14.up_proj.weight_scale": "model-00010-of-00047.safetensors", + "model.layers.9.mlp.experts.15.down_proj.weight": "model-00010-of-00047.safetensors", + "model.layers.9.mlp.experts.15.down_proj.weight_scale": "model-00010-of-00047.safetensors", + "model.layers.9.mlp.experts.15.gate_proj.weight": "model-00010-of-00047.safetensors", + "model.layers.9.mlp.experts.15.gate_proj.weight_scale": "model-00010-of-00047.safetensors", + "model.layers.9.mlp.experts.15.up_proj.weight": "model-00010-of-00047.safetensors", + "model.layers.9.mlp.experts.15.up_proj.weight_scale": "model-00010-of-00047.safetensors", + "model.layers.9.mlp.experts.16.down_proj.weight": "model-00010-of-00047.safetensors", + "model.layers.9.mlp.experts.16.down_proj.weight_scale": "model-00010-of-00047.safetensors", + "model.layers.9.mlp.experts.16.gate_proj.weight": "model-00010-of-00047.safetensors", + "model.layers.9.mlp.experts.16.gate_proj.weight_scale": "model-00010-of-00047.safetensors", + "model.layers.9.mlp.experts.16.up_proj.weight": "model-00010-of-00047.safetensors", + "model.layers.9.mlp.experts.16.up_proj.weight_scale": "model-00010-of-00047.safetensors", + "model.layers.9.mlp.experts.17.down_proj.weight": "model-00010-of-00047.safetensors", + "model.layers.9.mlp.experts.17.down_proj.weight_scale": "model-00010-of-00047.safetensors", + "model.layers.9.mlp.experts.17.gate_proj.weight": "model-00010-of-00047.safetensors", + "model.layers.9.mlp.experts.17.gate_proj.weight_scale": "model-00010-of-00047.safetensors", + "model.layers.9.mlp.experts.17.up_proj.weight": "model-00010-of-00047.safetensors", + "model.layers.9.mlp.experts.17.up_proj.weight_scale": "model-00010-of-00047.safetensors", + "model.layers.9.mlp.experts.18.down_proj.weight": "model-00010-of-00047.safetensors", + "model.layers.9.mlp.experts.18.down_proj.weight_scale": "model-00010-of-00047.safetensors", + "model.layers.9.mlp.experts.18.gate_proj.weight": "model-00010-of-00047.safetensors", + "model.layers.9.mlp.experts.18.gate_proj.weight_scale": "model-00010-of-00047.safetensors", + "model.layers.9.mlp.experts.18.up_proj.weight": "model-00010-of-00047.safetensors", + "model.layers.9.mlp.experts.18.up_proj.weight_scale": "model-00010-of-00047.safetensors", + "model.layers.9.mlp.experts.19.down_proj.weight": "model-00010-of-00047.safetensors", + "model.layers.9.mlp.experts.19.down_proj.weight_scale": "model-00010-of-00047.safetensors", + "model.layers.9.mlp.experts.19.gate_proj.weight": "model-00010-of-00047.safetensors", + "model.layers.9.mlp.experts.19.gate_proj.weight_scale": "model-00010-of-00047.safetensors", + "model.layers.9.mlp.experts.19.up_proj.weight": "model-00010-of-00047.safetensors", + "model.layers.9.mlp.experts.19.up_proj.weight_scale": "model-00010-of-00047.safetensors", + "model.layers.9.mlp.experts.2.down_proj.weight": "model-00010-of-00047.safetensors", + "model.layers.9.mlp.experts.2.down_proj.weight_scale": "model-00010-of-00047.safetensors", + "model.layers.9.mlp.experts.2.gate_proj.weight": "model-00010-of-00047.safetensors", + "model.layers.9.mlp.experts.2.gate_proj.weight_scale": "model-00010-of-00047.safetensors", + "model.layers.9.mlp.experts.2.up_proj.weight": "model-00010-of-00047.safetensors", + "model.layers.9.mlp.experts.2.up_proj.weight_scale": "model-00010-of-00047.safetensors", + "model.layers.9.mlp.experts.20.down_proj.weight": "model-00010-of-00047.safetensors", + "model.layers.9.mlp.experts.20.down_proj.weight_scale": "model-00010-of-00047.safetensors", + "model.layers.9.mlp.experts.20.gate_proj.weight": "model-00010-of-00047.safetensors", + "model.layers.9.mlp.experts.20.gate_proj.weight_scale": "model-00010-of-00047.safetensors", + "model.layers.9.mlp.experts.20.up_proj.weight": "model-00010-of-00047.safetensors", + "model.layers.9.mlp.experts.20.up_proj.weight_scale": "model-00010-of-00047.safetensors", + "model.layers.9.mlp.experts.21.down_proj.weight": "model-00010-of-00047.safetensors", + "model.layers.9.mlp.experts.21.down_proj.weight_scale": "model-00010-of-00047.safetensors", + "model.layers.9.mlp.experts.21.gate_proj.weight": "model-00010-of-00047.safetensors", + "model.layers.9.mlp.experts.21.gate_proj.weight_scale": "model-00010-of-00047.safetensors", + "model.layers.9.mlp.experts.21.up_proj.weight": "model-00010-of-00047.safetensors", + "model.layers.9.mlp.experts.21.up_proj.weight_scale": "model-00010-of-00047.safetensors", + "model.layers.9.mlp.experts.22.down_proj.weight": "model-00010-of-00047.safetensors", + "model.layers.9.mlp.experts.22.down_proj.weight_scale": "model-00010-of-00047.safetensors", + "model.layers.9.mlp.experts.22.gate_proj.weight": "model-00010-of-00047.safetensors", + "model.layers.9.mlp.experts.22.gate_proj.weight_scale": "model-00010-of-00047.safetensors", + "model.layers.9.mlp.experts.22.up_proj.weight": "model-00010-of-00047.safetensors", + "model.layers.9.mlp.experts.22.up_proj.weight_scale": "model-00010-of-00047.safetensors", + "model.layers.9.mlp.experts.23.down_proj.weight": "model-00010-of-00047.safetensors", + "model.layers.9.mlp.experts.23.down_proj.weight_scale": "model-00010-of-00047.safetensors", + "model.layers.9.mlp.experts.23.gate_proj.weight": "model-00010-of-00047.safetensors", + "model.layers.9.mlp.experts.23.gate_proj.weight_scale": "model-00010-of-00047.safetensors", + "model.layers.9.mlp.experts.23.up_proj.weight": "model-00010-of-00047.safetensors", + "model.layers.9.mlp.experts.23.up_proj.weight_scale": "model-00010-of-00047.safetensors", + "model.layers.9.mlp.experts.24.down_proj.weight": "model-00010-of-00047.safetensors", + "model.layers.9.mlp.experts.24.down_proj.weight_scale": "model-00010-of-00047.safetensors", + "model.layers.9.mlp.experts.24.gate_proj.weight": "model-00010-of-00047.safetensors", + "model.layers.9.mlp.experts.24.gate_proj.weight_scale": "model-00010-of-00047.safetensors", + "model.layers.9.mlp.experts.24.up_proj.weight": "model-00010-of-00047.safetensors", + "model.layers.9.mlp.experts.24.up_proj.weight_scale": "model-00010-of-00047.safetensors", + "model.layers.9.mlp.experts.25.down_proj.weight": "model-00010-of-00047.safetensors", + "model.layers.9.mlp.experts.25.down_proj.weight_scale": "model-00010-of-00047.safetensors", + "model.layers.9.mlp.experts.25.gate_proj.weight": "model-00010-of-00047.safetensors", + "model.layers.9.mlp.experts.25.gate_proj.weight_scale": "model-00010-of-00047.safetensors", + "model.layers.9.mlp.experts.25.up_proj.weight": "model-00010-of-00047.safetensors", + "model.layers.9.mlp.experts.25.up_proj.weight_scale": "model-00010-of-00047.safetensors", + "model.layers.9.mlp.experts.26.down_proj.weight": "model-00010-of-00047.safetensors", + "model.layers.9.mlp.experts.26.down_proj.weight_scale": "model-00010-of-00047.safetensors", + "model.layers.9.mlp.experts.26.gate_proj.weight": "model-00010-of-00047.safetensors", + "model.layers.9.mlp.experts.26.gate_proj.weight_scale": "model-00010-of-00047.safetensors", + "model.layers.9.mlp.experts.26.up_proj.weight": "model-00010-of-00047.safetensors", + "model.layers.9.mlp.experts.26.up_proj.weight_scale": "model-00010-of-00047.safetensors", + "model.layers.9.mlp.experts.27.down_proj.weight": "model-00010-of-00047.safetensors", + "model.layers.9.mlp.experts.27.down_proj.weight_scale": "model-00010-of-00047.safetensors", + "model.layers.9.mlp.experts.27.gate_proj.weight": "model-00010-of-00047.safetensors", + "model.layers.9.mlp.experts.27.gate_proj.weight_scale": "model-00010-of-00047.safetensors", + "model.layers.9.mlp.experts.27.up_proj.weight": "model-00010-of-00047.safetensors", + "model.layers.9.mlp.experts.27.up_proj.weight_scale": "model-00010-of-00047.safetensors", + "model.layers.9.mlp.experts.28.down_proj.weight": "model-00010-of-00047.safetensors", + "model.layers.9.mlp.experts.28.down_proj.weight_scale": "model-00010-of-00047.safetensors", + "model.layers.9.mlp.experts.28.gate_proj.weight": "model-00010-of-00047.safetensors", + "model.layers.9.mlp.experts.28.gate_proj.weight_scale": "model-00010-of-00047.safetensors", + "model.layers.9.mlp.experts.28.up_proj.weight": "model-00010-of-00047.safetensors", + "model.layers.9.mlp.experts.28.up_proj.weight_scale": "model-00010-of-00047.safetensors", + "model.layers.9.mlp.experts.29.down_proj.weight": "model-00010-of-00047.safetensors", + "model.layers.9.mlp.experts.29.down_proj.weight_scale": "model-00010-of-00047.safetensors", + "model.layers.9.mlp.experts.29.gate_proj.weight": "model-00010-of-00047.safetensors", + "model.layers.9.mlp.experts.29.gate_proj.weight_scale": "model-00010-of-00047.safetensors", + "model.layers.9.mlp.experts.29.up_proj.weight": "model-00010-of-00047.safetensors", + "model.layers.9.mlp.experts.29.up_proj.weight_scale": "model-00010-of-00047.safetensors", + "model.layers.9.mlp.experts.3.down_proj.weight": "model-00010-of-00047.safetensors", + "model.layers.9.mlp.experts.3.down_proj.weight_scale": "model-00010-of-00047.safetensors", + "model.layers.9.mlp.experts.3.gate_proj.weight": "model-00010-of-00047.safetensors", + "model.layers.9.mlp.experts.3.gate_proj.weight_scale": "model-00010-of-00047.safetensors", + "model.layers.9.mlp.experts.3.up_proj.weight": "model-00010-of-00047.safetensors", + "model.layers.9.mlp.experts.3.up_proj.weight_scale": "model-00010-of-00047.safetensors", + "model.layers.9.mlp.experts.30.down_proj.weight": "model-00010-of-00047.safetensors", + "model.layers.9.mlp.experts.30.down_proj.weight_scale": "model-00010-of-00047.safetensors", + "model.layers.9.mlp.experts.30.gate_proj.weight": "model-00010-of-00047.safetensors", + "model.layers.9.mlp.experts.30.gate_proj.weight_scale": "model-00010-of-00047.safetensors", + "model.layers.9.mlp.experts.30.up_proj.weight": "model-00010-of-00047.safetensors", + "model.layers.9.mlp.experts.30.up_proj.weight_scale": "model-00010-of-00047.safetensors", + "model.layers.9.mlp.experts.31.down_proj.weight": "model-00010-of-00047.safetensors", + "model.layers.9.mlp.experts.31.down_proj.weight_scale": "model-00010-of-00047.safetensors", + "model.layers.9.mlp.experts.31.gate_proj.weight": "model-00010-of-00047.safetensors", + "model.layers.9.mlp.experts.31.gate_proj.weight_scale": "model-00010-of-00047.safetensors", + "model.layers.9.mlp.experts.31.up_proj.weight": "model-00010-of-00047.safetensors", + "model.layers.9.mlp.experts.31.up_proj.weight_scale": "model-00010-of-00047.safetensors", + "model.layers.9.mlp.experts.32.down_proj.weight": "model-00010-of-00047.safetensors", + "model.layers.9.mlp.experts.32.down_proj.weight_scale": "model-00010-of-00047.safetensors", + "model.layers.9.mlp.experts.32.gate_proj.weight": "model-00010-of-00047.safetensors", + "model.layers.9.mlp.experts.32.gate_proj.weight_scale": "model-00010-of-00047.safetensors", + "model.layers.9.mlp.experts.32.up_proj.weight": "model-00010-of-00047.safetensors", + "model.layers.9.mlp.experts.32.up_proj.weight_scale": "model-00010-of-00047.safetensors", + "model.layers.9.mlp.experts.33.down_proj.weight": "model-00010-of-00047.safetensors", + "model.layers.9.mlp.experts.33.down_proj.weight_scale": "model-00010-of-00047.safetensors", + "model.layers.9.mlp.experts.33.gate_proj.weight": "model-00010-of-00047.safetensors", + "model.layers.9.mlp.experts.33.gate_proj.weight_scale": "model-00010-of-00047.safetensors", + "model.layers.9.mlp.experts.33.up_proj.weight": "model-00010-of-00047.safetensors", + "model.layers.9.mlp.experts.33.up_proj.weight_scale": "model-00010-of-00047.safetensors", + "model.layers.9.mlp.experts.34.down_proj.weight": "model-00010-of-00047.safetensors", + "model.layers.9.mlp.experts.34.down_proj.weight_scale": "model-00010-of-00047.safetensors", + "model.layers.9.mlp.experts.34.gate_proj.weight": "model-00010-of-00047.safetensors", + "model.layers.9.mlp.experts.34.gate_proj.weight_scale": "model-00010-of-00047.safetensors", + "model.layers.9.mlp.experts.34.up_proj.weight": "model-00010-of-00047.safetensors", + "model.layers.9.mlp.experts.34.up_proj.weight_scale": "model-00010-of-00047.safetensors", + "model.layers.9.mlp.experts.35.down_proj.weight": "model-00010-of-00047.safetensors", + "model.layers.9.mlp.experts.35.down_proj.weight_scale": "model-00010-of-00047.safetensors", + "model.layers.9.mlp.experts.35.gate_proj.weight": "model-00010-of-00047.safetensors", + "model.layers.9.mlp.experts.35.gate_proj.weight_scale": "model-00010-of-00047.safetensors", + "model.layers.9.mlp.experts.35.up_proj.weight": "model-00010-of-00047.safetensors", + "model.layers.9.mlp.experts.35.up_proj.weight_scale": "model-00010-of-00047.safetensors", + "model.layers.9.mlp.experts.36.down_proj.weight": "model-00010-of-00047.safetensors", + "model.layers.9.mlp.experts.36.down_proj.weight_scale": "model-00010-of-00047.safetensors", + "model.layers.9.mlp.experts.36.gate_proj.weight": "model-00010-of-00047.safetensors", + "model.layers.9.mlp.experts.36.gate_proj.weight_scale": "model-00010-of-00047.safetensors", + "model.layers.9.mlp.experts.36.up_proj.weight": "model-00010-of-00047.safetensors", + "model.layers.9.mlp.experts.36.up_proj.weight_scale": "model-00010-of-00047.safetensors", + "model.layers.9.mlp.experts.37.down_proj.weight": "model-00010-of-00047.safetensors", + "model.layers.9.mlp.experts.37.down_proj.weight_scale": "model-00010-of-00047.safetensors", + "model.layers.9.mlp.experts.37.gate_proj.weight": "model-00010-of-00047.safetensors", + "model.layers.9.mlp.experts.37.gate_proj.weight_scale": "model-00010-of-00047.safetensors", + "model.layers.9.mlp.experts.37.up_proj.weight": "model-00010-of-00047.safetensors", + "model.layers.9.mlp.experts.37.up_proj.weight_scale": "model-00010-of-00047.safetensors", + "model.layers.9.mlp.experts.38.down_proj.weight": "model-00010-of-00047.safetensors", + "model.layers.9.mlp.experts.38.down_proj.weight_scale": "model-00010-of-00047.safetensors", + "model.layers.9.mlp.experts.38.gate_proj.weight": "model-00010-of-00047.safetensors", + "model.layers.9.mlp.experts.38.gate_proj.weight_scale": "model-00010-of-00047.safetensors", + "model.layers.9.mlp.experts.38.up_proj.weight": "model-00010-of-00047.safetensors", + "model.layers.9.mlp.experts.38.up_proj.weight_scale": "model-00010-of-00047.safetensors", + "model.layers.9.mlp.experts.39.down_proj.weight": "model-00010-of-00047.safetensors", + "model.layers.9.mlp.experts.39.down_proj.weight_scale": "model-00010-of-00047.safetensors", + "model.layers.9.mlp.experts.39.gate_proj.weight": "model-00010-of-00047.safetensors", + "model.layers.9.mlp.experts.39.gate_proj.weight_scale": "model-00010-of-00047.safetensors", + "model.layers.9.mlp.experts.39.up_proj.weight": "model-00010-of-00047.safetensors", + "model.layers.9.mlp.experts.39.up_proj.weight_scale": "model-00010-of-00047.safetensors", + "model.layers.9.mlp.experts.4.down_proj.weight": "model-00010-of-00047.safetensors", + "model.layers.9.mlp.experts.4.down_proj.weight_scale": "model-00010-of-00047.safetensors", + "model.layers.9.mlp.experts.4.gate_proj.weight": "model-00010-of-00047.safetensors", + "model.layers.9.mlp.experts.4.gate_proj.weight_scale": "model-00010-of-00047.safetensors", + "model.layers.9.mlp.experts.4.up_proj.weight": "model-00010-of-00047.safetensors", + "model.layers.9.mlp.experts.4.up_proj.weight_scale": "model-00010-of-00047.safetensors", + "model.layers.9.mlp.experts.40.down_proj.weight": "model-00010-of-00047.safetensors", + "model.layers.9.mlp.experts.40.down_proj.weight_scale": "model-00010-of-00047.safetensors", + "model.layers.9.mlp.experts.40.gate_proj.weight": "model-00010-of-00047.safetensors", + "model.layers.9.mlp.experts.40.gate_proj.weight_scale": "model-00010-of-00047.safetensors", + "model.layers.9.mlp.experts.40.up_proj.weight": "model-00010-of-00047.safetensors", + "model.layers.9.mlp.experts.40.up_proj.weight_scale": "model-00010-of-00047.safetensors", + "model.layers.9.mlp.experts.41.down_proj.weight": "model-00010-of-00047.safetensors", + "model.layers.9.mlp.experts.41.down_proj.weight_scale": "model-00010-of-00047.safetensors", + "model.layers.9.mlp.experts.41.gate_proj.weight": "model-00010-of-00047.safetensors", + "model.layers.9.mlp.experts.41.gate_proj.weight_scale": "model-00010-of-00047.safetensors", + "model.layers.9.mlp.experts.41.up_proj.weight": "model-00010-of-00047.safetensors", + "model.layers.9.mlp.experts.41.up_proj.weight_scale": "model-00010-of-00047.safetensors", + "model.layers.9.mlp.experts.42.down_proj.weight": "model-00010-of-00047.safetensors", + "model.layers.9.mlp.experts.42.down_proj.weight_scale": "model-00010-of-00047.safetensors", + "model.layers.9.mlp.experts.42.gate_proj.weight": "model-00010-of-00047.safetensors", + "model.layers.9.mlp.experts.42.gate_proj.weight_scale": "model-00010-of-00047.safetensors", + "model.layers.9.mlp.experts.42.up_proj.weight": "model-00010-of-00047.safetensors", + "model.layers.9.mlp.experts.42.up_proj.weight_scale": "model-00010-of-00047.safetensors", + "model.layers.9.mlp.experts.43.down_proj.weight": "model-00010-of-00047.safetensors", + "model.layers.9.mlp.experts.43.down_proj.weight_scale": "model-00010-of-00047.safetensors", + "model.layers.9.mlp.experts.43.gate_proj.weight": "model-00010-of-00047.safetensors", + "model.layers.9.mlp.experts.43.gate_proj.weight_scale": "model-00010-of-00047.safetensors", + "model.layers.9.mlp.experts.43.up_proj.weight": "model-00010-of-00047.safetensors", + "model.layers.9.mlp.experts.43.up_proj.weight_scale": "model-00010-of-00047.safetensors", + "model.layers.9.mlp.experts.44.down_proj.weight": "model-00010-of-00047.safetensors", + "model.layers.9.mlp.experts.44.down_proj.weight_scale": "model-00010-of-00047.safetensors", + "model.layers.9.mlp.experts.44.gate_proj.weight": "model-00010-of-00047.safetensors", + "model.layers.9.mlp.experts.44.gate_proj.weight_scale": "model-00010-of-00047.safetensors", + "model.layers.9.mlp.experts.44.up_proj.weight": "model-00010-of-00047.safetensors", + "model.layers.9.mlp.experts.44.up_proj.weight_scale": "model-00010-of-00047.safetensors", + "model.layers.9.mlp.experts.45.down_proj.weight": "model-00010-of-00047.safetensors", + "model.layers.9.mlp.experts.45.down_proj.weight_scale": "model-00010-of-00047.safetensors", + "model.layers.9.mlp.experts.45.gate_proj.weight": "model-00010-of-00047.safetensors", + "model.layers.9.mlp.experts.45.gate_proj.weight_scale": "model-00010-of-00047.safetensors", + "model.layers.9.mlp.experts.45.up_proj.weight": "model-00010-of-00047.safetensors", + "model.layers.9.mlp.experts.45.up_proj.weight_scale": "model-00010-of-00047.safetensors", + "model.layers.9.mlp.experts.46.down_proj.weight": "model-00010-of-00047.safetensors", + "model.layers.9.mlp.experts.46.down_proj.weight_scale": "model-00010-of-00047.safetensors", + "model.layers.9.mlp.experts.46.gate_proj.weight": "model-00010-of-00047.safetensors", + "model.layers.9.mlp.experts.46.gate_proj.weight_scale": "model-00010-of-00047.safetensors", + "model.layers.9.mlp.experts.46.up_proj.weight": "model-00010-of-00047.safetensors", + "model.layers.9.mlp.experts.46.up_proj.weight_scale": "model-00010-of-00047.safetensors", + "model.layers.9.mlp.experts.47.down_proj.weight": "model-00010-of-00047.safetensors", + "model.layers.9.mlp.experts.47.down_proj.weight_scale": "model-00010-of-00047.safetensors", + "model.layers.9.mlp.experts.47.gate_proj.weight": "model-00010-of-00047.safetensors", + "model.layers.9.mlp.experts.47.gate_proj.weight_scale": "model-00010-of-00047.safetensors", + "model.layers.9.mlp.experts.47.up_proj.weight": "model-00010-of-00047.safetensors", + "model.layers.9.mlp.experts.47.up_proj.weight_scale": "model-00010-of-00047.safetensors", + "model.layers.9.mlp.experts.48.down_proj.weight": "model-00010-of-00047.safetensors", + "model.layers.9.mlp.experts.48.down_proj.weight_scale": "model-00010-of-00047.safetensors", + "model.layers.9.mlp.experts.48.gate_proj.weight": "model-00010-of-00047.safetensors", + "model.layers.9.mlp.experts.48.gate_proj.weight_scale": "model-00010-of-00047.safetensors", + "model.layers.9.mlp.experts.48.up_proj.weight": "model-00010-of-00047.safetensors", + "model.layers.9.mlp.experts.48.up_proj.weight_scale": "model-00010-of-00047.safetensors", + "model.layers.9.mlp.experts.49.down_proj.weight": "model-00010-of-00047.safetensors", + "model.layers.9.mlp.experts.49.down_proj.weight_scale": "model-00010-of-00047.safetensors", + "model.layers.9.mlp.experts.49.gate_proj.weight": "model-00010-of-00047.safetensors", + "model.layers.9.mlp.experts.49.gate_proj.weight_scale": "model-00010-of-00047.safetensors", + "model.layers.9.mlp.experts.49.up_proj.weight": "model-00010-of-00047.safetensors", + "model.layers.9.mlp.experts.49.up_proj.weight_scale": "model-00010-of-00047.safetensors", + "model.layers.9.mlp.experts.5.down_proj.weight": "model-00010-of-00047.safetensors", + "model.layers.9.mlp.experts.5.down_proj.weight_scale": "model-00010-of-00047.safetensors", + "model.layers.9.mlp.experts.5.gate_proj.weight": "model-00010-of-00047.safetensors", + "model.layers.9.mlp.experts.5.gate_proj.weight_scale": "model-00010-of-00047.safetensors", + "model.layers.9.mlp.experts.5.up_proj.weight": "model-00010-of-00047.safetensors", + "model.layers.9.mlp.experts.5.up_proj.weight_scale": "model-00010-of-00047.safetensors", + "model.layers.9.mlp.experts.50.down_proj.weight": "model-00010-of-00047.safetensors", + "model.layers.9.mlp.experts.50.down_proj.weight_scale": "model-00010-of-00047.safetensors", + "model.layers.9.mlp.experts.50.gate_proj.weight": "model-00010-of-00047.safetensors", + "model.layers.9.mlp.experts.50.gate_proj.weight_scale": "model-00010-of-00047.safetensors", + "model.layers.9.mlp.experts.50.up_proj.weight": "model-00010-of-00047.safetensors", + "model.layers.9.mlp.experts.50.up_proj.weight_scale": "model-00010-of-00047.safetensors", + "model.layers.9.mlp.experts.51.down_proj.weight": "model-00010-of-00047.safetensors", + "model.layers.9.mlp.experts.51.down_proj.weight_scale": "model-00010-of-00047.safetensors", + "model.layers.9.mlp.experts.51.gate_proj.weight": "model-00010-of-00047.safetensors", + "model.layers.9.mlp.experts.51.gate_proj.weight_scale": "model-00010-of-00047.safetensors", + "model.layers.9.mlp.experts.51.up_proj.weight": "model-00010-of-00047.safetensors", + "model.layers.9.mlp.experts.51.up_proj.weight_scale": "model-00010-of-00047.safetensors", + "model.layers.9.mlp.experts.52.down_proj.weight": "model-00010-of-00047.safetensors", + "model.layers.9.mlp.experts.52.down_proj.weight_scale": "model-00010-of-00047.safetensors", + "model.layers.9.mlp.experts.52.gate_proj.weight": "model-00010-of-00047.safetensors", + "model.layers.9.mlp.experts.52.gate_proj.weight_scale": "model-00010-of-00047.safetensors", + "model.layers.9.mlp.experts.52.up_proj.weight": "model-00010-of-00047.safetensors", + "model.layers.9.mlp.experts.52.up_proj.weight_scale": "model-00010-of-00047.safetensors", + "model.layers.9.mlp.experts.53.down_proj.weight": "model-00010-of-00047.safetensors", + "model.layers.9.mlp.experts.53.down_proj.weight_scale": "model-00010-of-00047.safetensors", + "model.layers.9.mlp.experts.53.gate_proj.weight": "model-00010-of-00047.safetensors", + "model.layers.9.mlp.experts.53.gate_proj.weight_scale": "model-00010-of-00047.safetensors", + "model.layers.9.mlp.experts.53.up_proj.weight": "model-00010-of-00047.safetensors", + "model.layers.9.mlp.experts.53.up_proj.weight_scale": "model-00010-of-00047.safetensors", + "model.layers.9.mlp.experts.54.down_proj.weight": "model-00010-of-00047.safetensors", + "model.layers.9.mlp.experts.54.down_proj.weight_scale": "model-00010-of-00047.safetensors", + "model.layers.9.mlp.experts.54.gate_proj.weight": "model-00010-of-00047.safetensors", + "model.layers.9.mlp.experts.54.gate_proj.weight_scale": "model-00010-of-00047.safetensors", + "model.layers.9.mlp.experts.54.up_proj.weight": "model-00010-of-00047.safetensors", + "model.layers.9.mlp.experts.54.up_proj.weight_scale": "model-00010-of-00047.safetensors", + "model.layers.9.mlp.experts.55.down_proj.weight": "model-00010-of-00047.safetensors", + "model.layers.9.mlp.experts.55.down_proj.weight_scale": "model-00010-of-00047.safetensors", + "model.layers.9.mlp.experts.55.gate_proj.weight": "model-00010-of-00047.safetensors", + "model.layers.9.mlp.experts.55.gate_proj.weight_scale": "model-00010-of-00047.safetensors", + "model.layers.9.mlp.experts.55.up_proj.weight": "model-00010-of-00047.safetensors", + "model.layers.9.mlp.experts.55.up_proj.weight_scale": "model-00010-of-00047.safetensors", + "model.layers.9.mlp.experts.56.down_proj.weight": "model-00010-of-00047.safetensors", + "model.layers.9.mlp.experts.56.down_proj.weight_scale": "model-00010-of-00047.safetensors", + "model.layers.9.mlp.experts.56.gate_proj.weight": "model-00010-of-00047.safetensors", + "model.layers.9.mlp.experts.56.gate_proj.weight_scale": "model-00010-of-00047.safetensors", + "model.layers.9.mlp.experts.56.up_proj.weight": "model-00010-of-00047.safetensors", + "model.layers.9.mlp.experts.56.up_proj.weight_scale": "model-00010-of-00047.safetensors", + "model.layers.9.mlp.experts.57.down_proj.weight": "model-00010-of-00047.safetensors", + "model.layers.9.mlp.experts.57.down_proj.weight_scale": "model-00010-of-00047.safetensors", + "model.layers.9.mlp.experts.57.gate_proj.weight": "model-00010-of-00047.safetensors", + "model.layers.9.mlp.experts.57.gate_proj.weight_scale": "model-00010-of-00047.safetensors", + "model.layers.9.mlp.experts.57.up_proj.weight": "model-00010-of-00047.safetensors", + "model.layers.9.mlp.experts.57.up_proj.weight_scale": "model-00010-of-00047.safetensors", + "model.layers.9.mlp.experts.58.down_proj.weight": "model-00010-of-00047.safetensors", + "model.layers.9.mlp.experts.58.down_proj.weight_scale": "model-00010-of-00047.safetensors", + "model.layers.9.mlp.experts.58.gate_proj.weight": "model-00010-of-00047.safetensors", + "model.layers.9.mlp.experts.58.gate_proj.weight_scale": "model-00010-of-00047.safetensors", + "model.layers.9.mlp.experts.58.up_proj.weight": "model-00010-of-00047.safetensors", + "model.layers.9.mlp.experts.58.up_proj.weight_scale": "model-00010-of-00047.safetensors", + "model.layers.9.mlp.experts.59.down_proj.weight": "model-00010-of-00047.safetensors", + "model.layers.9.mlp.experts.59.down_proj.weight_scale": "model-00010-of-00047.safetensors", + "model.layers.9.mlp.experts.59.gate_proj.weight": "model-00010-of-00047.safetensors", + "model.layers.9.mlp.experts.59.gate_proj.weight_scale": "model-00010-of-00047.safetensors", + "model.layers.9.mlp.experts.59.up_proj.weight": "model-00010-of-00047.safetensors", + "model.layers.9.mlp.experts.59.up_proj.weight_scale": "model-00010-of-00047.safetensors", + "model.layers.9.mlp.experts.6.down_proj.weight": "model-00010-of-00047.safetensors", + "model.layers.9.mlp.experts.6.down_proj.weight_scale": "model-00010-of-00047.safetensors", + "model.layers.9.mlp.experts.6.gate_proj.weight": "model-00010-of-00047.safetensors", + "model.layers.9.mlp.experts.6.gate_proj.weight_scale": "model-00010-of-00047.safetensors", + "model.layers.9.mlp.experts.6.up_proj.weight": "model-00010-of-00047.safetensors", + "model.layers.9.mlp.experts.6.up_proj.weight_scale": "model-00010-of-00047.safetensors", + "model.layers.9.mlp.experts.60.down_proj.weight": "model-00010-of-00047.safetensors", + "model.layers.9.mlp.experts.60.down_proj.weight_scale": "model-00010-of-00047.safetensors", + "model.layers.9.mlp.experts.60.gate_proj.weight": "model-00010-of-00047.safetensors", + "model.layers.9.mlp.experts.60.gate_proj.weight_scale": "model-00010-of-00047.safetensors", + "model.layers.9.mlp.experts.60.up_proj.weight": "model-00010-of-00047.safetensors", + "model.layers.9.mlp.experts.60.up_proj.weight_scale": "model-00010-of-00047.safetensors", + "model.layers.9.mlp.experts.61.down_proj.weight": "model-00010-of-00047.safetensors", + "model.layers.9.mlp.experts.61.down_proj.weight_scale": "model-00010-of-00047.safetensors", + "model.layers.9.mlp.experts.61.gate_proj.weight": "model-00010-of-00047.safetensors", + "model.layers.9.mlp.experts.61.gate_proj.weight_scale": "model-00010-of-00047.safetensors", + "model.layers.9.mlp.experts.61.up_proj.weight": "model-00010-of-00047.safetensors", + "model.layers.9.mlp.experts.61.up_proj.weight_scale": "model-00010-of-00047.safetensors", + "model.layers.9.mlp.experts.62.down_proj.weight": "model-00010-of-00047.safetensors", + "model.layers.9.mlp.experts.62.down_proj.weight_scale": "model-00010-of-00047.safetensors", + "model.layers.9.mlp.experts.62.gate_proj.weight": "model-00010-of-00047.safetensors", + "model.layers.9.mlp.experts.62.gate_proj.weight_scale": "model-00010-of-00047.safetensors", + "model.layers.9.mlp.experts.62.up_proj.weight": "model-00010-of-00047.safetensors", + "model.layers.9.mlp.experts.62.up_proj.weight_scale": "model-00010-of-00047.safetensors", + "model.layers.9.mlp.experts.63.down_proj.weight": "model-00010-of-00047.safetensors", + "model.layers.9.mlp.experts.63.down_proj.weight_scale": "model-00010-of-00047.safetensors", + "model.layers.9.mlp.experts.63.gate_proj.weight": "model-00010-of-00047.safetensors", + "model.layers.9.mlp.experts.63.gate_proj.weight_scale": "model-00010-of-00047.safetensors", + "model.layers.9.mlp.experts.63.up_proj.weight": "model-00010-of-00047.safetensors", + "model.layers.9.mlp.experts.63.up_proj.weight_scale": "model-00010-of-00047.safetensors", + "model.layers.9.mlp.experts.64.down_proj.weight": "model-00010-of-00047.safetensors", + "model.layers.9.mlp.experts.64.down_proj.weight_scale": "model-00010-of-00047.safetensors", + "model.layers.9.mlp.experts.64.gate_proj.weight": "model-00010-of-00047.safetensors", + "model.layers.9.mlp.experts.64.gate_proj.weight_scale": "model-00010-of-00047.safetensors", + "model.layers.9.mlp.experts.64.up_proj.weight": "model-00010-of-00047.safetensors", + "model.layers.9.mlp.experts.64.up_proj.weight_scale": "model-00010-of-00047.safetensors", + "model.layers.9.mlp.experts.65.down_proj.weight": "model-00010-of-00047.safetensors", + "model.layers.9.mlp.experts.65.down_proj.weight_scale": "model-00010-of-00047.safetensors", + "model.layers.9.mlp.experts.65.gate_proj.weight": "model-00010-of-00047.safetensors", + "model.layers.9.mlp.experts.65.gate_proj.weight_scale": "model-00010-of-00047.safetensors", + "model.layers.9.mlp.experts.65.up_proj.weight": "model-00010-of-00047.safetensors", + "model.layers.9.mlp.experts.65.up_proj.weight_scale": "model-00010-of-00047.safetensors", + "model.layers.9.mlp.experts.66.down_proj.weight": "model-00010-of-00047.safetensors", + "model.layers.9.mlp.experts.66.down_proj.weight_scale": "model-00010-of-00047.safetensors", + "model.layers.9.mlp.experts.66.gate_proj.weight": "model-00010-of-00047.safetensors", + "model.layers.9.mlp.experts.66.gate_proj.weight_scale": "model-00010-of-00047.safetensors", + "model.layers.9.mlp.experts.66.up_proj.weight": "model-00010-of-00047.safetensors", + "model.layers.9.mlp.experts.66.up_proj.weight_scale": "model-00010-of-00047.safetensors", + "model.layers.9.mlp.experts.67.down_proj.weight": "model-00010-of-00047.safetensors", + "model.layers.9.mlp.experts.67.down_proj.weight_scale": "model-00010-of-00047.safetensors", + "model.layers.9.mlp.experts.67.gate_proj.weight": "model-00010-of-00047.safetensors", + "model.layers.9.mlp.experts.67.gate_proj.weight_scale": "model-00010-of-00047.safetensors", + "model.layers.9.mlp.experts.67.up_proj.weight": "model-00010-of-00047.safetensors", + "model.layers.9.mlp.experts.67.up_proj.weight_scale": "model-00010-of-00047.safetensors", + "model.layers.9.mlp.experts.68.down_proj.weight": "model-00010-of-00047.safetensors", + "model.layers.9.mlp.experts.68.down_proj.weight_scale": "model-00010-of-00047.safetensors", + "model.layers.9.mlp.experts.68.gate_proj.weight": "model-00010-of-00047.safetensors", + "model.layers.9.mlp.experts.68.gate_proj.weight_scale": "model-00010-of-00047.safetensors", + "model.layers.9.mlp.experts.68.up_proj.weight": "model-00010-of-00047.safetensors", + "model.layers.9.mlp.experts.68.up_proj.weight_scale": "model-00010-of-00047.safetensors", + "model.layers.9.mlp.experts.69.down_proj.weight": "model-00010-of-00047.safetensors", + "model.layers.9.mlp.experts.69.down_proj.weight_scale": "model-00010-of-00047.safetensors", + "model.layers.9.mlp.experts.69.gate_proj.weight": "model-00010-of-00047.safetensors", + "model.layers.9.mlp.experts.69.gate_proj.weight_scale": "model-00010-of-00047.safetensors", + "model.layers.9.mlp.experts.69.up_proj.weight": "model-00010-of-00047.safetensors", + "model.layers.9.mlp.experts.69.up_proj.weight_scale": "model-00010-of-00047.safetensors", + "model.layers.9.mlp.experts.7.down_proj.weight": "model-00010-of-00047.safetensors", + "model.layers.9.mlp.experts.7.down_proj.weight_scale": "model-00010-of-00047.safetensors", + "model.layers.9.mlp.experts.7.gate_proj.weight": "model-00010-of-00047.safetensors", + "model.layers.9.mlp.experts.7.gate_proj.weight_scale": "model-00010-of-00047.safetensors", + "model.layers.9.mlp.experts.7.up_proj.weight": "model-00010-of-00047.safetensors", + "model.layers.9.mlp.experts.7.up_proj.weight_scale": "model-00010-of-00047.safetensors", + "model.layers.9.mlp.experts.70.down_proj.weight": "model-00010-of-00047.safetensors", + "model.layers.9.mlp.experts.70.down_proj.weight_scale": "model-00010-of-00047.safetensors", + "model.layers.9.mlp.experts.70.gate_proj.weight": "model-00010-of-00047.safetensors", + "model.layers.9.mlp.experts.70.gate_proj.weight_scale": "model-00010-of-00047.safetensors", + "model.layers.9.mlp.experts.70.up_proj.weight": "model-00010-of-00047.safetensors", + "model.layers.9.mlp.experts.70.up_proj.weight_scale": "model-00010-of-00047.safetensors", + "model.layers.9.mlp.experts.71.down_proj.weight": "model-00010-of-00047.safetensors", + "model.layers.9.mlp.experts.71.down_proj.weight_scale": "model-00010-of-00047.safetensors", + "model.layers.9.mlp.experts.71.gate_proj.weight": "model-00010-of-00047.safetensors", + "model.layers.9.mlp.experts.71.gate_proj.weight_scale": "model-00010-of-00047.safetensors", + "model.layers.9.mlp.experts.71.up_proj.weight": "model-00010-of-00047.safetensors", + "model.layers.9.mlp.experts.71.up_proj.weight_scale": "model-00010-of-00047.safetensors", + "model.layers.9.mlp.experts.72.down_proj.weight": "model-00010-of-00047.safetensors", + "model.layers.9.mlp.experts.72.down_proj.weight_scale": "model-00010-of-00047.safetensors", + "model.layers.9.mlp.experts.72.gate_proj.weight": "model-00010-of-00047.safetensors", + "model.layers.9.mlp.experts.72.gate_proj.weight_scale": "model-00010-of-00047.safetensors", + "model.layers.9.mlp.experts.72.up_proj.weight": "model-00010-of-00047.safetensors", + "model.layers.9.mlp.experts.72.up_proj.weight_scale": "model-00010-of-00047.safetensors", + "model.layers.9.mlp.experts.73.down_proj.weight": "model-00010-of-00047.safetensors", + "model.layers.9.mlp.experts.73.down_proj.weight_scale": "model-00010-of-00047.safetensors", + "model.layers.9.mlp.experts.73.gate_proj.weight": "model-00010-of-00047.safetensors", + "model.layers.9.mlp.experts.73.gate_proj.weight_scale": "model-00010-of-00047.safetensors", + "model.layers.9.mlp.experts.73.up_proj.weight": "model-00010-of-00047.safetensors", + "model.layers.9.mlp.experts.73.up_proj.weight_scale": "model-00010-of-00047.safetensors", + "model.layers.9.mlp.experts.74.down_proj.weight": "model-00010-of-00047.safetensors", + "model.layers.9.mlp.experts.74.down_proj.weight_scale": "model-00010-of-00047.safetensors", + "model.layers.9.mlp.experts.74.gate_proj.weight": "model-00010-of-00047.safetensors", + "model.layers.9.mlp.experts.74.gate_proj.weight_scale": "model-00010-of-00047.safetensors", + "model.layers.9.mlp.experts.74.up_proj.weight": "model-00010-of-00047.safetensors", + "model.layers.9.mlp.experts.74.up_proj.weight_scale": "model-00010-of-00047.safetensors", + "model.layers.9.mlp.experts.75.down_proj.weight": "model-00010-of-00047.safetensors", + "model.layers.9.mlp.experts.75.down_proj.weight_scale": "model-00010-of-00047.safetensors", + "model.layers.9.mlp.experts.75.gate_proj.weight": "model-00010-of-00047.safetensors", + "model.layers.9.mlp.experts.75.gate_proj.weight_scale": "model-00010-of-00047.safetensors", + "model.layers.9.mlp.experts.75.up_proj.weight": "model-00010-of-00047.safetensors", + "model.layers.9.mlp.experts.75.up_proj.weight_scale": "model-00010-of-00047.safetensors", + "model.layers.9.mlp.experts.76.down_proj.weight": "model-00010-of-00047.safetensors", + "model.layers.9.mlp.experts.76.down_proj.weight_scale": "model-00010-of-00047.safetensors", + "model.layers.9.mlp.experts.76.gate_proj.weight": "model-00010-of-00047.safetensors", + "model.layers.9.mlp.experts.76.gate_proj.weight_scale": "model-00010-of-00047.safetensors", + "model.layers.9.mlp.experts.76.up_proj.weight": "model-00010-of-00047.safetensors", + "model.layers.9.mlp.experts.76.up_proj.weight_scale": "model-00010-of-00047.safetensors", + "model.layers.9.mlp.experts.77.down_proj.weight": "model-00010-of-00047.safetensors", + "model.layers.9.mlp.experts.77.down_proj.weight_scale": "model-00010-of-00047.safetensors", + "model.layers.9.mlp.experts.77.gate_proj.weight": "model-00010-of-00047.safetensors", + "model.layers.9.mlp.experts.77.gate_proj.weight_scale": "model-00010-of-00047.safetensors", + "model.layers.9.mlp.experts.77.up_proj.weight": "model-00010-of-00047.safetensors", + "model.layers.9.mlp.experts.77.up_proj.weight_scale": "model-00010-of-00047.safetensors", + "model.layers.9.mlp.experts.78.down_proj.weight": "model-00010-of-00047.safetensors", + "model.layers.9.mlp.experts.78.down_proj.weight_scale": "model-00010-of-00047.safetensors", + "model.layers.9.mlp.experts.78.gate_proj.weight": "model-00010-of-00047.safetensors", + "model.layers.9.mlp.experts.78.gate_proj.weight_scale": "model-00010-of-00047.safetensors", + "model.layers.9.mlp.experts.78.up_proj.weight": "model-00010-of-00047.safetensors", + "model.layers.9.mlp.experts.78.up_proj.weight_scale": "model-00010-of-00047.safetensors", + "model.layers.9.mlp.experts.79.down_proj.weight": "model-00010-of-00047.safetensors", + "model.layers.9.mlp.experts.79.down_proj.weight_scale": "model-00010-of-00047.safetensors", + "model.layers.9.mlp.experts.79.gate_proj.weight": "model-00010-of-00047.safetensors", + "model.layers.9.mlp.experts.79.gate_proj.weight_scale": "model-00010-of-00047.safetensors", + "model.layers.9.mlp.experts.79.up_proj.weight": "model-00010-of-00047.safetensors", + "model.layers.9.mlp.experts.79.up_proj.weight_scale": "model-00010-of-00047.safetensors", + "model.layers.9.mlp.experts.8.down_proj.weight": "model-00010-of-00047.safetensors", + "model.layers.9.mlp.experts.8.down_proj.weight_scale": "model-00010-of-00047.safetensors", + "model.layers.9.mlp.experts.8.gate_proj.weight": "model-00010-of-00047.safetensors", + "model.layers.9.mlp.experts.8.gate_proj.weight_scale": "model-00010-of-00047.safetensors", + "model.layers.9.mlp.experts.8.up_proj.weight": "model-00010-of-00047.safetensors", + "model.layers.9.mlp.experts.8.up_proj.weight_scale": "model-00010-of-00047.safetensors", + "model.layers.9.mlp.experts.80.down_proj.weight": "model-00010-of-00047.safetensors", + "model.layers.9.mlp.experts.80.down_proj.weight_scale": "model-00010-of-00047.safetensors", + "model.layers.9.mlp.experts.80.gate_proj.weight": "model-00010-of-00047.safetensors", + "model.layers.9.mlp.experts.80.gate_proj.weight_scale": "model-00010-of-00047.safetensors", + "model.layers.9.mlp.experts.80.up_proj.weight": "model-00010-of-00047.safetensors", + "model.layers.9.mlp.experts.80.up_proj.weight_scale": "model-00010-of-00047.safetensors", + "model.layers.9.mlp.experts.81.down_proj.weight": "model-00010-of-00047.safetensors", + "model.layers.9.mlp.experts.81.down_proj.weight_scale": "model-00010-of-00047.safetensors", + "model.layers.9.mlp.experts.81.gate_proj.weight": "model-00010-of-00047.safetensors", + "model.layers.9.mlp.experts.81.gate_proj.weight_scale": "model-00010-of-00047.safetensors", + "model.layers.9.mlp.experts.81.up_proj.weight": "model-00010-of-00047.safetensors", + "model.layers.9.mlp.experts.81.up_proj.weight_scale": "model-00010-of-00047.safetensors", + "model.layers.9.mlp.experts.82.down_proj.weight": "model-00010-of-00047.safetensors", + "model.layers.9.mlp.experts.82.down_proj.weight_scale": "model-00010-of-00047.safetensors", + "model.layers.9.mlp.experts.82.gate_proj.weight": "model-00010-of-00047.safetensors", + "model.layers.9.mlp.experts.82.gate_proj.weight_scale": "model-00010-of-00047.safetensors", + "model.layers.9.mlp.experts.82.up_proj.weight": "model-00010-of-00047.safetensors", + "model.layers.9.mlp.experts.82.up_proj.weight_scale": "model-00010-of-00047.safetensors", + "model.layers.9.mlp.experts.83.down_proj.weight": "model-00010-of-00047.safetensors", + "model.layers.9.mlp.experts.83.down_proj.weight_scale": "model-00010-of-00047.safetensors", + "model.layers.9.mlp.experts.83.gate_proj.weight": "model-00010-of-00047.safetensors", + "model.layers.9.mlp.experts.83.gate_proj.weight_scale": "model-00010-of-00047.safetensors", + "model.layers.9.mlp.experts.83.up_proj.weight": "model-00010-of-00047.safetensors", + "model.layers.9.mlp.experts.83.up_proj.weight_scale": "model-00010-of-00047.safetensors", + "model.layers.9.mlp.experts.84.down_proj.weight": "model-00010-of-00047.safetensors", + "model.layers.9.mlp.experts.84.down_proj.weight_scale": "model-00010-of-00047.safetensors", + "model.layers.9.mlp.experts.84.gate_proj.weight": "model-00010-of-00047.safetensors", + "model.layers.9.mlp.experts.84.gate_proj.weight_scale": "model-00010-of-00047.safetensors", + "model.layers.9.mlp.experts.84.up_proj.weight": "model-00010-of-00047.safetensors", + "model.layers.9.mlp.experts.84.up_proj.weight_scale": "model-00010-of-00047.safetensors", + "model.layers.9.mlp.experts.85.down_proj.weight": "model-00010-of-00047.safetensors", + "model.layers.9.mlp.experts.85.down_proj.weight_scale": "model-00010-of-00047.safetensors", + "model.layers.9.mlp.experts.85.gate_proj.weight": "model-00010-of-00047.safetensors", + "model.layers.9.mlp.experts.85.gate_proj.weight_scale": "model-00010-of-00047.safetensors", + "model.layers.9.mlp.experts.85.up_proj.weight": "model-00010-of-00047.safetensors", + "model.layers.9.mlp.experts.85.up_proj.weight_scale": "model-00010-of-00047.safetensors", + "model.layers.9.mlp.experts.86.down_proj.weight": "model-00010-of-00047.safetensors", + "model.layers.9.mlp.experts.86.down_proj.weight_scale": "model-00010-of-00047.safetensors", + "model.layers.9.mlp.experts.86.gate_proj.weight": "model-00010-of-00047.safetensors", + "model.layers.9.mlp.experts.86.gate_proj.weight_scale": "model-00010-of-00047.safetensors", + "model.layers.9.mlp.experts.86.up_proj.weight": "model-00010-of-00047.safetensors", + "model.layers.9.mlp.experts.86.up_proj.weight_scale": "model-00010-of-00047.safetensors", + "model.layers.9.mlp.experts.87.down_proj.weight": "model-00010-of-00047.safetensors", + "model.layers.9.mlp.experts.87.down_proj.weight_scale": "model-00010-of-00047.safetensors", + "model.layers.9.mlp.experts.87.gate_proj.weight": "model-00010-of-00047.safetensors", + "model.layers.9.mlp.experts.87.gate_proj.weight_scale": "model-00010-of-00047.safetensors", + "model.layers.9.mlp.experts.87.up_proj.weight": "model-00010-of-00047.safetensors", + "model.layers.9.mlp.experts.87.up_proj.weight_scale": "model-00010-of-00047.safetensors", + "model.layers.9.mlp.experts.88.down_proj.weight": "model-00010-of-00047.safetensors", + "model.layers.9.mlp.experts.88.down_proj.weight_scale": "model-00010-of-00047.safetensors", + "model.layers.9.mlp.experts.88.gate_proj.weight": "model-00010-of-00047.safetensors", + "model.layers.9.mlp.experts.88.gate_proj.weight_scale": "model-00010-of-00047.safetensors", + "model.layers.9.mlp.experts.88.up_proj.weight": "model-00010-of-00047.safetensors", + "model.layers.9.mlp.experts.88.up_proj.weight_scale": "model-00010-of-00047.safetensors", + "model.layers.9.mlp.experts.89.down_proj.weight": "model-00010-of-00047.safetensors", + "model.layers.9.mlp.experts.89.down_proj.weight_scale": "model-00010-of-00047.safetensors", + "model.layers.9.mlp.experts.89.gate_proj.weight": "model-00010-of-00047.safetensors", + "model.layers.9.mlp.experts.89.gate_proj.weight_scale": "model-00010-of-00047.safetensors", + "model.layers.9.mlp.experts.89.up_proj.weight": "model-00010-of-00047.safetensors", + "model.layers.9.mlp.experts.89.up_proj.weight_scale": "model-00010-of-00047.safetensors", + "model.layers.9.mlp.experts.9.down_proj.weight": "model-00010-of-00047.safetensors", + "model.layers.9.mlp.experts.9.down_proj.weight_scale": "model-00010-of-00047.safetensors", + "model.layers.9.mlp.experts.9.gate_proj.weight": "model-00010-of-00047.safetensors", + "model.layers.9.mlp.experts.9.gate_proj.weight_scale": "model-00010-of-00047.safetensors", + "model.layers.9.mlp.experts.9.up_proj.weight": "model-00010-of-00047.safetensors", + "model.layers.9.mlp.experts.9.up_proj.weight_scale": "model-00010-of-00047.safetensors", + "model.layers.9.mlp.experts.90.down_proj.weight": "model-00010-of-00047.safetensors", + "model.layers.9.mlp.experts.90.down_proj.weight_scale": "model-00010-of-00047.safetensors", + "model.layers.9.mlp.experts.90.gate_proj.weight": "model-00010-of-00047.safetensors", + "model.layers.9.mlp.experts.90.gate_proj.weight_scale": "model-00010-of-00047.safetensors", + "model.layers.9.mlp.experts.90.up_proj.weight": "model-00010-of-00047.safetensors", + "model.layers.9.mlp.experts.90.up_proj.weight_scale": "model-00010-of-00047.safetensors", + "model.layers.9.mlp.experts.91.down_proj.weight": "model-00010-of-00047.safetensors", + "model.layers.9.mlp.experts.91.down_proj.weight_scale": "model-00010-of-00047.safetensors", + "model.layers.9.mlp.experts.91.gate_proj.weight": "model-00010-of-00047.safetensors", + "model.layers.9.mlp.experts.91.gate_proj.weight_scale": "model-00010-of-00047.safetensors", + "model.layers.9.mlp.experts.91.up_proj.weight": "model-00010-of-00047.safetensors", + "model.layers.9.mlp.experts.91.up_proj.weight_scale": "model-00010-of-00047.safetensors", + "model.layers.9.mlp.experts.92.down_proj.weight": "model-00010-of-00047.safetensors", + "model.layers.9.mlp.experts.92.down_proj.weight_scale": "model-00010-of-00047.safetensors", + "model.layers.9.mlp.experts.92.gate_proj.weight": "model-00010-of-00047.safetensors", + "model.layers.9.mlp.experts.92.gate_proj.weight_scale": "model-00010-of-00047.safetensors", + "model.layers.9.mlp.experts.92.up_proj.weight": "model-00010-of-00047.safetensors", + "model.layers.9.mlp.experts.92.up_proj.weight_scale": "model-00010-of-00047.safetensors", + "model.layers.9.mlp.experts.93.down_proj.weight": "model-00010-of-00047.safetensors", + "model.layers.9.mlp.experts.93.down_proj.weight_scale": "model-00010-of-00047.safetensors", + "model.layers.9.mlp.experts.93.gate_proj.weight": "model-00010-of-00047.safetensors", + "model.layers.9.mlp.experts.93.gate_proj.weight_scale": "model-00010-of-00047.safetensors", + "model.layers.9.mlp.experts.93.up_proj.weight": "model-00010-of-00047.safetensors", + "model.layers.9.mlp.experts.93.up_proj.weight_scale": "model-00010-of-00047.safetensors", + "model.layers.9.mlp.experts.94.down_proj.weight": "model-00010-of-00047.safetensors", + "model.layers.9.mlp.experts.94.down_proj.weight_scale": "model-00010-of-00047.safetensors", + "model.layers.9.mlp.experts.94.gate_proj.weight": "model-00010-of-00047.safetensors", + "model.layers.9.mlp.experts.94.gate_proj.weight_scale": "model-00010-of-00047.safetensors", + "model.layers.9.mlp.experts.94.up_proj.weight": "model-00010-of-00047.safetensors", + "model.layers.9.mlp.experts.94.up_proj.weight_scale": "model-00010-of-00047.safetensors", + "model.layers.9.mlp.experts.95.down_proj.weight": "model-00010-of-00047.safetensors", + "model.layers.9.mlp.experts.95.down_proj.weight_scale": "model-00010-of-00047.safetensors", + "model.layers.9.mlp.experts.95.gate_proj.weight": "model-00010-of-00047.safetensors", + "model.layers.9.mlp.experts.95.gate_proj.weight_scale": "model-00010-of-00047.safetensors", + "model.layers.9.mlp.experts.95.up_proj.weight": "model-00010-of-00047.safetensors", + "model.layers.9.mlp.experts.95.up_proj.weight_scale": "model-00010-of-00047.safetensors", + "model.layers.9.mlp.experts.96.down_proj.weight": "model-00010-of-00047.safetensors", + "model.layers.9.mlp.experts.96.down_proj.weight_scale": "model-00010-of-00047.safetensors", + "model.layers.9.mlp.experts.96.gate_proj.weight": "model-00010-of-00047.safetensors", + "model.layers.9.mlp.experts.96.gate_proj.weight_scale": "model-00010-of-00047.safetensors", + "model.layers.9.mlp.experts.96.up_proj.weight": "model-00010-of-00047.safetensors", + "model.layers.9.mlp.experts.96.up_proj.weight_scale": "model-00010-of-00047.safetensors", + "model.layers.9.mlp.experts.97.down_proj.weight": "model-00010-of-00047.safetensors", + "model.layers.9.mlp.experts.97.down_proj.weight_scale": "model-00010-of-00047.safetensors", + "model.layers.9.mlp.experts.97.gate_proj.weight": "model-00010-of-00047.safetensors", + "model.layers.9.mlp.experts.97.gate_proj.weight_scale": "model-00010-of-00047.safetensors", + "model.layers.9.mlp.experts.97.up_proj.weight": "model-00010-of-00047.safetensors", + "model.layers.9.mlp.experts.97.up_proj.weight_scale": "model-00010-of-00047.safetensors", + "model.layers.9.mlp.experts.98.down_proj.weight": "model-00010-of-00047.safetensors", + "model.layers.9.mlp.experts.98.down_proj.weight_scale": "model-00010-of-00047.safetensors", + "model.layers.9.mlp.experts.98.gate_proj.weight": "model-00010-of-00047.safetensors", + "model.layers.9.mlp.experts.98.gate_proj.weight_scale": "model-00010-of-00047.safetensors", + "model.layers.9.mlp.experts.98.up_proj.weight": "model-00010-of-00047.safetensors", + "model.layers.9.mlp.experts.98.up_proj.weight_scale": "model-00010-of-00047.safetensors", + "model.layers.9.mlp.experts.99.down_proj.weight": "model-00010-of-00047.safetensors", + "model.layers.9.mlp.experts.99.down_proj.weight_scale": "model-00010-of-00047.safetensors", + "model.layers.9.mlp.experts.99.gate_proj.weight": "model-00010-of-00047.safetensors", + "model.layers.9.mlp.experts.99.gate_proj.weight_scale": "model-00010-of-00047.safetensors", + "model.layers.9.mlp.experts.99.up_proj.weight": "model-00010-of-00047.safetensors", + "model.layers.9.mlp.experts.99.up_proj.weight_scale": "model-00010-of-00047.safetensors", + "model.layers.9.mlp.gate.e_score_correction_bias": "model-00010-of-00047.safetensors", + "model.layers.9.mlp.gate.weight": "model-00010-of-00047.safetensors", + "model.layers.9.mlp.shared_experts.down_proj.weight": "model-00010-of-00047.safetensors", + "model.layers.9.mlp.shared_experts.down_proj.weight_scale": "model-00010-of-00047.safetensors", + "model.layers.9.mlp.shared_experts.gate_proj.weight": "model-00010-of-00047.safetensors", + "model.layers.9.mlp.shared_experts.gate_proj.weight_scale": "model-00010-of-00047.safetensors", + "model.layers.9.mlp.shared_experts.up_proj.weight": "model-00010-of-00047.safetensors", + "model.layers.9.mlp.shared_experts.up_proj.weight_scale": "model-00010-of-00047.safetensors", + "model.layers.9.post_attention_layernorm.weight": "model-00010-of-00047.safetensors", + "model.layers.9.self_attn.k_proj.bias": "model-00010-of-00047.safetensors", + "model.layers.9.self_attn.k_proj.weight": "model-00010-of-00047.safetensors", + "model.layers.9.self_attn.k_proj.weight_scale": "model-00010-of-00047.safetensors", + "model.layers.9.self_attn.o_proj.weight": "model-00010-of-00047.safetensors", + "model.layers.9.self_attn.o_proj.weight_scale": "model-00010-of-00047.safetensors", + "model.layers.9.self_attn.q_proj.bias": "model-00010-of-00047.safetensors", + "model.layers.9.self_attn.q_proj.weight": "model-00010-of-00047.safetensors", + "model.layers.9.self_attn.q_proj.weight_scale": "model-00010-of-00047.safetensors", + "model.layers.9.self_attn.v_proj.bias": "model-00010-of-00047.safetensors", + "model.layers.9.self_attn.v_proj.weight": "model-00010-of-00047.safetensors", + "model.layers.9.self_attn.v_proj.weight_scale": "model-00010-of-00047.safetensors", + "model.layers.10.input_layernorm.weight": "model-00011-of-00047.safetensors", + "model.layers.10.mlp.experts.0.down_proj.weight": "model-00011-of-00047.safetensors", + "model.layers.10.mlp.experts.0.down_proj.weight_scale": "model-00011-of-00047.safetensors", + "model.layers.10.mlp.experts.0.gate_proj.weight": "model-00011-of-00047.safetensors", + "model.layers.10.mlp.experts.0.gate_proj.weight_scale": "model-00011-of-00047.safetensors", + "model.layers.10.mlp.experts.0.up_proj.weight": "model-00011-of-00047.safetensors", + "model.layers.10.mlp.experts.0.up_proj.weight_scale": "model-00011-of-00047.safetensors", + "model.layers.10.mlp.experts.1.down_proj.weight": "model-00011-of-00047.safetensors", + "model.layers.10.mlp.experts.1.down_proj.weight_scale": "model-00011-of-00047.safetensors", + "model.layers.10.mlp.experts.1.gate_proj.weight": "model-00011-of-00047.safetensors", + "model.layers.10.mlp.experts.1.gate_proj.weight_scale": "model-00011-of-00047.safetensors", + "model.layers.10.mlp.experts.1.up_proj.weight": "model-00011-of-00047.safetensors", + "model.layers.10.mlp.experts.1.up_proj.weight_scale": "model-00011-of-00047.safetensors", + "model.layers.10.mlp.experts.10.down_proj.weight": "model-00011-of-00047.safetensors", + "model.layers.10.mlp.experts.10.down_proj.weight_scale": "model-00011-of-00047.safetensors", + "model.layers.10.mlp.experts.10.gate_proj.weight": "model-00011-of-00047.safetensors", + "model.layers.10.mlp.experts.10.gate_proj.weight_scale": "model-00011-of-00047.safetensors", + "model.layers.10.mlp.experts.10.up_proj.weight": "model-00011-of-00047.safetensors", + "model.layers.10.mlp.experts.10.up_proj.weight_scale": "model-00011-of-00047.safetensors", + "model.layers.10.mlp.experts.100.down_proj.weight": "model-00011-of-00047.safetensors", + "model.layers.10.mlp.experts.100.down_proj.weight_scale": "model-00011-of-00047.safetensors", + "model.layers.10.mlp.experts.100.gate_proj.weight": "model-00011-of-00047.safetensors", + "model.layers.10.mlp.experts.100.gate_proj.weight_scale": "model-00011-of-00047.safetensors", + "model.layers.10.mlp.experts.100.up_proj.weight": "model-00011-of-00047.safetensors", + "model.layers.10.mlp.experts.100.up_proj.weight_scale": "model-00011-of-00047.safetensors", + "model.layers.10.mlp.experts.101.down_proj.weight": "model-00011-of-00047.safetensors", + "model.layers.10.mlp.experts.101.down_proj.weight_scale": "model-00011-of-00047.safetensors", + "model.layers.10.mlp.experts.101.gate_proj.weight": "model-00011-of-00047.safetensors", + "model.layers.10.mlp.experts.101.gate_proj.weight_scale": "model-00011-of-00047.safetensors", + "model.layers.10.mlp.experts.101.up_proj.weight": "model-00011-of-00047.safetensors", + "model.layers.10.mlp.experts.101.up_proj.weight_scale": "model-00011-of-00047.safetensors", + "model.layers.10.mlp.experts.102.down_proj.weight": "model-00011-of-00047.safetensors", + "model.layers.10.mlp.experts.102.down_proj.weight_scale": "model-00011-of-00047.safetensors", + "model.layers.10.mlp.experts.102.gate_proj.weight": "model-00011-of-00047.safetensors", + "model.layers.10.mlp.experts.102.gate_proj.weight_scale": "model-00011-of-00047.safetensors", + "model.layers.10.mlp.experts.102.up_proj.weight": "model-00011-of-00047.safetensors", + "model.layers.10.mlp.experts.102.up_proj.weight_scale": "model-00011-of-00047.safetensors", + "model.layers.10.mlp.experts.103.down_proj.weight": "model-00011-of-00047.safetensors", + "model.layers.10.mlp.experts.103.down_proj.weight_scale": "model-00011-of-00047.safetensors", + "model.layers.10.mlp.experts.103.gate_proj.weight": "model-00011-of-00047.safetensors", + "model.layers.10.mlp.experts.103.gate_proj.weight_scale": "model-00011-of-00047.safetensors", + "model.layers.10.mlp.experts.103.up_proj.weight": "model-00011-of-00047.safetensors", + "model.layers.10.mlp.experts.103.up_proj.weight_scale": "model-00011-of-00047.safetensors", + "model.layers.10.mlp.experts.104.down_proj.weight": "model-00011-of-00047.safetensors", + "model.layers.10.mlp.experts.104.down_proj.weight_scale": "model-00011-of-00047.safetensors", + "model.layers.10.mlp.experts.104.gate_proj.weight": "model-00011-of-00047.safetensors", + "model.layers.10.mlp.experts.104.gate_proj.weight_scale": "model-00011-of-00047.safetensors", + "model.layers.10.mlp.experts.104.up_proj.weight": "model-00011-of-00047.safetensors", + "model.layers.10.mlp.experts.104.up_proj.weight_scale": "model-00011-of-00047.safetensors", + "model.layers.10.mlp.experts.105.down_proj.weight": "model-00011-of-00047.safetensors", + "model.layers.10.mlp.experts.105.down_proj.weight_scale": "model-00011-of-00047.safetensors", + "model.layers.10.mlp.experts.105.gate_proj.weight": "model-00011-of-00047.safetensors", + "model.layers.10.mlp.experts.105.gate_proj.weight_scale": "model-00011-of-00047.safetensors", + "model.layers.10.mlp.experts.105.up_proj.weight": "model-00011-of-00047.safetensors", + "model.layers.10.mlp.experts.105.up_proj.weight_scale": "model-00011-of-00047.safetensors", + "model.layers.10.mlp.experts.106.down_proj.weight": "model-00011-of-00047.safetensors", + "model.layers.10.mlp.experts.106.down_proj.weight_scale": "model-00011-of-00047.safetensors", + "model.layers.10.mlp.experts.106.gate_proj.weight": "model-00011-of-00047.safetensors", + "model.layers.10.mlp.experts.106.gate_proj.weight_scale": "model-00011-of-00047.safetensors", + "model.layers.10.mlp.experts.106.up_proj.weight": "model-00011-of-00047.safetensors", + "model.layers.10.mlp.experts.106.up_proj.weight_scale": "model-00011-of-00047.safetensors", + "model.layers.10.mlp.experts.107.down_proj.weight": "model-00011-of-00047.safetensors", + "model.layers.10.mlp.experts.107.down_proj.weight_scale": "model-00011-of-00047.safetensors", + "model.layers.10.mlp.experts.107.gate_proj.weight": "model-00011-of-00047.safetensors", + "model.layers.10.mlp.experts.107.gate_proj.weight_scale": "model-00011-of-00047.safetensors", + "model.layers.10.mlp.experts.107.up_proj.weight": "model-00011-of-00047.safetensors", + "model.layers.10.mlp.experts.107.up_proj.weight_scale": "model-00011-of-00047.safetensors", + "model.layers.10.mlp.experts.108.down_proj.weight": "model-00011-of-00047.safetensors", + "model.layers.10.mlp.experts.108.down_proj.weight_scale": "model-00011-of-00047.safetensors", + "model.layers.10.mlp.experts.108.gate_proj.weight": "model-00011-of-00047.safetensors", + "model.layers.10.mlp.experts.108.gate_proj.weight_scale": "model-00011-of-00047.safetensors", + "model.layers.10.mlp.experts.108.up_proj.weight": "model-00011-of-00047.safetensors", + "model.layers.10.mlp.experts.108.up_proj.weight_scale": "model-00011-of-00047.safetensors", + "model.layers.10.mlp.experts.109.down_proj.weight": "model-00011-of-00047.safetensors", + "model.layers.10.mlp.experts.109.down_proj.weight_scale": "model-00011-of-00047.safetensors", + "model.layers.10.mlp.experts.109.gate_proj.weight": "model-00011-of-00047.safetensors", + "model.layers.10.mlp.experts.109.gate_proj.weight_scale": "model-00011-of-00047.safetensors", + "model.layers.10.mlp.experts.109.up_proj.weight": "model-00011-of-00047.safetensors", + "model.layers.10.mlp.experts.109.up_proj.weight_scale": "model-00011-of-00047.safetensors", + "model.layers.10.mlp.experts.11.down_proj.weight": "model-00011-of-00047.safetensors", + "model.layers.10.mlp.experts.11.down_proj.weight_scale": "model-00011-of-00047.safetensors", + "model.layers.10.mlp.experts.11.gate_proj.weight": "model-00011-of-00047.safetensors", + "model.layers.10.mlp.experts.11.gate_proj.weight_scale": "model-00011-of-00047.safetensors", + "model.layers.10.mlp.experts.11.up_proj.weight": "model-00011-of-00047.safetensors", + "model.layers.10.mlp.experts.11.up_proj.weight_scale": "model-00011-of-00047.safetensors", + "model.layers.10.mlp.experts.110.down_proj.weight": "model-00011-of-00047.safetensors", + "model.layers.10.mlp.experts.110.down_proj.weight_scale": "model-00011-of-00047.safetensors", + "model.layers.10.mlp.experts.110.gate_proj.weight": "model-00011-of-00047.safetensors", + "model.layers.10.mlp.experts.110.gate_proj.weight_scale": "model-00011-of-00047.safetensors", + "model.layers.10.mlp.experts.110.up_proj.weight": "model-00011-of-00047.safetensors", + "model.layers.10.mlp.experts.110.up_proj.weight_scale": "model-00011-of-00047.safetensors", + "model.layers.10.mlp.experts.111.down_proj.weight": "model-00011-of-00047.safetensors", + "model.layers.10.mlp.experts.111.down_proj.weight_scale": "model-00011-of-00047.safetensors", + "model.layers.10.mlp.experts.111.gate_proj.weight": "model-00011-of-00047.safetensors", + "model.layers.10.mlp.experts.111.gate_proj.weight_scale": "model-00011-of-00047.safetensors", + "model.layers.10.mlp.experts.111.up_proj.weight": "model-00011-of-00047.safetensors", + "model.layers.10.mlp.experts.111.up_proj.weight_scale": "model-00011-of-00047.safetensors", + "model.layers.10.mlp.experts.112.down_proj.weight": "model-00011-of-00047.safetensors", + "model.layers.10.mlp.experts.112.down_proj.weight_scale": "model-00011-of-00047.safetensors", + "model.layers.10.mlp.experts.112.gate_proj.weight": "model-00011-of-00047.safetensors", + "model.layers.10.mlp.experts.112.gate_proj.weight_scale": "model-00011-of-00047.safetensors", + "model.layers.10.mlp.experts.112.up_proj.weight": "model-00011-of-00047.safetensors", + "model.layers.10.mlp.experts.112.up_proj.weight_scale": "model-00011-of-00047.safetensors", + "model.layers.10.mlp.experts.113.down_proj.weight": "model-00011-of-00047.safetensors", + "model.layers.10.mlp.experts.113.down_proj.weight_scale": "model-00011-of-00047.safetensors", + "model.layers.10.mlp.experts.113.gate_proj.weight": "model-00011-of-00047.safetensors", + "model.layers.10.mlp.experts.113.gate_proj.weight_scale": "model-00011-of-00047.safetensors", + "model.layers.10.mlp.experts.113.up_proj.weight": "model-00011-of-00047.safetensors", + "model.layers.10.mlp.experts.113.up_proj.weight_scale": "model-00011-of-00047.safetensors", + "model.layers.10.mlp.experts.114.down_proj.weight": "model-00011-of-00047.safetensors", + "model.layers.10.mlp.experts.114.down_proj.weight_scale": "model-00011-of-00047.safetensors", + "model.layers.10.mlp.experts.114.gate_proj.weight": "model-00011-of-00047.safetensors", + "model.layers.10.mlp.experts.114.gate_proj.weight_scale": "model-00011-of-00047.safetensors", + "model.layers.10.mlp.experts.114.up_proj.weight": "model-00011-of-00047.safetensors", + "model.layers.10.mlp.experts.114.up_proj.weight_scale": "model-00011-of-00047.safetensors", + "model.layers.10.mlp.experts.115.down_proj.weight": "model-00011-of-00047.safetensors", + "model.layers.10.mlp.experts.115.down_proj.weight_scale": "model-00011-of-00047.safetensors", + "model.layers.10.mlp.experts.115.gate_proj.weight": "model-00011-of-00047.safetensors", + "model.layers.10.mlp.experts.115.gate_proj.weight_scale": "model-00011-of-00047.safetensors", + "model.layers.10.mlp.experts.115.up_proj.weight": "model-00011-of-00047.safetensors", + "model.layers.10.mlp.experts.115.up_proj.weight_scale": "model-00011-of-00047.safetensors", + "model.layers.10.mlp.experts.116.down_proj.weight": "model-00011-of-00047.safetensors", + "model.layers.10.mlp.experts.116.down_proj.weight_scale": "model-00011-of-00047.safetensors", + "model.layers.10.mlp.experts.116.gate_proj.weight": "model-00011-of-00047.safetensors", + "model.layers.10.mlp.experts.116.gate_proj.weight_scale": "model-00011-of-00047.safetensors", + "model.layers.10.mlp.experts.116.up_proj.weight": "model-00011-of-00047.safetensors", + "model.layers.10.mlp.experts.116.up_proj.weight_scale": "model-00011-of-00047.safetensors", + "model.layers.10.mlp.experts.117.down_proj.weight": "model-00011-of-00047.safetensors", + "model.layers.10.mlp.experts.117.down_proj.weight_scale": "model-00011-of-00047.safetensors", + "model.layers.10.mlp.experts.117.gate_proj.weight": "model-00011-of-00047.safetensors", + "model.layers.10.mlp.experts.117.gate_proj.weight_scale": "model-00011-of-00047.safetensors", + "model.layers.10.mlp.experts.117.up_proj.weight": "model-00011-of-00047.safetensors", + "model.layers.10.mlp.experts.117.up_proj.weight_scale": "model-00011-of-00047.safetensors", + "model.layers.10.mlp.experts.118.down_proj.weight": "model-00011-of-00047.safetensors", + "model.layers.10.mlp.experts.118.down_proj.weight_scale": "model-00011-of-00047.safetensors", + "model.layers.10.mlp.experts.118.gate_proj.weight": "model-00011-of-00047.safetensors", + "model.layers.10.mlp.experts.118.gate_proj.weight_scale": "model-00011-of-00047.safetensors", + "model.layers.10.mlp.experts.118.up_proj.weight": "model-00011-of-00047.safetensors", + "model.layers.10.mlp.experts.118.up_proj.weight_scale": "model-00011-of-00047.safetensors", + "model.layers.10.mlp.experts.119.down_proj.weight": "model-00011-of-00047.safetensors", + "model.layers.10.mlp.experts.119.down_proj.weight_scale": "model-00011-of-00047.safetensors", + "model.layers.10.mlp.experts.119.gate_proj.weight": "model-00011-of-00047.safetensors", + "model.layers.10.mlp.experts.119.gate_proj.weight_scale": "model-00011-of-00047.safetensors", + "model.layers.10.mlp.experts.119.up_proj.weight": "model-00011-of-00047.safetensors", + "model.layers.10.mlp.experts.119.up_proj.weight_scale": "model-00011-of-00047.safetensors", + "model.layers.10.mlp.experts.12.down_proj.weight": "model-00011-of-00047.safetensors", + "model.layers.10.mlp.experts.12.down_proj.weight_scale": "model-00011-of-00047.safetensors", + "model.layers.10.mlp.experts.12.gate_proj.weight": "model-00011-of-00047.safetensors", + "model.layers.10.mlp.experts.12.gate_proj.weight_scale": "model-00011-of-00047.safetensors", + "model.layers.10.mlp.experts.12.up_proj.weight": "model-00011-of-00047.safetensors", + "model.layers.10.mlp.experts.12.up_proj.weight_scale": "model-00011-of-00047.safetensors", + "model.layers.10.mlp.experts.120.down_proj.weight": "model-00011-of-00047.safetensors", + "model.layers.10.mlp.experts.120.down_proj.weight_scale": "model-00011-of-00047.safetensors", + "model.layers.10.mlp.experts.120.gate_proj.weight": "model-00011-of-00047.safetensors", + "model.layers.10.mlp.experts.120.gate_proj.weight_scale": "model-00011-of-00047.safetensors", + "model.layers.10.mlp.experts.120.up_proj.weight": "model-00011-of-00047.safetensors", + "model.layers.10.mlp.experts.120.up_proj.weight_scale": "model-00011-of-00047.safetensors", + "model.layers.10.mlp.experts.121.down_proj.weight": "model-00011-of-00047.safetensors", + "model.layers.10.mlp.experts.121.down_proj.weight_scale": "model-00011-of-00047.safetensors", + "model.layers.10.mlp.experts.121.gate_proj.weight": "model-00011-of-00047.safetensors", + "model.layers.10.mlp.experts.121.gate_proj.weight_scale": "model-00011-of-00047.safetensors", + "model.layers.10.mlp.experts.121.up_proj.weight": "model-00011-of-00047.safetensors", + "model.layers.10.mlp.experts.121.up_proj.weight_scale": "model-00011-of-00047.safetensors", + "model.layers.10.mlp.experts.122.down_proj.weight": "model-00011-of-00047.safetensors", + "model.layers.10.mlp.experts.122.down_proj.weight_scale": "model-00011-of-00047.safetensors", + "model.layers.10.mlp.experts.122.gate_proj.weight": "model-00011-of-00047.safetensors", + "model.layers.10.mlp.experts.122.gate_proj.weight_scale": "model-00011-of-00047.safetensors", + "model.layers.10.mlp.experts.122.up_proj.weight": "model-00011-of-00047.safetensors", + "model.layers.10.mlp.experts.122.up_proj.weight_scale": "model-00011-of-00047.safetensors", + "model.layers.10.mlp.experts.123.down_proj.weight": "model-00011-of-00047.safetensors", + "model.layers.10.mlp.experts.123.down_proj.weight_scale": "model-00011-of-00047.safetensors", + "model.layers.10.mlp.experts.123.gate_proj.weight": "model-00011-of-00047.safetensors", + "model.layers.10.mlp.experts.123.gate_proj.weight_scale": "model-00011-of-00047.safetensors", + "model.layers.10.mlp.experts.123.up_proj.weight": "model-00011-of-00047.safetensors", + "model.layers.10.mlp.experts.123.up_proj.weight_scale": "model-00011-of-00047.safetensors", + "model.layers.10.mlp.experts.124.down_proj.weight": "model-00011-of-00047.safetensors", + "model.layers.10.mlp.experts.124.down_proj.weight_scale": "model-00011-of-00047.safetensors", + "model.layers.10.mlp.experts.124.gate_proj.weight": "model-00011-of-00047.safetensors", + "model.layers.10.mlp.experts.124.gate_proj.weight_scale": "model-00011-of-00047.safetensors", + "model.layers.10.mlp.experts.124.up_proj.weight": "model-00011-of-00047.safetensors", + "model.layers.10.mlp.experts.124.up_proj.weight_scale": "model-00011-of-00047.safetensors", + "model.layers.10.mlp.experts.125.down_proj.weight": "model-00011-of-00047.safetensors", + "model.layers.10.mlp.experts.125.down_proj.weight_scale": "model-00011-of-00047.safetensors", + "model.layers.10.mlp.experts.125.gate_proj.weight": "model-00011-of-00047.safetensors", + "model.layers.10.mlp.experts.125.gate_proj.weight_scale": "model-00011-of-00047.safetensors", + "model.layers.10.mlp.experts.125.up_proj.weight": "model-00011-of-00047.safetensors", + "model.layers.10.mlp.experts.125.up_proj.weight_scale": "model-00011-of-00047.safetensors", + "model.layers.10.mlp.experts.126.down_proj.weight": "model-00011-of-00047.safetensors", + "model.layers.10.mlp.experts.126.down_proj.weight_scale": "model-00011-of-00047.safetensors", + "model.layers.10.mlp.experts.126.gate_proj.weight": "model-00011-of-00047.safetensors", + "model.layers.10.mlp.experts.126.gate_proj.weight_scale": "model-00011-of-00047.safetensors", + "model.layers.10.mlp.experts.126.up_proj.weight": "model-00011-of-00047.safetensors", + "model.layers.10.mlp.experts.126.up_proj.weight_scale": "model-00011-of-00047.safetensors", + "model.layers.10.mlp.experts.127.down_proj.weight": "model-00011-of-00047.safetensors", + "model.layers.10.mlp.experts.127.down_proj.weight_scale": "model-00011-of-00047.safetensors", + "model.layers.10.mlp.experts.127.gate_proj.weight": "model-00011-of-00047.safetensors", + "model.layers.10.mlp.experts.127.gate_proj.weight_scale": "model-00011-of-00047.safetensors", + "model.layers.10.mlp.experts.127.up_proj.weight": "model-00011-of-00047.safetensors", + "model.layers.10.mlp.experts.127.up_proj.weight_scale": "model-00011-of-00047.safetensors", + "model.layers.10.mlp.experts.13.down_proj.weight": "model-00011-of-00047.safetensors", + "model.layers.10.mlp.experts.13.down_proj.weight_scale": "model-00011-of-00047.safetensors", + "model.layers.10.mlp.experts.13.gate_proj.weight": "model-00011-of-00047.safetensors", + "model.layers.10.mlp.experts.13.gate_proj.weight_scale": "model-00011-of-00047.safetensors", + "model.layers.10.mlp.experts.13.up_proj.weight": "model-00011-of-00047.safetensors", + "model.layers.10.mlp.experts.13.up_proj.weight_scale": "model-00011-of-00047.safetensors", + "model.layers.10.mlp.experts.14.down_proj.weight": "model-00011-of-00047.safetensors", + "model.layers.10.mlp.experts.14.down_proj.weight_scale": "model-00011-of-00047.safetensors", + "model.layers.10.mlp.experts.14.gate_proj.weight": "model-00011-of-00047.safetensors", + "model.layers.10.mlp.experts.14.gate_proj.weight_scale": "model-00011-of-00047.safetensors", + "model.layers.10.mlp.experts.14.up_proj.weight": "model-00011-of-00047.safetensors", + "model.layers.10.mlp.experts.14.up_proj.weight_scale": "model-00011-of-00047.safetensors", + "model.layers.10.mlp.experts.15.down_proj.weight": "model-00011-of-00047.safetensors", + "model.layers.10.mlp.experts.15.down_proj.weight_scale": "model-00011-of-00047.safetensors", + "model.layers.10.mlp.experts.15.gate_proj.weight": "model-00011-of-00047.safetensors", + "model.layers.10.mlp.experts.15.gate_proj.weight_scale": "model-00011-of-00047.safetensors", + "model.layers.10.mlp.experts.15.up_proj.weight": "model-00011-of-00047.safetensors", + "model.layers.10.mlp.experts.15.up_proj.weight_scale": "model-00011-of-00047.safetensors", + "model.layers.10.mlp.experts.16.down_proj.weight": "model-00011-of-00047.safetensors", + "model.layers.10.mlp.experts.16.down_proj.weight_scale": "model-00011-of-00047.safetensors", + "model.layers.10.mlp.experts.16.gate_proj.weight": "model-00011-of-00047.safetensors", + "model.layers.10.mlp.experts.16.gate_proj.weight_scale": "model-00011-of-00047.safetensors", + "model.layers.10.mlp.experts.16.up_proj.weight": "model-00011-of-00047.safetensors", + "model.layers.10.mlp.experts.16.up_proj.weight_scale": "model-00011-of-00047.safetensors", + "model.layers.10.mlp.experts.17.down_proj.weight": "model-00011-of-00047.safetensors", + "model.layers.10.mlp.experts.17.down_proj.weight_scale": "model-00011-of-00047.safetensors", + "model.layers.10.mlp.experts.17.gate_proj.weight": "model-00011-of-00047.safetensors", + "model.layers.10.mlp.experts.17.gate_proj.weight_scale": "model-00011-of-00047.safetensors", + "model.layers.10.mlp.experts.17.up_proj.weight": "model-00011-of-00047.safetensors", + "model.layers.10.mlp.experts.17.up_proj.weight_scale": "model-00011-of-00047.safetensors", + "model.layers.10.mlp.experts.18.down_proj.weight": "model-00011-of-00047.safetensors", + "model.layers.10.mlp.experts.18.down_proj.weight_scale": "model-00011-of-00047.safetensors", + "model.layers.10.mlp.experts.18.gate_proj.weight": "model-00011-of-00047.safetensors", + "model.layers.10.mlp.experts.18.gate_proj.weight_scale": "model-00011-of-00047.safetensors", + "model.layers.10.mlp.experts.18.up_proj.weight": "model-00011-of-00047.safetensors", + "model.layers.10.mlp.experts.18.up_proj.weight_scale": "model-00011-of-00047.safetensors", + "model.layers.10.mlp.experts.19.down_proj.weight": "model-00011-of-00047.safetensors", + "model.layers.10.mlp.experts.19.down_proj.weight_scale": "model-00011-of-00047.safetensors", + "model.layers.10.mlp.experts.19.gate_proj.weight": "model-00011-of-00047.safetensors", + "model.layers.10.mlp.experts.19.gate_proj.weight_scale": "model-00011-of-00047.safetensors", + "model.layers.10.mlp.experts.19.up_proj.weight": "model-00011-of-00047.safetensors", + "model.layers.10.mlp.experts.19.up_proj.weight_scale": "model-00011-of-00047.safetensors", + "model.layers.10.mlp.experts.2.down_proj.weight": "model-00011-of-00047.safetensors", + "model.layers.10.mlp.experts.2.down_proj.weight_scale": "model-00011-of-00047.safetensors", + "model.layers.10.mlp.experts.2.gate_proj.weight": "model-00011-of-00047.safetensors", + "model.layers.10.mlp.experts.2.gate_proj.weight_scale": "model-00011-of-00047.safetensors", + "model.layers.10.mlp.experts.2.up_proj.weight": "model-00011-of-00047.safetensors", + "model.layers.10.mlp.experts.2.up_proj.weight_scale": "model-00011-of-00047.safetensors", + "model.layers.10.mlp.experts.20.down_proj.weight": "model-00011-of-00047.safetensors", + "model.layers.10.mlp.experts.20.down_proj.weight_scale": "model-00011-of-00047.safetensors", + "model.layers.10.mlp.experts.20.gate_proj.weight": "model-00011-of-00047.safetensors", + "model.layers.10.mlp.experts.20.gate_proj.weight_scale": "model-00011-of-00047.safetensors", + "model.layers.10.mlp.experts.20.up_proj.weight": "model-00011-of-00047.safetensors", + "model.layers.10.mlp.experts.20.up_proj.weight_scale": "model-00011-of-00047.safetensors", + "model.layers.10.mlp.experts.21.down_proj.weight": "model-00011-of-00047.safetensors", + "model.layers.10.mlp.experts.21.down_proj.weight_scale": "model-00011-of-00047.safetensors", + "model.layers.10.mlp.experts.21.gate_proj.weight": "model-00011-of-00047.safetensors", + "model.layers.10.mlp.experts.21.gate_proj.weight_scale": "model-00011-of-00047.safetensors", + "model.layers.10.mlp.experts.21.up_proj.weight": "model-00011-of-00047.safetensors", + "model.layers.10.mlp.experts.21.up_proj.weight_scale": "model-00011-of-00047.safetensors", + "model.layers.10.mlp.experts.22.down_proj.weight": "model-00011-of-00047.safetensors", + "model.layers.10.mlp.experts.22.down_proj.weight_scale": "model-00011-of-00047.safetensors", + "model.layers.10.mlp.experts.22.gate_proj.weight": "model-00011-of-00047.safetensors", + "model.layers.10.mlp.experts.22.gate_proj.weight_scale": "model-00011-of-00047.safetensors", + "model.layers.10.mlp.experts.22.up_proj.weight": "model-00011-of-00047.safetensors", + "model.layers.10.mlp.experts.22.up_proj.weight_scale": "model-00011-of-00047.safetensors", + "model.layers.10.mlp.experts.23.down_proj.weight": "model-00011-of-00047.safetensors", + "model.layers.10.mlp.experts.23.down_proj.weight_scale": "model-00011-of-00047.safetensors", + "model.layers.10.mlp.experts.23.gate_proj.weight": "model-00011-of-00047.safetensors", + "model.layers.10.mlp.experts.23.gate_proj.weight_scale": "model-00011-of-00047.safetensors", + "model.layers.10.mlp.experts.23.up_proj.weight": "model-00011-of-00047.safetensors", + "model.layers.10.mlp.experts.23.up_proj.weight_scale": "model-00011-of-00047.safetensors", + "model.layers.10.mlp.experts.24.down_proj.weight": "model-00011-of-00047.safetensors", + "model.layers.10.mlp.experts.24.down_proj.weight_scale": "model-00011-of-00047.safetensors", + "model.layers.10.mlp.experts.24.gate_proj.weight": "model-00011-of-00047.safetensors", + "model.layers.10.mlp.experts.24.gate_proj.weight_scale": "model-00011-of-00047.safetensors", + "model.layers.10.mlp.experts.24.up_proj.weight": "model-00011-of-00047.safetensors", + "model.layers.10.mlp.experts.24.up_proj.weight_scale": "model-00011-of-00047.safetensors", + "model.layers.10.mlp.experts.25.down_proj.weight": "model-00011-of-00047.safetensors", + "model.layers.10.mlp.experts.25.down_proj.weight_scale": "model-00011-of-00047.safetensors", + "model.layers.10.mlp.experts.25.gate_proj.weight": "model-00011-of-00047.safetensors", + "model.layers.10.mlp.experts.25.gate_proj.weight_scale": "model-00011-of-00047.safetensors", + "model.layers.10.mlp.experts.25.up_proj.weight": "model-00011-of-00047.safetensors", + "model.layers.10.mlp.experts.25.up_proj.weight_scale": "model-00011-of-00047.safetensors", + "model.layers.10.mlp.experts.26.down_proj.weight": "model-00011-of-00047.safetensors", + "model.layers.10.mlp.experts.26.down_proj.weight_scale": "model-00011-of-00047.safetensors", + "model.layers.10.mlp.experts.26.gate_proj.weight": "model-00011-of-00047.safetensors", + "model.layers.10.mlp.experts.26.gate_proj.weight_scale": "model-00011-of-00047.safetensors", + "model.layers.10.mlp.experts.26.up_proj.weight": "model-00011-of-00047.safetensors", + "model.layers.10.mlp.experts.26.up_proj.weight_scale": "model-00011-of-00047.safetensors", + "model.layers.10.mlp.experts.27.down_proj.weight": "model-00011-of-00047.safetensors", + "model.layers.10.mlp.experts.27.down_proj.weight_scale": "model-00011-of-00047.safetensors", + "model.layers.10.mlp.experts.27.gate_proj.weight": "model-00011-of-00047.safetensors", + "model.layers.10.mlp.experts.27.gate_proj.weight_scale": "model-00011-of-00047.safetensors", + "model.layers.10.mlp.experts.27.up_proj.weight": "model-00011-of-00047.safetensors", + "model.layers.10.mlp.experts.27.up_proj.weight_scale": "model-00011-of-00047.safetensors", + "model.layers.10.mlp.experts.28.down_proj.weight": "model-00011-of-00047.safetensors", + "model.layers.10.mlp.experts.28.down_proj.weight_scale": "model-00011-of-00047.safetensors", + "model.layers.10.mlp.experts.28.gate_proj.weight": "model-00011-of-00047.safetensors", + "model.layers.10.mlp.experts.28.gate_proj.weight_scale": "model-00011-of-00047.safetensors", + "model.layers.10.mlp.experts.28.up_proj.weight": "model-00011-of-00047.safetensors", + "model.layers.10.mlp.experts.28.up_proj.weight_scale": "model-00011-of-00047.safetensors", + "model.layers.10.mlp.experts.29.down_proj.weight": "model-00011-of-00047.safetensors", + "model.layers.10.mlp.experts.29.down_proj.weight_scale": "model-00011-of-00047.safetensors", + "model.layers.10.mlp.experts.29.gate_proj.weight": "model-00011-of-00047.safetensors", + "model.layers.10.mlp.experts.29.gate_proj.weight_scale": "model-00011-of-00047.safetensors", + "model.layers.10.mlp.experts.29.up_proj.weight": "model-00011-of-00047.safetensors", + "model.layers.10.mlp.experts.29.up_proj.weight_scale": "model-00011-of-00047.safetensors", + "model.layers.10.mlp.experts.3.down_proj.weight": "model-00011-of-00047.safetensors", + "model.layers.10.mlp.experts.3.down_proj.weight_scale": "model-00011-of-00047.safetensors", + "model.layers.10.mlp.experts.3.gate_proj.weight": "model-00011-of-00047.safetensors", + "model.layers.10.mlp.experts.3.gate_proj.weight_scale": "model-00011-of-00047.safetensors", + "model.layers.10.mlp.experts.3.up_proj.weight": "model-00011-of-00047.safetensors", + "model.layers.10.mlp.experts.3.up_proj.weight_scale": "model-00011-of-00047.safetensors", + "model.layers.10.mlp.experts.30.down_proj.weight": "model-00011-of-00047.safetensors", + "model.layers.10.mlp.experts.30.down_proj.weight_scale": "model-00011-of-00047.safetensors", + "model.layers.10.mlp.experts.30.gate_proj.weight": "model-00011-of-00047.safetensors", + "model.layers.10.mlp.experts.30.gate_proj.weight_scale": "model-00011-of-00047.safetensors", + "model.layers.10.mlp.experts.30.up_proj.weight": "model-00011-of-00047.safetensors", + "model.layers.10.mlp.experts.30.up_proj.weight_scale": "model-00011-of-00047.safetensors", + "model.layers.10.mlp.experts.31.down_proj.weight": "model-00011-of-00047.safetensors", + "model.layers.10.mlp.experts.31.down_proj.weight_scale": "model-00011-of-00047.safetensors", + "model.layers.10.mlp.experts.31.gate_proj.weight": "model-00011-of-00047.safetensors", + "model.layers.10.mlp.experts.31.gate_proj.weight_scale": "model-00011-of-00047.safetensors", + "model.layers.10.mlp.experts.31.up_proj.weight": "model-00011-of-00047.safetensors", + "model.layers.10.mlp.experts.31.up_proj.weight_scale": "model-00011-of-00047.safetensors", + "model.layers.10.mlp.experts.32.down_proj.weight": "model-00011-of-00047.safetensors", + "model.layers.10.mlp.experts.32.down_proj.weight_scale": "model-00011-of-00047.safetensors", + "model.layers.10.mlp.experts.32.gate_proj.weight": "model-00011-of-00047.safetensors", + "model.layers.10.mlp.experts.32.gate_proj.weight_scale": "model-00011-of-00047.safetensors", + "model.layers.10.mlp.experts.32.up_proj.weight": "model-00011-of-00047.safetensors", + "model.layers.10.mlp.experts.32.up_proj.weight_scale": "model-00011-of-00047.safetensors", + "model.layers.10.mlp.experts.33.down_proj.weight": "model-00011-of-00047.safetensors", + "model.layers.10.mlp.experts.33.down_proj.weight_scale": "model-00011-of-00047.safetensors", + "model.layers.10.mlp.experts.33.gate_proj.weight": "model-00011-of-00047.safetensors", + "model.layers.10.mlp.experts.33.gate_proj.weight_scale": "model-00011-of-00047.safetensors", + "model.layers.10.mlp.experts.33.up_proj.weight": "model-00011-of-00047.safetensors", + "model.layers.10.mlp.experts.33.up_proj.weight_scale": "model-00011-of-00047.safetensors", + "model.layers.10.mlp.experts.34.down_proj.weight": "model-00011-of-00047.safetensors", + "model.layers.10.mlp.experts.34.down_proj.weight_scale": "model-00011-of-00047.safetensors", + "model.layers.10.mlp.experts.34.gate_proj.weight": "model-00011-of-00047.safetensors", + "model.layers.10.mlp.experts.34.gate_proj.weight_scale": "model-00011-of-00047.safetensors", + "model.layers.10.mlp.experts.34.up_proj.weight": "model-00011-of-00047.safetensors", + "model.layers.10.mlp.experts.34.up_proj.weight_scale": "model-00011-of-00047.safetensors", + "model.layers.10.mlp.experts.35.down_proj.weight": "model-00011-of-00047.safetensors", + "model.layers.10.mlp.experts.35.down_proj.weight_scale": "model-00011-of-00047.safetensors", + "model.layers.10.mlp.experts.35.gate_proj.weight": "model-00011-of-00047.safetensors", + "model.layers.10.mlp.experts.35.gate_proj.weight_scale": "model-00011-of-00047.safetensors", + "model.layers.10.mlp.experts.35.up_proj.weight": "model-00011-of-00047.safetensors", + "model.layers.10.mlp.experts.35.up_proj.weight_scale": "model-00011-of-00047.safetensors", + "model.layers.10.mlp.experts.36.down_proj.weight": "model-00011-of-00047.safetensors", + "model.layers.10.mlp.experts.36.down_proj.weight_scale": "model-00011-of-00047.safetensors", + "model.layers.10.mlp.experts.36.gate_proj.weight": "model-00011-of-00047.safetensors", + "model.layers.10.mlp.experts.36.gate_proj.weight_scale": "model-00011-of-00047.safetensors", + "model.layers.10.mlp.experts.36.up_proj.weight": "model-00011-of-00047.safetensors", + "model.layers.10.mlp.experts.36.up_proj.weight_scale": "model-00011-of-00047.safetensors", + "model.layers.10.mlp.experts.37.down_proj.weight": "model-00011-of-00047.safetensors", + "model.layers.10.mlp.experts.37.down_proj.weight_scale": "model-00011-of-00047.safetensors", + "model.layers.10.mlp.experts.37.gate_proj.weight": "model-00011-of-00047.safetensors", + "model.layers.10.mlp.experts.37.gate_proj.weight_scale": "model-00011-of-00047.safetensors", + "model.layers.10.mlp.experts.37.up_proj.weight": "model-00011-of-00047.safetensors", + "model.layers.10.mlp.experts.37.up_proj.weight_scale": "model-00011-of-00047.safetensors", + "model.layers.10.mlp.experts.38.down_proj.weight": "model-00011-of-00047.safetensors", + "model.layers.10.mlp.experts.38.down_proj.weight_scale": "model-00011-of-00047.safetensors", + "model.layers.10.mlp.experts.38.gate_proj.weight": "model-00011-of-00047.safetensors", + "model.layers.10.mlp.experts.38.gate_proj.weight_scale": "model-00011-of-00047.safetensors", + "model.layers.10.mlp.experts.38.up_proj.weight": "model-00011-of-00047.safetensors", + "model.layers.10.mlp.experts.38.up_proj.weight_scale": "model-00011-of-00047.safetensors", + "model.layers.10.mlp.experts.39.down_proj.weight": "model-00011-of-00047.safetensors", + "model.layers.10.mlp.experts.39.down_proj.weight_scale": "model-00011-of-00047.safetensors", + "model.layers.10.mlp.experts.39.gate_proj.weight": "model-00011-of-00047.safetensors", + "model.layers.10.mlp.experts.39.gate_proj.weight_scale": "model-00011-of-00047.safetensors", + "model.layers.10.mlp.experts.39.up_proj.weight": "model-00011-of-00047.safetensors", + "model.layers.10.mlp.experts.39.up_proj.weight_scale": "model-00011-of-00047.safetensors", + "model.layers.10.mlp.experts.4.down_proj.weight": "model-00011-of-00047.safetensors", + "model.layers.10.mlp.experts.4.down_proj.weight_scale": "model-00011-of-00047.safetensors", + "model.layers.10.mlp.experts.4.gate_proj.weight": "model-00011-of-00047.safetensors", + "model.layers.10.mlp.experts.4.gate_proj.weight_scale": "model-00011-of-00047.safetensors", + "model.layers.10.mlp.experts.4.up_proj.weight": "model-00011-of-00047.safetensors", + "model.layers.10.mlp.experts.4.up_proj.weight_scale": "model-00011-of-00047.safetensors", + "model.layers.10.mlp.experts.40.down_proj.weight": "model-00011-of-00047.safetensors", + "model.layers.10.mlp.experts.40.down_proj.weight_scale": "model-00011-of-00047.safetensors", + "model.layers.10.mlp.experts.40.gate_proj.weight": "model-00011-of-00047.safetensors", + "model.layers.10.mlp.experts.40.gate_proj.weight_scale": "model-00011-of-00047.safetensors", + "model.layers.10.mlp.experts.40.up_proj.weight": "model-00011-of-00047.safetensors", + "model.layers.10.mlp.experts.40.up_proj.weight_scale": "model-00011-of-00047.safetensors", + "model.layers.10.mlp.experts.41.down_proj.weight": "model-00011-of-00047.safetensors", + "model.layers.10.mlp.experts.41.down_proj.weight_scale": "model-00011-of-00047.safetensors", + "model.layers.10.mlp.experts.41.gate_proj.weight": "model-00011-of-00047.safetensors", + "model.layers.10.mlp.experts.41.gate_proj.weight_scale": "model-00011-of-00047.safetensors", + "model.layers.10.mlp.experts.41.up_proj.weight": "model-00011-of-00047.safetensors", + "model.layers.10.mlp.experts.41.up_proj.weight_scale": "model-00011-of-00047.safetensors", + "model.layers.10.mlp.experts.42.down_proj.weight": "model-00011-of-00047.safetensors", + "model.layers.10.mlp.experts.42.down_proj.weight_scale": "model-00011-of-00047.safetensors", + "model.layers.10.mlp.experts.42.gate_proj.weight": "model-00011-of-00047.safetensors", + "model.layers.10.mlp.experts.42.gate_proj.weight_scale": "model-00011-of-00047.safetensors", + "model.layers.10.mlp.experts.42.up_proj.weight": "model-00011-of-00047.safetensors", + "model.layers.10.mlp.experts.42.up_proj.weight_scale": "model-00011-of-00047.safetensors", + "model.layers.10.mlp.experts.43.down_proj.weight": "model-00011-of-00047.safetensors", + "model.layers.10.mlp.experts.43.down_proj.weight_scale": "model-00011-of-00047.safetensors", + "model.layers.10.mlp.experts.43.gate_proj.weight": "model-00011-of-00047.safetensors", + "model.layers.10.mlp.experts.43.gate_proj.weight_scale": "model-00011-of-00047.safetensors", + "model.layers.10.mlp.experts.43.up_proj.weight": "model-00011-of-00047.safetensors", + "model.layers.10.mlp.experts.43.up_proj.weight_scale": "model-00011-of-00047.safetensors", + "model.layers.10.mlp.experts.44.down_proj.weight": "model-00011-of-00047.safetensors", + "model.layers.10.mlp.experts.44.down_proj.weight_scale": "model-00011-of-00047.safetensors", + "model.layers.10.mlp.experts.44.gate_proj.weight": "model-00011-of-00047.safetensors", + "model.layers.10.mlp.experts.44.gate_proj.weight_scale": "model-00011-of-00047.safetensors", + "model.layers.10.mlp.experts.44.up_proj.weight": "model-00011-of-00047.safetensors", + "model.layers.10.mlp.experts.44.up_proj.weight_scale": "model-00011-of-00047.safetensors", + "model.layers.10.mlp.experts.45.down_proj.weight": "model-00011-of-00047.safetensors", + "model.layers.10.mlp.experts.45.down_proj.weight_scale": "model-00011-of-00047.safetensors", + "model.layers.10.mlp.experts.45.gate_proj.weight": "model-00011-of-00047.safetensors", + "model.layers.10.mlp.experts.45.gate_proj.weight_scale": "model-00011-of-00047.safetensors", + "model.layers.10.mlp.experts.45.up_proj.weight": "model-00011-of-00047.safetensors", + "model.layers.10.mlp.experts.45.up_proj.weight_scale": "model-00011-of-00047.safetensors", + "model.layers.10.mlp.experts.46.down_proj.weight": "model-00011-of-00047.safetensors", + "model.layers.10.mlp.experts.46.down_proj.weight_scale": "model-00011-of-00047.safetensors", + "model.layers.10.mlp.experts.46.gate_proj.weight": "model-00011-of-00047.safetensors", + "model.layers.10.mlp.experts.46.gate_proj.weight_scale": "model-00011-of-00047.safetensors", + "model.layers.10.mlp.experts.46.up_proj.weight": "model-00011-of-00047.safetensors", + "model.layers.10.mlp.experts.46.up_proj.weight_scale": "model-00011-of-00047.safetensors", + "model.layers.10.mlp.experts.47.down_proj.weight": "model-00011-of-00047.safetensors", + "model.layers.10.mlp.experts.47.down_proj.weight_scale": "model-00011-of-00047.safetensors", + "model.layers.10.mlp.experts.47.gate_proj.weight": "model-00011-of-00047.safetensors", + "model.layers.10.mlp.experts.47.gate_proj.weight_scale": "model-00011-of-00047.safetensors", + "model.layers.10.mlp.experts.47.up_proj.weight": "model-00011-of-00047.safetensors", + "model.layers.10.mlp.experts.47.up_proj.weight_scale": "model-00011-of-00047.safetensors", + "model.layers.10.mlp.experts.48.down_proj.weight": "model-00011-of-00047.safetensors", + "model.layers.10.mlp.experts.48.down_proj.weight_scale": "model-00011-of-00047.safetensors", + "model.layers.10.mlp.experts.48.gate_proj.weight": "model-00011-of-00047.safetensors", + "model.layers.10.mlp.experts.48.gate_proj.weight_scale": "model-00011-of-00047.safetensors", + "model.layers.10.mlp.experts.48.up_proj.weight": "model-00011-of-00047.safetensors", + "model.layers.10.mlp.experts.48.up_proj.weight_scale": "model-00011-of-00047.safetensors", + "model.layers.10.mlp.experts.49.down_proj.weight": "model-00011-of-00047.safetensors", + "model.layers.10.mlp.experts.49.down_proj.weight_scale": "model-00011-of-00047.safetensors", + "model.layers.10.mlp.experts.49.gate_proj.weight": "model-00011-of-00047.safetensors", + "model.layers.10.mlp.experts.49.gate_proj.weight_scale": "model-00011-of-00047.safetensors", + "model.layers.10.mlp.experts.49.up_proj.weight": "model-00011-of-00047.safetensors", + "model.layers.10.mlp.experts.49.up_proj.weight_scale": "model-00011-of-00047.safetensors", + "model.layers.10.mlp.experts.5.down_proj.weight": "model-00011-of-00047.safetensors", + "model.layers.10.mlp.experts.5.down_proj.weight_scale": "model-00011-of-00047.safetensors", + "model.layers.10.mlp.experts.5.gate_proj.weight": "model-00011-of-00047.safetensors", + "model.layers.10.mlp.experts.5.gate_proj.weight_scale": "model-00011-of-00047.safetensors", + "model.layers.10.mlp.experts.5.up_proj.weight": "model-00011-of-00047.safetensors", + "model.layers.10.mlp.experts.5.up_proj.weight_scale": "model-00011-of-00047.safetensors", + "model.layers.10.mlp.experts.50.down_proj.weight": "model-00011-of-00047.safetensors", + "model.layers.10.mlp.experts.50.down_proj.weight_scale": "model-00011-of-00047.safetensors", + "model.layers.10.mlp.experts.50.gate_proj.weight": "model-00011-of-00047.safetensors", + "model.layers.10.mlp.experts.50.gate_proj.weight_scale": "model-00011-of-00047.safetensors", + "model.layers.10.mlp.experts.50.up_proj.weight": "model-00011-of-00047.safetensors", + "model.layers.10.mlp.experts.50.up_proj.weight_scale": "model-00011-of-00047.safetensors", + "model.layers.10.mlp.experts.51.down_proj.weight": "model-00011-of-00047.safetensors", + "model.layers.10.mlp.experts.51.down_proj.weight_scale": "model-00011-of-00047.safetensors", + "model.layers.10.mlp.experts.51.gate_proj.weight": "model-00011-of-00047.safetensors", + "model.layers.10.mlp.experts.51.gate_proj.weight_scale": "model-00011-of-00047.safetensors", + "model.layers.10.mlp.experts.51.up_proj.weight": "model-00011-of-00047.safetensors", + "model.layers.10.mlp.experts.51.up_proj.weight_scale": "model-00011-of-00047.safetensors", + "model.layers.10.mlp.experts.52.down_proj.weight": "model-00011-of-00047.safetensors", + "model.layers.10.mlp.experts.52.down_proj.weight_scale": "model-00011-of-00047.safetensors", + "model.layers.10.mlp.experts.52.gate_proj.weight": "model-00011-of-00047.safetensors", + "model.layers.10.mlp.experts.52.gate_proj.weight_scale": "model-00011-of-00047.safetensors", + "model.layers.10.mlp.experts.52.up_proj.weight": "model-00011-of-00047.safetensors", + "model.layers.10.mlp.experts.52.up_proj.weight_scale": "model-00011-of-00047.safetensors", + "model.layers.10.mlp.experts.53.down_proj.weight": "model-00011-of-00047.safetensors", + "model.layers.10.mlp.experts.53.down_proj.weight_scale": "model-00011-of-00047.safetensors", + "model.layers.10.mlp.experts.53.gate_proj.weight": "model-00011-of-00047.safetensors", + "model.layers.10.mlp.experts.53.gate_proj.weight_scale": "model-00011-of-00047.safetensors", + "model.layers.10.mlp.experts.53.up_proj.weight": "model-00011-of-00047.safetensors", + "model.layers.10.mlp.experts.53.up_proj.weight_scale": "model-00011-of-00047.safetensors", + "model.layers.10.mlp.experts.54.down_proj.weight": "model-00011-of-00047.safetensors", + "model.layers.10.mlp.experts.54.down_proj.weight_scale": "model-00011-of-00047.safetensors", + "model.layers.10.mlp.experts.54.gate_proj.weight": "model-00011-of-00047.safetensors", + "model.layers.10.mlp.experts.54.gate_proj.weight_scale": "model-00011-of-00047.safetensors", + "model.layers.10.mlp.experts.54.up_proj.weight": "model-00011-of-00047.safetensors", + "model.layers.10.mlp.experts.54.up_proj.weight_scale": "model-00011-of-00047.safetensors", + "model.layers.10.mlp.experts.55.down_proj.weight": "model-00011-of-00047.safetensors", + "model.layers.10.mlp.experts.55.down_proj.weight_scale": "model-00011-of-00047.safetensors", + "model.layers.10.mlp.experts.55.gate_proj.weight": "model-00011-of-00047.safetensors", + "model.layers.10.mlp.experts.55.gate_proj.weight_scale": "model-00011-of-00047.safetensors", + "model.layers.10.mlp.experts.55.up_proj.weight": "model-00011-of-00047.safetensors", + "model.layers.10.mlp.experts.55.up_proj.weight_scale": "model-00011-of-00047.safetensors", + "model.layers.10.mlp.experts.56.down_proj.weight": "model-00011-of-00047.safetensors", + "model.layers.10.mlp.experts.56.down_proj.weight_scale": "model-00011-of-00047.safetensors", + "model.layers.10.mlp.experts.56.gate_proj.weight": "model-00011-of-00047.safetensors", + "model.layers.10.mlp.experts.56.gate_proj.weight_scale": "model-00011-of-00047.safetensors", + "model.layers.10.mlp.experts.56.up_proj.weight": "model-00011-of-00047.safetensors", + "model.layers.10.mlp.experts.56.up_proj.weight_scale": "model-00011-of-00047.safetensors", + "model.layers.10.mlp.experts.57.down_proj.weight": "model-00011-of-00047.safetensors", + "model.layers.10.mlp.experts.57.down_proj.weight_scale": "model-00011-of-00047.safetensors", + "model.layers.10.mlp.experts.57.gate_proj.weight": "model-00011-of-00047.safetensors", + "model.layers.10.mlp.experts.57.gate_proj.weight_scale": "model-00011-of-00047.safetensors", + "model.layers.10.mlp.experts.57.up_proj.weight": "model-00011-of-00047.safetensors", + "model.layers.10.mlp.experts.57.up_proj.weight_scale": "model-00011-of-00047.safetensors", + "model.layers.10.mlp.experts.58.down_proj.weight": "model-00011-of-00047.safetensors", + "model.layers.10.mlp.experts.58.down_proj.weight_scale": "model-00011-of-00047.safetensors", + "model.layers.10.mlp.experts.58.gate_proj.weight": "model-00011-of-00047.safetensors", + "model.layers.10.mlp.experts.58.gate_proj.weight_scale": "model-00011-of-00047.safetensors", + "model.layers.10.mlp.experts.58.up_proj.weight": "model-00011-of-00047.safetensors", + "model.layers.10.mlp.experts.58.up_proj.weight_scale": "model-00011-of-00047.safetensors", + "model.layers.10.mlp.experts.59.down_proj.weight": "model-00011-of-00047.safetensors", + "model.layers.10.mlp.experts.59.down_proj.weight_scale": "model-00011-of-00047.safetensors", + "model.layers.10.mlp.experts.59.gate_proj.weight": "model-00011-of-00047.safetensors", + "model.layers.10.mlp.experts.59.gate_proj.weight_scale": "model-00011-of-00047.safetensors", + "model.layers.10.mlp.experts.59.up_proj.weight": "model-00011-of-00047.safetensors", + "model.layers.10.mlp.experts.59.up_proj.weight_scale": "model-00011-of-00047.safetensors", + "model.layers.10.mlp.experts.6.down_proj.weight": "model-00011-of-00047.safetensors", + "model.layers.10.mlp.experts.6.down_proj.weight_scale": "model-00011-of-00047.safetensors", + "model.layers.10.mlp.experts.6.gate_proj.weight": "model-00011-of-00047.safetensors", + "model.layers.10.mlp.experts.6.gate_proj.weight_scale": "model-00011-of-00047.safetensors", + "model.layers.10.mlp.experts.6.up_proj.weight": "model-00011-of-00047.safetensors", + "model.layers.10.mlp.experts.6.up_proj.weight_scale": "model-00011-of-00047.safetensors", + "model.layers.10.mlp.experts.60.down_proj.weight": "model-00011-of-00047.safetensors", + "model.layers.10.mlp.experts.60.down_proj.weight_scale": "model-00011-of-00047.safetensors", + "model.layers.10.mlp.experts.60.gate_proj.weight": "model-00011-of-00047.safetensors", + "model.layers.10.mlp.experts.60.gate_proj.weight_scale": "model-00011-of-00047.safetensors", + "model.layers.10.mlp.experts.60.up_proj.weight": "model-00011-of-00047.safetensors", + "model.layers.10.mlp.experts.60.up_proj.weight_scale": "model-00011-of-00047.safetensors", + "model.layers.10.mlp.experts.61.down_proj.weight": "model-00011-of-00047.safetensors", + "model.layers.10.mlp.experts.61.down_proj.weight_scale": "model-00011-of-00047.safetensors", + "model.layers.10.mlp.experts.61.gate_proj.weight": "model-00011-of-00047.safetensors", + "model.layers.10.mlp.experts.61.gate_proj.weight_scale": "model-00011-of-00047.safetensors", + "model.layers.10.mlp.experts.61.up_proj.weight": "model-00011-of-00047.safetensors", + "model.layers.10.mlp.experts.61.up_proj.weight_scale": "model-00011-of-00047.safetensors", + "model.layers.10.mlp.experts.62.down_proj.weight": "model-00011-of-00047.safetensors", + "model.layers.10.mlp.experts.62.down_proj.weight_scale": "model-00011-of-00047.safetensors", + "model.layers.10.mlp.experts.62.gate_proj.weight": "model-00011-of-00047.safetensors", + "model.layers.10.mlp.experts.62.gate_proj.weight_scale": "model-00011-of-00047.safetensors", + "model.layers.10.mlp.experts.62.up_proj.weight": "model-00011-of-00047.safetensors", + "model.layers.10.mlp.experts.62.up_proj.weight_scale": "model-00011-of-00047.safetensors", + "model.layers.10.mlp.experts.63.down_proj.weight": "model-00011-of-00047.safetensors", + "model.layers.10.mlp.experts.63.down_proj.weight_scale": "model-00011-of-00047.safetensors", + "model.layers.10.mlp.experts.63.gate_proj.weight": "model-00011-of-00047.safetensors", + "model.layers.10.mlp.experts.63.gate_proj.weight_scale": "model-00011-of-00047.safetensors", + "model.layers.10.mlp.experts.63.up_proj.weight": "model-00011-of-00047.safetensors", + "model.layers.10.mlp.experts.63.up_proj.weight_scale": "model-00011-of-00047.safetensors", + "model.layers.10.mlp.experts.64.down_proj.weight": "model-00011-of-00047.safetensors", + "model.layers.10.mlp.experts.64.down_proj.weight_scale": "model-00011-of-00047.safetensors", + "model.layers.10.mlp.experts.64.gate_proj.weight": "model-00011-of-00047.safetensors", + "model.layers.10.mlp.experts.64.gate_proj.weight_scale": "model-00011-of-00047.safetensors", + "model.layers.10.mlp.experts.64.up_proj.weight": "model-00011-of-00047.safetensors", + "model.layers.10.mlp.experts.64.up_proj.weight_scale": "model-00011-of-00047.safetensors", + "model.layers.10.mlp.experts.65.down_proj.weight": "model-00011-of-00047.safetensors", + "model.layers.10.mlp.experts.65.down_proj.weight_scale": "model-00011-of-00047.safetensors", + "model.layers.10.mlp.experts.65.gate_proj.weight": "model-00011-of-00047.safetensors", + "model.layers.10.mlp.experts.65.gate_proj.weight_scale": "model-00011-of-00047.safetensors", + "model.layers.10.mlp.experts.65.up_proj.weight": "model-00011-of-00047.safetensors", + "model.layers.10.mlp.experts.65.up_proj.weight_scale": "model-00011-of-00047.safetensors", + "model.layers.10.mlp.experts.66.down_proj.weight": "model-00011-of-00047.safetensors", + "model.layers.10.mlp.experts.66.down_proj.weight_scale": "model-00011-of-00047.safetensors", + "model.layers.10.mlp.experts.66.gate_proj.weight": "model-00011-of-00047.safetensors", + "model.layers.10.mlp.experts.66.gate_proj.weight_scale": "model-00011-of-00047.safetensors", + "model.layers.10.mlp.experts.66.up_proj.weight": "model-00011-of-00047.safetensors", + "model.layers.10.mlp.experts.66.up_proj.weight_scale": "model-00011-of-00047.safetensors", + "model.layers.10.mlp.experts.67.down_proj.weight": "model-00011-of-00047.safetensors", + "model.layers.10.mlp.experts.67.down_proj.weight_scale": "model-00011-of-00047.safetensors", + "model.layers.10.mlp.experts.67.gate_proj.weight": "model-00011-of-00047.safetensors", + "model.layers.10.mlp.experts.67.gate_proj.weight_scale": "model-00011-of-00047.safetensors", + "model.layers.10.mlp.experts.67.up_proj.weight": "model-00011-of-00047.safetensors", + "model.layers.10.mlp.experts.67.up_proj.weight_scale": "model-00011-of-00047.safetensors", + "model.layers.10.mlp.experts.68.down_proj.weight": "model-00011-of-00047.safetensors", + "model.layers.10.mlp.experts.68.down_proj.weight_scale": "model-00011-of-00047.safetensors", + "model.layers.10.mlp.experts.68.gate_proj.weight": "model-00011-of-00047.safetensors", + "model.layers.10.mlp.experts.68.gate_proj.weight_scale": "model-00011-of-00047.safetensors", + "model.layers.10.mlp.experts.68.up_proj.weight": "model-00011-of-00047.safetensors", + "model.layers.10.mlp.experts.68.up_proj.weight_scale": "model-00011-of-00047.safetensors", + "model.layers.10.mlp.experts.69.down_proj.weight": "model-00011-of-00047.safetensors", + "model.layers.10.mlp.experts.69.down_proj.weight_scale": "model-00011-of-00047.safetensors", + "model.layers.10.mlp.experts.69.gate_proj.weight": "model-00011-of-00047.safetensors", + "model.layers.10.mlp.experts.69.gate_proj.weight_scale": "model-00011-of-00047.safetensors", + "model.layers.10.mlp.experts.69.up_proj.weight": "model-00011-of-00047.safetensors", + "model.layers.10.mlp.experts.69.up_proj.weight_scale": "model-00011-of-00047.safetensors", + "model.layers.10.mlp.experts.7.down_proj.weight": "model-00011-of-00047.safetensors", + "model.layers.10.mlp.experts.7.down_proj.weight_scale": "model-00011-of-00047.safetensors", + "model.layers.10.mlp.experts.7.gate_proj.weight": "model-00011-of-00047.safetensors", + "model.layers.10.mlp.experts.7.gate_proj.weight_scale": "model-00011-of-00047.safetensors", + "model.layers.10.mlp.experts.7.up_proj.weight": "model-00011-of-00047.safetensors", + "model.layers.10.mlp.experts.7.up_proj.weight_scale": "model-00011-of-00047.safetensors", + "model.layers.10.mlp.experts.70.down_proj.weight": "model-00011-of-00047.safetensors", + "model.layers.10.mlp.experts.70.down_proj.weight_scale": "model-00011-of-00047.safetensors", + "model.layers.10.mlp.experts.70.gate_proj.weight": "model-00011-of-00047.safetensors", + "model.layers.10.mlp.experts.70.gate_proj.weight_scale": "model-00011-of-00047.safetensors", + "model.layers.10.mlp.experts.70.up_proj.weight": "model-00011-of-00047.safetensors", + "model.layers.10.mlp.experts.70.up_proj.weight_scale": "model-00011-of-00047.safetensors", + "model.layers.10.mlp.experts.71.down_proj.weight": "model-00011-of-00047.safetensors", + "model.layers.10.mlp.experts.71.down_proj.weight_scale": "model-00011-of-00047.safetensors", + "model.layers.10.mlp.experts.71.gate_proj.weight": "model-00011-of-00047.safetensors", + "model.layers.10.mlp.experts.71.gate_proj.weight_scale": "model-00011-of-00047.safetensors", + "model.layers.10.mlp.experts.71.up_proj.weight": "model-00011-of-00047.safetensors", + "model.layers.10.mlp.experts.71.up_proj.weight_scale": "model-00011-of-00047.safetensors", + "model.layers.10.mlp.experts.72.down_proj.weight": "model-00011-of-00047.safetensors", + "model.layers.10.mlp.experts.72.down_proj.weight_scale": "model-00011-of-00047.safetensors", + "model.layers.10.mlp.experts.72.gate_proj.weight": "model-00011-of-00047.safetensors", + "model.layers.10.mlp.experts.72.gate_proj.weight_scale": "model-00011-of-00047.safetensors", + "model.layers.10.mlp.experts.72.up_proj.weight": "model-00011-of-00047.safetensors", + "model.layers.10.mlp.experts.72.up_proj.weight_scale": "model-00011-of-00047.safetensors", + "model.layers.10.mlp.experts.73.down_proj.weight": "model-00011-of-00047.safetensors", + "model.layers.10.mlp.experts.73.down_proj.weight_scale": "model-00011-of-00047.safetensors", + "model.layers.10.mlp.experts.73.gate_proj.weight": "model-00011-of-00047.safetensors", + "model.layers.10.mlp.experts.73.gate_proj.weight_scale": "model-00011-of-00047.safetensors", + "model.layers.10.mlp.experts.73.up_proj.weight": "model-00011-of-00047.safetensors", + "model.layers.10.mlp.experts.73.up_proj.weight_scale": "model-00011-of-00047.safetensors", + "model.layers.10.mlp.experts.74.down_proj.weight": "model-00011-of-00047.safetensors", + "model.layers.10.mlp.experts.74.down_proj.weight_scale": "model-00011-of-00047.safetensors", + "model.layers.10.mlp.experts.74.gate_proj.weight": "model-00011-of-00047.safetensors", + "model.layers.10.mlp.experts.74.gate_proj.weight_scale": "model-00011-of-00047.safetensors", + "model.layers.10.mlp.experts.74.up_proj.weight": "model-00011-of-00047.safetensors", + "model.layers.10.mlp.experts.74.up_proj.weight_scale": "model-00011-of-00047.safetensors", + "model.layers.10.mlp.experts.75.down_proj.weight": "model-00011-of-00047.safetensors", + "model.layers.10.mlp.experts.75.down_proj.weight_scale": "model-00011-of-00047.safetensors", + "model.layers.10.mlp.experts.75.gate_proj.weight": "model-00011-of-00047.safetensors", + "model.layers.10.mlp.experts.75.gate_proj.weight_scale": "model-00011-of-00047.safetensors", + "model.layers.10.mlp.experts.75.up_proj.weight": "model-00011-of-00047.safetensors", + "model.layers.10.mlp.experts.75.up_proj.weight_scale": "model-00011-of-00047.safetensors", + "model.layers.10.mlp.experts.76.down_proj.weight": "model-00011-of-00047.safetensors", + "model.layers.10.mlp.experts.76.down_proj.weight_scale": "model-00011-of-00047.safetensors", + "model.layers.10.mlp.experts.76.gate_proj.weight": "model-00011-of-00047.safetensors", + "model.layers.10.mlp.experts.76.gate_proj.weight_scale": "model-00011-of-00047.safetensors", + "model.layers.10.mlp.experts.76.up_proj.weight": "model-00011-of-00047.safetensors", + "model.layers.10.mlp.experts.76.up_proj.weight_scale": "model-00011-of-00047.safetensors", + "model.layers.10.mlp.experts.77.down_proj.weight": "model-00011-of-00047.safetensors", + "model.layers.10.mlp.experts.77.down_proj.weight_scale": "model-00011-of-00047.safetensors", + "model.layers.10.mlp.experts.77.gate_proj.weight": "model-00011-of-00047.safetensors", + "model.layers.10.mlp.experts.77.gate_proj.weight_scale": "model-00011-of-00047.safetensors", + "model.layers.10.mlp.experts.77.up_proj.weight": "model-00011-of-00047.safetensors", + "model.layers.10.mlp.experts.77.up_proj.weight_scale": "model-00011-of-00047.safetensors", + "model.layers.10.mlp.experts.78.down_proj.weight": "model-00011-of-00047.safetensors", + "model.layers.10.mlp.experts.78.down_proj.weight_scale": "model-00011-of-00047.safetensors", + "model.layers.10.mlp.experts.78.gate_proj.weight": "model-00011-of-00047.safetensors", + "model.layers.10.mlp.experts.78.gate_proj.weight_scale": "model-00011-of-00047.safetensors", + "model.layers.10.mlp.experts.78.up_proj.weight": "model-00011-of-00047.safetensors", + "model.layers.10.mlp.experts.78.up_proj.weight_scale": "model-00011-of-00047.safetensors", + "model.layers.10.mlp.experts.79.down_proj.weight": "model-00011-of-00047.safetensors", + "model.layers.10.mlp.experts.79.down_proj.weight_scale": "model-00011-of-00047.safetensors", + "model.layers.10.mlp.experts.79.gate_proj.weight": "model-00011-of-00047.safetensors", + "model.layers.10.mlp.experts.79.gate_proj.weight_scale": "model-00011-of-00047.safetensors", + "model.layers.10.mlp.experts.79.up_proj.weight": "model-00011-of-00047.safetensors", + "model.layers.10.mlp.experts.79.up_proj.weight_scale": "model-00011-of-00047.safetensors", + "model.layers.10.mlp.experts.8.down_proj.weight": "model-00011-of-00047.safetensors", + "model.layers.10.mlp.experts.8.down_proj.weight_scale": "model-00011-of-00047.safetensors", + "model.layers.10.mlp.experts.8.gate_proj.weight": "model-00011-of-00047.safetensors", + "model.layers.10.mlp.experts.8.gate_proj.weight_scale": "model-00011-of-00047.safetensors", + "model.layers.10.mlp.experts.8.up_proj.weight": "model-00011-of-00047.safetensors", + "model.layers.10.mlp.experts.8.up_proj.weight_scale": "model-00011-of-00047.safetensors", + "model.layers.10.mlp.experts.80.down_proj.weight": "model-00011-of-00047.safetensors", + "model.layers.10.mlp.experts.80.down_proj.weight_scale": "model-00011-of-00047.safetensors", + "model.layers.10.mlp.experts.80.gate_proj.weight": "model-00011-of-00047.safetensors", + "model.layers.10.mlp.experts.80.gate_proj.weight_scale": "model-00011-of-00047.safetensors", + "model.layers.10.mlp.experts.80.up_proj.weight": "model-00011-of-00047.safetensors", + "model.layers.10.mlp.experts.80.up_proj.weight_scale": "model-00011-of-00047.safetensors", + "model.layers.10.mlp.experts.81.down_proj.weight": "model-00011-of-00047.safetensors", + "model.layers.10.mlp.experts.81.down_proj.weight_scale": "model-00011-of-00047.safetensors", + "model.layers.10.mlp.experts.81.gate_proj.weight": "model-00011-of-00047.safetensors", + "model.layers.10.mlp.experts.81.gate_proj.weight_scale": "model-00011-of-00047.safetensors", + "model.layers.10.mlp.experts.81.up_proj.weight": "model-00011-of-00047.safetensors", + "model.layers.10.mlp.experts.81.up_proj.weight_scale": "model-00011-of-00047.safetensors", + "model.layers.10.mlp.experts.82.down_proj.weight": "model-00011-of-00047.safetensors", + "model.layers.10.mlp.experts.82.down_proj.weight_scale": "model-00011-of-00047.safetensors", + "model.layers.10.mlp.experts.82.gate_proj.weight": "model-00011-of-00047.safetensors", + "model.layers.10.mlp.experts.82.gate_proj.weight_scale": "model-00011-of-00047.safetensors", + "model.layers.10.mlp.experts.82.up_proj.weight": "model-00011-of-00047.safetensors", + "model.layers.10.mlp.experts.82.up_proj.weight_scale": "model-00011-of-00047.safetensors", + "model.layers.10.mlp.experts.83.down_proj.weight": "model-00011-of-00047.safetensors", + "model.layers.10.mlp.experts.83.down_proj.weight_scale": "model-00011-of-00047.safetensors", + "model.layers.10.mlp.experts.83.gate_proj.weight": "model-00011-of-00047.safetensors", + "model.layers.10.mlp.experts.83.gate_proj.weight_scale": "model-00011-of-00047.safetensors", + "model.layers.10.mlp.experts.83.up_proj.weight": "model-00011-of-00047.safetensors", + "model.layers.10.mlp.experts.83.up_proj.weight_scale": "model-00011-of-00047.safetensors", + "model.layers.10.mlp.experts.84.down_proj.weight": "model-00011-of-00047.safetensors", + "model.layers.10.mlp.experts.84.down_proj.weight_scale": "model-00011-of-00047.safetensors", + "model.layers.10.mlp.experts.84.gate_proj.weight": "model-00011-of-00047.safetensors", + "model.layers.10.mlp.experts.84.gate_proj.weight_scale": "model-00011-of-00047.safetensors", + "model.layers.10.mlp.experts.84.up_proj.weight": "model-00011-of-00047.safetensors", + "model.layers.10.mlp.experts.84.up_proj.weight_scale": "model-00011-of-00047.safetensors", + "model.layers.10.mlp.experts.85.down_proj.weight": "model-00011-of-00047.safetensors", + "model.layers.10.mlp.experts.85.down_proj.weight_scale": "model-00011-of-00047.safetensors", + "model.layers.10.mlp.experts.85.gate_proj.weight": "model-00011-of-00047.safetensors", + "model.layers.10.mlp.experts.85.gate_proj.weight_scale": "model-00011-of-00047.safetensors", + "model.layers.10.mlp.experts.85.up_proj.weight": "model-00011-of-00047.safetensors", + "model.layers.10.mlp.experts.85.up_proj.weight_scale": "model-00011-of-00047.safetensors", + "model.layers.10.mlp.experts.86.down_proj.weight": "model-00011-of-00047.safetensors", + "model.layers.10.mlp.experts.86.down_proj.weight_scale": "model-00011-of-00047.safetensors", + "model.layers.10.mlp.experts.86.gate_proj.weight": "model-00011-of-00047.safetensors", + "model.layers.10.mlp.experts.86.gate_proj.weight_scale": "model-00011-of-00047.safetensors", + "model.layers.10.mlp.experts.86.up_proj.weight": "model-00011-of-00047.safetensors", + "model.layers.10.mlp.experts.86.up_proj.weight_scale": "model-00011-of-00047.safetensors", + "model.layers.10.mlp.experts.87.down_proj.weight": "model-00011-of-00047.safetensors", + "model.layers.10.mlp.experts.87.down_proj.weight_scale": "model-00011-of-00047.safetensors", + "model.layers.10.mlp.experts.87.gate_proj.weight": "model-00011-of-00047.safetensors", + "model.layers.10.mlp.experts.87.gate_proj.weight_scale": "model-00011-of-00047.safetensors", + "model.layers.10.mlp.experts.87.up_proj.weight": "model-00011-of-00047.safetensors", + "model.layers.10.mlp.experts.87.up_proj.weight_scale": "model-00011-of-00047.safetensors", + "model.layers.10.mlp.experts.88.down_proj.weight": "model-00011-of-00047.safetensors", + "model.layers.10.mlp.experts.88.down_proj.weight_scale": "model-00011-of-00047.safetensors", + "model.layers.10.mlp.experts.88.gate_proj.weight": "model-00011-of-00047.safetensors", + "model.layers.10.mlp.experts.88.gate_proj.weight_scale": "model-00011-of-00047.safetensors", + "model.layers.10.mlp.experts.88.up_proj.weight": "model-00011-of-00047.safetensors", + "model.layers.10.mlp.experts.88.up_proj.weight_scale": "model-00011-of-00047.safetensors", + "model.layers.10.mlp.experts.89.down_proj.weight": "model-00011-of-00047.safetensors", + "model.layers.10.mlp.experts.89.down_proj.weight_scale": "model-00011-of-00047.safetensors", + "model.layers.10.mlp.experts.89.gate_proj.weight": "model-00011-of-00047.safetensors", + "model.layers.10.mlp.experts.89.gate_proj.weight_scale": "model-00011-of-00047.safetensors", + "model.layers.10.mlp.experts.89.up_proj.weight": "model-00011-of-00047.safetensors", + "model.layers.10.mlp.experts.89.up_proj.weight_scale": "model-00011-of-00047.safetensors", + "model.layers.10.mlp.experts.9.down_proj.weight": "model-00011-of-00047.safetensors", + "model.layers.10.mlp.experts.9.down_proj.weight_scale": "model-00011-of-00047.safetensors", + "model.layers.10.mlp.experts.9.gate_proj.weight": "model-00011-of-00047.safetensors", + "model.layers.10.mlp.experts.9.gate_proj.weight_scale": "model-00011-of-00047.safetensors", + "model.layers.10.mlp.experts.9.up_proj.weight": "model-00011-of-00047.safetensors", + "model.layers.10.mlp.experts.9.up_proj.weight_scale": "model-00011-of-00047.safetensors", + "model.layers.10.mlp.experts.90.down_proj.weight": "model-00011-of-00047.safetensors", + "model.layers.10.mlp.experts.90.down_proj.weight_scale": "model-00011-of-00047.safetensors", + "model.layers.10.mlp.experts.90.gate_proj.weight": "model-00011-of-00047.safetensors", + "model.layers.10.mlp.experts.90.gate_proj.weight_scale": "model-00011-of-00047.safetensors", + "model.layers.10.mlp.experts.90.up_proj.weight": "model-00011-of-00047.safetensors", + "model.layers.10.mlp.experts.90.up_proj.weight_scale": "model-00011-of-00047.safetensors", + "model.layers.10.mlp.experts.91.down_proj.weight": "model-00011-of-00047.safetensors", + "model.layers.10.mlp.experts.91.down_proj.weight_scale": "model-00011-of-00047.safetensors", + "model.layers.10.mlp.experts.91.gate_proj.weight": "model-00011-of-00047.safetensors", + "model.layers.10.mlp.experts.91.gate_proj.weight_scale": "model-00011-of-00047.safetensors", + "model.layers.10.mlp.experts.91.up_proj.weight": "model-00011-of-00047.safetensors", + "model.layers.10.mlp.experts.91.up_proj.weight_scale": "model-00011-of-00047.safetensors", + "model.layers.10.mlp.experts.92.down_proj.weight": "model-00011-of-00047.safetensors", + "model.layers.10.mlp.experts.92.down_proj.weight_scale": "model-00011-of-00047.safetensors", + "model.layers.10.mlp.experts.92.gate_proj.weight": "model-00011-of-00047.safetensors", + "model.layers.10.mlp.experts.92.gate_proj.weight_scale": "model-00011-of-00047.safetensors", + "model.layers.10.mlp.experts.92.up_proj.weight": "model-00011-of-00047.safetensors", + "model.layers.10.mlp.experts.92.up_proj.weight_scale": "model-00011-of-00047.safetensors", + "model.layers.10.mlp.experts.93.down_proj.weight": "model-00011-of-00047.safetensors", + "model.layers.10.mlp.experts.93.down_proj.weight_scale": "model-00011-of-00047.safetensors", + "model.layers.10.mlp.experts.93.gate_proj.weight": "model-00011-of-00047.safetensors", + "model.layers.10.mlp.experts.93.gate_proj.weight_scale": "model-00011-of-00047.safetensors", + "model.layers.10.mlp.experts.93.up_proj.weight": "model-00011-of-00047.safetensors", + "model.layers.10.mlp.experts.93.up_proj.weight_scale": "model-00011-of-00047.safetensors", + "model.layers.10.mlp.experts.94.down_proj.weight": "model-00011-of-00047.safetensors", + "model.layers.10.mlp.experts.94.down_proj.weight_scale": "model-00011-of-00047.safetensors", + "model.layers.10.mlp.experts.94.gate_proj.weight": "model-00011-of-00047.safetensors", + "model.layers.10.mlp.experts.94.gate_proj.weight_scale": "model-00011-of-00047.safetensors", + "model.layers.10.mlp.experts.94.up_proj.weight": "model-00011-of-00047.safetensors", + "model.layers.10.mlp.experts.94.up_proj.weight_scale": "model-00011-of-00047.safetensors", + "model.layers.10.mlp.experts.95.down_proj.weight": "model-00011-of-00047.safetensors", + "model.layers.10.mlp.experts.95.down_proj.weight_scale": "model-00011-of-00047.safetensors", + "model.layers.10.mlp.experts.95.gate_proj.weight": "model-00011-of-00047.safetensors", + "model.layers.10.mlp.experts.95.gate_proj.weight_scale": "model-00011-of-00047.safetensors", + "model.layers.10.mlp.experts.95.up_proj.weight": "model-00011-of-00047.safetensors", + "model.layers.10.mlp.experts.95.up_proj.weight_scale": "model-00011-of-00047.safetensors", + "model.layers.10.mlp.experts.96.down_proj.weight": "model-00011-of-00047.safetensors", + "model.layers.10.mlp.experts.96.down_proj.weight_scale": "model-00011-of-00047.safetensors", + "model.layers.10.mlp.experts.96.gate_proj.weight": "model-00011-of-00047.safetensors", + "model.layers.10.mlp.experts.96.gate_proj.weight_scale": "model-00011-of-00047.safetensors", + "model.layers.10.mlp.experts.96.up_proj.weight": "model-00011-of-00047.safetensors", + "model.layers.10.mlp.experts.96.up_proj.weight_scale": "model-00011-of-00047.safetensors", + "model.layers.10.mlp.experts.97.down_proj.weight": "model-00011-of-00047.safetensors", + "model.layers.10.mlp.experts.97.down_proj.weight_scale": "model-00011-of-00047.safetensors", + "model.layers.10.mlp.experts.97.gate_proj.weight": "model-00011-of-00047.safetensors", + "model.layers.10.mlp.experts.97.gate_proj.weight_scale": "model-00011-of-00047.safetensors", + "model.layers.10.mlp.experts.97.up_proj.weight": "model-00011-of-00047.safetensors", + "model.layers.10.mlp.experts.97.up_proj.weight_scale": "model-00011-of-00047.safetensors", + "model.layers.10.mlp.experts.98.down_proj.weight": "model-00011-of-00047.safetensors", + "model.layers.10.mlp.experts.98.down_proj.weight_scale": "model-00011-of-00047.safetensors", + "model.layers.10.mlp.experts.98.gate_proj.weight": "model-00011-of-00047.safetensors", + "model.layers.10.mlp.experts.98.gate_proj.weight_scale": "model-00011-of-00047.safetensors", + "model.layers.10.mlp.experts.98.up_proj.weight": "model-00011-of-00047.safetensors", + "model.layers.10.mlp.experts.98.up_proj.weight_scale": "model-00011-of-00047.safetensors", + "model.layers.10.mlp.experts.99.down_proj.weight": "model-00011-of-00047.safetensors", + "model.layers.10.mlp.experts.99.down_proj.weight_scale": "model-00011-of-00047.safetensors", + "model.layers.10.mlp.experts.99.gate_proj.weight": "model-00011-of-00047.safetensors", + "model.layers.10.mlp.experts.99.gate_proj.weight_scale": "model-00011-of-00047.safetensors", + "model.layers.10.mlp.experts.99.up_proj.weight": "model-00011-of-00047.safetensors", + "model.layers.10.mlp.experts.99.up_proj.weight_scale": "model-00011-of-00047.safetensors", + "model.layers.10.mlp.gate.e_score_correction_bias": "model-00011-of-00047.safetensors", + "model.layers.10.mlp.gate.weight": "model-00011-of-00047.safetensors", + "model.layers.10.mlp.shared_experts.down_proj.weight": "model-00011-of-00047.safetensors", + "model.layers.10.mlp.shared_experts.down_proj.weight_scale": "model-00011-of-00047.safetensors", + "model.layers.10.mlp.shared_experts.gate_proj.weight": "model-00011-of-00047.safetensors", + "model.layers.10.mlp.shared_experts.gate_proj.weight_scale": "model-00011-of-00047.safetensors", + "model.layers.10.mlp.shared_experts.up_proj.weight": "model-00011-of-00047.safetensors", + "model.layers.10.mlp.shared_experts.up_proj.weight_scale": "model-00011-of-00047.safetensors", + "model.layers.10.post_attention_layernorm.weight": "model-00011-of-00047.safetensors", + "model.layers.10.self_attn.k_proj.bias": "model-00011-of-00047.safetensors", + "model.layers.10.self_attn.k_proj.weight": "model-00011-of-00047.safetensors", + "model.layers.10.self_attn.k_proj.weight_scale": "model-00011-of-00047.safetensors", + "model.layers.10.self_attn.o_proj.weight": "model-00011-of-00047.safetensors", + "model.layers.10.self_attn.o_proj.weight_scale": "model-00011-of-00047.safetensors", + "model.layers.10.self_attn.q_proj.bias": "model-00011-of-00047.safetensors", + "model.layers.10.self_attn.q_proj.weight": "model-00011-of-00047.safetensors", + "model.layers.10.self_attn.q_proj.weight_scale": "model-00011-of-00047.safetensors", + "model.layers.10.self_attn.v_proj.bias": "model-00011-of-00047.safetensors", + "model.layers.10.self_attn.v_proj.weight": "model-00011-of-00047.safetensors", + "model.layers.10.self_attn.v_proj.weight_scale": "model-00011-of-00047.safetensors", + "model.layers.11.input_layernorm.weight": "model-00012-of-00047.safetensors", + "model.layers.11.mlp.experts.0.down_proj.weight": "model-00012-of-00047.safetensors", + "model.layers.11.mlp.experts.0.down_proj.weight_scale": "model-00012-of-00047.safetensors", + "model.layers.11.mlp.experts.0.gate_proj.weight": "model-00012-of-00047.safetensors", + "model.layers.11.mlp.experts.0.gate_proj.weight_scale": "model-00012-of-00047.safetensors", + "model.layers.11.mlp.experts.0.up_proj.weight": "model-00012-of-00047.safetensors", + "model.layers.11.mlp.experts.0.up_proj.weight_scale": "model-00012-of-00047.safetensors", + "model.layers.11.mlp.experts.1.down_proj.weight": "model-00012-of-00047.safetensors", + "model.layers.11.mlp.experts.1.down_proj.weight_scale": "model-00012-of-00047.safetensors", + "model.layers.11.mlp.experts.1.gate_proj.weight": "model-00012-of-00047.safetensors", + "model.layers.11.mlp.experts.1.gate_proj.weight_scale": "model-00012-of-00047.safetensors", + "model.layers.11.mlp.experts.1.up_proj.weight": "model-00012-of-00047.safetensors", + "model.layers.11.mlp.experts.1.up_proj.weight_scale": "model-00012-of-00047.safetensors", + "model.layers.11.mlp.experts.10.down_proj.weight": "model-00012-of-00047.safetensors", + "model.layers.11.mlp.experts.10.down_proj.weight_scale": "model-00012-of-00047.safetensors", + "model.layers.11.mlp.experts.10.gate_proj.weight": "model-00012-of-00047.safetensors", + "model.layers.11.mlp.experts.10.gate_proj.weight_scale": "model-00012-of-00047.safetensors", + "model.layers.11.mlp.experts.10.up_proj.weight": "model-00012-of-00047.safetensors", + "model.layers.11.mlp.experts.10.up_proj.weight_scale": "model-00012-of-00047.safetensors", + "model.layers.11.mlp.experts.100.down_proj.weight": "model-00012-of-00047.safetensors", + "model.layers.11.mlp.experts.100.down_proj.weight_scale": "model-00012-of-00047.safetensors", + "model.layers.11.mlp.experts.100.gate_proj.weight": "model-00012-of-00047.safetensors", + "model.layers.11.mlp.experts.100.gate_proj.weight_scale": "model-00012-of-00047.safetensors", + "model.layers.11.mlp.experts.100.up_proj.weight": "model-00012-of-00047.safetensors", + "model.layers.11.mlp.experts.100.up_proj.weight_scale": "model-00012-of-00047.safetensors", + "model.layers.11.mlp.experts.101.down_proj.weight": "model-00012-of-00047.safetensors", + "model.layers.11.mlp.experts.101.down_proj.weight_scale": "model-00012-of-00047.safetensors", + "model.layers.11.mlp.experts.101.gate_proj.weight": "model-00012-of-00047.safetensors", + "model.layers.11.mlp.experts.101.gate_proj.weight_scale": "model-00012-of-00047.safetensors", + "model.layers.11.mlp.experts.101.up_proj.weight": "model-00012-of-00047.safetensors", + "model.layers.11.mlp.experts.101.up_proj.weight_scale": "model-00012-of-00047.safetensors", + "model.layers.11.mlp.experts.102.down_proj.weight": "model-00012-of-00047.safetensors", + "model.layers.11.mlp.experts.102.down_proj.weight_scale": "model-00012-of-00047.safetensors", + "model.layers.11.mlp.experts.102.gate_proj.weight": "model-00012-of-00047.safetensors", + "model.layers.11.mlp.experts.102.gate_proj.weight_scale": "model-00012-of-00047.safetensors", + "model.layers.11.mlp.experts.102.up_proj.weight": "model-00012-of-00047.safetensors", + "model.layers.11.mlp.experts.102.up_proj.weight_scale": "model-00012-of-00047.safetensors", + "model.layers.11.mlp.experts.103.down_proj.weight": "model-00012-of-00047.safetensors", + "model.layers.11.mlp.experts.103.down_proj.weight_scale": "model-00012-of-00047.safetensors", + "model.layers.11.mlp.experts.103.gate_proj.weight": "model-00012-of-00047.safetensors", + "model.layers.11.mlp.experts.103.gate_proj.weight_scale": "model-00012-of-00047.safetensors", + "model.layers.11.mlp.experts.103.up_proj.weight": "model-00012-of-00047.safetensors", + "model.layers.11.mlp.experts.103.up_proj.weight_scale": "model-00012-of-00047.safetensors", + "model.layers.11.mlp.experts.104.down_proj.weight": "model-00012-of-00047.safetensors", + "model.layers.11.mlp.experts.104.down_proj.weight_scale": "model-00012-of-00047.safetensors", + "model.layers.11.mlp.experts.104.gate_proj.weight": "model-00012-of-00047.safetensors", + "model.layers.11.mlp.experts.104.gate_proj.weight_scale": "model-00012-of-00047.safetensors", + "model.layers.11.mlp.experts.104.up_proj.weight": "model-00012-of-00047.safetensors", + "model.layers.11.mlp.experts.104.up_proj.weight_scale": "model-00012-of-00047.safetensors", + "model.layers.11.mlp.experts.105.down_proj.weight": "model-00012-of-00047.safetensors", + "model.layers.11.mlp.experts.105.down_proj.weight_scale": "model-00012-of-00047.safetensors", + "model.layers.11.mlp.experts.105.gate_proj.weight": "model-00012-of-00047.safetensors", + "model.layers.11.mlp.experts.105.gate_proj.weight_scale": "model-00012-of-00047.safetensors", + "model.layers.11.mlp.experts.105.up_proj.weight": "model-00012-of-00047.safetensors", + "model.layers.11.mlp.experts.105.up_proj.weight_scale": "model-00012-of-00047.safetensors", + "model.layers.11.mlp.experts.106.down_proj.weight": "model-00012-of-00047.safetensors", + "model.layers.11.mlp.experts.106.down_proj.weight_scale": "model-00012-of-00047.safetensors", + "model.layers.11.mlp.experts.106.gate_proj.weight": "model-00012-of-00047.safetensors", + "model.layers.11.mlp.experts.106.gate_proj.weight_scale": "model-00012-of-00047.safetensors", + "model.layers.11.mlp.experts.106.up_proj.weight": "model-00012-of-00047.safetensors", + "model.layers.11.mlp.experts.106.up_proj.weight_scale": "model-00012-of-00047.safetensors", + "model.layers.11.mlp.experts.107.down_proj.weight": "model-00012-of-00047.safetensors", + "model.layers.11.mlp.experts.107.down_proj.weight_scale": "model-00012-of-00047.safetensors", + "model.layers.11.mlp.experts.107.gate_proj.weight": "model-00012-of-00047.safetensors", + "model.layers.11.mlp.experts.107.gate_proj.weight_scale": "model-00012-of-00047.safetensors", + "model.layers.11.mlp.experts.107.up_proj.weight": "model-00012-of-00047.safetensors", + "model.layers.11.mlp.experts.107.up_proj.weight_scale": "model-00012-of-00047.safetensors", + "model.layers.11.mlp.experts.108.down_proj.weight": "model-00012-of-00047.safetensors", + "model.layers.11.mlp.experts.108.down_proj.weight_scale": "model-00012-of-00047.safetensors", + "model.layers.11.mlp.experts.108.gate_proj.weight": "model-00012-of-00047.safetensors", + "model.layers.11.mlp.experts.108.gate_proj.weight_scale": "model-00012-of-00047.safetensors", + "model.layers.11.mlp.experts.108.up_proj.weight": "model-00012-of-00047.safetensors", + "model.layers.11.mlp.experts.108.up_proj.weight_scale": "model-00012-of-00047.safetensors", + "model.layers.11.mlp.experts.109.down_proj.weight": "model-00012-of-00047.safetensors", + "model.layers.11.mlp.experts.109.down_proj.weight_scale": "model-00012-of-00047.safetensors", + "model.layers.11.mlp.experts.109.gate_proj.weight": "model-00012-of-00047.safetensors", + "model.layers.11.mlp.experts.109.gate_proj.weight_scale": "model-00012-of-00047.safetensors", + "model.layers.11.mlp.experts.109.up_proj.weight": "model-00012-of-00047.safetensors", + "model.layers.11.mlp.experts.109.up_proj.weight_scale": "model-00012-of-00047.safetensors", + "model.layers.11.mlp.experts.11.down_proj.weight": "model-00012-of-00047.safetensors", + "model.layers.11.mlp.experts.11.down_proj.weight_scale": "model-00012-of-00047.safetensors", + "model.layers.11.mlp.experts.11.gate_proj.weight": "model-00012-of-00047.safetensors", + "model.layers.11.mlp.experts.11.gate_proj.weight_scale": "model-00012-of-00047.safetensors", + "model.layers.11.mlp.experts.11.up_proj.weight": "model-00012-of-00047.safetensors", + "model.layers.11.mlp.experts.11.up_proj.weight_scale": "model-00012-of-00047.safetensors", + "model.layers.11.mlp.experts.110.down_proj.weight": "model-00012-of-00047.safetensors", + "model.layers.11.mlp.experts.110.down_proj.weight_scale": "model-00012-of-00047.safetensors", + "model.layers.11.mlp.experts.110.gate_proj.weight": "model-00012-of-00047.safetensors", + "model.layers.11.mlp.experts.110.gate_proj.weight_scale": "model-00012-of-00047.safetensors", + "model.layers.11.mlp.experts.110.up_proj.weight": "model-00012-of-00047.safetensors", + "model.layers.11.mlp.experts.110.up_proj.weight_scale": "model-00012-of-00047.safetensors", + "model.layers.11.mlp.experts.111.down_proj.weight": "model-00012-of-00047.safetensors", + "model.layers.11.mlp.experts.111.down_proj.weight_scale": "model-00012-of-00047.safetensors", + "model.layers.11.mlp.experts.111.gate_proj.weight": "model-00012-of-00047.safetensors", + "model.layers.11.mlp.experts.111.gate_proj.weight_scale": "model-00012-of-00047.safetensors", + "model.layers.11.mlp.experts.111.up_proj.weight": "model-00012-of-00047.safetensors", + "model.layers.11.mlp.experts.111.up_proj.weight_scale": "model-00012-of-00047.safetensors", + "model.layers.11.mlp.experts.112.down_proj.weight": "model-00012-of-00047.safetensors", + "model.layers.11.mlp.experts.112.down_proj.weight_scale": "model-00012-of-00047.safetensors", + "model.layers.11.mlp.experts.112.gate_proj.weight": "model-00012-of-00047.safetensors", + "model.layers.11.mlp.experts.112.gate_proj.weight_scale": "model-00012-of-00047.safetensors", + "model.layers.11.mlp.experts.112.up_proj.weight": "model-00012-of-00047.safetensors", + "model.layers.11.mlp.experts.112.up_proj.weight_scale": "model-00012-of-00047.safetensors", + "model.layers.11.mlp.experts.113.down_proj.weight": "model-00012-of-00047.safetensors", + "model.layers.11.mlp.experts.113.down_proj.weight_scale": "model-00012-of-00047.safetensors", + "model.layers.11.mlp.experts.113.gate_proj.weight": "model-00012-of-00047.safetensors", + "model.layers.11.mlp.experts.113.gate_proj.weight_scale": "model-00012-of-00047.safetensors", + "model.layers.11.mlp.experts.113.up_proj.weight": "model-00012-of-00047.safetensors", + "model.layers.11.mlp.experts.113.up_proj.weight_scale": "model-00012-of-00047.safetensors", + "model.layers.11.mlp.experts.114.down_proj.weight": "model-00012-of-00047.safetensors", + "model.layers.11.mlp.experts.114.down_proj.weight_scale": "model-00012-of-00047.safetensors", + "model.layers.11.mlp.experts.114.gate_proj.weight": "model-00012-of-00047.safetensors", + "model.layers.11.mlp.experts.114.gate_proj.weight_scale": "model-00012-of-00047.safetensors", + "model.layers.11.mlp.experts.114.up_proj.weight": "model-00012-of-00047.safetensors", + "model.layers.11.mlp.experts.114.up_proj.weight_scale": "model-00012-of-00047.safetensors", + "model.layers.11.mlp.experts.115.down_proj.weight": "model-00012-of-00047.safetensors", + "model.layers.11.mlp.experts.115.down_proj.weight_scale": "model-00012-of-00047.safetensors", + "model.layers.11.mlp.experts.115.gate_proj.weight": "model-00012-of-00047.safetensors", + "model.layers.11.mlp.experts.115.gate_proj.weight_scale": "model-00012-of-00047.safetensors", + "model.layers.11.mlp.experts.115.up_proj.weight": "model-00012-of-00047.safetensors", + "model.layers.11.mlp.experts.115.up_proj.weight_scale": "model-00012-of-00047.safetensors", + "model.layers.11.mlp.experts.116.down_proj.weight": "model-00012-of-00047.safetensors", + "model.layers.11.mlp.experts.116.down_proj.weight_scale": "model-00012-of-00047.safetensors", + "model.layers.11.mlp.experts.116.gate_proj.weight": "model-00012-of-00047.safetensors", + "model.layers.11.mlp.experts.116.gate_proj.weight_scale": "model-00012-of-00047.safetensors", + "model.layers.11.mlp.experts.116.up_proj.weight": "model-00012-of-00047.safetensors", + "model.layers.11.mlp.experts.116.up_proj.weight_scale": "model-00012-of-00047.safetensors", + "model.layers.11.mlp.experts.117.down_proj.weight": "model-00012-of-00047.safetensors", + "model.layers.11.mlp.experts.117.down_proj.weight_scale": "model-00012-of-00047.safetensors", + "model.layers.11.mlp.experts.117.gate_proj.weight": "model-00012-of-00047.safetensors", + "model.layers.11.mlp.experts.117.gate_proj.weight_scale": "model-00012-of-00047.safetensors", + "model.layers.11.mlp.experts.117.up_proj.weight": "model-00012-of-00047.safetensors", + "model.layers.11.mlp.experts.117.up_proj.weight_scale": "model-00012-of-00047.safetensors", + "model.layers.11.mlp.experts.118.down_proj.weight": "model-00012-of-00047.safetensors", + "model.layers.11.mlp.experts.118.down_proj.weight_scale": "model-00012-of-00047.safetensors", + "model.layers.11.mlp.experts.118.gate_proj.weight": "model-00012-of-00047.safetensors", + "model.layers.11.mlp.experts.118.gate_proj.weight_scale": "model-00012-of-00047.safetensors", + "model.layers.11.mlp.experts.118.up_proj.weight": "model-00012-of-00047.safetensors", + "model.layers.11.mlp.experts.118.up_proj.weight_scale": "model-00012-of-00047.safetensors", + "model.layers.11.mlp.experts.119.down_proj.weight": "model-00012-of-00047.safetensors", + "model.layers.11.mlp.experts.119.down_proj.weight_scale": "model-00012-of-00047.safetensors", + "model.layers.11.mlp.experts.119.gate_proj.weight": "model-00012-of-00047.safetensors", + "model.layers.11.mlp.experts.119.gate_proj.weight_scale": "model-00012-of-00047.safetensors", + "model.layers.11.mlp.experts.119.up_proj.weight": "model-00012-of-00047.safetensors", + "model.layers.11.mlp.experts.119.up_proj.weight_scale": "model-00012-of-00047.safetensors", + "model.layers.11.mlp.experts.12.down_proj.weight": "model-00012-of-00047.safetensors", + "model.layers.11.mlp.experts.12.down_proj.weight_scale": "model-00012-of-00047.safetensors", + "model.layers.11.mlp.experts.12.gate_proj.weight": "model-00012-of-00047.safetensors", + "model.layers.11.mlp.experts.12.gate_proj.weight_scale": "model-00012-of-00047.safetensors", + "model.layers.11.mlp.experts.12.up_proj.weight": "model-00012-of-00047.safetensors", + "model.layers.11.mlp.experts.12.up_proj.weight_scale": "model-00012-of-00047.safetensors", + "model.layers.11.mlp.experts.120.down_proj.weight": "model-00012-of-00047.safetensors", + "model.layers.11.mlp.experts.120.down_proj.weight_scale": "model-00012-of-00047.safetensors", + "model.layers.11.mlp.experts.120.gate_proj.weight": "model-00012-of-00047.safetensors", + "model.layers.11.mlp.experts.120.gate_proj.weight_scale": "model-00012-of-00047.safetensors", + "model.layers.11.mlp.experts.120.up_proj.weight": "model-00012-of-00047.safetensors", + "model.layers.11.mlp.experts.120.up_proj.weight_scale": "model-00012-of-00047.safetensors", + "model.layers.11.mlp.experts.121.down_proj.weight": "model-00012-of-00047.safetensors", + "model.layers.11.mlp.experts.121.down_proj.weight_scale": "model-00012-of-00047.safetensors", + "model.layers.11.mlp.experts.121.gate_proj.weight": "model-00012-of-00047.safetensors", + "model.layers.11.mlp.experts.121.gate_proj.weight_scale": "model-00012-of-00047.safetensors", + "model.layers.11.mlp.experts.121.up_proj.weight": "model-00012-of-00047.safetensors", + "model.layers.11.mlp.experts.121.up_proj.weight_scale": "model-00012-of-00047.safetensors", + "model.layers.11.mlp.experts.122.down_proj.weight": "model-00012-of-00047.safetensors", + "model.layers.11.mlp.experts.122.down_proj.weight_scale": "model-00012-of-00047.safetensors", + "model.layers.11.mlp.experts.122.gate_proj.weight": "model-00012-of-00047.safetensors", + "model.layers.11.mlp.experts.122.gate_proj.weight_scale": "model-00012-of-00047.safetensors", + "model.layers.11.mlp.experts.122.up_proj.weight": "model-00012-of-00047.safetensors", + "model.layers.11.mlp.experts.122.up_proj.weight_scale": "model-00012-of-00047.safetensors", + "model.layers.11.mlp.experts.123.down_proj.weight": "model-00012-of-00047.safetensors", + "model.layers.11.mlp.experts.123.down_proj.weight_scale": "model-00012-of-00047.safetensors", + "model.layers.11.mlp.experts.123.gate_proj.weight": "model-00012-of-00047.safetensors", + "model.layers.11.mlp.experts.123.gate_proj.weight_scale": "model-00012-of-00047.safetensors", + "model.layers.11.mlp.experts.123.up_proj.weight": "model-00012-of-00047.safetensors", + "model.layers.11.mlp.experts.123.up_proj.weight_scale": "model-00012-of-00047.safetensors", + "model.layers.11.mlp.experts.124.down_proj.weight": "model-00012-of-00047.safetensors", + "model.layers.11.mlp.experts.124.down_proj.weight_scale": "model-00012-of-00047.safetensors", + "model.layers.11.mlp.experts.124.gate_proj.weight": "model-00012-of-00047.safetensors", + "model.layers.11.mlp.experts.124.gate_proj.weight_scale": "model-00012-of-00047.safetensors", + "model.layers.11.mlp.experts.124.up_proj.weight": "model-00012-of-00047.safetensors", + "model.layers.11.mlp.experts.124.up_proj.weight_scale": "model-00012-of-00047.safetensors", + "model.layers.11.mlp.experts.125.down_proj.weight": "model-00012-of-00047.safetensors", + "model.layers.11.mlp.experts.125.down_proj.weight_scale": "model-00012-of-00047.safetensors", + "model.layers.11.mlp.experts.125.gate_proj.weight": "model-00012-of-00047.safetensors", + "model.layers.11.mlp.experts.125.gate_proj.weight_scale": "model-00012-of-00047.safetensors", + "model.layers.11.mlp.experts.125.up_proj.weight": "model-00012-of-00047.safetensors", + "model.layers.11.mlp.experts.125.up_proj.weight_scale": "model-00012-of-00047.safetensors", + "model.layers.11.mlp.experts.126.down_proj.weight": "model-00012-of-00047.safetensors", + "model.layers.11.mlp.experts.126.down_proj.weight_scale": "model-00012-of-00047.safetensors", + "model.layers.11.mlp.experts.126.gate_proj.weight": "model-00012-of-00047.safetensors", + "model.layers.11.mlp.experts.126.gate_proj.weight_scale": "model-00012-of-00047.safetensors", + "model.layers.11.mlp.experts.126.up_proj.weight": "model-00012-of-00047.safetensors", + "model.layers.11.mlp.experts.126.up_proj.weight_scale": "model-00012-of-00047.safetensors", + "model.layers.11.mlp.experts.127.down_proj.weight": "model-00012-of-00047.safetensors", + "model.layers.11.mlp.experts.127.down_proj.weight_scale": "model-00012-of-00047.safetensors", + "model.layers.11.mlp.experts.127.gate_proj.weight": "model-00012-of-00047.safetensors", + "model.layers.11.mlp.experts.127.gate_proj.weight_scale": "model-00012-of-00047.safetensors", + "model.layers.11.mlp.experts.127.up_proj.weight": "model-00012-of-00047.safetensors", + "model.layers.11.mlp.experts.127.up_proj.weight_scale": "model-00012-of-00047.safetensors", + "model.layers.11.mlp.experts.13.down_proj.weight": "model-00012-of-00047.safetensors", + "model.layers.11.mlp.experts.13.down_proj.weight_scale": "model-00012-of-00047.safetensors", + "model.layers.11.mlp.experts.13.gate_proj.weight": "model-00012-of-00047.safetensors", + "model.layers.11.mlp.experts.13.gate_proj.weight_scale": "model-00012-of-00047.safetensors", + "model.layers.11.mlp.experts.13.up_proj.weight": "model-00012-of-00047.safetensors", + "model.layers.11.mlp.experts.13.up_proj.weight_scale": "model-00012-of-00047.safetensors", + "model.layers.11.mlp.experts.14.down_proj.weight": "model-00012-of-00047.safetensors", + "model.layers.11.mlp.experts.14.down_proj.weight_scale": "model-00012-of-00047.safetensors", + "model.layers.11.mlp.experts.14.gate_proj.weight": "model-00012-of-00047.safetensors", + "model.layers.11.mlp.experts.14.gate_proj.weight_scale": "model-00012-of-00047.safetensors", + "model.layers.11.mlp.experts.14.up_proj.weight": "model-00012-of-00047.safetensors", + "model.layers.11.mlp.experts.14.up_proj.weight_scale": "model-00012-of-00047.safetensors", + "model.layers.11.mlp.experts.15.down_proj.weight": "model-00012-of-00047.safetensors", + "model.layers.11.mlp.experts.15.down_proj.weight_scale": "model-00012-of-00047.safetensors", + "model.layers.11.mlp.experts.15.gate_proj.weight": "model-00012-of-00047.safetensors", + "model.layers.11.mlp.experts.15.gate_proj.weight_scale": "model-00012-of-00047.safetensors", + "model.layers.11.mlp.experts.15.up_proj.weight": "model-00012-of-00047.safetensors", + "model.layers.11.mlp.experts.15.up_proj.weight_scale": "model-00012-of-00047.safetensors", + "model.layers.11.mlp.experts.16.down_proj.weight": "model-00012-of-00047.safetensors", + "model.layers.11.mlp.experts.16.down_proj.weight_scale": "model-00012-of-00047.safetensors", + "model.layers.11.mlp.experts.16.gate_proj.weight": "model-00012-of-00047.safetensors", + "model.layers.11.mlp.experts.16.gate_proj.weight_scale": "model-00012-of-00047.safetensors", + "model.layers.11.mlp.experts.16.up_proj.weight": "model-00012-of-00047.safetensors", + "model.layers.11.mlp.experts.16.up_proj.weight_scale": "model-00012-of-00047.safetensors", + "model.layers.11.mlp.experts.17.down_proj.weight": "model-00012-of-00047.safetensors", + "model.layers.11.mlp.experts.17.down_proj.weight_scale": "model-00012-of-00047.safetensors", + "model.layers.11.mlp.experts.17.gate_proj.weight": "model-00012-of-00047.safetensors", + "model.layers.11.mlp.experts.17.gate_proj.weight_scale": "model-00012-of-00047.safetensors", + "model.layers.11.mlp.experts.17.up_proj.weight": "model-00012-of-00047.safetensors", + "model.layers.11.mlp.experts.17.up_proj.weight_scale": "model-00012-of-00047.safetensors", + "model.layers.11.mlp.experts.18.down_proj.weight": "model-00012-of-00047.safetensors", + "model.layers.11.mlp.experts.18.down_proj.weight_scale": "model-00012-of-00047.safetensors", + "model.layers.11.mlp.experts.18.gate_proj.weight": "model-00012-of-00047.safetensors", + "model.layers.11.mlp.experts.18.gate_proj.weight_scale": "model-00012-of-00047.safetensors", + "model.layers.11.mlp.experts.18.up_proj.weight": "model-00012-of-00047.safetensors", + "model.layers.11.mlp.experts.18.up_proj.weight_scale": "model-00012-of-00047.safetensors", + "model.layers.11.mlp.experts.19.down_proj.weight": "model-00012-of-00047.safetensors", + "model.layers.11.mlp.experts.19.down_proj.weight_scale": "model-00012-of-00047.safetensors", + "model.layers.11.mlp.experts.19.gate_proj.weight": "model-00012-of-00047.safetensors", + "model.layers.11.mlp.experts.19.gate_proj.weight_scale": "model-00012-of-00047.safetensors", + "model.layers.11.mlp.experts.19.up_proj.weight": "model-00012-of-00047.safetensors", + "model.layers.11.mlp.experts.19.up_proj.weight_scale": "model-00012-of-00047.safetensors", + "model.layers.11.mlp.experts.2.down_proj.weight": "model-00012-of-00047.safetensors", + "model.layers.11.mlp.experts.2.down_proj.weight_scale": "model-00012-of-00047.safetensors", + "model.layers.11.mlp.experts.2.gate_proj.weight": "model-00012-of-00047.safetensors", + "model.layers.11.mlp.experts.2.gate_proj.weight_scale": "model-00012-of-00047.safetensors", + "model.layers.11.mlp.experts.2.up_proj.weight": "model-00012-of-00047.safetensors", + "model.layers.11.mlp.experts.2.up_proj.weight_scale": "model-00012-of-00047.safetensors", + "model.layers.11.mlp.experts.20.down_proj.weight": "model-00012-of-00047.safetensors", + "model.layers.11.mlp.experts.20.down_proj.weight_scale": "model-00012-of-00047.safetensors", + "model.layers.11.mlp.experts.20.gate_proj.weight": "model-00012-of-00047.safetensors", + "model.layers.11.mlp.experts.20.gate_proj.weight_scale": "model-00012-of-00047.safetensors", + "model.layers.11.mlp.experts.20.up_proj.weight": "model-00012-of-00047.safetensors", + "model.layers.11.mlp.experts.20.up_proj.weight_scale": "model-00012-of-00047.safetensors", + "model.layers.11.mlp.experts.21.down_proj.weight": "model-00012-of-00047.safetensors", + "model.layers.11.mlp.experts.21.down_proj.weight_scale": "model-00012-of-00047.safetensors", + "model.layers.11.mlp.experts.21.gate_proj.weight": "model-00012-of-00047.safetensors", + "model.layers.11.mlp.experts.21.gate_proj.weight_scale": "model-00012-of-00047.safetensors", + "model.layers.11.mlp.experts.21.up_proj.weight": "model-00012-of-00047.safetensors", + "model.layers.11.mlp.experts.21.up_proj.weight_scale": "model-00012-of-00047.safetensors", + "model.layers.11.mlp.experts.22.down_proj.weight": "model-00012-of-00047.safetensors", + "model.layers.11.mlp.experts.22.down_proj.weight_scale": "model-00012-of-00047.safetensors", + "model.layers.11.mlp.experts.22.gate_proj.weight": "model-00012-of-00047.safetensors", + "model.layers.11.mlp.experts.22.gate_proj.weight_scale": "model-00012-of-00047.safetensors", + "model.layers.11.mlp.experts.22.up_proj.weight": "model-00012-of-00047.safetensors", + "model.layers.11.mlp.experts.22.up_proj.weight_scale": "model-00012-of-00047.safetensors", + "model.layers.11.mlp.experts.23.down_proj.weight": "model-00012-of-00047.safetensors", + "model.layers.11.mlp.experts.23.down_proj.weight_scale": "model-00012-of-00047.safetensors", + "model.layers.11.mlp.experts.23.gate_proj.weight": "model-00012-of-00047.safetensors", + "model.layers.11.mlp.experts.23.gate_proj.weight_scale": "model-00012-of-00047.safetensors", + "model.layers.11.mlp.experts.23.up_proj.weight": "model-00012-of-00047.safetensors", + "model.layers.11.mlp.experts.23.up_proj.weight_scale": "model-00012-of-00047.safetensors", + "model.layers.11.mlp.experts.24.down_proj.weight": "model-00012-of-00047.safetensors", + "model.layers.11.mlp.experts.24.down_proj.weight_scale": "model-00012-of-00047.safetensors", + "model.layers.11.mlp.experts.24.gate_proj.weight": "model-00012-of-00047.safetensors", + "model.layers.11.mlp.experts.24.gate_proj.weight_scale": "model-00012-of-00047.safetensors", + "model.layers.11.mlp.experts.24.up_proj.weight": "model-00012-of-00047.safetensors", + "model.layers.11.mlp.experts.24.up_proj.weight_scale": "model-00012-of-00047.safetensors", + "model.layers.11.mlp.experts.25.down_proj.weight": "model-00012-of-00047.safetensors", + "model.layers.11.mlp.experts.25.down_proj.weight_scale": "model-00012-of-00047.safetensors", + "model.layers.11.mlp.experts.25.gate_proj.weight": "model-00012-of-00047.safetensors", + "model.layers.11.mlp.experts.25.gate_proj.weight_scale": "model-00012-of-00047.safetensors", + "model.layers.11.mlp.experts.25.up_proj.weight": "model-00012-of-00047.safetensors", + "model.layers.11.mlp.experts.25.up_proj.weight_scale": "model-00012-of-00047.safetensors", + "model.layers.11.mlp.experts.26.down_proj.weight": "model-00012-of-00047.safetensors", + "model.layers.11.mlp.experts.26.down_proj.weight_scale": "model-00012-of-00047.safetensors", + "model.layers.11.mlp.experts.26.gate_proj.weight": "model-00012-of-00047.safetensors", + "model.layers.11.mlp.experts.26.gate_proj.weight_scale": "model-00012-of-00047.safetensors", + "model.layers.11.mlp.experts.26.up_proj.weight": "model-00012-of-00047.safetensors", + "model.layers.11.mlp.experts.26.up_proj.weight_scale": "model-00012-of-00047.safetensors", + "model.layers.11.mlp.experts.27.down_proj.weight": "model-00012-of-00047.safetensors", + "model.layers.11.mlp.experts.27.down_proj.weight_scale": "model-00012-of-00047.safetensors", + "model.layers.11.mlp.experts.27.gate_proj.weight": "model-00012-of-00047.safetensors", + "model.layers.11.mlp.experts.27.gate_proj.weight_scale": "model-00012-of-00047.safetensors", + "model.layers.11.mlp.experts.27.up_proj.weight": "model-00012-of-00047.safetensors", + "model.layers.11.mlp.experts.27.up_proj.weight_scale": "model-00012-of-00047.safetensors", + "model.layers.11.mlp.experts.28.down_proj.weight": "model-00012-of-00047.safetensors", + "model.layers.11.mlp.experts.28.down_proj.weight_scale": "model-00012-of-00047.safetensors", + "model.layers.11.mlp.experts.28.gate_proj.weight": "model-00012-of-00047.safetensors", + "model.layers.11.mlp.experts.28.gate_proj.weight_scale": "model-00012-of-00047.safetensors", + "model.layers.11.mlp.experts.28.up_proj.weight": "model-00012-of-00047.safetensors", + "model.layers.11.mlp.experts.28.up_proj.weight_scale": "model-00012-of-00047.safetensors", + "model.layers.11.mlp.experts.29.down_proj.weight": "model-00012-of-00047.safetensors", + "model.layers.11.mlp.experts.29.down_proj.weight_scale": "model-00012-of-00047.safetensors", + "model.layers.11.mlp.experts.29.gate_proj.weight": "model-00012-of-00047.safetensors", + "model.layers.11.mlp.experts.29.gate_proj.weight_scale": "model-00012-of-00047.safetensors", + "model.layers.11.mlp.experts.29.up_proj.weight": "model-00012-of-00047.safetensors", + "model.layers.11.mlp.experts.29.up_proj.weight_scale": "model-00012-of-00047.safetensors", + "model.layers.11.mlp.experts.3.down_proj.weight": "model-00012-of-00047.safetensors", + "model.layers.11.mlp.experts.3.down_proj.weight_scale": "model-00012-of-00047.safetensors", + "model.layers.11.mlp.experts.3.gate_proj.weight": "model-00012-of-00047.safetensors", + "model.layers.11.mlp.experts.3.gate_proj.weight_scale": "model-00012-of-00047.safetensors", + "model.layers.11.mlp.experts.3.up_proj.weight": "model-00012-of-00047.safetensors", + "model.layers.11.mlp.experts.3.up_proj.weight_scale": "model-00012-of-00047.safetensors", + "model.layers.11.mlp.experts.30.down_proj.weight": "model-00012-of-00047.safetensors", + "model.layers.11.mlp.experts.30.down_proj.weight_scale": "model-00012-of-00047.safetensors", + "model.layers.11.mlp.experts.30.gate_proj.weight": "model-00012-of-00047.safetensors", + "model.layers.11.mlp.experts.30.gate_proj.weight_scale": "model-00012-of-00047.safetensors", + "model.layers.11.mlp.experts.30.up_proj.weight": "model-00012-of-00047.safetensors", + "model.layers.11.mlp.experts.30.up_proj.weight_scale": "model-00012-of-00047.safetensors", + "model.layers.11.mlp.experts.31.down_proj.weight": "model-00012-of-00047.safetensors", + "model.layers.11.mlp.experts.31.down_proj.weight_scale": "model-00012-of-00047.safetensors", + "model.layers.11.mlp.experts.31.gate_proj.weight": "model-00012-of-00047.safetensors", + "model.layers.11.mlp.experts.31.gate_proj.weight_scale": "model-00012-of-00047.safetensors", + "model.layers.11.mlp.experts.31.up_proj.weight": "model-00012-of-00047.safetensors", + "model.layers.11.mlp.experts.31.up_proj.weight_scale": "model-00012-of-00047.safetensors", + "model.layers.11.mlp.experts.32.down_proj.weight": "model-00012-of-00047.safetensors", + "model.layers.11.mlp.experts.32.down_proj.weight_scale": "model-00012-of-00047.safetensors", + "model.layers.11.mlp.experts.32.gate_proj.weight": "model-00012-of-00047.safetensors", + "model.layers.11.mlp.experts.32.gate_proj.weight_scale": "model-00012-of-00047.safetensors", + "model.layers.11.mlp.experts.32.up_proj.weight": "model-00012-of-00047.safetensors", + "model.layers.11.mlp.experts.32.up_proj.weight_scale": "model-00012-of-00047.safetensors", + "model.layers.11.mlp.experts.33.down_proj.weight": "model-00012-of-00047.safetensors", + "model.layers.11.mlp.experts.33.down_proj.weight_scale": "model-00012-of-00047.safetensors", + "model.layers.11.mlp.experts.33.gate_proj.weight": "model-00012-of-00047.safetensors", + "model.layers.11.mlp.experts.33.gate_proj.weight_scale": "model-00012-of-00047.safetensors", + "model.layers.11.mlp.experts.33.up_proj.weight": "model-00012-of-00047.safetensors", + "model.layers.11.mlp.experts.33.up_proj.weight_scale": "model-00012-of-00047.safetensors", + "model.layers.11.mlp.experts.34.down_proj.weight": "model-00012-of-00047.safetensors", + "model.layers.11.mlp.experts.34.down_proj.weight_scale": "model-00012-of-00047.safetensors", + "model.layers.11.mlp.experts.34.gate_proj.weight": "model-00012-of-00047.safetensors", + "model.layers.11.mlp.experts.34.gate_proj.weight_scale": "model-00012-of-00047.safetensors", + "model.layers.11.mlp.experts.34.up_proj.weight": "model-00012-of-00047.safetensors", + "model.layers.11.mlp.experts.34.up_proj.weight_scale": "model-00012-of-00047.safetensors", + "model.layers.11.mlp.experts.35.down_proj.weight": "model-00012-of-00047.safetensors", + "model.layers.11.mlp.experts.35.down_proj.weight_scale": "model-00012-of-00047.safetensors", + "model.layers.11.mlp.experts.35.gate_proj.weight": "model-00012-of-00047.safetensors", + "model.layers.11.mlp.experts.35.gate_proj.weight_scale": "model-00012-of-00047.safetensors", + "model.layers.11.mlp.experts.35.up_proj.weight": "model-00012-of-00047.safetensors", + "model.layers.11.mlp.experts.35.up_proj.weight_scale": "model-00012-of-00047.safetensors", + "model.layers.11.mlp.experts.36.down_proj.weight": "model-00012-of-00047.safetensors", + "model.layers.11.mlp.experts.36.down_proj.weight_scale": "model-00012-of-00047.safetensors", + "model.layers.11.mlp.experts.36.gate_proj.weight": "model-00012-of-00047.safetensors", + "model.layers.11.mlp.experts.36.gate_proj.weight_scale": "model-00012-of-00047.safetensors", + "model.layers.11.mlp.experts.36.up_proj.weight": "model-00012-of-00047.safetensors", + "model.layers.11.mlp.experts.36.up_proj.weight_scale": "model-00012-of-00047.safetensors", + "model.layers.11.mlp.experts.37.down_proj.weight": "model-00012-of-00047.safetensors", + "model.layers.11.mlp.experts.37.down_proj.weight_scale": "model-00012-of-00047.safetensors", + "model.layers.11.mlp.experts.37.gate_proj.weight": "model-00012-of-00047.safetensors", + "model.layers.11.mlp.experts.37.gate_proj.weight_scale": "model-00012-of-00047.safetensors", + "model.layers.11.mlp.experts.37.up_proj.weight": "model-00012-of-00047.safetensors", + "model.layers.11.mlp.experts.37.up_proj.weight_scale": "model-00012-of-00047.safetensors", + "model.layers.11.mlp.experts.38.down_proj.weight": "model-00012-of-00047.safetensors", + "model.layers.11.mlp.experts.38.down_proj.weight_scale": "model-00012-of-00047.safetensors", + "model.layers.11.mlp.experts.38.gate_proj.weight": "model-00012-of-00047.safetensors", + "model.layers.11.mlp.experts.38.gate_proj.weight_scale": "model-00012-of-00047.safetensors", + "model.layers.11.mlp.experts.38.up_proj.weight": "model-00012-of-00047.safetensors", + "model.layers.11.mlp.experts.38.up_proj.weight_scale": "model-00012-of-00047.safetensors", + "model.layers.11.mlp.experts.39.down_proj.weight": "model-00012-of-00047.safetensors", + "model.layers.11.mlp.experts.39.down_proj.weight_scale": "model-00012-of-00047.safetensors", + "model.layers.11.mlp.experts.39.gate_proj.weight": "model-00012-of-00047.safetensors", + "model.layers.11.mlp.experts.39.gate_proj.weight_scale": "model-00012-of-00047.safetensors", + "model.layers.11.mlp.experts.39.up_proj.weight": "model-00012-of-00047.safetensors", + "model.layers.11.mlp.experts.39.up_proj.weight_scale": "model-00012-of-00047.safetensors", + "model.layers.11.mlp.experts.4.down_proj.weight": "model-00012-of-00047.safetensors", + "model.layers.11.mlp.experts.4.down_proj.weight_scale": "model-00012-of-00047.safetensors", + "model.layers.11.mlp.experts.4.gate_proj.weight": "model-00012-of-00047.safetensors", + "model.layers.11.mlp.experts.4.gate_proj.weight_scale": "model-00012-of-00047.safetensors", + "model.layers.11.mlp.experts.4.up_proj.weight": "model-00012-of-00047.safetensors", + "model.layers.11.mlp.experts.4.up_proj.weight_scale": "model-00012-of-00047.safetensors", + "model.layers.11.mlp.experts.40.down_proj.weight": "model-00012-of-00047.safetensors", + "model.layers.11.mlp.experts.40.down_proj.weight_scale": "model-00012-of-00047.safetensors", + "model.layers.11.mlp.experts.40.gate_proj.weight": "model-00012-of-00047.safetensors", + "model.layers.11.mlp.experts.40.gate_proj.weight_scale": "model-00012-of-00047.safetensors", + "model.layers.11.mlp.experts.40.up_proj.weight": "model-00012-of-00047.safetensors", + "model.layers.11.mlp.experts.40.up_proj.weight_scale": "model-00012-of-00047.safetensors", + "model.layers.11.mlp.experts.41.down_proj.weight": "model-00012-of-00047.safetensors", + "model.layers.11.mlp.experts.41.down_proj.weight_scale": "model-00012-of-00047.safetensors", + "model.layers.11.mlp.experts.41.gate_proj.weight": "model-00012-of-00047.safetensors", + "model.layers.11.mlp.experts.41.gate_proj.weight_scale": "model-00012-of-00047.safetensors", + "model.layers.11.mlp.experts.41.up_proj.weight": "model-00012-of-00047.safetensors", + "model.layers.11.mlp.experts.41.up_proj.weight_scale": "model-00012-of-00047.safetensors", + "model.layers.11.mlp.experts.42.down_proj.weight": "model-00012-of-00047.safetensors", + "model.layers.11.mlp.experts.42.down_proj.weight_scale": "model-00012-of-00047.safetensors", + "model.layers.11.mlp.experts.42.gate_proj.weight": "model-00012-of-00047.safetensors", + "model.layers.11.mlp.experts.42.gate_proj.weight_scale": "model-00012-of-00047.safetensors", + "model.layers.11.mlp.experts.42.up_proj.weight": "model-00012-of-00047.safetensors", + "model.layers.11.mlp.experts.42.up_proj.weight_scale": "model-00012-of-00047.safetensors", + "model.layers.11.mlp.experts.43.down_proj.weight": "model-00012-of-00047.safetensors", + "model.layers.11.mlp.experts.43.down_proj.weight_scale": "model-00012-of-00047.safetensors", + "model.layers.11.mlp.experts.43.gate_proj.weight": "model-00012-of-00047.safetensors", + "model.layers.11.mlp.experts.43.gate_proj.weight_scale": "model-00012-of-00047.safetensors", + "model.layers.11.mlp.experts.43.up_proj.weight": "model-00012-of-00047.safetensors", + "model.layers.11.mlp.experts.43.up_proj.weight_scale": "model-00012-of-00047.safetensors", + "model.layers.11.mlp.experts.44.down_proj.weight": "model-00012-of-00047.safetensors", + "model.layers.11.mlp.experts.44.down_proj.weight_scale": "model-00012-of-00047.safetensors", + "model.layers.11.mlp.experts.44.gate_proj.weight": "model-00012-of-00047.safetensors", + "model.layers.11.mlp.experts.44.gate_proj.weight_scale": "model-00012-of-00047.safetensors", + "model.layers.11.mlp.experts.44.up_proj.weight": "model-00012-of-00047.safetensors", + "model.layers.11.mlp.experts.44.up_proj.weight_scale": "model-00012-of-00047.safetensors", + "model.layers.11.mlp.experts.45.down_proj.weight": "model-00012-of-00047.safetensors", + "model.layers.11.mlp.experts.45.down_proj.weight_scale": "model-00012-of-00047.safetensors", + "model.layers.11.mlp.experts.45.gate_proj.weight": "model-00012-of-00047.safetensors", + "model.layers.11.mlp.experts.45.gate_proj.weight_scale": "model-00012-of-00047.safetensors", + "model.layers.11.mlp.experts.45.up_proj.weight": "model-00012-of-00047.safetensors", + "model.layers.11.mlp.experts.45.up_proj.weight_scale": "model-00012-of-00047.safetensors", + "model.layers.11.mlp.experts.46.down_proj.weight": "model-00012-of-00047.safetensors", + "model.layers.11.mlp.experts.46.down_proj.weight_scale": "model-00012-of-00047.safetensors", + "model.layers.11.mlp.experts.46.gate_proj.weight": "model-00012-of-00047.safetensors", + "model.layers.11.mlp.experts.46.gate_proj.weight_scale": "model-00012-of-00047.safetensors", + "model.layers.11.mlp.experts.46.up_proj.weight": "model-00012-of-00047.safetensors", + "model.layers.11.mlp.experts.46.up_proj.weight_scale": "model-00012-of-00047.safetensors", + "model.layers.11.mlp.experts.47.down_proj.weight": "model-00012-of-00047.safetensors", + "model.layers.11.mlp.experts.47.down_proj.weight_scale": "model-00012-of-00047.safetensors", + "model.layers.11.mlp.experts.47.gate_proj.weight": "model-00012-of-00047.safetensors", + "model.layers.11.mlp.experts.47.gate_proj.weight_scale": "model-00012-of-00047.safetensors", + "model.layers.11.mlp.experts.47.up_proj.weight": "model-00012-of-00047.safetensors", + "model.layers.11.mlp.experts.47.up_proj.weight_scale": "model-00012-of-00047.safetensors", + "model.layers.11.mlp.experts.48.down_proj.weight": "model-00012-of-00047.safetensors", + "model.layers.11.mlp.experts.48.down_proj.weight_scale": "model-00012-of-00047.safetensors", + "model.layers.11.mlp.experts.48.gate_proj.weight": "model-00012-of-00047.safetensors", + "model.layers.11.mlp.experts.48.gate_proj.weight_scale": "model-00012-of-00047.safetensors", + "model.layers.11.mlp.experts.48.up_proj.weight": "model-00012-of-00047.safetensors", + "model.layers.11.mlp.experts.48.up_proj.weight_scale": "model-00012-of-00047.safetensors", + "model.layers.11.mlp.experts.49.down_proj.weight": "model-00012-of-00047.safetensors", + "model.layers.11.mlp.experts.49.down_proj.weight_scale": "model-00012-of-00047.safetensors", + "model.layers.11.mlp.experts.49.gate_proj.weight": "model-00012-of-00047.safetensors", + "model.layers.11.mlp.experts.49.gate_proj.weight_scale": "model-00012-of-00047.safetensors", + "model.layers.11.mlp.experts.49.up_proj.weight": "model-00012-of-00047.safetensors", + "model.layers.11.mlp.experts.49.up_proj.weight_scale": "model-00012-of-00047.safetensors", + "model.layers.11.mlp.experts.5.down_proj.weight": "model-00012-of-00047.safetensors", + "model.layers.11.mlp.experts.5.down_proj.weight_scale": "model-00012-of-00047.safetensors", + "model.layers.11.mlp.experts.5.gate_proj.weight": "model-00012-of-00047.safetensors", + "model.layers.11.mlp.experts.5.gate_proj.weight_scale": "model-00012-of-00047.safetensors", + "model.layers.11.mlp.experts.5.up_proj.weight": "model-00012-of-00047.safetensors", + "model.layers.11.mlp.experts.5.up_proj.weight_scale": "model-00012-of-00047.safetensors", + "model.layers.11.mlp.experts.50.down_proj.weight": "model-00012-of-00047.safetensors", + "model.layers.11.mlp.experts.50.down_proj.weight_scale": "model-00012-of-00047.safetensors", + "model.layers.11.mlp.experts.50.gate_proj.weight": "model-00012-of-00047.safetensors", + "model.layers.11.mlp.experts.50.gate_proj.weight_scale": "model-00012-of-00047.safetensors", + "model.layers.11.mlp.experts.50.up_proj.weight": "model-00012-of-00047.safetensors", + "model.layers.11.mlp.experts.50.up_proj.weight_scale": "model-00012-of-00047.safetensors", + "model.layers.11.mlp.experts.51.down_proj.weight": "model-00012-of-00047.safetensors", + "model.layers.11.mlp.experts.51.down_proj.weight_scale": "model-00012-of-00047.safetensors", + "model.layers.11.mlp.experts.51.gate_proj.weight": "model-00012-of-00047.safetensors", + "model.layers.11.mlp.experts.51.gate_proj.weight_scale": "model-00012-of-00047.safetensors", + "model.layers.11.mlp.experts.51.up_proj.weight": "model-00012-of-00047.safetensors", + "model.layers.11.mlp.experts.51.up_proj.weight_scale": "model-00012-of-00047.safetensors", + "model.layers.11.mlp.experts.52.down_proj.weight": "model-00012-of-00047.safetensors", + "model.layers.11.mlp.experts.52.down_proj.weight_scale": "model-00012-of-00047.safetensors", + "model.layers.11.mlp.experts.52.gate_proj.weight": "model-00012-of-00047.safetensors", + "model.layers.11.mlp.experts.52.gate_proj.weight_scale": "model-00012-of-00047.safetensors", + "model.layers.11.mlp.experts.52.up_proj.weight": "model-00012-of-00047.safetensors", + "model.layers.11.mlp.experts.52.up_proj.weight_scale": "model-00012-of-00047.safetensors", + "model.layers.11.mlp.experts.53.down_proj.weight": "model-00012-of-00047.safetensors", + "model.layers.11.mlp.experts.53.down_proj.weight_scale": "model-00012-of-00047.safetensors", + "model.layers.11.mlp.experts.53.gate_proj.weight": "model-00012-of-00047.safetensors", + "model.layers.11.mlp.experts.53.gate_proj.weight_scale": "model-00012-of-00047.safetensors", + "model.layers.11.mlp.experts.53.up_proj.weight": "model-00012-of-00047.safetensors", + "model.layers.11.mlp.experts.53.up_proj.weight_scale": "model-00012-of-00047.safetensors", + "model.layers.11.mlp.experts.54.down_proj.weight": "model-00012-of-00047.safetensors", + "model.layers.11.mlp.experts.54.down_proj.weight_scale": "model-00012-of-00047.safetensors", + "model.layers.11.mlp.experts.54.gate_proj.weight": "model-00012-of-00047.safetensors", + "model.layers.11.mlp.experts.54.gate_proj.weight_scale": "model-00012-of-00047.safetensors", + "model.layers.11.mlp.experts.54.up_proj.weight": "model-00012-of-00047.safetensors", + "model.layers.11.mlp.experts.54.up_proj.weight_scale": "model-00012-of-00047.safetensors", + "model.layers.11.mlp.experts.55.down_proj.weight": "model-00012-of-00047.safetensors", + "model.layers.11.mlp.experts.55.down_proj.weight_scale": "model-00012-of-00047.safetensors", + "model.layers.11.mlp.experts.55.gate_proj.weight": "model-00012-of-00047.safetensors", + "model.layers.11.mlp.experts.55.gate_proj.weight_scale": "model-00012-of-00047.safetensors", + "model.layers.11.mlp.experts.55.up_proj.weight": "model-00012-of-00047.safetensors", + "model.layers.11.mlp.experts.55.up_proj.weight_scale": "model-00012-of-00047.safetensors", + "model.layers.11.mlp.experts.56.down_proj.weight": "model-00012-of-00047.safetensors", + "model.layers.11.mlp.experts.56.down_proj.weight_scale": "model-00012-of-00047.safetensors", + "model.layers.11.mlp.experts.56.gate_proj.weight": "model-00012-of-00047.safetensors", + "model.layers.11.mlp.experts.56.gate_proj.weight_scale": "model-00012-of-00047.safetensors", + "model.layers.11.mlp.experts.56.up_proj.weight": "model-00012-of-00047.safetensors", + "model.layers.11.mlp.experts.56.up_proj.weight_scale": "model-00012-of-00047.safetensors", + "model.layers.11.mlp.experts.57.down_proj.weight": "model-00012-of-00047.safetensors", + "model.layers.11.mlp.experts.57.down_proj.weight_scale": "model-00012-of-00047.safetensors", + "model.layers.11.mlp.experts.57.gate_proj.weight": "model-00012-of-00047.safetensors", + "model.layers.11.mlp.experts.57.gate_proj.weight_scale": "model-00012-of-00047.safetensors", + "model.layers.11.mlp.experts.57.up_proj.weight": "model-00012-of-00047.safetensors", + "model.layers.11.mlp.experts.57.up_proj.weight_scale": "model-00012-of-00047.safetensors", + "model.layers.11.mlp.experts.58.down_proj.weight": "model-00012-of-00047.safetensors", + "model.layers.11.mlp.experts.58.down_proj.weight_scale": "model-00012-of-00047.safetensors", + "model.layers.11.mlp.experts.58.gate_proj.weight": "model-00012-of-00047.safetensors", + "model.layers.11.mlp.experts.58.gate_proj.weight_scale": "model-00012-of-00047.safetensors", + "model.layers.11.mlp.experts.58.up_proj.weight": "model-00012-of-00047.safetensors", + "model.layers.11.mlp.experts.58.up_proj.weight_scale": "model-00012-of-00047.safetensors", + "model.layers.11.mlp.experts.59.down_proj.weight": "model-00012-of-00047.safetensors", + "model.layers.11.mlp.experts.59.down_proj.weight_scale": "model-00012-of-00047.safetensors", + "model.layers.11.mlp.experts.59.gate_proj.weight": "model-00012-of-00047.safetensors", + "model.layers.11.mlp.experts.59.gate_proj.weight_scale": "model-00012-of-00047.safetensors", + "model.layers.11.mlp.experts.59.up_proj.weight": "model-00012-of-00047.safetensors", + "model.layers.11.mlp.experts.59.up_proj.weight_scale": "model-00012-of-00047.safetensors", + "model.layers.11.mlp.experts.6.down_proj.weight": "model-00012-of-00047.safetensors", + "model.layers.11.mlp.experts.6.down_proj.weight_scale": "model-00012-of-00047.safetensors", + "model.layers.11.mlp.experts.6.gate_proj.weight": "model-00012-of-00047.safetensors", + "model.layers.11.mlp.experts.6.gate_proj.weight_scale": "model-00012-of-00047.safetensors", + "model.layers.11.mlp.experts.6.up_proj.weight": "model-00012-of-00047.safetensors", + "model.layers.11.mlp.experts.6.up_proj.weight_scale": "model-00012-of-00047.safetensors", + "model.layers.11.mlp.experts.60.down_proj.weight": "model-00012-of-00047.safetensors", + "model.layers.11.mlp.experts.60.down_proj.weight_scale": "model-00012-of-00047.safetensors", + "model.layers.11.mlp.experts.60.gate_proj.weight": "model-00012-of-00047.safetensors", + "model.layers.11.mlp.experts.60.gate_proj.weight_scale": "model-00012-of-00047.safetensors", + "model.layers.11.mlp.experts.60.up_proj.weight": "model-00012-of-00047.safetensors", + "model.layers.11.mlp.experts.60.up_proj.weight_scale": "model-00012-of-00047.safetensors", + "model.layers.11.mlp.experts.61.down_proj.weight": "model-00012-of-00047.safetensors", + "model.layers.11.mlp.experts.61.down_proj.weight_scale": "model-00012-of-00047.safetensors", + "model.layers.11.mlp.experts.61.gate_proj.weight": "model-00012-of-00047.safetensors", + "model.layers.11.mlp.experts.61.gate_proj.weight_scale": "model-00012-of-00047.safetensors", + "model.layers.11.mlp.experts.61.up_proj.weight": "model-00012-of-00047.safetensors", + "model.layers.11.mlp.experts.61.up_proj.weight_scale": "model-00012-of-00047.safetensors", + "model.layers.11.mlp.experts.62.down_proj.weight": "model-00012-of-00047.safetensors", + "model.layers.11.mlp.experts.62.down_proj.weight_scale": "model-00012-of-00047.safetensors", + "model.layers.11.mlp.experts.62.gate_proj.weight": "model-00012-of-00047.safetensors", + "model.layers.11.mlp.experts.62.gate_proj.weight_scale": "model-00012-of-00047.safetensors", + "model.layers.11.mlp.experts.62.up_proj.weight": "model-00012-of-00047.safetensors", + "model.layers.11.mlp.experts.62.up_proj.weight_scale": "model-00012-of-00047.safetensors", + "model.layers.11.mlp.experts.63.down_proj.weight": "model-00012-of-00047.safetensors", + "model.layers.11.mlp.experts.63.down_proj.weight_scale": "model-00012-of-00047.safetensors", + "model.layers.11.mlp.experts.63.gate_proj.weight": "model-00012-of-00047.safetensors", + "model.layers.11.mlp.experts.63.gate_proj.weight_scale": "model-00012-of-00047.safetensors", + "model.layers.11.mlp.experts.63.up_proj.weight": "model-00012-of-00047.safetensors", + "model.layers.11.mlp.experts.63.up_proj.weight_scale": "model-00012-of-00047.safetensors", + "model.layers.11.mlp.experts.64.down_proj.weight": "model-00012-of-00047.safetensors", + "model.layers.11.mlp.experts.64.down_proj.weight_scale": "model-00012-of-00047.safetensors", + "model.layers.11.mlp.experts.64.gate_proj.weight": "model-00012-of-00047.safetensors", + "model.layers.11.mlp.experts.64.gate_proj.weight_scale": "model-00012-of-00047.safetensors", + "model.layers.11.mlp.experts.64.up_proj.weight": "model-00012-of-00047.safetensors", + "model.layers.11.mlp.experts.64.up_proj.weight_scale": "model-00012-of-00047.safetensors", + "model.layers.11.mlp.experts.65.down_proj.weight": "model-00012-of-00047.safetensors", + "model.layers.11.mlp.experts.65.down_proj.weight_scale": "model-00012-of-00047.safetensors", + "model.layers.11.mlp.experts.65.gate_proj.weight": "model-00012-of-00047.safetensors", + "model.layers.11.mlp.experts.65.gate_proj.weight_scale": "model-00012-of-00047.safetensors", + "model.layers.11.mlp.experts.65.up_proj.weight": "model-00012-of-00047.safetensors", + "model.layers.11.mlp.experts.65.up_proj.weight_scale": "model-00012-of-00047.safetensors", + "model.layers.11.mlp.experts.66.down_proj.weight": "model-00012-of-00047.safetensors", + "model.layers.11.mlp.experts.66.down_proj.weight_scale": "model-00012-of-00047.safetensors", + "model.layers.11.mlp.experts.66.gate_proj.weight": "model-00012-of-00047.safetensors", + "model.layers.11.mlp.experts.66.gate_proj.weight_scale": "model-00012-of-00047.safetensors", + "model.layers.11.mlp.experts.66.up_proj.weight": "model-00012-of-00047.safetensors", + "model.layers.11.mlp.experts.66.up_proj.weight_scale": "model-00012-of-00047.safetensors", + "model.layers.11.mlp.experts.67.down_proj.weight": "model-00012-of-00047.safetensors", + "model.layers.11.mlp.experts.67.down_proj.weight_scale": "model-00012-of-00047.safetensors", + "model.layers.11.mlp.experts.67.gate_proj.weight": "model-00012-of-00047.safetensors", + "model.layers.11.mlp.experts.67.gate_proj.weight_scale": "model-00012-of-00047.safetensors", + "model.layers.11.mlp.experts.67.up_proj.weight": "model-00012-of-00047.safetensors", + "model.layers.11.mlp.experts.67.up_proj.weight_scale": "model-00012-of-00047.safetensors", + "model.layers.11.mlp.experts.68.down_proj.weight": "model-00012-of-00047.safetensors", + "model.layers.11.mlp.experts.68.down_proj.weight_scale": "model-00012-of-00047.safetensors", + "model.layers.11.mlp.experts.68.gate_proj.weight": "model-00012-of-00047.safetensors", + "model.layers.11.mlp.experts.68.gate_proj.weight_scale": "model-00012-of-00047.safetensors", + "model.layers.11.mlp.experts.68.up_proj.weight": "model-00012-of-00047.safetensors", + "model.layers.11.mlp.experts.68.up_proj.weight_scale": "model-00012-of-00047.safetensors", + "model.layers.11.mlp.experts.69.down_proj.weight": "model-00012-of-00047.safetensors", + "model.layers.11.mlp.experts.69.down_proj.weight_scale": "model-00012-of-00047.safetensors", + "model.layers.11.mlp.experts.69.gate_proj.weight": "model-00012-of-00047.safetensors", + "model.layers.11.mlp.experts.69.gate_proj.weight_scale": "model-00012-of-00047.safetensors", + "model.layers.11.mlp.experts.69.up_proj.weight": "model-00012-of-00047.safetensors", + "model.layers.11.mlp.experts.69.up_proj.weight_scale": "model-00012-of-00047.safetensors", + "model.layers.11.mlp.experts.7.down_proj.weight": "model-00012-of-00047.safetensors", + "model.layers.11.mlp.experts.7.down_proj.weight_scale": "model-00012-of-00047.safetensors", + "model.layers.11.mlp.experts.7.gate_proj.weight": "model-00012-of-00047.safetensors", + "model.layers.11.mlp.experts.7.gate_proj.weight_scale": "model-00012-of-00047.safetensors", + "model.layers.11.mlp.experts.7.up_proj.weight": "model-00012-of-00047.safetensors", + "model.layers.11.mlp.experts.7.up_proj.weight_scale": "model-00012-of-00047.safetensors", + "model.layers.11.mlp.experts.70.down_proj.weight": "model-00012-of-00047.safetensors", + "model.layers.11.mlp.experts.70.down_proj.weight_scale": "model-00012-of-00047.safetensors", + "model.layers.11.mlp.experts.70.gate_proj.weight": "model-00012-of-00047.safetensors", + "model.layers.11.mlp.experts.70.gate_proj.weight_scale": "model-00012-of-00047.safetensors", + "model.layers.11.mlp.experts.70.up_proj.weight": "model-00012-of-00047.safetensors", + "model.layers.11.mlp.experts.70.up_proj.weight_scale": "model-00012-of-00047.safetensors", + "model.layers.11.mlp.experts.71.down_proj.weight": "model-00012-of-00047.safetensors", + "model.layers.11.mlp.experts.71.down_proj.weight_scale": "model-00012-of-00047.safetensors", + "model.layers.11.mlp.experts.71.gate_proj.weight": "model-00012-of-00047.safetensors", + "model.layers.11.mlp.experts.71.gate_proj.weight_scale": "model-00012-of-00047.safetensors", + "model.layers.11.mlp.experts.71.up_proj.weight": "model-00012-of-00047.safetensors", + "model.layers.11.mlp.experts.71.up_proj.weight_scale": "model-00012-of-00047.safetensors", + "model.layers.11.mlp.experts.72.down_proj.weight": "model-00012-of-00047.safetensors", + "model.layers.11.mlp.experts.72.down_proj.weight_scale": "model-00012-of-00047.safetensors", + "model.layers.11.mlp.experts.72.gate_proj.weight": "model-00012-of-00047.safetensors", + "model.layers.11.mlp.experts.72.gate_proj.weight_scale": "model-00012-of-00047.safetensors", + "model.layers.11.mlp.experts.72.up_proj.weight": "model-00012-of-00047.safetensors", + "model.layers.11.mlp.experts.72.up_proj.weight_scale": "model-00012-of-00047.safetensors", + "model.layers.11.mlp.experts.73.down_proj.weight": "model-00012-of-00047.safetensors", + "model.layers.11.mlp.experts.73.down_proj.weight_scale": "model-00012-of-00047.safetensors", + "model.layers.11.mlp.experts.73.gate_proj.weight": "model-00012-of-00047.safetensors", + "model.layers.11.mlp.experts.73.gate_proj.weight_scale": "model-00012-of-00047.safetensors", + "model.layers.11.mlp.experts.73.up_proj.weight": "model-00012-of-00047.safetensors", + "model.layers.11.mlp.experts.73.up_proj.weight_scale": "model-00012-of-00047.safetensors", + "model.layers.11.mlp.experts.74.down_proj.weight": "model-00012-of-00047.safetensors", + "model.layers.11.mlp.experts.74.down_proj.weight_scale": "model-00012-of-00047.safetensors", + "model.layers.11.mlp.experts.74.gate_proj.weight": "model-00012-of-00047.safetensors", + "model.layers.11.mlp.experts.74.gate_proj.weight_scale": "model-00012-of-00047.safetensors", + "model.layers.11.mlp.experts.74.up_proj.weight": "model-00012-of-00047.safetensors", + "model.layers.11.mlp.experts.74.up_proj.weight_scale": "model-00012-of-00047.safetensors", + "model.layers.11.mlp.experts.75.down_proj.weight": "model-00012-of-00047.safetensors", + "model.layers.11.mlp.experts.75.down_proj.weight_scale": "model-00012-of-00047.safetensors", + "model.layers.11.mlp.experts.75.gate_proj.weight": "model-00012-of-00047.safetensors", + "model.layers.11.mlp.experts.75.gate_proj.weight_scale": "model-00012-of-00047.safetensors", + "model.layers.11.mlp.experts.75.up_proj.weight": "model-00012-of-00047.safetensors", + "model.layers.11.mlp.experts.75.up_proj.weight_scale": "model-00012-of-00047.safetensors", + "model.layers.11.mlp.experts.76.down_proj.weight": "model-00012-of-00047.safetensors", + "model.layers.11.mlp.experts.76.down_proj.weight_scale": "model-00012-of-00047.safetensors", + "model.layers.11.mlp.experts.76.gate_proj.weight": "model-00012-of-00047.safetensors", + "model.layers.11.mlp.experts.76.gate_proj.weight_scale": "model-00012-of-00047.safetensors", + "model.layers.11.mlp.experts.76.up_proj.weight": "model-00012-of-00047.safetensors", + "model.layers.11.mlp.experts.76.up_proj.weight_scale": "model-00012-of-00047.safetensors", + "model.layers.11.mlp.experts.77.down_proj.weight": "model-00012-of-00047.safetensors", + "model.layers.11.mlp.experts.77.down_proj.weight_scale": "model-00012-of-00047.safetensors", + "model.layers.11.mlp.experts.77.gate_proj.weight": "model-00012-of-00047.safetensors", + "model.layers.11.mlp.experts.77.gate_proj.weight_scale": "model-00012-of-00047.safetensors", + "model.layers.11.mlp.experts.77.up_proj.weight": "model-00012-of-00047.safetensors", + "model.layers.11.mlp.experts.77.up_proj.weight_scale": "model-00012-of-00047.safetensors", + "model.layers.11.mlp.experts.78.down_proj.weight": "model-00012-of-00047.safetensors", + "model.layers.11.mlp.experts.78.down_proj.weight_scale": "model-00012-of-00047.safetensors", + "model.layers.11.mlp.experts.78.gate_proj.weight": "model-00012-of-00047.safetensors", + "model.layers.11.mlp.experts.78.gate_proj.weight_scale": "model-00012-of-00047.safetensors", + "model.layers.11.mlp.experts.78.up_proj.weight": "model-00012-of-00047.safetensors", + "model.layers.11.mlp.experts.78.up_proj.weight_scale": "model-00012-of-00047.safetensors", + "model.layers.11.mlp.experts.79.down_proj.weight": "model-00012-of-00047.safetensors", + "model.layers.11.mlp.experts.79.down_proj.weight_scale": "model-00012-of-00047.safetensors", + "model.layers.11.mlp.experts.79.gate_proj.weight": "model-00012-of-00047.safetensors", + "model.layers.11.mlp.experts.79.gate_proj.weight_scale": "model-00012-of-00047.safetensors", + "model.layers.11.mlp.experts.79.up_proj.weight": "model-00012-of-00047.safetensors", + "model.layers.11.mlp.experts.79.up_proj.weight_scale": "model-00012-of-00047.safetensors", + "model.layers.11.mlp.experts.8.down_proj.weight": "model-00012-of-00047.safetensors", + "model.layers.11.mlp.experts.8.down_proj.weight_scale": "model-00012-of-00047.safetensors", + "model.layers.11.mlp.experts.8.gate_proj.weight": "model-00012-of-00047.safetensors", + "model.layers.11.mlp.experts.8.gate_proj.weight_scale": "model-00012-of-00047.safetensors", + "model.layers.11.mlp.experts.8.up_proj.weight": "model-00012-of-00047.safetensors", + "model.layers.11.mlp.experts.8.up_proj.weight_scale": "model-00012-of-00047.safetensors", + "model.layers.11.mlp.experts.80.down_proj.weight": "model-00012-of-00047.safetensors", + "model.layers.11.mlp.experts.80.down_proj.weight_scale": "model-00012-of-00047.safetensors", + "model.layers.11.mlp.experts.80.gate_proj.weight": "model-00012-of-00047.safetensors", + "model.layers.11.mlp.experts.80.gate_proj.weight_scale": "model-00012-of-00047.safetensors", + "model.layers.11.mlp.experts.80.up_proj.weight": "model-00012-of-00047.safetensors", + "model.layers.11.mlp.experts.80.up_proj.weight_scale": "model-00012-of-00047.safetensors", + "model.layers.11.mlp.experts.81.down_proj.weight": "model-00012-of-00047.safetensors", + "model.layers.11.mlp.experts.81.down_proj.weight_scale": "model-00012-of-00047.safetensors", + "model.layers.11.mlp.experts.81.gate_proj.weight": "model-00012-of-00047.safetensors", + "model.layers.11.mlp.experts.81.gate_proj.weight_scale": "model-00012-of-00047.safetensors", + "model.layers.11.mlp.experts.81.up_proj.weight": "model-00012-of-00047.safetensors", + "model.layers.11.mlp.experts.81.up_proj.weight_scale": "model-00012-of-00047.safetensors", + "model.layers.11.mlp.experts.82.down_proj.weight": "model-00012-of-00047.safetensors", + "model.layers.11.mlp.experts.82.down_proj.weight_scale": "model-00012-of-00047.safetensors", + "model.layers.11.mlp.experts.82.gate_proj.weight": "model-00012-of-00047.safetensors", + "model.layers.11.mlp.experts.82.gate_proj.weight_scale": "model-00012-of-00047.safetensors", + "model.layers.11.mlp.experts.82.up_proj.weight": "model-00012-of-00047.safetensors", + "model.layers.11.mlp.experts.82.up_proj.weight_scale": "model-00012-of-00047.safetensors", + "model.layers.11.mlp.experts.83.down_proj.weight": "model-00012-of-00047.safetensors", + "model.layers.11.mlp.experts.83.down_proj.weight_scale": "model-00012-of-00047.safetensors", + "model.layers.11.mlp.experts.83.gate_proj.weight": "model-00012-of-00047.safetensors", + "model.layers.11.mlp.experts.83.gate_proj.weight_scale": "model-00012-of-00047.safetensors", + "model.layers.11.mlp.experts.83.up_proj.weight": "model-00012-of-00047.safetensors", + "model.layers.11.mlp.experts.83.up_proj.weight_scale": "model-00012-of-00047.safetensors", + "model.layers.11.mlp.experts.84.down_proj.weight": "model-00012-of-00047.safetensors", + "model.layers.11.mlp.experts.84.down_proj.weight_scale": "model-00012-of-00047.safetensors", + "model.layers.11.mlp.experts.84.gate_proj.weight": "model-00012-of-00047.safetensors", + "model.layers.11.mlp.experts.84.gate_proj.weight_scale": "model-00012-of-00047.safetensors", + "model.layers.11.mlp.experts.84.up_proj.weight": "model-00012-of-00047.safetensors", + "model.layers.11.mlp.experts.84.up_proj.weight_scale": "model-00012-of-00047.safetensors", + "model.layers.11.mlp.experts.85.down_proj.weight": "model-00012-of-00047.safetensors", + "model.layers.11.mlp.experts.85.down_proj.weight_scale": "model-00012-of-00047.safetensors", + "model.layers.11.mlp.experts.85.gate_proj.weight": "model-00012-of-00047.safetensors", + "model.layers.11.mlp.experts.85.gate_proj.weight_scale": "model-00012-of-00047.safetensors", + "model.layers.11.mlp.experts.85.up_proj.weight": "model-00012-of-00047.safetensors", + "model.layers.11.mlp.experts.85.up_proj.weight_scale": "model-00012-of-00047.safetensors", + "model.layers.11.mlp.experts.86.down_proj.weight": "model-00012-of-00047.safetensors", + "model.layers.11.mlp.experts.86.down_proj.weight_scale": "model-00012-of-00047.safetensors", + "model.layers.11.mlp.experts.86.gate_proj.weight": "model-00012-of-00047.safetensors", + "model.layers.11.mlp.experts.86.gate_proj.weight_scale": "model-00012-of-00047.safetensors", + "model.layers.11.mlp.experts.86.up_proj.weight": "model-00012-of-00047.safetensors", + "model.layers.11.mlp.experts.86.up_proj.weight_scale": "model-00012-of-00047.safetensors", + "model.layers.11.mlp.experts.87.down_proj.weight": "model-00012-of-00047.safetensors", + "model.layers.11.mlp.experts.87.down_proj.weight_scale": "model-00012-of-00047.safetensors", + "model.layers.11.mlp.experts.87.gate_proj.weight": "model-00012-of-00047.safetensors", + "model.layers.11.mlp.experts.87.gate_proj.weight_scale": "model-00012-of-00047.safetensors", + "model.layers.11.mlp.experts.87.up_proj.weight": "model-00012-of-00047.safetensors", + "model.layers.11.mlp.experts.87.up_proj.weight_scale": "model-00012-of-00047.safetensors", + "model.layers.11.mlp.experts.88.down_proj.weight": "model-00012-of-00047.safetensors", + "model.layers.11.mlp.experts.88.down_proj.weight_scale": "model-00012-of-00047.safetensors", + "model.layers.11.mlp.experts.88.gate_proj.weight": "model-00012-of-00047.safetensors", + "model.layers.11.mlp.experts.88.gate_proj.weight_scale": "model-00012-of-00047.safetensors", + "model.layers.11.mlp.experts.88.up_proj.weight": "model-00012-of-00047.safetensors", + "model.layers.11.mlp.experts.88.up_proj.weight_scale": "model-00012-of-00047.safetensors", + "model.layers.11.mlp.experts.89.down_proj.weight": "model-00012-of-00047.safetensors", + "model.layers.11.mlp.experts.89.down_proj.weight_scale": "model-00012-of-00047.safetensors", + "model.layers.11.mlp.experts.89.gate_proj.weight": "model-00012-of-00047.safetensors", + "model.layers.11.mlp.experts.89.gate_proj.weight_scale": "model-00012-of-00047.safetensors", + "model.layers.11.mlp.experts.89.up_proj.weight": "model-00012-of-00047.safetensors", + "model.layers.11.mlp.experts.89.up_proj.weight_scale": "model-00012-of-00047.safetensors", + "model.layers.11.mlp.experts.9.down_proj.weight": "model-00012-of-00047.safetensors", + "model.layers.11.mlp.experts.9.down_proj.weight_scale": "model-00012-of-00047.safetensors", + "model.layers.11.mlp.experts.9.gate_proj.weight": "model-00012-of-00047.safetensors", + "model.layers.11.mlp.experts.9.gate_proj.weight_scale": "model-00012-of-00047.safetensors", + "model.layers.11.mlp.experts.9.up_proj.weight": "model-00012-of-00047.safetensors", + "model.layers.11.mlp.experts.9.up_proj.weight_scale": "model-00012-of-00047.safetensors", + "model.layers.11.mlp.experts.90.down_proj.weight": "model-00012-of-00047.safetensors", + "model.layers.11.mlp.experts.90.down_proj.weight_scale": "model-00012-of-00047.safetensors", + "model.layers.11.mlp.experts.90.gate_proj.weight": "model-00012-of-00047.safetensors", + "model.layers.11.mlp.experts.90.gate_proj.weight_scale": "model-00012-of-00047.safetensors", + "model.layers.11.mlp.experts.90.up_proj.weight": "model-00012-of-00047.safetensors", + "model.layers.11.mlp.experts.90.up_proj.weight_scale": "model-00012-of-00047.safetensors", + "model.layers.11.mlp.experts.91.down_proj.weight": "model-00012-of-00047.safetensors", + "model.layers.11.mlp.experts.91.down_proj.weight_scale": "model-00012-of-00047.safetensors", + "model.layers.11.mlp.experts.91.gate_proj.weight": "model-00012-of-00047.safetensors", + "model.layers.11.mlp.experts.91.gate_proj.weight_scale": "model-00012-of-00047.safetensors", + "model.layers.11.mlp.experts.91.up_proj.weight": "model-00012-of-00047.safetensors", + "model.layers.11.mlp.experts.91.up_proj.weight_scale": "model-00012-of-00047.safetensors", + "model.layers.11.mlp.experts.92.down_proj.weight": "model-00012-of-00047.safetensors", + "model.layers.11.mlp.experts.92.down_proj.weight_scale": "model-00012-of-00047.safetensors", + "model.layers.11.mlp.experts.92.gate_proj.weight": "model-00012-of-00047.safetensors", + "model.layers.11.mlp.experts.92.gate_proj.weight_scale": "model-00012-of-00047.safetensors", + "model.layers.11.mlp.experts.92.up_proj.weight": "model-00012-of-00047.safetensors", + "model.layers.11.mlp.experts.92.up_proj.weight_scale": "model-00012-of-00047.safetensors", + "model.layers.11.mlp.experts.93.down_proj.weight": "model-00012-of-00047.safetensors", + "model.layers.11.mlp.experts.93.down_proj.weight_scale": "model-00012-of-00047.safetensors", + "model.layers.11.mlp.experts.93.gate_proj.weight": "model-00012-of-00047.safetensors", + "model.layers.11.mlp.experts.93.gate_proj.weight_scale": "model-00012-of-00047.safetensors", + "model.layers.11.mlp.experts.93.up_proj.weight": "model-00012-of-00047.safetensors", + "model.layers.11.mlp.experts.93.up_proj.weight_scale": "model-00012-of-00047.safetensors", + "model.layers.11.mlp.experts.94.down_proj.weight": "model-00012-of-00047.safetensors", + "model.layers.11.mlp.experts.94.down_proj.weight_scale": "model-00012-of-00047.safetensors", + "model.layers.11.mlp.experts.94.gate_proj.weight": "model-00012-of-00047.safetensors", + "model.layers.11.mlp.experts.94.gate_proj.weight_scale": "model-00012-of-00047.safetensors", + "model.layers.11.mlp.experts.94.up_proj.weight": "model-00012-of-00047.safetensors", + "model.layers.11.mlp.experts.94.up_proj.weight_scale": "model-00012-of-00047.safetensors", + "model.layers.11.mlp.experts.95.down_proj.weight": "model-00012-of-00047.safetensors", + "model.layers.11.mlp.experts.95.down_proj.weight_scale": "model-00012-of-00047.safetensors", + "model.layers.11.mlp.experts.95.gate_proj.weight": "model-00012-of-00047.safetensors", + "model.layers.11.mlp.experts.95.gate_proj.weight_scale": "model-00012-of-00047.safetensors", + "model.layers.11.mlp.experts.95.up_proj.weight": "model-00012-of-00047.safetensors", + "model.layers.11.mlp.experts.95.up_proj.weight_scale": "model-00012-of-00047.safetensors", + "model.layers.11.mlp.experts.96.down_proj.weight": "model-00012-of-00047.safetensors", + "model.layers.11.mlp.experts.96.down_proj.weight_scale": "model-00012-of-00047.safetensors", + "model.layers.11.mlp.experts.96.gate_proj.weight": "model-00012-of-00047.safetensors", + "model.layers.11.mlp.experts.96.gate_proj.weight_scale": "model-00012-of-00047.safetensors", + "model.layers.11.mlp.experts.96.up_proj.weight": "model-00012-of-00047.safetensors", + "model.layers.11.mlp.experts.96.up_proj.weight_scale": "model-00012-of-00047.safetensors", + "model.layers.11.mlp.experts.97.down_proj.weight": "model-00012-of-00047.safetensors", + "model.layers.11.mlp.experts.97.down_proj.weight_scale": "model-00012-of-00047.safetensors", + "model.layers.11.mlp.experts.97.gate_proj.weight": "model-00012-of-00047.safetensors", + "model.layers.11.mlp.experts.97.gate_proj.weight_scale": "model-00012-of-00047.safetensors", + "model.layers.11.mlp.experts.97.up_proj.weight": "model-00012-of-00047.safetensors", + "model.layers.11.mlp.experts.97.up_proj.weight_scale": "model-00012-of-00047.safetensors", + "model.layers.11.mlp.experts.98.down_proj.weight": "model-00012-of-00047.safetensors", + "model.layers.11.mlp.experts.98.down_proj.weight_scale": "model-00012-of-00047.safetensors", + "model.layers.11.mlp.experts.98.gate_proj.weight": "model-00012-of-00047.safetensors", + "model.layers.11.mlp.experts.98.gate_proj.weight_scale": "model-00012-of-00047.safetensors", + "model.layers.11.mlp.experts.98.up_proj.weight": "model-00012-of-00047.safetensors", + "model.layers.11.mlp.experts.98.up_proj.weight_scale": "model-00012-of-00047.safetensors", + "model.layers.11.mlp.experts.99.down_proj.weight": "model-00012-of-00047.safetensors", + "model.layers.11.mlp.experts.99.down_proj.weight_scale": "model-00012-of-00047.safetensors", + "model.layers.11.mlp.experts.99.gate_proj.weight": "model-00012-of-00047.safetensors", + "model.layers.11.mlp.experts.99.gate_proj.weight_scale": "model-00012-of-00047.safetensors", + "model.layers.11.mlp.experts.99.up_proj.weight": "model-00012-of-00047.safetensors", + "model.layers.11.mlp.experts.99.up_proj.weight_scale": "model-00012-of-00047.safetensors", + "model.layers.11.mlp.gate.e_score_correction_bias": "model-00012-of-00047.safetensors", + "model.layers.11.mlp.gate.weight": "model-00012-of-00047.safetensors", + "model.layers.11.mlp.shared_experts.down_proj.weight": "model-00012-of-00047.safetensors", + "model.layers.11.mlp.shared_experts.down_proj.weight_scale": "model-00012-of-00047.safetensors", + "model.layers.11.mlp.shared_experts.gate_proj.weight": "model-00012-of-00047.safetensors", + "model.layers.11.mlp.shared_experts.gate_proj.weight_scale": "model-00012-of-00047.safetensors", + "model.layers.11.mlp.shared_experts.up_proj.weight": "model-00012-of-00047.safetensors", + "model.layers.11.mlp.shared_experts.up_proj.weight_scale": "model-00012-of-00047.safetensors", + "model.layers.11.post_attention_layernorm.weight": "model-00012-of-00047.safetensors", + "model.layers.11.self_attn.k_proj.bias": "model-00012-of-00047.safetensors", + "model.layers.11.self_attn.k_proj.weight": "model-00012-of-00047.safetensors", + "model.layers.11.self_attn.k_proj.weight_scale": "model-00012-of-00047.safetensors", + "model.layers.11.self_attn.o_proj.weight": "model-00012-of-00047.safetensors", + "model.layers.11.self_attn.o_proj.weight_scale": "model-00012-of-00047.safetensors", + "model.layers.11.self_attn.q_proj.bias": "model-00012-of-00047.safetensors", + "model.layers.11.self_attn.q_proj.weight": "model-00012-of-00047.safetensors", + "model.layers.11.self_attn.q_proj.weight_scale": "model-00012-of-00047.safetensors", + "model.layers.11.self_attn.v_proj.bias": "model-00012-of-00047.safetensors", + "model.layers.11.self_attn.v_proj.weight": "model-00012-of-00047.safetensors", + "model.layers.11.self_attn.v_proj.weight_scale": "model-00012-of-00047.safetensors", + "model.layers.12.input_layernorm.weight": "model-00013-of-00047.safetensors", + "model.layers.12.mlp.experts.0.down_proj.weight": "model-00013-of-00047.safetensors", + "model.layers.12.mlp.experts.0.down_proj.weight_scale": "model-00013-of-00047.safetensors", + "model.layers.12.mlp.experts.0.gate_proj.weight": "model-00013-of-00047.safetensors", + "model.layers.12.mlp.experts.0.gate_proj.weight_scale": "model-00013-of-00047.safetensors", + "model.layers.12.mlp.experts.0.up_proj.weight": "model-00013-of-00047.safetensors", + "model.layers.12.mlp.experts.0.up_proj.weight_scale": "model-00013-of-00047.safetensors", + "model.layers.12.mlp.experts.1.down_proj.weight": "model-00013-of-00047.safetensors", + "model.layers.12.mlp.experts.1.down_proj.weight_scale": "model-00013-of-00047.safetensors", + "model.layers.12.mlp.experts.1.gate_proj.weight": "model-00013-of-00047.safetensors", + "model.layers.12.mlp.experts.1.gate_proj.weight_scale": "model-00013-of-00047.safetensors", + "model.layers.12.mlp.experts.1.up_proj.weight": "model-00013-of-00047.safetensors", + "model.layers.12.mlp.experts.1.up_proj.weight_scale": "model-00013-of-00047.safetensors", + "model.layers.12.mlp.experts.10.down_proj.weight": "model-00013-of-00047.safetensors", + "model.layers.12.mlp.experts.10.down_proj.weight_scale": "model-00013-of-00047.safetensors", + "model.layers.12.mlp.experts.10.gate_proj.weight": "model-00013-of-00047.safetensors", + "model.layers.12.mlp.experts.10.gate_proj.weight_scale": "model-00013-of-00047.safetensors", + "model.layers.12.mlp.experts.10.up_proj.weight": "model-00013-of-00047.safetensors", + "model.layers.12.mlp.experts.10.up_proj.weight_scale": "model-00013-of-00047.safetensors", + "model.layers.12.mlp.experts.100.down_proj.weight": "model-00013-of-00047.safetensors", + "model.layers.12.mlp.experts.100.down_proj.weight_scale": "model-00013-of-00047.safetensors", + "model.layers.12.mlp.experts.100.gate_proj.weight": "model-00013-of-00047.safetensors", + "model.layers.12.mlp.experts.100.gate_proj.weight_scale": "model-00013-of-00047.safetensors", + "model.layers.12.mlp.experts.100.up_proj.weight": "model-00013-of-00047.safetensors", + "model.layers.12.mlp.experts.100.up_proj.weight_scale": "model-00013-of-00047.safetensors", + "model.layers.12.mlp.experts.101.down_proj.weight": "model-00013-of-00047.safetensors", + "model.layers.12.mlp.experts.101.down_proj.weight_scale": "model-00013-of-00047.safetensors", + "model.layers.12.mlp.experts.101.gate_proj.weight": "model-00013-of-00047.safetensors", + "model.layers.12.mlp.experts.101.gate_proj.weight_scale": "model-00013-of-00047.safetensors", + "model.layers.12.mlp.experts.101.up_proj.weight": "model-00013-of-00047.safetensors", + "model.layers.12.mlp.experts.101.up_proj.weight_scale": "model-00013-of-00047.safetensors", + "model.layers.12.mlp.experts.102.down_proj.weight": "model-00013-of-00047.safetensors", + "model.layers.12.mlp.experts.102.down_proj.weight_scale": "model-00013-of-00047.safetensors", + "model.layers.12.mlp.experts.102.gate_proj.weight": "model-00013-of-00047.safetensors", + "model.layers.12.mlp.experts.102.gate_proj.weight_scale": "model-00013-of-00047.safetensors", + "model.layers.12.mlp.experts.102.up_proj.weight": "model-00013-of-00047.safetensors", + "model.layers.12.mlp.experts.102.up_proj.weight_scale": "model-00013-of-00047.safetensors", + "model.layers.12.mlp.experts.103.down_proj.weight": "model-00013-of-00047.safetensors", + "model.layers.12.mlp.experts.103.down_proj.weight_scale": "model-00013-of-00047.safetensors", + "model.layers.12.mlp.experts.103.gate_proj.weight": "model-00013-of-00047.safetensors", + "model.layers.12.mlp.experts.103.gate_proj.weight_scale": "model-00013-of-00047.safetensors", + "model.layers.12.mlp.experts.103.up_proj.weight": "model-00013-of-00047.safetensors", + "model.layers.12.mlp.experts.103.up_proj.weight_scale": "model-00013-of-00047.safetensors", + "model.layers.12.mlp.experts.104.down_proj.weight": "model-00013-of-00047.safetensors", + "model.layers.12.mlp.experts.104.down_proj.weight_scale": "model-00013-of-00047.safetensors", + "model.layers.12.mlp.experts.104.gate_proj.weight": "model-00013-of-00047.safetensors", + "model.layers.12.mlp.experts.104.gate_proj.weight_scale": "model-00013-of-00047.safetensors", + "model.layers.12.mlp.experts.104.up_proj.weight": "model-00013-of-00047.safetensors", + "model.layers.12.mlp.experts.104.up_proj.weight_scale": "model-00013-of-00047.safetensors", + "model.layers.12.mlp.experts.105.down_proj.weight": "model-00013-of-00047.safetensors", + "model.layers.12.mlp.experts.105.down_proj.weight_scale": "model-00013-of-00047.safetensors", + "model.layers.12.mlp.experts.105.gate_proj.weight": "model-00013-of-00047.safetensors", + "model.layers.12.mlp.experts.105.gate_proj.weight_scale": "model-00013-of-00047.safetensors", + "model.layers.12.mlp.experts.105.up_proj.weight": "model-00013-of-00047.safetensors", + "model.layers.12.mlp.experts.105.up_proj.weight_scale": "model-00013-of-00047.safetensors", + "model.layers.12.mlp.experts.106.down_proj.weight": "model-00013-of-00047.safetensors", + "model.layers.12.mlp.experts.106.down_proj.weight_scale": "model-00013-of-00047.safetensors", + "model.layers.12.mlp.experts.106.gate_proj.weight": "model-00013-of-00047.safetensors", + "model.layers.12.mlp.experts.106.gate_proj.weight_scale": "model-00013-of-00047.safetensors", + "model.layers.12.mlp.experts.106.up_proj.weight": "model-00013-of-00047.safetensors", + "model.layers.12.mlp.experts.106.up_proj.weight_scale": "model-00013-of-00047.safetensors", + "model.layers.12.mlp.experts.107.down_proj.weight": "model-00013-of-00047.safetensors", + "model.layers.12.mlp.experts.107.down_proj.weight_scale": "model-00013-of-00047.safetensors", + "model.layers.12.mlp.experts.107.gate_proj.weight": "model-00013-of-00047.safetensors", + "model.layers.12.mlp.experts.107.gate_proj.weight_scale": "model-00013-of-00047.safetensors", + "model.layers.12.mlp.experts.107.up_proj.weight": "model-00013-of-00047.safetensors", + "model.layers.12.mlp.experts.107.up_proj.weight_scale": "model-00013-of-00047.safetensors", + "model.layers.12.mlp.experts.108.down_proj.weight": "model-00013-of-00047.safetensors", + "model.layers.12.mlp.experts.108.down_proj.weight_scale": "model-00013-of-00047.safetensors", + "model.layers.12.mlp.experts.108.gate_proj.weight": "model-00013-of-00047.safetensors", + "model.layers.12.mlp.experts.108.gate_proj.weight_scale": "model-00013-of-00047.safetensors", + "model.layers.12.mlp.experts.108.up_proj.weight": "model-00013-of-00047.safetensors", + "model.layers.12.mlp.experts.108.up_proj.weight_scale": "model-00013-of-00047.safetensors", + "model.layers.12.mlp.experts.109.down_proj.weight": "model-00013-of-00047.safetensors", + "model.layers.12.mlp.experts.109.down_proj.weight_scale": "model-00013-of-00047.safetensors", + "model.layers.12.mlp.experts.109.gate_proj.weight": "model-00013-of-00047.safetensors", + "model.layers.12.mlp.experts.109.gate_proj.weight_scale": "model-00013-of-00047.safetensors", + "model.layers.12.mlp.experts.109.up_proj.weight": "model-00013-of-00047.safetensors", + "model.layers.12.mlp.experts.109.up_proj.weight_scale": "model-00013-of-00047.safetensors", + "model.layers.12.mlp.experts.11.down_proj.weight": "model-00013-of-00047.safetensors", + "model.layers.12.mlp.experts.11.down_proj.weight_scale": "model-00013-of-00047.safetensors", + "model.layers.12.mlp.experts.11.gate_proj.weight": "model-00013-of-00047.safetensors", + "model.layers.12.mlp.experts.11.gate_proj.weight_scale": "model-00013-of-00047.safetensors", + "model.layers.12.mlp.experts.11.up_proj.weight": "model-00013-of-00047.safetensors", + "model.layers.12.mlp.experts.11.up_proj.weight_scale": "model-00013-of-00047.safetensors", + "model.layers.12.mlp.experts.110.down_proj.weight": "model-00013-of-00047.safetensors", + "model.layers.12.mlp.experts.110.down_proj.weight_scale": "model-00013-of-00047.safetensors", + "model.layers.12.mlp.experts.110.gate_proj.weight": "model-00013-of-00047.safetensors", + "model.layers.12.mlp.experts.110.gate_proj.weight_scale": "model-00013-of-00047.safetensors", + "model.layers.12.mlp.experts.110.up_proj.weight": "model-00013-of-00047.safetensors", + "model.layers.12.mlp.experts.110.up_proj.weight_scale": "model-00013-of-00047.safetensors", + "model.layers.12.mlp.experts.111.down_proj.weight": "model-00013-of-00047.safetensors", + "model.layers.12.mlp.experts.111.down_proj.weight_scale": "model-00013-of-00047.safetensors", + "model.layers.12.mlp.experts.111.gate_proj.weight": "model-00013-of-00047.safetensors", + "model.layers.12.mlp.experts.111.gate_proj.weight_scale": "model-00013-of-00047.safetensors", + "model.layers.12.mlp.experts.111.up_proj.weight": "model-00013-of-00047.safetensors", + "model.layers.12.mlp.experts.111.up_proj.weight_scale": "model-00013-of-00047.safetensors", + "model.layers.12.mlp.experts.112.down_proj.weight": "model-00013-of-00047.safetensors", + "model.layers.12.mlp.experts.112.down_proj.weight_scale": "model-00013-of-00047.safetensors", + "model.layers.12.mlp.experts.112.gate_proj.weight": "model-00013-of-00047.safetensors", + "model.layers.12.mlp.experts.112.gate_proj.weight_scale": "model-00013-of-00047.safetensors", + "model.layers.12.mlp.experts.112.up_proj.weight": "model-00013-of-00047.safetensors", + "model.layers.12.mlp.experts.112.up_proj.weight_scale": "model-00013-of-00047.safetensors", + "model.layers.12.mlp.experts.113.down_proj.weight": "model-00013-of-00047.safetensors", + "model.layers.12.mlp.experts.113.down_proj.weight_scale": "model-00013-of-00047.safetensors", + "model.layers.12.mlp.experts.113.gate_proj.weight": "model-00013-of-00047.safetensors", + "model.layers.12.mlp.experts.113.gate_proj.weight_scale": "model-00013-of-00047.safetensors", + "model.layers.12.mlp.experts.113.up_proj.weight": "model-00013-of-00047.safetensors", + "model.layers.12.mlp.experts.113.up_proj.weight_scale": "model-00013-of-00047.safetensors", + "model.layers.12.mlp.experts.114.down_proj.weight": "model-00013-of-00047.safetensors", + "model.layers.12.mlp.experts.114.down_proj.weight_scale": "model-00013-of-00047.safetensors", + "model.layers.12.mlp.experts.114.gate_proj.weight": "model-00013-of-00047.safetensors", + "model.layers.12.mlp.experts.114.gate_proj.weight_scale": "model-00013-of-00047.safetensors", + "model.layers.12.mlp.experts.114.up_proj.weight": "model-00013-of-00047.safetensors", + "model.layers.12.mlp.experts.114.up_proj.weight_scale": "model-00013-of-00047.safetensors", + "model.layers.12.mlp.experts.115.down_proj.weight": "model-00013-of-00047.safetensors", + "model.layers.12.mlp.experts.115.down_proj.weight_scale": "model-00013-of-00047.safetensors", + "model.layers.12.mlp.experts.115.gate_proj.weight": "model-00013-of-00047.safetensors", + "model.layers.12.mlp.experts.115.gate_proj.weight_scale": "model-00013-of-00047.safetensors", + "model.layers.12.mlp.experts.115.up_proj.weight": "model-00013-of-00047.safetensors", + "model.layers.12.mlp.experts.115.up_proj.weight_scale": "model-00013-of-00047.safetensors", + "model.layers.12.mlp.experts.116.down_proj.weight": "model-00013-of-00047.safetensors", + "model.layers.12.mlp.experts.116.down_proj.weight_scale": "model-00013-of-00047.safetensors", + "model.layers.12.mlp.experts.116.gate_proj.weight": "model-00013-of-00047.safetensors", + "model.layers.12.mlp.experts.116.gate_proj.weight_scale": "model-00013-of-00047.safetensors", + "model.layers.12.mlp.experts.116.up_proj.weight": "model-00013-of-00047.safetensors", + "model.layers.12.mlp.experts.116.up_proj.weight_scale": "model-00013-of-00047.safetensors", + "model.layers.12.mlp.experts.117.down_proj.weight": "model-00013-of-00047.safetensors", + "model.layers.12.mlp.experts.117.down_proj.weight_scale": "model-00013-of-00047.safetensors", + "model.layers.12.mlp.experts.117.gate_proj.weight": "model-00013-of-00047.safetensors", + "model.layers.12.mlp.experts.117.gate_proj.weight_scale": "model-00013-of-00047.safetensors", + "model.layers.12.mlp.experts.117.up_proj.weight": "model-00013-of-00047.safetensors", + "model.layers.12.mlp.experts.117.up_proj.weight_scale": "model-00013-of-00047.safetensors", + "model.layers.12.mlp.experts.118.down_proj.weight": "model-00013-of-00047.safetensors", + "model.layers.12.mlp.experts.118.down_proj.weight_scale": "model-00013-of-00047.safetensors", + "model.layers.12.mlp.experts.118.gate_proj.weight": "model-00013-of-00047.safetensors", + "model.layers.12.mlp.experts.118.gate_proj.weight_scale": "model-00013-of-00047.safetensors", + "model.layers.12.mlp.experts.118.up_proj.weight": "model-00013-of-00047.safetensors", + "model.layers.12.mlp.experts.118.up_proj.weight_scale": "model-00013-of-00047.safetensors", + "model.layers.12.mlp.experts.119.down_proj.weight": "model-00013-of-00047.safetensors", + "model.layers.12.mlp.experts.119.down_proj.weight_scale": "model-00013-of-00047.safetensors", + "model.layers.12.mlp.experts.119.gate_proj.weight": "model-00013-of-00047.safetensors", + "model.layers.12.mlp.experts.119.gate_proj.weight_scale": "model-00013-of-00047.safetensors", + "model.layers.12.mlp.experts.119.up_proj.weight": "model-00013-of-00047.safetensors", + "model.layers.12.mlp.experts.119.up_proj.weight_scale": "model-00013-of-00047.safetensors", + "model.layers.12.mlp.experts.12.down_proj.weight": "model-00013-of-00047.safetensors", + "model.layers.12.mlp.experts.12.down_proj.weight_scale": "model-00013-of-00047.safetensors", + "model.layers.12.mlp.experts.12.gate_proj.weight": "model-00013-of-00047.safetensors", + "model.layers.12.mlp.experts.12.gate_proj.weight_scale": "model-00013-of-00047.safetensors", + "model.layers.12.mlp.experts.12.up_proj.weight": "model-00013-of-00047.safetensors", + "model.layers.12.mlp.experts.12.up_proj.weight_scale": "model-00013-of-00047.safetensors", + "model.layers.12.mlp.experts.120.down_proj.weight": "model-00013-of-00047.safetensors", + "model.layers.12.mlp.experts.120.down_proj.weight_scale": "model-00013-of-00047.safetensors", + "model.layers.12.mlp.experts.120.gate_proj.weight": "model-00013-of-00047.safetensors", + "model.layers.12.mlp.experts.120.gate_proj.weight_scale": "model-00013-of-00047.safetensors", + "model.layers.12.mlp.experts.120.up_proj.weight": "model-00013-of-00047.safetensors", + "model.layers.12.mlp.experts.120.up_proj.weight_scale": "model-00013-of-00047.safetensors", + "model.layers.12.mlp.experts.121.down_proj.weight": "model-00013-of-00047.safetensors", + "model.layers.12.mlp.experts.121.down_proj.weight_scale": "model-00013-of-00047.safetensors", + "model.layers.12.mlp.experts.121.gate_proj.weight": "model-00013-of-00047.safetensors", + "model.layers.12.mlp.experts.121.gate_proj.weight_scale": "model-00013-of-00047.safetensors", + "model.layers.12.mlp.experts.121.up_proj.weight": "model-00013-of-00047.safetensors", + "model.layers.12.mlp.experts.121.up_proj.weight_scale": "model-00013-of-00047.safetensors", + "model.layers.12.mlp.experts.122.down_proj.weight": "model-00013-of-00047.safetensors", + "model.layers.12.mlp.experts.122.down_proj.weight_scale": "model-00013-of-00047.safetensors", + "model.layers.12.mlp.experts.122.gate_proj.weight": "model-00013-of-00047.safetensors", + "model.layers.12.mlp.experts.122.gate_proj.weight_scale": "model-00013-of-00047.safetensors", + "model.layers.12.mlp.experts.122.up_proj.weight": "model-00013-of-00047.safetensors", + "model.layers.12.mlp.experts.122.up_proj.weight_scale": "model-00013-of-00047.safetensors", + "model.layers.12.mlp.experts.123.down_proj.weight": "model-00013-of-00047.safetensors", + "model.layers.12.mlp.experts.123.down_proj.weight_scale": "model-00013-of-00047.safetensors", + "model.layers.12.mlp.experts.123.gate_proj.weight": "model-00013-of-00047.safetensors", + "model.layers.12.mlp.experts.123.gate_proj.weight_scale": "model-00013-of-00047.safetensors", + "model.layers.12.mlp.experts.123.up_proj.weight": "model-00013-of-00047.safetensors", + "model.layers.12.mlp.experts.123.up_proj.weight_scale": "model-00013-of-00047.safetensors", + "model.layers.12.mlp.experts.124.down_proj.weight": "model-00013-of-00047.safetensors", + "model.layers.12.mlp.experts.124.down_proj.weight_scale": "model-00013-of-00047.safetensors", + "model.layers.12.mlp.experts.124.gate_proj.weight": "model-00013-of-00047.safetensors", + "model.layers.12.mlp.experts.124.gate_proj.weight_scale": "model-00013-of-00047.safetensors", + "model.layers.12.mlp.experts.124.up_proj.weight": "model-00013-of-00047.safetensors", + "model.layers.12.mlp.experts.124.up_proj.weight_scale": "model-00013-of-00047.safetensors", + "model.layers.12.mlp.experts.125.down_proj.weight": "model-00013-of-00047.safetensors", + "model.layers.12.mlp.experts.125.down_proj.weight_scale": "model-00013-of-00047.safetensors", + "model.layers.12.mlp.experts.125.gate_proj.weight": "model-00013-of-00047.safetensors", + "model.layers.12.mlp.experts.125.gate_proj.weight_scale": "model-00013-of-00047.safetensors", + "model.layers.12.mlp.experts.125.up_proj.weight": "model-00013-of-00047.safetensors", + "model.layers.12.mlp.experts.125.up_proj.weight_scale": "model-00013-of-00047.safetensors", + "model.layers.12.mlp.experts.126.down_proj.weight": "model-00013-of-00047.safetensors", + "model.layers.12.mlp.experts.126.down_proj.weight_scale": "model-00013-of-00047.safetensors", + "model.layers.12.mlp.experts.126.gate_proj.weight": "model-00013-of-00047.safetensors", + "model.layers.12.mlp.experts.126.gate_proj.weight_scale": "model-00013-of-00047.safetensors", + "model.layers.12.mlp.experts.126.up_proj.weight": "model-00013-of-00047.safetensors", + "model.layers.12.mlp.experts.126.up_proj.weight_scale": "model-00013-of-00047.safetensors", + "model.layers.12.mlp.experts.127.down_proj.weight": "model-00013-of-00047.safetensors", + "model.layers.12.mlp.experts.127.down_proj.weight_scale": "model-00013-of-00047.safetensors", + "model.layers.12.mlp.experts.127.gate_proj.weight": "model-00013-of-00047.safetensors", + "model.layers.12.mlp.experts.127.gate_proj.weight_scale": "model-00013-of-00047.safetensors", + "model.layers.12.mlp.experts.127.up_proj.weight": "model-00013-of-00047.safetensors", + "model.layers.12.mlp.experts.127.up_proj.weight_scale": "model-00013-of-00047.safetensors", + "model.layers.12.mlp.experts.13.down_proj.weight": "model-00013-of-00047.safetensors", + "model.layers.12.mlp.experts.13.down_proj.weight_scale": "model-00013-of-00047.safetensors", + "model.layers.12.mlp.experts.13.gate_proj.weight": "model-00013-of-00047.safetensors", + "model.layers.12.mlp.experts.13.gate_proj.weight_scale": "model-00013-of-00047.safetensors", + "model.layers.12.mlp.experts.13.up_proj.weight": "model-00013-of-00047.safetensors", + "model.layers.12.mlp.experts.13.up_proj.weight_scale": "model-00013-of-00047.safetensors", + "model.layers.12.mlp.experts.14.down_proj.weight": "model-00013-of-00047.safetensors", + "model.layers.12.mlp.experts.14.down_proj.weight_scale": "model-00013-of-00047.safetensors", + "model.layers.12.mlp.experts.14.gate_proj.weight": "model-00013-of-00047.safetensors", + "model.layers.12.mlp.experts.14.gate_proj.weight_scale": "model-00013-of-00047.safetensors", + "model.layers.12.mlp.experts.14.up_proj.weight": "model-00013-of-00047.safetensors", + "model.layers.12.mlp.experts.14.up_proj.weight_scale": "model-00013-of-00047.safetensors", + "model.layers.12.mlp.experts.15.down_proj.weight": "model-00013-of-00047.safetensors", + "model.layers.12.mlp.experts.15.down_proj.weight_scale": "model-00013-of-00047.safetensors", + "model.layers.12.mlp.experts.15.gate_proj.weight": "model-00013-of-00047.safetensors", + "model.layers.12.mlp.experts.15.gate_proj.weight_scale": "model-00013-of-00047.safetensors", + "model.layers.12.mlp.experts.15.up_proj.weight": "model-00013-of-00047.safetensors", + "model.layers.12.mlp.experts.15.up_proj.weight_scale": "model-00013-of-00047.safetensors", + "model.layers.12.mlp.experts.16.down_proj.weight": "model-00013-of-00047.safetensors", + "model.layers.12.mlp.experts.16.down_proj.weight_scale": "model-00013-of-00047.safetensors", + "model.layers.12.mlp.experts.16.gate_proj.weight": "model-00013-of-00047.safetensors", + "model.layers.12.mlp.experts.16.gate_proj.weight_scale": "model-00013-of-00047.safetensors", + "model.layers.12.mlp.experts.16.up_proj.weight": "model-00013-of-00047.safetensors", + "model.layers.12.mlp.experts.16.up_proj.weight_scale": "model-00013-of-00047.safetensors", + "model.layers.12.mlp.experts.17.down_proj.weight": "model-00013-of-00047.safetensors", + "model.layers.12.mlp.experts.17.down_proj.weight_scale": "model-00013-of-00047.safetensors", + "model.layers.12.mlp.experts.17.gate_proj.weight": "model-00013-of-00047.safetensors", + "model.layers.12.mlp.experts.17.gate_proj.weight_scale": "model-00013-of-00047.safetensors", + "model.layers.12.mlp.experts.17.up_proj.weight": "model-00013-of-00047.safetensors", + "model.layers.12.mlp.experts.17.up_proj.weight_scale": "model-00013-of-00047.safetensors", + "model.layers.12.mlp.experts.18.down_proj.weight": "model-00013-of-00047.safetensors", + "model.layers.12.mlp.experts.18.down_proj.weight_scale": "model-00013-of-00047.safetensors", + "model.layers.12.mlp.experts.18.gate_proj.weight": "model-00013-of-00047.safetensors", + "model.layers.12.mlp.experts.18.gate_proj.weight_scale": "model-00013-of-00047.safetensors", + "model.layers.12.mlp.experts.18.up_proj.weight": "model-00013-of-00047.safetensors", + "model.layers.12.mlp.experts.18.up_proj.weight_scale": "model-00013-of-00047.safetensors", + "model.layers.12.mlp.experts.19.down_proj.weight": "model-00013-of-00047.safetensors", + "model.layers.12.mlp.experts.19.down_proj.weight_scale": "model-00013-of-00047.safetensors", + "model.layers.12.mlp.experts.19.gate_proj.weight": "model-00013-of-00047.safetensors", + "model.layers.12.mlp.experts.19.gate_proj.weight_scale": "model-00013-of-00047.safetensors", + "model.layers.12.mlp.experts.19.up_proj.weight": "model-00013-of-00047.safetensors", + "model.layers.12.mlp.experts.19.up_proj.weight_scale": "model-00013-of-00047.safetensors", + "model.layers.12.mlp.experts.2.down_proj.weight": "model-00013-of-00047.safetensors", + "model.layers.12.mlp.experts.2.down_proj.weight_scale": "model-00013-of-00047.safetensors", + "model.layers.12.mlp.experts.2.gate_proj.weight": "model-00013-of-00047.safetensors", + "model.layers.12.mlp.experts.2.gate_proj.weight_scale": "model-00013-of-00047.safetensors", + "model.layers.12.mlp.experts.2.up_proj.weight": "model-00013-of-00047.safetensors", + "model.layers.12.mlp.experts.2.up_proj.weight_scale": "model-00013-of-00047.safetensors", + "model.layers.12.mlp.experts.20.down_proj.weight": "model-00013-of-00047.safetensors", + "model.layers.12.mlp.experts.20.down_proj.weight_scale": "model-00013-of-00047.safetensors", + "model.layers.12.mlp.experts.20.gate_proj.weight": "model-00013-of-00047.safetensors", + "model.layers.12.mlp.experts.20.gate_proj.weight_scale": "model-00013-of-00047.safetensors", + "model.layers.12.mlp.experts.20.up_proj.weight": "model-00013-of-00047.safetensors", + "model.layers.12.mlp.experts.20.up_proj.weight_scale": "model-00013-of-00047.safetensors", + "model.layers.12.mlp.experts.21.down_proj.weight": "model-00013-of-00047.safetensors", + "model.layers.12.mlp.experts.21.down_proj.weight_scale": "model-00013-of-00047.safetensors", + "model.layers.12.mlp.experts.21.gate_proj.weight": "model-00013-of-00047.safetensors", + "model.layers.12.mlp.experts.21.gate_proj.weight_scale": "model-00013-of-00047.safetensors", + "model.layers.12.mlp.experts.21.up_proj.weight": "model-00013-of-00047.safetensors", + "model.layers.12.mlp.experts.21.up_proj.weight_scale": "model-00013-of-00047.safetensors", + "model.layers.12.mlp.experts.22.down_proj.weight": "model-00013-of-00047.safetensors", + "model.layers.12.mlp.experts.22.down_proj.weight_scale": "model-00013-of-00047.safetensors", + "model.layers.12.mlp.experts.22.gate_proj.weight": "model-00013-of-00047.safetensors", + "model.layers.12.mlp.experts.22.gate_proj.weight_scale": "model-00013-of-00047.safetensors", + "model.layers.12.mlp.experts.22.up_proj.weight": "model-00013-of-00047.safetensors", + "model.layers.12.mlp.experts.22.up_proj.weight_scale": "model-00013-of-00047.safetensors", + "model.layers.12.mlp.experts.23.down_proj.weight": "model-00013-of-00047.safetensors", + "model.layers.12.mlp.experts.23.down_proj.weight_scale": "model-00013-of-00047.safetensors", + "model.layers.12.mlp.experts.23.gate_proj.weight": "model-00013-of-00047.safetensors", + "model.layers.12.mlp.experts.23.gate_proj.weight_scale": "model-00013-of-00047.safetensors", + "model.layers.12.mlp.experts.23.up_proj.weight": "model-00013-of-00047.safetensors", + "model.layers.12.mlp.experts.23.up_proj.weight_scale": "model-00013-of-00047.safetensors", + "model.layers.12.mlp.experts.24.down_proj.weight": "model-00013-of-00047.safetensors", + "model.layers.12.mlp.experts.24.down_proj.weight_scale": "model-00013-of-00047.safetensors", + "model.layers.12.mlp.experts.24.gate_proj.weight": "model-00013-of-00047.safetensors", + "model.layers.12.mlp.experts.24.gate_proj.weight_scale": "model-00013-of-00047.safetensors", + "model.layers.12.mlp.experts.24.up_proj.weight": "model-00013-of-00047.safetensors", + "model.layers.12.mlp.experts.24.up_proj.weight_scale": "model-00013-of-00047.safetensors", + "model.layers.12.mlp.experts.25.down_proj.weight": "model-00013-of-00047.safetensors", + "model.layers.12.mlp.experts.25.down_proj.weight_scale": "model-00013-of-00047.safetensors", + "model.layers.12.mlp.experts.25.gate_proj.weight": "model-00013-of-00047.safetensors", + "model.layers.12.mlp.experts.25.gate_proj.weight_scale": "model-00013-of-00047.safetensors", + "model.layers.12.mlp.experts.25.up_proj.weight": "model-00013-of-00047.safetensors", + "model.layers.12.mlp.experts.25.up_proj.weight_scale": "model-00013-of-00047.safetensors", + "model.layers.12.mlp.experts.26.down_proj.weight": "model-00013-of-00047.safetensors", + "model.layers.12.mlp.experts.26.down_proj.weight_scale": "model-00013-of-00047.safetensors", + "model.layers.12.mlp.experts.26.gate_proj.weight": "model-00013-of-00047.safetensors", + "model.layers.12.mlp.experts.26.gate_proj.weight_scale": "model-00013-of-00047.safetensors", + "model.layers.12.mlp.experts.26.up_proj.weight": "model-00013-of-00047.safetensors", + "model.layers.12.mlp.experts.26.up_proj.weight_scale": "model-00013-of-00047.safetensors", + "model.layers.12.mlp.experts.27.down_proj.weight": "model-00013-of-00047.safetensors", + "model.layers.12.mlp.experts.27.down_proj.weight_scale": "model-00013-of-00047.safetensors", + "model.layers.12.mlp.experts.27.gate_proj.weight": "model-00013-of-00047.safetensors", + "model.layers.12.mlp.experts.27.gate_proj.weight_scale": "model-00013-of-00047.safetensors", + "model.layers.12.mlp.experts.27.up_proj.weight": "model-00013-of-00047.safetensors", + "model.layers.12.mlp.experts.27.up_proj.weight_scale": "model-00013-of-00047.safetensors", + "model.layers.12.mlp.experts.28.down_proj.weight": "model-00013-of-00047.safetensors", + "model.layers.12.mlp.experts.28.down_proj.weight_scale": "model-00013-of-00047.safetensors", + "model.layers.12.mlp.experts.28.gate_proj.weight": "model-00013-of-00047.safetensors", + "model.layers.12.mlp.experts.28.gate_proj.weight_scale": "model-00013-of-00047.safetensors", + "model.layers.12.mlp.experts.28.up_proj.weight": "model-00013-of-00047.safetensors", + "model.layers.12.mlp.experts.28.up_proj.weight_scale": "model-00013-of-00047.safetensors", + "model.layers.12.mlp.experts.29.down_proj.weight": "model-00013-of-00047.safetensors", + "model.layers.12.mlp.experts.29.down_proj.weight_scale": "model-00013-of-00047.safetensors", + "model.layers.12.mlp.experts.29.gate_proj.weight": "model-00013-of-00047.safetensors", + "model.layers.12.mlp.experts.29.gate_proj.weight_scale": "model-00013-of-00047.safetensors", + "model.layers.12.mlp.experts.29.up_proj.weight": "model-00013-of-00047.safetensors", + "model.layers.12.mlp.experts.29.up_proj.weight_scale": "model-00013-of-00047.safetensors", + "model.layers.12.mlp.experts.3.down_proj.weight": "model-00013-of-00047.safetensors", + "model.layers.12.mlp.experts.3.down_proj.weight_scale": "model-00013-of-00047.safetensors", + "model.layers.12.mlp.experts.3.gate_proj.weight": "model-00013-of-00047.safetensors", + "model.layers.12.mlp.experts.3.gate_proj.weight_scale": "model-00013-of-00047.safetensors", + "model.layers.12.mlp.experts.3.up_proj.weight": "model-00013-of-00047.safetensors", + "model.layers.12.mlp.experts.3.up_proj.weight_scale": "model-00013-of-00047.safetensors", + "model.layers.12.mlp.experts.30.down_proj.weight": "model-00013-of-00047.safetensors", + "model.layers.12.mlp.experts.30.down_proj.weight_scale": "model-00013-of-00047.safetensors", + "model.layers.12.mlp.experts.30.gate_proj.weight": "model-00013-of-00047.safetensors", + "model.layers.12.mlp.experts.30.gate_proj.weight_scale": "model-00013-of-00047.safetensors", + "model.layers.12.mlp.experts.30.up_proj.weight": "model-00013-of-00047.safetensors", + "model.layers.12.mlp.experts.30.up_proj.weight_scale": "model-00013-of-00047.safetensors", + "model.layers.12.mlp.experts.31.down_proj.weight": "model-00013-of-00047.safetensors", + "model.layers.12.mlp.experts.31.down_proj.weight_scale": "model-00013-of-00047.safetensors", + "model.layers.12.mlp.experts.31.gate_proj.weight": "model-00013-of-00047.safetensors", + "model.layers.12.mlp.experts.31.gate_proj.weight_scale": "model-00013-of-00047.safetensors", + "model.layers.12.mlp.experts.31.up_proj.weight": "model-00013-of-00047.safetensors", + "model.layers.12.mlp.experts.31.up_proj.weight_scale": "model-00013-of-00047.safetensors", + "model.layers.12.mlp.experts.32.down_proj.weight": "model-00013-of-00047.safetensors", + "model.layers.12.mlp.experts.32.down_proj.weight_scale": "model-00013-of-00047.safetensors", + "model.layers.12.mlp.experts.32.gate_proj.weight": "model-00013-of-00047.safetensors", + "model.layers.12.mlp.experts.32.gate_proj.weight_scale": "model-00013-of-00047.safetensors", + "model.layers.12.mlp.experts.32.up_proj.weight": "model-00013-of-00047.safetensors", + "model.layers.12.mlp.experts.32.up_proj.weight_scale": "model-00013-of-00047.safetensors", + "model.layers.12.mlp.experts.33.down_proj.weight": "model-00013-of-00047.safetensors", + "model.layers.12.mlp.experts.33.down_proj.weight_scale": "model-00013-of-00047.safetensors", + "model.layers.12.mlp.experts.33.gate_proj.weight": "model-00013-of-00047.safetensors", + "model.layers.12.mlp.experts.33.gate_proj.weight_scale": "model-00013-of-00047.safetensors", + "model.layers.12.mlp.experts.33.up_proj.weight": "model-00013-of-00047.safetensors", + "model.layers.12.mlp.experts.33.up_proj.weight_scale": "model-00013-of-00047.safetensors", + "model.layers.12.mlp.experts.34.down_proj.weight": "model-00013-of-00047.safetensors", + "model.layers.12.mlp.experts.34.down_proj.weight_scale": "model-00013-of-00047.safetensors", + "model.layers.12.mlp.experts.34.gate_proj.weight": "model-00013-of-00047.safetensors", + "model.layers.12.mlp.experts.34.gate_proj.weight_scale": "model-00013-of-00047.safetensors", + "model.layers.12.mlp.experts.34.up_proj.weight": "model-00013-of-00047.safetensors", + "model.layers.12.mlp.experts.34.up_proj.weight_scale": "model-00013-of-00047.safetensors", + "model.layers.12.mlp.experts.35.down_proj.weight": "model-00013-of-00047.safetensors", + "model.layers.12.mlp.experts.35.down_proj.weight_scale": "model-00013-of-00047.safetensors", + "model.layers.12.mlp.experts.35.gate_proj.weight": "model-00013-of-00047.safetensors", + "model.layers.12.mlp.experts.35.gate_proj.weight_scale": "model-00013-of-00047.safetensors", + "model.layers.12.mlp.experts.35.up_proj.weight": "model-00013-of-00047.safetensors", + "model.layers.12.mlp.experts.35.up_proj.weight_scale": "model-00013-of-00047.safetensors", + "model.layers.12.mlp.experts.36.down_proj.weight": "model-00013-of-00047.safetensors", + "model.layers.12.mlp.experts.36.down_proj.weight_scale": "model-00013-of-00047.safetensors", + "model.layers.12.mlp.experts.36.gate_proj.weight": "model-00013-of-00047.safetensors", + "model.layers.12.mlp.experts.36.gate_proj.weight_scale": "model-00013-of-00047.safetensors", + "model.layers.12.mlp.experts.36.up_proj.weight": "model-00013-of-00047.safetensors", + "model.layers.12.mlp.experts.36.up_proj.weight_scale": "model-00013-of-00047.safetensors", + "model.layers.12.mlp.experts.37.down_proj.weight": "model-00013-of-00047.safetensors", + "model.layers.12.mlp.experts.37.down_proj.weight_scale": "model-00013-of-00047.safetensors", + "model.layers.12.mlp.experts.37.gate_proj.weight": "model-00013-of-00047.safetensors", + "model.layers.12.mlp.experts.37.gate_proj.weight_scale": "model-00013-of-00047.safetensors", + "model.layers.12.mlp.experts.37.up_proj.weight": "model-00013-of-00047.safetensors", + "model.layers.12.mlp.experts.37.up_proj.weight_scale": "model-00013-of-00047.safetensors", + "model.layers.12.mlp.experts.38.down_proj.weight": "model-00013-of-00047.safetensors", + "model.layers.12.mlp.experts.38.down_proj.weight_scale": "model-00013-of-00047.safetensors", + "model.layers.12.mlp.experts.38.gate_proj.weight": "model-00013-of-00047.safetensors", + "model.layers.12.mlp.experts.38.gate_proj.weight_scale": "model-00013-of-00047.safetensors", + "model.layers.12.mlp.experts.38.up_proj.weight": "model-00013-of-00047.safetensors", + "model.layers.12.mlp.experts.38.up_proj.weight_scale": "model-00013-of-00047.safetensors", + "model.layers.12.mlp.experts.39.down_proj.weight": "model-00013-of-00047.safetensors", + "model.layers.12.mlp.experts.39.down_proj.weight_scale": "model-00013-of-00047.safetensors", + "model.layers.12.mlp.experts.39.gate_proj.weight": "model-00013-of-00047.safetensors", + "model.layers.12.mlp.experts.39.gate_proj.weight_scale": "model-00013-of-00047.safetensors", + "model.layers.12.mlp.experts.39.up_proj.weight": "model-00013-of-00047.safetensors", + "model.layers.12.mlp.experts.39.up_proj.weight_scale": "model-00013-of-00047.safetensors", + "model.layers.12.mlp.experts.4.down_proj.weight": "model-00013-of-00047.safetensors", + "model.layers.12.mlp.experts.4.down_proj.weight_scale": "model-00013-of-00047.safetensors", + "model.layers.12.mlp.experts.4.gate_proj.weight": "model-00013-of-00047.safetensors", + "model.layers.12.mlp.experts.4.gate_proj.weight_scale": "model-00013-of-00047.safetensors", + "model.layers.12.mlp.experts.4.up_proj.weight": "model-00013-of-00047.safetensors", + "model.layers.12.mlp.experts.4.up_proj.weight_scale": "model-00013-of-00047.safetensors", + "model.layers.12.mlp.experts.40.down_proj.weight": "model-00013-of-00047.safetensors", + "model.layers.12.mlp.experts.40.down_proj.weight_scale": "model-00013-of-00047.safetensors", + "model.layers.12.mlp.experts.40.gate_proj.weight": "model-00013-of-00047.safetensors", + "model.layers.12.mlp.experts.40.gate_proj.weight_scale": "model-00013-of-00047.safetensors", + "model.layers.12.mlp.experts.40.up_proj.weight": "model-00013-of-00047.safetensors", + "model.layers.12.mlp.experts.40.up_proj.weight_scale": "model-00013-of-00047.safetensors", + "model.layers.12.mlp.experts.41.down_proj.weight": "model-00013-of-00047.safetensors", + "model.layers.12.mlp.experts.41.down_proj.weight_scale": "model-00013-of-00047.safetensors", + "model.layers.12.mlp.experts.41.gate_proj.weight": "model-00013-of-00047.safetensors", + "model.layers.12.mlp.experts.41.gate_proj.weight_scale": "model-00013-of-00047.safetensors", + "model.layers.12.mlp.experts.41.up_proj.weight": "model-00013-of-00047.safetensors", + "model.layers.12.mlp.experts.41.up_proj.weight_scale": "model-00013-of-00047.safetensors", + "model.layers.12.mlp.experts.42.down_proj.weight": "model-00013-of-00047.safetensors", + "model.layers.12.mlp.experts.42.down_proj.weight_scale": "model-00013-of-00047.safetensors", + "model.layers.12.mlp.experts.42.gate_proj.weight": "model-00013-of-00047.safetensors", + "model.layers.12.mlp.experts.42.gate_proj.weight_scale": "model-00013-of-00047.safetensors", + "model.layers.12.mlp.experts.42.up_proj.weight": "model-00013-of-00047.safetensors", + "model.layers.12.mlp.experts.42.up_proj.weight_scale": "model-00013-of-00047.safetensors", + "model.layers.12.mlp.experts.43.down_proj.weight": "model-00013-of-00047.safetensors", + "model.layers.12.mlp.experts.43.down_proj.weight_scale": "model-00013-of-00047.safetensors", + "model.layers.12.mlp.experts.43.gate_proj.weight": "model-00013-of-00047.safetensors", + "model.layers.12.mlp.experts.43.gate_proj.weight_scale": "model-00013-of-00047.safetensors", + "model.layers.12.mlp.experts.43.up_proj.weight": "model-00013-of-00047.safetensors", + "model.layers.12.mlp.experts.43.up_proj.weight_scale": "model-00013-of-00047.safetensors", + "model.layers.12.mlp.experts.44.down_proj.weight": "model-00013-of-00047.safetensors", + "model.layers.12.mlp.experts.44.down_proj.weight_scale": "model-00013-of-00047.safetensors", + "model.layers.12.mlp.experts.44.gate_proj.weight": "model-00013-of-00047.safetensors", + "model.layers.12.mlp.experts.44.gate_proj.weight_scale": "model-00013-of-00047.safetensors", + "model.layers.12.mlp.experts.44.up_proj.weight": "model-00013-of-00047.safetensors", + "model.layers.12.mlp.experts.44.up_proj.weight_scale": "model-00013-of-00047.safetensors", + "model.layers.12.mlp.experts.45.down_proj.weight": "model-00013-of-00047.safetensors", + "model.layers.12.mlp.experts.45.down_proj.weight_scale": "model-00013-of-00047.safetensors", + "model.layers.12.mlp.experts.45.gate_proj.weight": "model-00013-of-00047.safetensors", + "model.layers.12.mlp.experts.45.gate_proj.weight_scale": "model-00013-of-00047.safetensors", + "model.layers.12.mlp.experts.45.up_proj.weight": "model-00013-of-00047.safetensors", + "model.layers.12.mlp.experts.45.up_proj.weight_scale": "model-00013-of-00047.safetensors", + "model.layers.12.mlp.experts.46.down_proj.weight": "model-00013-of-00047.safetensors", + "model.layers.12.mlp.experts.46.down_proj.weight_scale": "model-00013-of-00047.safetensors", + "model.layers.12.mlp.experts.46.gate_proj.weight": "model-00013-of-00047.safetensors", + "model.layers.12.mlp.experts.46.gate_proj.weight_scale": "model-00013-of-00047.safetensors", + "model.layers.12.mlp.experts.46.up_proj.weight": "model-00013-of-00047.safetensors", + "model.layers.12.mlp.experts.46.up_proj.weight_scale": "model-00013-of-00047.safetensors", + "model.layers.12.mlp.experts.47.down_proj.weight": "model-00013-of-00047.safetensors", + "model.layers.12.mlp.experts.47.down_proj.weight_scale": "model-00013-of-00047.safetensors", + "model.layers.12.mlp.experts.47.gate_proj.weight": "model-00013-of-00047.safetensors", + "model.layers.12.mlp.experts.47.gate_proj.weight_scale": "model-00013-of-00047.safetensors", + "model.layers.12.mlp.experts.47.up_proj.weight": "model-00013-of-00047.safetensors", + "model.layers.12.mlp.experts.47.up_proj.weight_scale": "model-00013-of-00047.safetensors", + "model.layers.12.mlp.experts.48.down_proj.weight": "model-00013-of-00047.safetensors", + "model.layers.12.mlp.experts.48.down_proj.weight_scale": "model-00013-of-00047.safetensors", + "model.layers.12.mlp.experts.48.gate_proj.weight": "model-00013-of-00047.safetensors", + "model.layers.12.mlp.experts.48.gate_proj.weight_scale": "model-00013-of-00047.safetensors", + "model.layers.12.mlp.experts.48.up_proj.weight": "model-00013-of-00047.safetensors", + "model.layers.12.mlp.experts.48.up_proj.weight_scale": "model-00013-of-00047.safetensors", + "model.layers.12.mlp.experts.49.down_proj.weight": "model-00013-of-00047.safetensors", + "model.layers.12.mlp.experts.49.down_proj.weight_scale": "model-00013-of-00047.safetensors", + "model.layers.12.mlp.experts.49.gate_proj.weight": "model-00013-of-00047.safetensors", + "model.layers.12.mlp.experts.49.gate_proj.weight_scale": "model-00013-of-00047.safetensors", + "model.layers.12.mlp.experts.49.up_proj.weight": "model-00013-of-00047.safetensors", + "model.layers.12.mlp.experts.49.up_proj.weight_scale": "model-00013-of-00047.safetensors", + "model.layers.12.mlp.experts.5.down_proj.weight": "model-00013-of-00047.safetensors", + "model.layers.12.mlp.experts.5.down_proj.weight_scale": "model-00013-of-00047.safetensors", + "model.layers.12.mlp.experts.5.gate_proj.weight": "model-00013-of-00047.safetensors", + "model.layers.12.mlp.experts.5.gate_proj.weight_scale": "model-00013-of-00047.safetensors", + "model.layers.12.mlp.experts.5.up_proj.weight": "model-00013-of-00047.safetensors", + "model.layers.12.mlp.experts.5.up_proj.weight_scale": "model-00013-of-00047.safetensors", + "model.layers.12.mlp.experts.50.down_proj.weight": "model-00013-of-00047.safetensors", + "model.layers.12.mlp.experts.50.down_proj.weight_scale": "model-00013-of-00047.safetensors", + "model.layers.12.mlp.experts.50.gate_proj.weight": "model-00013-of-00047.safetensors", + "model.layers.12.mlp.experts.50.gate_proj.weight_scale": "model-00013-of-00047.safetensors", + "model.layers.12.mlp.experts.50.up_proj.weight": "model-00013-of-00047.safetensors", + "model.layers.12.mlp.experts.50.up_proj.weight_scale": "model-00013-of-00047.safetensors", + "model.layers.12.mlp.experts.51.down_proj.weight": "model-00013-of-00047.safetensors", + "model.layers.12.mlp.experts.51.down_proj.weight_scale": "model-00013-of-00047.safetensors", + "model.layers.12.mlp.experts.51.gate_proj.weight": "model-00013-of-00047.safetensors", + "model.layers.12.mlp.experts.51.gate_proj.weight_scale": "model-00013-of-00047.safetensors", + "model.layers.12.mlp.experts.51.up_proj.weight": "model-00013-of-00047.safetensors", + "model.layers.12.mlp.experts.51.up_proj.weight_scale": "model-00013-of-00047.safetensors", + "model.layers.12.mlp.experts.52.down_proj.weight": "model-00013-of-00047.safetensors", + "model.layers.12.mlp.experts.52.down_proj.weight_scale": "model-00013-of-00047.safetensors", + "model.layers.12.mlp.experts.52.gate_proj.weight": "model-00013-of-00047.safetensors", + "model.layers.12.mlp.experts.52.gate_proj.weight_scale": "model-00013-of-00047.safetensors", + "model.layers.12.mlp.experts.52.up_proj.weight": "model-00013-of-00047.safetensors", + "model.layers.12.mlp.experts.52.up_proj.weight_scale": "model-00013-of-00047.safetensors", + "model.layers.12.mlp.experts.53.down_proj.weight": "model-00013-of-00047.safetensors", + "model.layers.12.mlp.experts.53.down_proj.weight_scale": "model-00013-of-00047.safetensors", + "model.layers.12.mlp.experts.53.gate_proj.weight": "model-00013-of-00047.safetensors", + "model.layers.12.mlp.experts.53.gate_proj.weight_scale": "model-00013-of-00047.safetensors", + "model.layers.12.mlp.experts.53.up_proj.weight": "model-00013-of-00047.safetensors", + "model.layers.12.mlp.experts.53.up_proj.weight_scale": "model-00013-of-00047.safetensors", + "model.layers.12.mlp.experts.54.down_proj.weight": "model-00013-of-00047.safetensors", + "model.layers.12.mlp.experts.54.down_proj.weight_scale": "model-00013-of-00047.safetensors", + "model.layers.12.mlp.experts.54.gate_proj.weight": "model-00013-of-00047.safetensors", + "model.layers.12.mlp.experts.54.gate_proj.weight_scale": "model-00013-of-00047.safetensors", + "model.layers.12.mlp.experts.54.up_proj.weight": "model-00013-of-00047.safetensors", + "model.layers.12.mlp.experts.54.up_proj.weight_scale": "model-00013-of-00047.safetensors", + "model.layers.12.mlp.experts.55.down_proj.weight": "model-00013-of-00047.safetensors", + "model.layers.12.mlp.experts.55.down_proj.weight_scale": "model-00013-of-00047.safetensors", + "model.layers.12.mlp.experts.55.gate_proj.weight": "model-00013-of-00047.safetensors", + "model.layers.12.mlp.experts.55.gate_proj.weight_scale": "model-00013-of-00047.safetensors", + "model.layers.12.mlp.experts.55.up_proj.weight": "model-00013-of-00047.safetensors", + "model.layers.12.mlp.experts.55.up_proj.weight_scale": "model-00013-of-00047.safetensors", + "model.layers.12.mlp.experts.56.down_proj.weight": "model-00013-of-00047.safetensors", + "model.layers.12.mlp.experts.56.down_proj.weight_scale": "model-00013-of-00047.safetensors", + "model.layers.12.mlp.experts.56.gate_proj.weight": "model-00013-of-00047.safetensors", + "model.layers.12.mlp.experts.56.gate_proj.weight_scale": "model-00013-of-00047.safetensors", + "model.layers.12.mlp.experts.56.up_proj.weight": "model-00013-of-00047.safetensors", + "model.layers.12.mlp.experts.56.up_proj.weight_scale": "model-00013-of-00047.safetensors", + "model.layers.12.mlp.experts.57.down_proj.weight": "model-00013-of-00047.safetensors", + "model.layers.12.mlp.experts.57.down_proj.weight_scale": "model-00013-of-00047.safetensors", + "model.layers.12.mlp.experts.57.gate_proj.weight": "model-00013-of-00047.safetensors", + "model.layers.12.mlp.experts.57.gate_proj.weight_scale": "model-00013-of-00047.safetensors", + "model.layers.12.mlp.experts.57.up_proj.weight": "model-00013-of-00047.safetensors", + "model.layers.12.mlp.experts.57.up_proj.weight_scale": "model-00013-of-00047.safetensors", + "model.layers.12.mlp.experts.58.down_proj.weight": "model-00013-of-00047.safetensors", + "model.layers.12.mlp.experts.58.down_proj.weight_scale": "model-00013-of-00047.safetensors", + "model.layers.12.mlp.experts.58.gate_proj.weight": "model-00013-of-00047.safetensors", + "model.layers.12.mlp.experts.58.gate_proj.weight_scale": "model-00013-of-00047.safetensors", + "model.layers.12.mlp.experts.58.up_proj.weight": "model-00013-of-00047.safetensors", + "model.layers.12.mlp.experts.58.up_proj.weight_scale": "model-00013-of-00047.safetensors", + "model.layers.12.mlp.experts.59.down_proj.weight": "model-00013-of-00047.safetensors", + "model.layers.12.mlp.experts.59.down_proj.weight_scale": "model-00013-of-00047.safetensors", + "model.layers.12.mlp.experts.59.gate_proj.weight": "model-00013-of-00047.safetensors", + "model.layers.12.mlp.experts.59.gate_proj.weight_scale": "model-00013-of-00047.safetensors", + "model.layers.12.mlp.experts.59.up_proj.weight": "model-00013-of-00047.safetensors", + "model.layers.12.mlp.experts.59.up_proj.weight_scale": "model-00013-of-00047.safetensors", + "model.layers.12.mlp.experts.6.down_proj.weight": "model-00013-of-00047.safetensors", + "model.layers.12.mlp.experts.6.down_proj.weight_scale": "model-00013-of-00047.safetensors", + "model.layers.12.mlp.experts.6.gate_proj.weight": "model-00013-of-00047.safetensors", + "model.layers.12.mlp.experts.6.gate_proj.weight_scale": "model-00013-of-00047.safetensors", + "model.layers.12.mlp.experts.6.up_proj.weight": "model-00013-of-00047.safetensors", + "model.layers.12.mlp.experts.6.up_proj.weight_scale": "model-00013-of-00047.safetensors", + "model.layers.12.mlp.experts.60.down_proj.weight": "model-00013-of-00047.safetensors", + "model.layers.12.mlp.experts.60.down_proj.weight_scale": "model-00013-of-00047.safetensors", + "model.layers.12.mlp.experts.60.gate_proj.weight": "model-00013-of-00047.safetensors", + "model.layers.12.mlp.experts.60.gate_proj.weight_scale": "model-00013-of-00047.safetensors", + "model.layers.12.mlp.experts.60.up_proj.weight": "model-00013-of-00047.safetensors", + "model.layers.12.mlp.experts.60.up_proj.weight_scale": "model-00013-of-00047.safetensors", + "model.layers.12.mlp.experts.61.down_proj.weight": "model-00013-of-00047.safetensors", + "model.layers.12.mlp.experts.61.down_proj.weight_scale": "model-00013-of-00047.safetensors", + "model.layers.12.mlp.experts.61.gate_proj.weight": "model-00013-of-00047.safetensors", + "model.layers.12.mlp.experts.61.gate_proj.weight_scale": "model-00013-of-00047.safetensors", + "model.layers.12.mlp.experts.61.up_proj.weight": "model-00013-of-00047.safetensors", + "model.layers.12.mlp.experts.61.up_proj.weight_scale": "model-00013-of-00047.safetensors", + "model.layers.12.mlp.experts.62.down_proj.weight": "model-00013-of-00047.safetensors", + "model.layers.12.mlp.experts.62.down_proj.weight_scale": "model-00013-of-00047.safetensors", + "model.layers.12.mlp.experts.62.gate_proj.weight": "model-00013-of-00047.safetensors", + "model.layers.12.mlp.experts.62.gate_proj.weight_scale": "model-00013-of-00047.safetensors", + "model.layers.12.mlp.experts.62.up_proj.weight": "model-00013-of-00047.safetensors", + "model.layers.12.mlp.experts.62.up_proj.weight_scale": "model-00013-of-00047.safetensors", + "model.layers.12.mlp.experts.63.down_proj.weight": "model-00013-of-00047.safetensors", + "model.layers.12.mlp.experts.63.down_proj.weight_scale": "model-00013-of-00047.safetensors", + "model.layers.12.mlp.experts.63.gate_proj.weight": "model-00013-of-00047.safetensors", + "model.layers.12.mlp.experts.63.gate_proj.weight_scale": "model-00013-of-00047.safetensors", + "model.layers.12.mlp.experts.63.up_proj.weight": "model-00013-of-00047.safetensors", + "model.layers.12.mlp.experts.63.up_proj.weight_scale": "model-00013-of-00047.safetensors", + "model.layers.12.mlp.experts.64.down_proj.weight": "model-00013-of-00047.safetensors", + "model.layers.12.mlp.experts.64.down_proj.weight_scale": "model-00013-of-00047.safetensors", + "model.layers.12.mlp.experts.64.gate_proj.weight": "model-00013-of-00047.safetensors", + "model.layers.12.mlp.experts.64.gate_proj.weight_scale": "model-00013-of-00047.safetensors", + "model.layers.12.mlp.experts.64.up_proj.weight": "model-00013-of-00047.safetensors", + "model.layers.12.mlp.experts.64.up_proj.weight_scale": "model-00013-of-00047.safetensors", + "model.layers.12.mlp.experts.65.down_proj.weight": "model-00013-of-00047.safetensors", + "model.layers.12.mlp.experts.65.down_proj.weight_scale": "model-00013-of-00047.safetensors", + "model.layers.12.mlp.experts.65.gate_proj.weight": "model-00013-of-00047.safetensors", + "model.layers.12.mlp.experts.65.gate_proj.weight_scale": "model-00013-of-00047.safetensors", + "model.layers.12.mlp.experts.65.up_proj.weight": "model-00013-of-00047.safetensors", + "model.layers.12.mlp.experts.65.up_proj.weight_scale": "model-00013-of-00047.safetensors", + "model.layers.12.mlp.experts.66.down_proj.weight": "model-00013-of-00047.safetensors", + "model.layers.12.mlp.experts.66.down_proj.weight_scale": "model-00013-of-00047.safetensors", + "model.layers.12.mlp.experts.66.gate_proj.weight": "model-00013-of-00047.safetensors", + "model.layers.12.mlp.experts.66.gate_proj.weight_scale": "model-00013-of-00047.safetensors", + "model.layers.12.mlp.experts.66.up_proj.weight": "model-00013-of-00047.safetensors", + "model.layers.12.mlp.experts.66.up_proj.weight_scale": "model-00013-of-00047.safetensors", + "model.layers.12.mlp.experts.67.down_proj.weight": "model-00013-of-00047.safetensors", + "model.layers.12.mlp.experts.67.down_proj.weight_scale": "model-00013-of-00047.safetensors", + "model.layers.12.mlp.experts.67.gate_proj.weight": "model-00013-of-00047.safetensors", + "model.layers.12.mlp.experts.67.gate_proj.weight_scale": "model-00013-of-00047.safetensors", + "model.layers.12.mlp.experts.67.up_proj.weight": "model-00013-of-00047.safetensors", + "model.layers.12.mlp.experts.67.up_proj.weight_scale": "model-00013-of-00047.safetensors", + "model.layers.12.mlp.experts.68.down_proj.weight": "model-00013-of-00047.safetensors", + "model.layers.12.mlp.experts.68.down_proj.weight_scale": "model-00013-of-00047.safetensors", + "model.layers.12.mlp.experts.68.gate_proj.weight": "model-00013-of-00047.safetensors", + "model.layers.12.mlp.experts.68.gate_proj.weight_scale": "model-00013-of-00047.safetensors", + "model.layers.12.mlp.experts.68.up_proj.weight": "model-00013-of-00047.safetensors", + "model.layers.12.mlp.experts.68.up_proj.weight_scale": "model-00013-of-00047.safetensors", + "model.layers.12.mlp.experts.69.down_proj.weight": "model-00013-of-00047.safetensors", + "model.layers.12.mlp.experts.69.down_proj.weight_scale": "model-00013-of-00047.safetensors", + "model.layers.12.mlp.experts.69.gate_proj.weight": "model-00013-of-00047.safetensors", + "model.layers.12.mlp.experts.69.gate_proj.weight_scale": "model-00013-of-00047.safetensors", + "model.layers.12.mlp.experts.69.up_proj.weight": "model-00013-of-00047.safetensors", + "model.layers.12.mlp.experts.69.up_proj.weight_scale": "model-00013-of-00047.safetensors", + "model.layers.12.mlp.experts.7.down_proj.weight": "model-00013-of-00047.safetensors", + "model.layers.12.mlp.experts.7.down_proj.weight_scale": "model-00013-of-00047.safetensors", + "model.layers.12.mlp.experts.7.gate_proj.weight": "model-00013-of-00047.safetensors", + "model.layers.12.mlp.experts.7.gate_proj.weight_scale": "model-00013-of-00047.safetensors", + "model.layers.12.mlp.experts.7.up_proj.weight": "model-00013-of-00047.safetensors", + "model.layers.12.mlp.experts.7.up_proj.weight_scale": "model-00013-of-00047.safetensors", + "model.layers.12.mlp.experts.70.down_proj.weight": "model-00013-of-00047.safetensors", + "model.layers.12.mlp.experts.70.down_proj.weight_scale": "model-00013-of-00047.safetensors", + "model.layers.12.mlp.experts.70.gate_proj.weight": "model-00013-of-00047.safetensors", + "model.layers.12.mlp.experts.70.gate_proj.weight_scale": "model-00013-of-00047.safetensors", + "model.layers.12.mlp.experts.70.up_proj.weight": "model-00013-of-00047.safetensors", + "model.layers.12.mlp.experts.70.up_proj.weight_scale": "model-00013-of-00047.safetensors", + "model.layers.12.mlp.experts.71.down_proj.weight": "model-00013-of-00047.safetensors", + "model.layers.12.mlp.experts.71.down_proj.weight_scale": "model-00013-of-00047.safetensors", + "model.layers.12.mlp.experts.71.gate_proj.weight": "model-00013-of-00047.safetensors", + "model.layers.12.mlp.experts.71.gate_proj.weight_scale": "model-00013-of-00047.safetensors", + "model.layers.12.mlp.experts.71.up_proj.weight": "model-00013-of-00047.safetensors", + "model.layers.12.mlp.experts.71.up_proj.weight_scale": "model-00013-of-00047.safetensors", + "model.layers.12.mlp.experts.72.down_proj.weight": "model-00013-of-00047.safetensors", + "model.layers.12.mlp.experts.72.down_proj.weight_scale": "model-00013-of-00047.safetensors", + "model.layers.12.mlp.experts.72.gate_proj.weight": "model-00013-of-00047.safetensors", + "model.layers.12.mlp.experts.72.gate_proj.weight_scale": "model-00013-of-00047.safetensors", + "model.layers.12.mlp.experts.72.up_proj.weight": "model-00013-of-00047.safetensors", + "model.layers.12.mlp.experts.72.up_proj.weight_scale": "model-00013-of-00047.safetensors", + "model.layers.12.mlp.experts.73.down_proj.weight": "model-00013-of-00047.safetensors", + "model.layers.12.mlp.experts.73.down_proj.weight_scale": "model-00013-of-00047.safetensors", + "model.layers.12.mlp.experts.73.gate_proj.weight": "model-00013-of-00047.safetensors", + "model.layers.12.mlp.experts.73.gate_proj.weight_scale": "model-00013-of-00047.safetensors", + "model.layers.12.mlp.experts.73.up_proj.weight": "model-00013-of-00047.safetensors", + "model.layers.12.mlp.experts.73.up_proj.weight_scale": "model-00013-of-00047.safetensors", + "model.layers.12.mlp.experts.74.down_proj.weight": "model-00013-of-00047.safetensors", + "model.layers.12.mlp.experts.74.down_proj.weight_scale": "model-00013-of-00047.safetensors", + "model.layers.12.mlp.experts.74.gate_proj.weight": "model-00013-of-00047.safetensors", + "model.layers.12.mlp.experts.74.gate_proj.weight_scale": "model-00013-of-00047.safetensors", + "model.layers.12.mlp.experts.74.up_proj.weight": "model-00013-of-00047.safetensors", + "model.layers.12.mlp.experts.74.up_proj.weight_scale": "model-00013-of-00047.safetensors", + "model.layers.12.mlp.experts.75.down_proj.weight": "model-00013-of-00047.safetensors", + "model.layers.12.mlp.experts.75.down_proj.weight_scale": "model-00013-of-00047.safetensors", + "model.layers.12.mlp.experts.75.gate_proj.weight": "model-00013-of-00047.safetensors", + "model.layers.12.mlp.experts.75.gate_proj.weight_scale": "model-00013-of-00047.safetensors", + "model.layers.12.mlp.experts.75.up_proj.weight": "model-00013-of-00047.safetensors", + "model.layers.12.mlp.experts.75.up_proj.weight_scale": "model-00013-of-00047.safetensors", + "model.layers.12.mlp.experts.76.down_proj.weight": "model-00013-of-00047.safetensors", + "model.layers.12.mlp.experts.76.down_proj.weight_scale": "model-00013-of-00047.safetensors", + "model.layers.12.mlp.experts.76.gate_proj.weight": "model-00013-of-00047.safetensors", + "model.layers.12.mlp.experts.76.gate_proj.weight_scale": "model-00013-of-00047.safetensors", + "model.layers.12.mlp.experts.76.up_proj.weight": "model-00013-of-00047.safetensors", + "model.layers.12.mlp.experts.76.up_proj.weight_scale": "model-00013-of-00047.safetensors", + "model.layers.12.mlp.experts.77.down_proj.weight": "model-00013-of-00047.safetensors", + "model.layers.12.mlp.experts.77.down_proj.weight_scale": "model-00013-of-00047.safetensors", + "model.layers.12.mlp.experts.77.gate_proj.weight": "model-00013-of-00047.safetensors", + "model.layers.12.mlp.experts.77.gate_proj.weight_scale": "model-00013-of-00047.safetensors", + "model.layers.12.mlp.experts.77.up_proj.weight": "model-00013-of-00047.safetensors", + "model.layers.12.mlp.experts.77.up_proj.weight_scale": "model-00013-of-00047.safetensors", + "model.layers.12.mlp.experts.78.down_proj.weight": "model-00013-of-00047.safetensors", + "model.layers.12.mlp.experts.78.down_proj.weight_scale": "model-00013-of-00047.safetensors", + "model.layers.12.mlp.experts.78.gate_proj.weight": "model-00013-of-00047.safetensors", + "model.layers.12.mlp.experts.78.gate_proj.weight_scale": "model-00013-of-00047.safetensors", + "model.layers.12.mlp.experts.78.up_proj.weight": "model-00013-of-00047.safetensors", + "model.layers.12.mlp.experts.78.up_proj.weight_scale": "model-00013-of-00047.safetensors", + "model.layers.12.mlp.experts.79.down_proj.weight": "model-00013-of-00047.safetensors", + "model.layers.12.mlp.experts.79.down_proj.weight_scale": "model-00013-of-00047.safetensors", + "model.layers.12.mlp.experts.79.gate_proj.weight": "model-00013-of-00047.safetensors", + "model.layers.12.mlp.experts.79.gate_proj.weight_scale": "model-00013-of-00047.safetensors", + "model.layers.12.mlp.experts.79.up_proj.weight": "model-00013-of-00047.safetensors", + "model.layers.12.mlp.experts.79.up_proj.weight_scale": "model-00013-of-00047.safetensors", + "model.layers.12.mlp.experts.8.down_proj.weight": "model-00013-of-00047.safetensors", + "model.layers.12.mlp.experts.8.down_proj.weight_scale": "model-00013-of-00047.safetensors", + "model.layers.12.mlp.experts.8.gate_proj.weight": "model-00013-of-00047.safetensors", + "model.layers.12.mlp.experts.8.gate_proj.weight_scale": "model-00013-of-00047.safetensors", + "model.layers.12.mlp.experts.8.up_proj.weight": "model-00013-of-00047.safetensors", + "model.layers.12.mlp.experts.8.up_proj.weight_scale": "model-00013-of-00047.safetensors", + "model.layers.12.mlp.experts.80.down_proj.weight": "model-00013-of-00047.safetensors", + "model.layers.12.mlp.experts.80.down_proj.weight_scale": "model-00013-of-00047.safetensors", + "model.layers.12.mlp.experts.80.gate_proj.weight": "model-00013-of-00047.safetensors", + "model.layers.12.mlp.experts.80.gate_proj.weight_scale": "model-00013-of-00047.safetensors", + "model.layers.12.mlp.experts.80.up_proj.weight": "model-00013-of-00047.safetensors", + "model.layers.12.mlp.experts.80.up_proj.weight_scale": "model-00013-of-00047.safetensors", + "model.layers.12.mlp.experts.81.down_proj.weight": "model-00013-of-00047.safetensors", + "model.layers.12.mlp.experts.81.down_proj.weight_scale": "model-00013-of-00047.safetensors", + "model.layers.12.mlp.experts.81.gate_proj.weight": "model-00013-of-00047.safetensors", + "model.layers.12.mlp.experts.81.gate_proj.weight_scale": "model-00013-of-00047.safetensors", + "model.layers.12.mlp.experts.81.up_proj.weight": "model-00013-of-00047.safetensors", + "model.layers.12.mlp.experts.81.up_proj.weight_scale": "model-00013-of-00047.safetensors", + "model.layers.12.mlp.experts.82.down_proj.weight": "model-00013-of-00047.safetensors", + "model.layers.12.mlp.experts.82.down_proj.weight_scale": "model-00013-of-00047.safetensors", + "model.layers.12.mlp.experts.82.gate_proj.weight": "model-00013-of-00047.safetensors", + "model.layers.12.mlp.experts.82.gate_proj.weight_scale": "model-00013-of-00047.safetensors", + "model.layers.12.mlp.experts.82.up_proj.weight": "model-00013-of-00047.safetensors", + "model.layers.12.mlp.experts.82.up_proj.weight_scale": "model-00013-of-00047.safetensors", + "model.layers.12.mlp.experts.83.down_proj.weight": "model-00013-of-00047.safetensors", + "model.layers.12.mlp.experts.83.down_proj.weight_scale": "model-00013-of-00047.safetensors", + "model.layers.12.mlp.experts.83.gate_proj.weight": "model-00013-of-00047.safetensors", + "model.layers.12.mlp.experts.83.gate_proj.weight_scale": "model-00013-of-00047.safetensors", + "model.layers.12.mlp.experts.83.up_proj.weight": "model-00013-of-00047.safetensors", + "model.layers.12.mlp.experts.83.up_proj.weight_scale": "model-00013-of-00047.safetensors", + "model.layers.12.mlp.experts.84.down_proj.weight": "model-00013-of-00047.safetensors", + "model.layers.12.mlp.experts.84.down_proj.weight_scale": "model-00013-of-00047.safetensors", + "model.layers.12.mlp.experts.84.gate_proj.weight": "model-00013-of-00047.safetensors", + "model.layers.12.mlp.experts.84.gate_proj.weight_scale": "model-00013-of-00047.safetensors", + "model.layers.12.mlp.experts.84.up_proj.weight": "model-00013-of-00047.safetensors", + "model.layers.12.mlp.experts.84.up_proj.weight_scale": "model-00013-of-00047.safetensors", + "model.layers.12.mlp.experts.85.down_proj.weight": "model-00013-of-00047.safetensors", + "model.layers.12.mlp.experts.85.down_proj.weight_scale": "model-00013-of-00047.safetensors", + "model.layers.12.mlp.experts.85.gate_proj.weight": "model-00013-of-00047.safetensors", + "model.layers.12.mlp.experts.85.gate_proj.weight_scale": "model-00013-of-00047.safetensors", + "model.layers.12.mlp.experts.85.up_proj.weight": "model-00013-of-00047.safetensors", + "model.layers.12.mlp.experts.85.up_proj.weight_scale": "model-00013-of-00047.safetensors", + "model.layers.12.mlp.experts.86.down_proj.weight": "model-00013-of-00047.safetensors", + "model.layers.12.mlp.experts.86.down_proj.weight_scale": "model-00013-of-00047.safetensors", + "model.layers.12.mlp.experts.86.gate_proj.weight": "model-00013-of-00047.safetensors", + "model.layers.12.mlp.experts.86.gate_proj.weight_scale": "model-00013-of-00047.safetensors", + "model.layers.12.mlp.experts.86.up_proj.weight": "model-00013-of-00047.safetensors", + "model.layers.12.mlp.experts.86.up_proj.weight_scale": "model-00013-of-00047.safetensors", + "model.layers.12.mlp.experts.87.down_proj.weight": "model-00013-of-00047.safetensors", + "model.layers.12.mlp.experts.87.down_proj.weight_scale": "model-00013-of-00047.safetensors", + "model.layers.12.mlp.experts.87.gate_proj.weight": "model-00013-of-00047.safetensors", + "model.layers.12.mlp.experts.87.gate_proj.weight_scale": "model-00013-of-00047.safetensors", + "model.layers.12.mlp.experts.87.up_proj.weight": "model-00013-of-00047.safetensors", + "model.layers.12.mlp.experts.87.up_proj.weight_scale": "model-00013-of-00047.safetensors", + "model.layers.12.mlp.experts.88.down_proj.weight": "model-00013-of-00047.safetensors", + "model.layers.12.mlp.experts.88.down_proj.weight_scale": "model-00013-of-00047.safetensors", + "model.layers.12.mlp.experts.88.gate_proj.weight": "model-00013-of-00047.safetensors", + "model.layers.12.mlp.experts.88.gate_proj.weight_scale": "model-00013-of-00047.safetensors", + "model.layers.12.mlp.experts.88.up_proj.weight": "model-00013-of-00047.safetensors", + "model.layers.12.mlp.experts.88.up_proj.weight_scale": "model-00013-of-00047.safetensors", + "model.layers.12.mlp.experts.89.down_proj.weight": "model-00013-of-00047.safetensors", + "model.layers.12.mlp.experts.89.down_proj.weight_scale": "model-00013-of-00047.safetensors", + "model.layers.12.mlp.experts.89.gate_proj.weight": "model-00013-of-00047.safetensors", + "model.layers.12.mlp.experts.89.gate_proj.weight_scale": "model-00013-of-00047.safetensors", + "model.layers.12.mlp.experts.89.up_proj.weight": "model-00013-of-00047.safetensors", + "model.layers.12.mlp.experts.89.up_proj.weight_scale": "model-00013-of-00047.safetensors", + "model.layers.12.mlp.experts.9.down_proj.weight": "model-00013-of-00047.safetensors", + "model.layers.12.mlp.experts.9.down_proj.weight_scale": "model-00013-of-00047.safetensors", + "model.layers.12.mlp.experts.9.gate_proj.weight": "model-00013-of-00047.safetensors", + "model.layers.12.mlp.experts.9.gate_proj.weight_scale": "model-00013-of-00047.safetensors", + "model.layers.12.mlp.experts.9.up_proj.weight": "model-00013-of-00047.safetensors", + "model.layers.12.mlp.experts.9.up_proj.weight_scale": "model-00013-of-00047.safetensors", + "model.layers.12.mlp.experts.90.down_proj.weight": "model-00013-of-00047.safetensors", + "model.layers.12.mlp.experts.90.down_proj.weight_scale": "model-00013-of-00047.safetensors", + "model.layers.12.mlp.experts.90.gate_proj.weight": "model-00013-of-00047.safetensors", + "model.layers.12.mlp.experts.90.gate_proj.weight_scale": "model-00013-of-00047.safetensors", + "model.layers.12.mlp.experts.90.up_proj.weight": "model-00013-of-00047.safetensors", + "model.layers.12.mlp.experts.90.up_proj.weight_scale": "model-00013-of-00047.safetensors", + "model.layers.12.mlp.experts.91.down_proj.weight": "model-00013-of-00047.safetensors", + "model.layers.12.mlp.experts.91.down_proj.weight_scale": "model-00013-of-00047.safetensors", + "model.layers.12.mlp.experts.91.gate_proj.weight": "model-00013-of-00047.safetensors", + "model.layers.12.mlp.experts.91.gate_proj.weight_scale": "model-00013-of-00047.safetensors", + "model.layers.12.mlp.experts.91.up_proj.weight": "model-00013-of-00047.safetensors", + "model.layers.12.mlp.experts.91.up_proj.weight_scale": "model-00013-of-00047.safetensors", + "model.layers.12.mlp.experts.92.down_proj.weight": "model-00013-of-00047.safetensors", + "model.layers.12.mlp.experts.92.down_proj.weight_scale": "model-00013-of-00047.safetensors", + "model.layers.12.mlp.experts.92.gate_proj.weight": "model-00013-of-00047.safetensors", + "model.layers.12.mlp.experts.92.gate_proj.weight_scale": "model-00013-of-00047.safetensors", + "model.layers.12.mlp.experts.92.up_proj.weight": "model-00013-of-00047.safetensors", + "model.layers.12.mlp.experts.92.up_proj.weight_scale": "model-00013-of-00047.safetensors", + "model.layers.12.mlp.experts.93.down_proj.weight": "model-00013-of-00047.safetensors", + "model.layers.12.mlp.experts.93.down_proj.weight_scale": "model-00013-of-00047.safetensors", + "model.layers.12.mlp.experts.93.gate_proj.weight": "model-00013-of-00047.safetensors", + "model.layers.12.mlp.experts.93.gate_proj.weight_scale": "model-00013-of-00047.safetensors", + "model.layers.12.mlp.experts.93.up_proj.weight": "model-00013-of-00047.safetensors", + "model.layers.12.mlp.experts.93.up_proj.weight_scale": "model-00013-of-00047.safetensors", + "model.layers.12.mlp.experts.94.down_proj.weight": "model-00013-of-00047.safetensors", + "model.layers.12.mlp.experts.94.down_proj.weight_scale": "model-00013-of-00047.safetensors", + "model.layers.12.mlp.experts.94.gate_proj.weight": "model-00013-of-00047.safetensors", + "model.layers.12.mlp.experts.94.gate_proj.weight_scale": "model-00013-of-00047.safetensors", + "model.layers.12.mlp.experts.94.up_proj.weight": "model-00013-of-00047.safetensors", + "model.layers.12.mlp.experts.94.up_proj.weight_scale": "model-00013-of-00047.safetensors", + "model.layers.12.mlp.experts.95.down_proj.weight": "model-00013-of-00047.safetensors", + "model.layers.12.mlp.experts.95.down_proj.weight_scale": "model-00013-of-00047.safetensors", + "model.layers.12.mlp.experts.95.gate_proj.weight": "model-00013-of-00047.safetensors", + "model.layers.12.mlp.experts.95.gate_proj.weight_scale": "model-00013-of-00047.safetensors", + "model.layers.12.mlp.experts.95.up_proj.weight": "model-00013-of-00047.safetensors", + "model.layers.12.mlp.experts.95.up_proj.weight_scale": "model-00013-of-00047.safetensors", + "model.layers.12.mlp.experts.96.down_proj.weight": "model-00013-of-00047.safetensors", + "model.layers.12.mlp.experts.96.down_proj.weight_scale": "model-00013-of-00047.safetensors", + "model.layers.12.mlp.experts.96.gate_proj.weight": "model-00013-of-00047.safetensors", + "model.layers.12.mlp.experts.96.gate_proj.weight_scale": "model-00013-of-00047.safetensors", + "model.layers.12.mlp.experts.96.up_proj.weight": "model-00013-of-00047.safetensors", + "model.layers.12.mlp.experts.96.up_proj.weight_scale": "model-00013-of-00047.safetensors", + "model.layers.12.mlp.experts.97.down_proj.weight": "model-00013-of-00047.safetensors", + "model.layers.12.mlp.experts.97.down_proj.weight_scale": "model-00013-of-00047.safetensors", + "model.layers.12.mlp.experts.97.gate_proj.weight": "model-00013-of-00047.safetensors", + "model.layers.12.mlp.experts.97.gate_proj.weight_scale": "model-00013-of-00047.safetensors", + "model.layers.12.mlp.experts.97.up_proj.weight": "model-00013-of-00047.safetensors", + "model.layers.12.mlp.experts.97.up_proj.weight_scale": "model-00013-of-00047.safetensors", + "model.layers.12.mlp.experts.98.down_proj.weight": "model-00013-of-00047.safetensors", + "model.layers.12.mlp.experts.98.down_proj.weight_scale": "model-00013-of-00047.safetensors", + "model.layers.12.mlp.experts.98.gate_proj.weight": "model-00013-of-00047.safetensors", + "model.layers.12.mlp.experts.98.gate_proj.weight_scale": "model-00013-of-00047.safetensors", + "model.layers.12.mlp.experts.98.up_proj.weight": "model-00013-of-00047.safetensors", + "model.layers.12.mlp.experts.98.up_proj.weight_scale": "model-00013-of-00047.safetensors", + "model.layers.12.mlp.experts.99.down_proj.weight": "model-00013-of-00047.safetensors", + "model.layers.12.mlp.experts.99.down_proj.weight_scale": "model-00013-of-00047.safetensors", + "model.layers.12.mlp.experts.99.gate_proj.weight": "model-00013-of-00047.safetensors", + "model.layers.12.mlp.experts.99.gate_proj.weight_scale": "model-00013-of-00047.safetensors", + "model.layers.12.mlp.experts.99.up_proj.weight": "model-00013-of-00047.safetensors", + "model.layers.12.mlp.experts.99.up_proj.weight_scale": "model-00013-of-00047.safetensors", + "model.layers.12.mlp.gate.e_score_correction_bias": "model-00013-of-00047.safetensors", + "model.layers.12.mlp.gate.weight": "model-00013-of-00047.safetensors", + "model.layers.12.mlp.shared_experts.down_proj.weight": "model-00013-of-00047.safetensors", + "model.layers.12.mlp.shared_experts.down_proj.weight_scale": "model-00013-of-00047.safetensors", + "model.layers.12.mlp.shared_experts.gate_proj.weight": "model-00013-of-00047.safetensors", + "model.layers.12.mlp.shared_experts.gate_proj.weight_scale": "model-00013-of-00047.safetensors", + "model.layers.12.mlp.shared_experts.up_proj.weight": "model-00013-of-00047.safetensors", + "model.layers.12.mlp.shared_experts.up_proj.weight_scale": "model-00013-of-00047.safetensors", + "model.layers.12.post_attention_layernorm.weight": "model-00013-of-00047.safetensors", + "model.layers.12.self_attn.k_proj.bias": "model-00013-of-00047.safetensors", + "model.layers.12.self_attn.k_proj.weight": "model-00013-of-00047.safetensors", + "model.layers.12.self_attn.k_proj.weight_scale": "model-00013-of-00047.safetensors", + "model.layers.12.self_attn.o_proj.weight": "model-00013-of-00047.safetensors", + "model.layers.12.self_attn.o_proj.weight_scale": "model-00013-of-00047.safetensors", + "model.layers.12.self_attn.q_proj.bias": "model-00013-of-00047.safetensors", + "model.layers.12.self_attn.q_proj.weight": "model-00013-of-00047.safetensors", + "model.layers.12.self_attn.q_proj.weight_scale": "model-00013-of-00047.safetensors", + "model.layers.12.self_attn.v_proj.bias": "model-00013-of-00047.safetensors", + "model.layers.12.self_attn.v_proj.weight": "model-00013-of-00047.safetensors", + "model.layers.12.self_attn.v_proj.weight_scale": "model-00013-of-00047.safetensors", + "model.layers.13.input_layernorm.weight": "model-00014-of-00047.safetensors", + "model.layers.13.mlp.experts.0.down_proj.weight": "model-00014-of-00047.safetensors", + "model.layers.13.mlp.experts.0.down_proj.weight_scale": "model-00014-of-00047.safetensors", + "model.layers.13.mlp.experts.0.gate_proj.weight": "model-00014-of-00047.safetensors", + "model.layers.13.mlp.experts.0.gate_proj.weight_scale": "model-00014-of-00047.safetensors", + "model.layers.13.mlp.experts.0.up_proj.weight": "model-00014-of-00047.safetensors", + "model.layers.13.mlp.experts.0.up_proj.weight_scale": "model-00014-of-00047.safetensors", + "model.layers.13.mlp.experts.1.down_proj.weight": "model-00014-of-00047.safetensors", + "model.layers.13.mlp.experts.1.down_proj.weight_scale": "model-00014-of-00047.safetensors", + "model.layers.13.mlp.experts.1.gate_proj.weight": "model-00014-of-00047.safetensors", + "model.layers.13.mlp.experts.1.gate_proj.weight_scale": "model-00014-of-00047.safetensors", + "model.layers.13.mlp.experts.1.up_proj.weight": "model-00014-of-00047.safetensors", + "model.layers.13.mlp.experts.1.up_proj.weight_scale": "model-00014-of-00047.safetensors", + "model.layers.13.mlp.experts.10.down_proj.weight": "model-00014-of-00047.safetensors", + "model.layers.13.mlp.experts.10.down_proj.weight_scale": "model-00014-of-00047.safetensors", + "model.layers.13.mlp.experts.10.gate_proj.weight": "model-00014-of-00047.safetensors", + "model.layers.13.mlp.experts.10.gate_proj.weight_scale": "model-00014-of-00047.safetensors", + "model.layers.13.mlp.experts.10.up_proj.weight": "model-00014-of-00047.safetensors", + "model.layers.13.mlp.experts.10.up_proj.weight_scale": "model-00014-of-00047.safetensors", + "model.layers.13.mlp.experts.100.down_proj.weight": "model-00014-of-00047.safetensors", + "model.layers.13.mlp.experts.100.down_proj.weight_scale": "model-00014-of-00047.safetensors", + "model.layers.13.mlp.experts.100.gate_proj.weight": "model-00014-of-00047.safetensors", + "model.layers.13.mlp.experts.100.gate_proj.weight_scale": "model-00014-of-00047.safetensors", + "model.layers.13.mlp.experts.100.up_proj.weight": "model-00014-of-00047.safetensors", + "model.layers.13.mlp.experts.100.up_proj.weight_scale": "model-00014-of-00047.safetensors", + "model.layers.13.mlp.experts.101.down_proj.weight": "model-00014-of-00047.safetensors", + "model.layers.13.mlp.experts.101.down_proj.weight_scale": "model-00014-of-00047.safetensors", + "model.layers.13.mlp.experts.101.gate_proj.weight": "model-00014-of-00047.safetensors", + "model.layers.13.mlp.experts.101.gate_proj.weight_scale": "model-00014-of-00047.safetensors", + "model.layers.13.mlp.experts.101.up_proj.weight": "model-00014-of-00047.safetensors", + "model.layers.13.mlp.experts.101.up_proj.weight_scale": "model-00014-of-00047.safetensors", + "model.layers.13.mlp.experts.102.down_proj.weight": "model-00014-of-00047.safetensors", + "model.layers.13.mlp.experts.102.down_proj.weight_scale": "model-00014-of-00047.safetensors", + "model.layers.13.mlp.experts.102.gate_proj.weight": "model-00014-of-00047.safetensors", + "model.layers.13.mlp.experts.102.gate_proj.weight_scale": "model-00014-of-00047.safetensors", + "model.layers.13.mlp.experts.102.up_proj.weight": "model-00014-of-00047.safetensors", + "model.layers.13.mlp.experts.102.up_proj.weight_scale": "model-00014-of-00047.safetensors", + "model.layers.13.mlp.experts.103.down_proj.weight": "model-00014-of-00047.safetensors", + "model.layers.13.mlp.experts.103.down_proj.weight_scale": "model-00014-of-00047.safetensors", + "model.layers.13.mlp.experts.103.gate_proj.weight": "model-00014-of-00047.safetensors", + "model.layers.13.mlp.experts.103.gate_proj.weight_scale": "model-00014-of-00047.safetensors", + "model.layers.13.mlp.experts.103.up_proj.weight": "model-00014-of-00047.safetensors", + "model.layers.13.mlp.experts.103.up_proj.weight_scale": "model-00014-of-00047.safetensors", + "model.layers.13.mlp.experts.104.down_proj.weight": "model-00014-of-00047.safetensors", + "model.layers.13.mlp.experts.104.down_proj.weight_scale": "model-00014-of-00047.safetensors", + "model.layers.13.mlp.experts.104.gate_proj.weight": "model-00014-of-00047.safetensors", + "model.layers.13.mlp.experts.104.gate_proj.weight_scale": "model-00014-of-00047.safetensors", + "model.layers.13.mlp.experts.104.up_proj.weight": "model-00014-of-00047.safetensors", + "model.layers.13.mlp.experts.104.up_proj.weight_scale": "model-00014-of-00047.safetensors", + "model.layers.13.mlp.experts.105.down_proj.weight": "model-00014-of-00047.safetensors", + "model.layers.13.mlp.experts.105.down_proj.weight_scale": "model-00014-of-00047.safetensors", + "model.layers.13.mlp.experts.105.gate_proj.weight": "model-00014-of-00047.safetensors", + "model.layers.13.mlp.experts.105.gate_proj.weight_scale": "model-00014-of-00047.safetensors", + "model.layers.13.mlp.experts.105.up_proj.weight": "model-00014-of-00047.safetensors", + "model.layers.13.mlp.experts.105.up_proj.weight_scale": "model-00014-of-00047.safetensors", + "model.layers.13.mlp.experts.106.down_proj.weight": "model-00014-of-00047.safetensors", + "model.layers.13.mlp.experts.106.down_proj.weight_scale": "model-00014-of-00047.safetensors", + "model.layers.13.mlp.experts.106.gate_proj.weight": "model-00014-of-00047.safetensors", + "model.layers.13.mlp.experts.106.gate_proj.weight_scale": "model-00014-of-00047.safetensors", + "model.layers.13.mlp.experts.106.up_proj.weight": "model-00014-of-00047.safetensors", + "model.layers.13.mlp.experts.106.up_proj.weight_scale": "model-00014-of-00047.safetensors", + "model.layers.13.mlp.experts.107.down_proj.weight": "model-00014-of-00047.safetensors", + "model.layers.13.mlp.experts.107.down_proj.weight_scale": "model-00014-of-00047.safetensors", + "model.layers.13.mlp.experts.107.gate_proj.weight": "model-00014-of-00047.safetensors", + "model.layers.13.mlp.experts.107.gate_proj.weight_scale": "model-00014-of-00047.safetensors", + "model.layers.13.mlp.experts.107.up_proj.weight": "model-00014-of-00047.safetensors", + "model.layers.13.mlp.experts.107.up_proj.weight_scale": "model-00014-of-00047.safetensors", + "model.layers.13.mlp.experts.108.down_proj.weight": "model-00014-of-00047.safetensors", + "model.layers.13.mlp.experts.108.down_proj.weight_scale": "model-00014-of-00047.safetensors", + "model.layers.13.mlp.experts.108.gate_proj.weight": "model-00014-of-00047.safetensors", + "model.layers.13.mlp.experts.108.gate_proj.weight_scale": "model-00014-of-00047.safetensors", + "model.layers.13.mlp.experts.108.up_proj.weight": "model-00014-of-00047.safetensors", + "model.layers.13.mlp.experts.108.up_proj.weight_scale": "model-00014-of-00047.safetensors", + "model.layers.13.mlp.experts.109.down_proj.weight": "model-00014-of-00047.safetensors", + "model.layers.13.mlp.experts.109.down_proj.weight_scale": "model-00014-of-00047.safetensors", + "model.layers.13.mlp.experts.109.gate_proj.weight": "model-00014-of-00047.safetensors", + "model.layers.13.mlp.experts.109.gate_proj.weight_scale": "model-00014-of-00047.safetensors", + "model.layers.13.mlp.experts.109.up_proj.weight": "model-00014-of-00047.safetensors", + "model.layers.13.mlp.experts.109.up_proj.weight_scale": "model-00014-of-00047.safetensors", + "model.layers.13.mlp.experts.11.down_proj.weight": "model-00014-of-00047.safetensors", + "model.layers.13.mlp.experts.11.down_proj.weight_scale": "model-00014-of-00047.safetensors", + "model.layers.13.mlp.experts.11.gate_proj.weight": "model-00014-of-00047.safetensors", + "model.layers.13.mlp.experts.11.gate_proj.weight_scale": "model-00014-of-00047.safetensors", + "model.layers.13.mlp.experts.11.up_proj.weight": "model-00014-of-00047.safetensors", + "model.layers.13.mlp.experts.11.up_proj.weight_scale": "model-00014-of-00047.safetensors", + "model.layers.13.mlp.experts.110.down_proj.weight": "model-00014-of-00047.safetensors", + "model.layers.13.mlp.experts.110.down_proj.weight_scale": "model-00014-of-00047.safetensors", + "model.layers.13.mlp.experts.110.gate_proj.weight": "model-00014-of-00047.safetensors", + "model.layers.13.mlp.experts.110.gate_proj.weight_scale": "model-00014-of-00047.safetensors", + "model.layers.13.mlp.experts.110.up_proj.weight": "model-00014-of-00047.safetensors", + "model.layers.13.mlp.experts.110.up_proj.weight_scale": "model-00014-of-00047.safetensors", + "model.layers.13.mlp.experts.111.down_proj.weight": "model-00014-of-00047.safetensors", + "model.layers.13.mlp.experts.111.down_proj.weight_scale": "model-00014-of-00047.safetensors", + "model.layers.13.mlp.experts.111.gate_proj.weight": "model-00014-of-00047.safetensors", + "model.layers.13.mlp.experts.111.gate_proj.weight_scale": "model-00014-of-00047.safetensors", + "model.layers.13.mlp.experts.111.up_proj.weight": "model-00014-of-00047.safetensors", + "model.layers.13.mlp.experts.111.up_proj.weight_scale": "model-00014-of-00047.safetensors", + "model.layers.13.mlp.experts.112.down_proj.weight": "model-00014-of-00047.safetensors", + "model.layers.13.mlp.experts.112.down_proj.weight_scale": "model-00014-of-00047.safetensors", + "model.layers.13.mlp.experts.112.gate_proj.weight": "model-00014-of-00047.safetensors", + "model.layers.13.mlp.experts.112.gate_proj.weight_scale": "model-00014-of-00047.safetensors", + "model.layers.13.mlp.experts.112.up_proj.weight": "model-00014-of-00047.safetensors", + "model.layers.13.mlp.experts.112.up_proj.weight_scale": "model-00014-of-00047.safetensors", + "model.layers.13.mlp.experts.113.down_proj.weight": "model-00014-of-00047.safetensors", + "model.layers.13.mlp.experts.113.down_proj.weight_scale": "model-00014-of-00047.safetensors", + "model.layers.13.mlp.experts.113.gate_proj.weight": "model-00014-of-00047.safetensors", + "model.layers.13.mlp.experts.113.gate_proj.weight_scale": "model-00014-of-00047.safetensors", + "model.layers.13.mlp.experts.113.up_proj.weight": "model-00014-of-00047.safetensors", + "model.layers.13.mlp.experts.113.up_proj.weight_scale": "model-00014-of-00047.safetensors", + "model.layers.13.mlp.experts.114.down_proj.weight": "model-00014-of-00047.safetensors", + "model.layers.13.mlp.experts.114.down_proj.weight_scale": "model-00014-of-00047.safetensors", + "model.layers.13.mlp.experts.114.gate_proj.weight": "model-00014-of-00047.safetensors", + "model.layers.13.mlp.experts.114.gate_proj.weight_scale": "model-00014-of-00047.safetensors", + "model.layers.13.mlp.experts.114.up_proj.weight": "model-00014-of-00047.safetensors", + "model.layers.13.mlp.experts.114.up_proj.weight_scale": "model-00014-of-00047.safetensors", + "model.layers.13.mlp.experts.115.down_proj.weight": "model-00014-of-00047.safetensors", + "model.layers.13.mlp.experts.115.down_proj.weight_scale": "model-00014-of-00047.safetensors", + "model.layers.13.mlp.experts.115.gate_proj.weight": "model-00014-of-00047.safetensors", + "model.layers.13.mlp.experts.115.gate_proj.weight_scale": "model-00014-of-00047.safetensors", + "model.layers.13.mlp.experts.115.up_proj.weight": "model-00014-of-00047.safetensors", + "model.layers.13.mlp.experts.115.up_proj.weight_scale": "model-00014-of-00047.safetensors", + "model.layers.13.mlp.experts.116.down_proj.weight": "model-00014-of-00047.safetensors", + "model.layers.13.mlp.experts.116.down_proj.weight_scale": "model-00014-of-00047.safetensors", + "model.layers.13.mlp.experts.116.gate_proj.weight": "model-00014-of-00047.safetensors", + "model.layers.13.mlp.experts.116.gate_proj.weight_scale": "model-00014-of-00047.safetensors", + "model.layers.13.mlp.experts.116.up_proj.weight": "model-00014-of-00047.safetensors", + "model.layers.13.mlp.experts.116.up_proj.weight_scale": "model-00014-of-00047.safetensors", + "model.layers.13.mlp.experts.117.down_proj.weight": "model-00014-of-00047.safetensors", + "model.layers.13.mlp.experts.117.down_proj.weight_scale": "model-00014-of-00047.safetensors", + "model.layers.13.mlp.experts.117.gate_proj.weight": "model-00014-of-00047.safetensors", + "model.layers.13.mlp.experts.117.gate_proj.weight_scale": "model-00014-of-00047.safetensors", + "model.layers.13.mlp.experts.117.up_proj.weight": "model-00014-of-00047.safetensors", + "model.layers.13.mlp.experts.117.up_proj.weight_scale": "model-00014-of-00047.safetensors", + "model.layers.13.mlp.experts.118.down_proj.weight": "model-00014-of-00047.safetensors", + "model.layers.13.mlp.experts.118.down_proj.weight_scale": "model-00014-of-00047.safetensors", + "model.layers.13.mlp.experts.118.gate_proj.weight": "model-00014-of-00047.safetensors", + "model.layers.13.mlp.experts.118.gate_proj.weight_scale": "model-00014-of-00047.safetensors", + "model.layers.13.mlp.experts.118.up_proj.weight": "model-00014-of-00047.safetensors", + "model.layers.13.mlp.experts.118.up_proj.weight_scale": "model-00014-of-00047.safetensors", + "model.layers.13.mlp.experts.119.down_proj.weight": "model-00014-of-00047.safetensors", + "model.layers.13.mlp.experts.119.down_proj.weight_scale": "model-00014-of-00047.safetensors", + "model.layers.13.mlp.experts.119.gate_proj.weight": "model-00014-of-00047.safetensors", + "model.layers.13.mlp.experts.119.gate_proj.weight_scale": "model-00014-of-00047.safetensors", + "model.layers.13.mlp.experts.119.up_proj.weight": "model-00014-of-00047.safetensors", + "model.layers.13.mlp.experts.119.up_proj.weight_scale": "model-00014-of-00047.safetensors", + "model.layers.13.mlp.experts.12.down_proj.weight": "model-00014-of-00047.safetensors", + "model.layers.13.mlp.experts.12.down_proj.weight_scale": "model-00014-of-00047.safetensors", + "model.layers.13.mlp.experts.12.gate_proj.weight": "model-00014-of-00047.safetensors", + "model.layers.13.mlp.experts.12.gate_proj.weight_scale": "model-00014-of-00047.safetensors", + "model.layers.13.mlp.experts.12.up_proj.weight": "model-00014-of-00047.safetensors", + "model.layers.13.mlp.experts.12.up_proj.weight_scale": "model-00014-of-00047.safetensors", + "model.layers.13.mlp.experts.120.down_proj.weight": "model-00014-of-00047.safetensors", + "model.layers.13.mlp.experts.120.down_proj.weight_scale": "model-00014-of-00047.safetensors", + "model.layers.13.mlp.experts.120.gate_proj.weight": "model-00014-of-00047.safetensors", + "model.layers.13.mlp.experts.120.gate_proj.weight_scale": "model-00014-of-00047.safetensors", + "model.layers.13.mlp.experts.120.up_proj.weight": "model-00014-of-00047.safetensors", + "model.layers.13.mlp.experts.120.up_proj.weight_scale": "model-00014-of-00047.safetensors", + "model.layers.13.mlp.experts.121.down_proj.weight": "model-00014-of-00047.safetensors", + "model.layers.13.mlp.experts.121.down_proj.weight_scale": "model-00014-of-00047.safetensors", + "model.layers.13.mlp.experts.121.gate_proj.weight": "model-00014-of-00047.safetensors", + "model.layers.13.mlp.experts.121.gate_proj.weight_scale": "model-00014-of-00047.safetensors", + "model.layers.13.mlp.experts.121.up_proj.weight": "model-00014-of-00047.safetensors", + "model.layers.13.mlp.experts.121.up_proj.weight_scale": "model-00014-of-00047.safetensors", + "model.layers.13.mlp.experts.122.down_proj.weight": "model-00014-of-00047.safetensors", + "model.layers.13.mlp.experts.122.down_proj.weight_scale": "model-00014-of-00047.safetensors", + "model.layers.13.mlp.experts.122.gate_proj.weight": "model-00014-of-00047.safetensors", + "model.layers.13.mlp.experts.122.gate_proj.weight_scale": "model-00014-of-00047.safetensors", + "model.layers.13.mlp.experts.122.up_proj.weight": "model-00014-of-00047.safetensors", + "model.layers.13.mlp.experts.122.up_proj.weight_scale": "model-00014-of-00047.safetensors", + "model.layers.13.mlp.experts.123.down_proj.weight": "model-00014-of-00047.safetensors", + "model.layers.13.mlp.experts.123.down_proj.weight_scale": "model-00014-of-00047.safetensors", + "model.layers.13.mlp.experts.123.gate_proj.weight": "model-00014-of-00047.safetensors", + "model.layers.13.mlp.experts.123.gate_proj.weight_scale": "model-00014-of-00047.safetensors", + "model.layers.13.mlp.experts.123.up_proj.weight": "model-00014-of-00047.safetensors", + "model.layers.13.mlp.experts.123.up_proj.weight_scale": "model-00014-of-00047.safetensors", + "model.layers.13.mlp.experts.124.down_proj.weight": "model-00014-of-00047.safetensors", + "model.layers.13.mlp.experts.124.down_proj.weight_scale": "model-00014-of-00047.safetensors", + "model.layers.13.mlp.experts.124.gate_proj.weight": "model-00014-of-00047.safetensors", + "model.layers.13.mlp.experts.124.gate_proj.weight_scale": "model-00014-of-00047.safetensors", + "model.layers.13.mlp.experts.124.up_proj.weight": "model-00014-of-00047.safetensors", + "model.layers.13.mlp.experts.124.up_proj.weight_scale": "model-00014-of-00047.safetensors", + "model.layers.13.mlp.experts.125.down_proj.weight": "model-00014-of-00047.safetensors", + "model.layers.13.mlp.experts.125.down_proj.weight_scale": "model-00014-of-00047.safetensors", + "model.layers.13.mlp.experts.125.gate_proj.weight": "model-00014-of-00047.safetensors", + "model.layers.13.mlp.experts.125.gate_proj.weight_scale": "model-00014-of-00047.safetensors", + "model.layers.13.mlp.experts.125.up_proj.weight": "model-00014-of-00047.safetensors", + "model.layers.13.mlp.experts.125.up_proj.weight_scale": "model-00014-of-00047.safetensors", + "model.layers.13.mlp.experts.126.down_proj.weight": "model-00014-of-00047.safetensors", + "model.layers.13.mlp.experts.126.down_proj.weight_scale": "model-00014-of-00047.safetensors", + "model.layers.13.mlp.experts.126.gate_proj.weight": "model-00014-of-00047.safetensors", + "model.layers.13.mlp.experts.126.gate_proj.weight_scale": "model-00014-of-00047.safetensors", + "model.layers.13.mlp.experts.126.up_proj.weight": "model-00014-of-00047.safetensors", + "model.layers.13.mlp.experts.126.up_proj.weight_scale": "model-00014-of-00047.safetensors", + "model.layers.13.mlp.experts.127.down_proj.weight": "model-00014-of-00047.safetensors", + "model.layers.13.mlp.experts.127.down_proj.weight_scale": "model-00014-of-00047.safetensors", + "model.layers.13.mlp.experts.127.gate_proj.weight": "model-00014-of-00047.safetensors", + "model.layers.13.mlp.experts.127.gate_proj.weight_scale": "model-00014-of-00047.safetensors", + "model.layers.13.mlp.experts.127.up_proj.weight": "model-00014-of-00047.safetensors", + "model.layers.13.mlp.experts.127.up_proj.weight_scale": "model-00014-of-00047.safetensors", + "model.layers.13.mlp.experts.13.down_proj.weight": "model-00014-of-00047.safetensors", + "model.layers.13.mlp.experts.13.down_proj.weight_scale": "model-00014-of-00047.safetensors", + "model.layers.13.mlp.experts.13.gate_proj.weight": "model-00014-of-00047.safetensors", + "model.layers.13.mlp.experts.13.gate_proj.weight_scale": "model-00014-of-00047.safetensors", + "model.layers.13.mlp.experts.13.up_proj.weight": "model-00014-of-00047.safetensors", + "model.layers.13.mlp.experts.13.up_proj.weight_scale": "model-00014-of-00047.safetensors", + "model.layers.13.mlp.experts.14.down_proj.weight": "model-00014-of-00047.safetensors", + "model.layers.13.mlp.experts.14.down_proj.weight_scale": "model-00014-of-00047.safetensors", + "model.layers.13.mlp.experts.14.gate_proj.weight": "model-00014-of-00047.safetensors", + "model.layers.13.mlp.experts.14.gate_proj.weight_scale": "model-00014-of-00047.safetensors", + "model.layers.13.mlp.experts.14.up_proj.weight": "model-00014-of-00047.safetensors", + "model.layers.13.mlp.experts.14.up_proj.weight_scale": "model-00014-of-00047.safetensors", + "model.layers.13.mlp.experts.15.down_proj.weight": "model-00014-of-00047.safetensors", + "model.layers.13.mlp.experts.15.down_proj.weight_scale": "model-00014-of-00047.safetensors", + "model.layers.13.mlp.experts.15.gate_proj.weight": "model-00014-of-00047.safetensors", + "model.layers.13.mlp.experts.15.gate_proj.weight_scale": "model-00014-of-00047.safetensors", + "model.layers.13.mlp.experts.15.up_proj.weight": "model-00014-of-00047.safetensors", + "model.layers.13.mlp.experts.15.up_proj.weight_scale": "model-00014-of-00047.safetensors", + "model.layers.13.mlp.experts.16.down_proj.weight": "model-00014-of-00047.safetensors", + "model.layers.13.mlp.experts.16.down_proj.weight_scale": "model-00014-of-00047.safetensors", + "model.layers.13.mlp.experts.16.gate_proj.weight": "model-00014-of-00047.safetensors", + "model.layers.13.mlp.experts.16.gate_proj.weight_scale": "model-00014-of-00047.safetensors", + "model.layers.13.mlp.experts.16.up_proj.weight": "model-00014-of-00047.safetensors", + "model.layers.13.mlp.experts.16.up_proj.weight_scale": "model-00014-of-00047.safetensors", + "model.layers.13.mlp.experts.17.down_proj.weight": "model-00014-of-00047.safetensors", + "model.layers.13.mlp.experts.17.down_proj.weight_scale": "model-00014-of-00047.safetensors", + "model.layers.13.mlp.experts.17.gate_proj.weight": "model-00014-of-00047.safetensors", + "model.layers.13.mlp.experts.17.gate_proj.weight_scale": "model-00014-of-00047.safetensors", + "model.layers.13.mlp.experts.17.up_proj.weight": "model-00014-of-00047.safetensors", + "model.layers.13.mlp.experts.17.up_proj.weight_scale": "model-00014-of-00047.safetensors", + "model.layers.13.mlp.experts.18.down_proj.weight": "model-00014-of-00047.safetensors", + "model.layers.13.mlp.experts.18.down_proj.weight_scale": "model-00014-of-00047.safetensors", + "model.layers.13.mlp.experts.18.gate_proj.weight": "model-00014-of-00047.safetensors", + "model.layers.13.mlp.experts.18.gate_proj.weight_scale": "model-00014-of-00047.safetensors", + "model.layers.13.mlp.experts.18.up_proj.weight": "model-00014-of-00047.safetensors", + "model.layers.13.mlp.experts.18.up_proj.weight_scale": "model-00014-of-00047.safetensors", + "model.layers.13.mlp.experts.19.down_proj.weight": "model-00014-of-00047.safetensors", + "model.layers.13.mlp.experts.19.down_proj.weight_scale": "model-00014-of-00047.safetensors", + "model.layers.13.mlp.experts.19.gate_proj.weight": "model-00014-of-00047.safetensors", + "model.layers.13.mlp.experts.19.gate_proj.weight_scale": "model-00014-of-00047.safetensors", + "model.layers.13.mlp.experts.19.up_proj.weight": "model-00014-of-00047.safetensors", + "model.layers.13.mlp.experts.19.up_proj.weight_scale": "model-00014-of-00047.safetensors", + "model.layers.13.mlp.experts.2.down_proj.weight": "model-00014-of-00047.safetensors", + "model.layers.13.mlp.experts.2.down_proj.weight_scale": "model-00014-of-00047.safetensors", + "model.layers.13.mlp.experts.2.gate_proj.weight": "model-00014-of-00047.safetensors", + "model.layers.13.mlp.experts.2.gate_proj.weight_scale": "model-00014-of-00047.safetensors", + "model.layers.13.mlp.experts.2.up_proj.weight": "model-00014-of-00047.safetensors", + "model.layers.13.mlp.experts.2.up_proj.weight_scale": "model-00014-of-00047.safetensors", + "model.layers.13.mlp.experts.20.down_proj.weight": "model-00014-of-00047.safetensors", + "model.layers.13.mlp.experts.20.down_proj.weight_scale": "model-00014-of-00047.safetensors", + "model.layers.13.mlp.experts.20.gate_proj.weight": "model-00014-of-00047.safetensors", + "model.layers.13.mlp.experts.20.gate_proj.weight_scale": "model-00014-of-00047.safetensors", + "model.layers.13.mlp.experts.20.up_proj.weight": "model-00014-of-00047.safetensors", + "model.layers.13.mlp.experts.20.up_proj.weight_scale": "model-00014-of-00047.safetensors", + "model.layers.13.mlp.experts.21.down_proj.weight": "model-00014-of-00047.safetensors", + "model.layers.13.mlp.experts.21.down_proj.weight_scale": "model-00014-of-00047.safetensors", + "model.layers.13.mlp.experts.21.gate_proj.weight": "model-00014-of-00047.safetensors", + "model.layers.13.mlp.experts.21.gate_proj.weight_scale": "model-00014-of-00047.safetensors", + "model.layers.13.mlp.experts.21.up_proj.weight": "model-00014-of-00047.safetensors", + "model.layers.13.mlp.experts.21.up_proj.weight_scale": "model-00014-of-00047.safetensors", + "model.layers.13.mlp.experts.22.down_proj.weight": "model-00014-of-00047.safetensors", + "model.layers.13.mlp.experts.22.down_proj.weight_scale": "model-00014-of-00047.safetensors", + "model.layers.13.mlp.experts.22.gate_proj.weight": "model-00014-of-00047.safetensors", + "model.layers.13.mlp.experts.22.gate_proj.weight_scale": "model-00014-of-00047.safetensors", + "model.layers.13.mlp.experts.22.up_proj.weight": "model-00014-of-00047.safetensors", + "model.layers.13.mlp.experts.22.up_proj.weight_scale": "model-00014-of-00047.safetensors", + "model.layers.13.mlp.experts.23.down_proj.weight": "model-00014-of-00047.safetensors", + "model.layers.13.mlp.experts.23.down_proj.weight_scale": "model-00014-of-00047.safetensors", + "model.layers.13.mlp.experts.23.gate_proj.weight": "model-00014-of-00047.safetensors", + "model.layers.13.mlp.experts.23.gate_proj.weight_scale": "model-00014-of-00047.safetensors", + "model.layers.13.mlp.experts.23.up_proj.weight": "model-00014-of-00047.safetensors", + "model.layers.13.mlp.experts.23.up_proj.weight_scale": "model-00014-of-00047.safetensors", + "model.layers.13.mlp.experts.24.down_proj.weight": "model-00014-of-00047.safetensors", + "model.layers.13.mlp.experts.24.down_proj.weight_scale": "model-00014-of-00047.safetensors", + "model.layers.13.mlp.experts.24.gate_proj.weight": "model-00014-of-00047.safetensors", + "model.layers.13.mlp.experts.24.gate_proj.weight_scale": "model-00014-of-00047.safetensors", + "model.layers.13.mlp.experts.24.up_proj.weight": "model-00014-of-00047.safetensors", + "model.layers.13.mlp.experts.24.up_proj.weight_scale": "model-00014-of-00047.safetensors", + "model.layers.13.mlp.experts.25.down_proj.weight": "model-00014-of-00047.safetensors", + "model.layers.13.mlp.experts.25.down_proj.weight_scale": "model-00014-of-00047.safetensors", + "model.layers.13.mlp.experts.25.gate_proj.weight": "model-00014-of-00047.safetensors", + "model.layers.13.mlp.experts.25.gate_proj.weight_scale": "model-00014-of-00047.safetensors", + "model.layers.13.mlp.experts.25.up_proj.weight": "model-00014-of-00047.safetensors", + "model.layers.13.mlp.experts.25.up_proj.weight_scale": "model-00014-of-00047.safetensors", + "model.layers.13.mlp.experts.26.down_proj.weight": "model-00014-of-00047.safetensors", + "model.layers.13.mlp.experts.26.down_proj.weight_scale": "model-00014-of-00047.safetensors", + "model.layers.13.mlp.experts.26.gate_proj.weight": "model-00014-of-00047.safetensors", + "model.layers.13.mlp.experts.26.gate_proj.weight_scale": "model-00014-of-00047.safetensors", + "model.layers.13.mlp.experts.26.up_proj.weight": "model-00014-of-00047.safetensors", + "model.layers.13.mlp.experts.26.up_proj.weight_scale": "model-00014-of-00047.safetensors", + "model.layers.13.mlp.experts.27.down_proj.weight": "model-00014-of-00047.safetensors", + "model.layers.13.mlp.experts.27.down_proj.weight_scale": "model-00014-of-00047.safetensors", + "model.layers.13.mlp.experts.27.gate_proj.weight": "model-00014-of-00047.safetensors", + "model.layers.13.mlp.experts.27.gate_proj.weight_scale": "model-00014-of-00047.safetensors", + "model.layers.13.mlp.experts.27.up_proj.weight": "model-00014-of-00047.safetensors", + "model.layers.13.mlp.experts.27.up_proj.weight_scale": "model-00014-of-00047.safetensors", + "model.layers.13.mlp.experts.28.down_proj.weight": "model-00014-of-00047.safetensors", + "model.layers.13.mlp.experts.28.down_proj.weight_scale": "model-00014-of-00047.safetensors", + "model.layers.13.mlp.experts.28.gate_proj.weight": "model-00014-of-00047.safetensors", + "model.layers.13.mlp.experts.28.gate_proj.weight_scale": "model-00014-of-00047.safetensors", + "model.layers.13.mlp.experts.28.up_proj.weight": "model-00014-of-00047.safetensors", + "model.layers.13.mlp.experts.28.up_proj.weight_scale": "model-00014-of-00047.safetensors", + "model.layers.13.mlp.experts.29.down_proj.weight": "model-00014-of-00047.safetensors", + "model.layers.13.mlp.experts.29.down_proj.weight_scale": "model-00014-of-00047.safetensors", + "model.layers.13.mlp.experts.29.gate_proj.weight": "model-00014-of-00047.safetensors", + "model.layers.13.mlp.experts.29.gate_proj.weight_scale": "model-00014-of-00047.safetensors", + "model.layers.13.mlp.experts.29.up_proj.weight": "model-00014-of-00047.safetensors", + "model.layers.13.mlp.experts.29.up_proj.weight_scale": "model-00014-of-00047.safetensors", + "model.layers.13.mlp.experts.3.down_proj.weight": "model-00014-of-00047.safetensors", + "model.layers.13.mlp.experts.3.down_proj.weight_scale": "model-00014-of-00047.safetensors", + "model.layers.13.mlp.experts.3.gate_proj.weight": "model-00014-of-00047.safetensors", + "model.layers.13.mlp.experts.3.gate_proj.weight_scale": "model-00014-of-00047.safetensors", + "model.layers.13.mlp.experts.3.up_proj.weight": "model-00014-of-00047.safetensors", + "model.layers.13.mlp.experts.3.up_proj.weight_scale": "model-00014-of-00047.safetensors", + "model.layers.13.mlp.experts.30.down_proj.weight": "model-00014-of-00047.safetensors", + "model.layers.13.mlp.experts.30.down_proj.weight_scale": "model-00014-of-00047.safetensors", + "model.layers.13.mlp.experts.30.gate_proj.weight": "model-00014-of-00047.safetensors", + "model.layers.13.mlp.experts.30.gate_proj.weight_scale": "model-00014-of-00047.safetensors", + "model.layers.13.mlp.experts.30.up_proj.weight": "model-00014-of-00047.safetensors", + "model.layers.13.mlp.experts.30.up_proj.weight_scale": "model-00014-of-00047.safetensors", + "model.layers.13.mlp.experts.31.down_proj.weight": "model-00014-of-00047.safetensors", + "model.layers.13.mlp.experts.31.down_proj.weight_scale": "model-00014-of-00047.safetensors", + "model.layers.13.mlp.experts.31.gate_proj.weight": "model-00014-of-00047.safetensors", + "model.layers.13.mlp.experts.31.gate_proj.weight_scale": "model-00014-of-00047.safetensors", + "model.layers.13.mlp.experts.31.up_proj.weight": "model-00014-of-00047.safetensors", + "model.layers.13.mlp.experts.31.up_proj.weight_scale": "model-00014-of-00047.safetensors", + "model.layers.13.mlp.experts.32.down_proj.weight": "model-00014-of-00047.safetensors", + "model.layers.13.mlp.experts.32.down_proj.weight_scale": "model-00014-of-00047.safetensors", + "model.layers.13.mlp.experts.32.gate_proj.weight": "model-00014-of-00047.safetensors", + "model.layers.13.mlp.experts.32.gate_proj.weight_scale": "model-00014-of-00047.safetensors", + "model.layers.13.mlp.experts.32.up_proj.weight": "model-00014-of-00047.safetensors", + "model.layers.13.mlp.experts.32.up_proj.weight_scale": "model-00014-of-00047.safetensors", + "model.layers.13.mlp.experts.33.down_proj.weight": "model-00014-of-00047.safetensors", + "model.layers.13.mlp.experts.33.down_proj.weight_scale": "model-00014-of-00047.safetensors", + "model.layers.13.mlp.experts.33.gate_proj.weight": "model-00014-of-00047.safetensors", + "model.layers.13.mlp.experts.33.gate_proj.weight_scale": "model-00014-of-00047.safetensors", + "model.layers.13.mlp.experts.33.up_proj.weight": "model-00014-of-00047.safetensors", + "model.layers.13.mlp.experts.33.up_proj.weight_scale": "model-00014-of-00047.safetensors", + "model.layers.13.mlp.experts.34.down_proj.weight": "model-00014-of-00047.safetensors", + "model.layers.13.mlp.experts.34.down_proj.weight_scale": "model-00014-of-00047.safetensors", + "model.layers.13.mlp.experts.34.gate_proj.weight": "model-00014-of-00047.safetensors", + "model.layers.13.mlp.experts.34.gate_proj.weight_scale": "model-00014-of-00047.safetensors", + "model.layers.13.mlp.experts.34.up_proj.weight": "model-00014-of-00047.safetensors", + "model.layers.13.mlp.experts.34.up_proj.weight_scale": "model-00014-of-00047.safetensors", + "model.layers.13.mlp.experts.35.down_proj.weight": "model-00014-of-00047.safetensors", + "model.layers.13.mlp.experts.35.down_proj.weight_scale": "model-00014-of-00047.safetensors", + "model.layers.13.mlp.experts.35.gate_proj.weight": "model-00014-of-00047.safetensors", + "model.layers.13.mlp.experts.35.gate_proj.weight_scale": "model-00014-of-00047.safetensors", + "model.layers.13.mlp.experts.35.up_proj.weight": "model-00014-of-00047.safetensors", + "model.layers.13.mlp.experts.35.up_proj.weight_scale": "model-00014-of-00047.safetensors", + "model.layers.13.mlp.experts.36.down_proj.weight": "model-00014-of-00047.safetensors", + "model.layers.13.mlp.experts.36.down_proj.weight_scale": "model-00014-of-00047.safetensors", + "model.layers.13.mlp.experts.36.gate_proj.weight": "model-00014-of-00047.safetensors", + "model.layers.13.mlp.experts.36.gate_proj.weight_scale": "model-00014-of-00047.safetensors", + "model.layers.13.mlp.experts.36.up_proj.weight": "model-00014-of-00047.safetensors", + "model.layers.13.mlp.experts.36.up_proj.weight_scale": "model-00014-of-00047.safetensors", + "model.layers.13.mlp.experts.37.down_proj.weight": "model-00014-of-00047.safetensors", + "model.layers.13.mlp.experts.37.down_proj.weight_scale": "model-00014-of-00047.safetensors", + "model.layers.13.mlp.experts.37.gate_proj.weight": "model-00014-of-00047.safetensors", + "model.layers.13.mlp.experts.37.gate_proj.weight_scale": "model-00014-of-00047.safetensors", + "model.layers.13.mlp.experts.37.up_proj.weight": "model-00014-of-00047.safetensors", + "model.layers.13.mlp.experts.37.up_proj.weight_scale": "model-00014-of-00047.safetensors", + "model.layers.13.mlp.experts.38.down_proj.weight": "model-00014-of-00047.safetensors", + "model.layers.13.mlp.experts.38.down_proj.weight_scale": "model-00014-of-00047.safetensors", + "model.layers.13.mlp.experts.38.gate_proj.weight": "model-00014-of-00047.safetensors", + "model.layers.13.mlp.experts.38.gate_proj.weight_scale": "model-00014-of-00047.safetensors", + "model.layers.13.mlp.experts.38.up_proj.weight": "model-00014-of-00047.safetensors", + "model.layers.13.mlp.experts.38.up_proj.weight_scale": "model-00014-of-00047.safetensors", + "model.layers.13.mlp.experts.39.down_proj.weight": "model-00014-of-00047.safetensors", + "model.layers.13.mlp.experts.39.down_proj.weight_scale": "model-00014-of-00047.safetensors", + "model.layers.13.mlp.experts.39.gate_proj.weight": "model-00014-of-00047.safetensors", + "model.layers.13.mlp.experts.39.gate_proj.weight_scale": "model-00014-of-00047.safetensors", + "model.layers.13.mlp.experts.39.up_proj.weight": "model-00014-of-00047.safetensors", + "model.layers.13.mlp.experts.39.up_proj.weight_scale": "model-00014-of-00047.safetensors", + "model.layers.13.mlp.experts.4.down_proj.weight": "model-00014-of-00047.safetensors", + "model.layers.13.mlp.experts.4.down_proj.weight_scale": "model-00014-of-00047.safetensors", + "model.layers.13.mlp.experts.4.gate_proj.weight": "model-00014-of-00047.safetensors", + "model.layers.13.mlp.experts.4.gate_proj.weight_scale": "model-00014-of-00047.safetensors", + "model.layers.13.mlp.experts.4.up_proj.weight": "model-00014-of-00047.safetensors", + "model.layers.13.mlp.experts.4.up_proj.weight_scale": "model-00014-of-00047.safetensors", + "model.layers.13.mlp.experts.40.down_proj.weight": "model-00014-of-00047.safetensors", + "model.layers.13.mlp.experts.40.down_proj.weight_scale": "model-00014-of-00047.safetensors", + "model.layers.13.mlp.experts.40.gate_proj.weight": "model-00014-of-00047.safetensors", + "model.layers.13.mlp.experts.40.gate_proj.weight_scale": "model-00014-of-00047.safetensors", + "model.layers.13.mlp.experts.40.up_proj.weight": "model-00014-of-00047.safetensors", + "model.layers.13.mlp.experts.40.up_proj.weight_scale": "model-00014-of-00047.safetensors", + "model.layers.13.mlp.experts.41.down_proj.weight": "model-00014-of-00047.safetensors", + "model.layers.13.mlp.experts.41.down_proj.weight_scale": "model-00014-of-00047.safetensors", + "model.layers.13.mlp.experts.41.gate_proj.weight": "model-00014-of-00047.safetensors", + "model.layers.13.mlp.experts.41.gate_proj.weight_scale": "model-00014-of-00047.safetensors", + "model.layers.13.mlp.experts.41.up_proj.weight": "model-00014-of-00047.safetensors", + "model.layers.13.mlp.experts.41.up_proj.weight_scale": "model-00014-of-00047.safetensors", + "model.layers.13.mlp.experts.42.down_proj.weight": "model-00014-of-00047.safetensors", + "model.layers.13.mlp.experts.42.down_proj.weight_scale": "model-00014-of-00047.safetensors", + "model.layers.13.mlp.experts.42.gate_proj.weight": "model-00014-of-00047.safetensors", + "model.layers.13.mlp.experts.42.gate_proj.weight_scale": "model-00014-of-00047.safetensors", + "model.layers.13.mlp.experts.42.up_proj.weight": "model-00014-of-00047.safetensors", + "model.layers.13.mlp.experts.42.up_proj.weight_scale": "model-00014-of-00047.safetensors", + "model.layers.13.mlp.experts.43.down_proj.weight": "model-00014-of-00047.safetensors", + "model.layers.13.mlp.experts.43.down_proj.weight_scale": "model-00014-of-00047.safetensors", + "model.layers.13.mlp.experts.43.gate_proj.weight": "model-00014-of-00047.safetensors", + "model.layers.13.mlp.experts.43.gate_proj.weight_scale": "model-00014-of-00047.safetensors", + "model.layers.13.mlp.experts.43.up_proj.weight": "model-00014-of-00047.safetensors", + "model.layers.13.mlp.experts.43.up_proj.weight_scale": "model-00014-of-00047.safetensors", + "model.layers.13.mlp.experts.44.down_proj.weight": "model-00014-of-00047.safetensors", + "model.layers.13.mlp.experts.44.down_proj.weight_scale": "model-00014-of-00047.safetensors", + "model.layers.13.mlp.experts.44.gate_proj.weight": "model-00014-of-00047.safetensors", + "model.layers.13.mlp.experts.44.gate_proj.weight_scale": "model-00014-of-00047.safetensors", + "model.layers.13.mlp.experts.44.up_proj.weight": "model-00014-of-00047.safetensors", + "model.layers.13.mlp.experts.44.up_proj.weight_scale": "model-00014-of-00047.safetensors", + "model.layers.13.mlp.experts.45.down_proj.weight": "model-00014-of-00047.safetensors", + "model.layers.13.mlp.experts.45.down_proj.weight_scale": "model-00014-of-00047.safetensors", + "model.layers.13.mlp.experts.45.gate_proj.weight": "model-00014-of-00047.safetensors", + "model.layers.13.mlp.experts.45.gate_proj.weight_scale": "model-00014-of-00047.safetensors", + "model.layers.13.mlp.experts.45.up_proj.weight": "model-00014-of-00047.safetensors", + "model.layers.13.mlp.experts.45.up_proj.weight_scale": "model-00014-of-00047.safetensors", + "model.layers.13.mlp.experts.46.down_proj.weight": "model-00014-of-00047.safetensors", + "model.layers.13.mlp.experts.46.down_proj.weight_scale": "model-00014-of-00047.safetensors", + "model.layers.13.mlp.experts.46.gate_proj.weight": "model-00014-of-00047.safetensors", + "model.layers.13.mlp.experts.46.gate_proj.weight_scale": "model-00014-of-00047.safetensors", + "model.layers.13.mlp.experts.46.up_proj.weight": "model-00014-of-00047.safetensors", + "model.layers.13.mlp.experts.46.up_proj.weight_scale": "model-00014-of-00047.safetensors", + "model.layers.13.mlp.experts.47.down_proj.weight": "model-00014-of-00047.safetensors", + "model.layers.13.mlp.experts.47.down_proj.weight_scale": "model-00014-of-00047.safetensors", + "model.layers.13.mlp.experts.47.gate_proj.weight": "model-00014-of-00047.safetensors", + "model.layers.13.mlp.experts.47.gate_proj.weight_scale": "model-00014-of-00047.safetensors", + "model.layers.13.mlp.experts.47.up_proj.weight": "model-00014-of-00047.safetensors", + "model.layers.13.mlp.experts.47.up_proj.weight_scale": "model-00014-of-00047.safetensors", + "model.layers.13.mlp.experts.48.down_proj.weight": "model-00014-of-00047.safetensors", + "model.layers.13.mlp.experts.48.down_proj.weight_scale": "model-00014-of-00047.safetensors", + "model.layers.13.mlp.experts.48.gate_proj.weight": "model-00014-of-00047.safetensors", + "model.layers.13.mlp.experts.48.gate_proj.weight_scale": "model-00014-of-00047.safetensors", + "model.layers.13.mlp.experts.48.up_proj.weight": "model-00014-of-00047.safetensors", + "model.layers.13.mlp.experts.48.up_proj.weight_scale": "model-00014-of-00047.safetensors", + "model.layers.13.mlp.experts.49.down_proj.weight": "model-00014-of-00047.safetensors", + "model.layers.13.mlp.experts.49.down_proj.weight_scale": "model-00014-of-00047.safetensors", + "model.layers.13.mlp.experts.49.gate_proj.weight": "model-00014-of-00047.safetensors", + "model.layers.13.mlp.experts.49.gate_proj.weight_scale": "model-00014-of-00047.safetensors", + "model.layers.13.mlp.experts.49.up_proj.weight": "model-00014-of-00047.safetensors", + "model.layers.13.mlp.experts.49.up_proj.weight_scale": "model-00014-of-00047.safetensors", + "model.layers.13.mlp.experts.5.down_proj.weight": "model-00014-of-00047.safetensors", + "model.layers.13.mlp.experts.5.down_proj.weight_scale": "model-00014-of-00047.safetensors", + "model.layers.13.mlp.experts.5.gate_proj.weight": "model-00014-of-00047.safetensors", + "model.layers.13.mlp.experts.5.gate_proj.weight_scale": "model-00014-of-00047.safetensors", + "model.layers.13.mlp.experts.5.up_proj.weight": "model-00014-of-00047.safetensors", + "model.layers.13.mlp.experts.5.up_proj.weight_scale": "model-00014-of-00047.safetensors", + "model.layers.13.mlp.experts.50.down_proj.weight": "model-00014-of-00047.safetensors", + "model.layers.13.mlp.experts.50.down_proj.weight_scale": "model-00014-of-00047.safetensors", + "model.layers.13.mlp.experts.50.gate_proj.weight": "model-00014-of-00047.safetensors", + "model.layers.13.mlp.experts.50.gate_proj.weight_scale": "model-00014-of-00047.safetensors", + "model.layers.13.mlp.experts.50.up_proj.weight": "model-00014-of-00047.safetensors", + "model.layers.13.mlp.experts.50.up_proj.weight_scale": "model-00014-of-00047.safetensors", + "model.layers.13.mlp.experts.51.down_proj.weight": "model-00014-of-00047.safetensors", + "model.layers.13.mlp.experts.51.down_proj.weight_scale": "model-00014-of-00047.safetensors", + "model.layers.13.mlp.experts.51.gate_proj.weight": "model-00014-of-00047.safetensors", + "model.layers.13.mlp.experts.51.gate_proj.weight_scale": "model-00014-of-00047.safetensors", + "model.layers.13.mlp.experts.51.up_proj.weight": "model-00014-of-00047.safetensors", + "model.layers.13.mlp.experts.51.up_proj.weight_scale": "model-00014-of-00047.safetensors", + "model.layers.13.mlp.experts.52.down_proj.weight": "model-00014-of-00047.safetensors", + "model.layers.13.mlp.experts.52.down_proj.weight_scale": "model-00014-of-00047.safetensors", + "model.layers.13.mlp.experts.52.gate_proj.weight": "model-00014-of-00047.safetensors", + "model.layers.13.mlp.experts.52.gate_proj.weight_scale": "model-00014-of-00047.safetensors", + "model.layers.13.mlp.experts.52.up_proj.weight": "model-00014-of-00047.safetensors", + "model.layers.13.mlp.experts.52.up_proj.weight_scale": "model-00014-of-00047.safetensors", + "model.layers.13.mlp.experts.53.down_proj.weight": "model-00014-of-00047.safetensors", + "model.layers.13.mlp.experts.53.down_proj.weight_scale": "model-00014-of-00047.safetensors", + "model.layers.13.mlp.experts.53.gate_proj.weight": "model-00014-of-00047.safetensors", + "model.layers.13.mlp.experts.53.gate_proj.weight_scale": "model-00014-of-00047.safetensors", + "model.layers.13.mlp.experts.53.up_proj.weight": "model-00014-of-00047.safetensors", + "model.layers.13.mlp.experts.53.up_proj.weight_scale": "model-00014-of-00047.safetensors", + "model.layers.13.mlp.experts.54.down_proj.weight": "model-00014-of-00047.safetensors", + "model.layers.13.mlp.experts.54.down_proj.weight_scale": "model-00014-of-00047.safetensors", + "model.layers.13.mlp.experts.54.gate_proj.weight": "model-00014-of-00047.safetensors", + "model.layers.13.mlp.experts.54.gate_proj.weight_scale": "model-00014-of-00047.safetensors", + "model.layers.13.mlp.experts.54.up_proj.weight": "model-00014-of-00047.safetensors", + "model.layers.13.mlp.experts.54.up_proj.weight_scale": "model-00014-of-00047.safetensors", + "model.layers.13.mlp.experts.55.down_proj.weight": "model-00014-of-00047.safetensors", + "model.layers.13.mlp.experts.55.down_proj.weight_scale": "model-00014-of-00047.safetensors", + "model.layers.13.mlp.experts.55.gate_proj.weight": "model-00014-of-00047.safetensors", + "model.layers.13.mlp.experts.55.gate_proj.weight_scale": "model-00014-of-00047.safetensors", + "model.layers.13.mlp.experts.55.up_proj.weight": "model-00014-of-00047.safetensors", + "model.layers.13.mlp.experts.55.up_proj.weight_scale": "model-00014-of-00047.safetensors", + "model.layers.13.mlp.experts.56.down_proj.weight": "model-00014-of-00047.safetensors", + "model.layers.13.mlp.experts.56.down_proj.weight_scale": "model-00014-of-00047.safetensors", + "model.layers.13.mlp.experts.56.gate_proj.weight": "model-00014-of-00047.safetensors", + "model.layers.13.mlp.experts.56.gate_proj.weight_scale": "model-00014-of-00047.safetensors", + "model.layers.13.mlp.experts.56.up_proj.weight": "model-00014-of-00047.safetensors", + "model.layers.13.mlp.experts.56.up_proj.weight_scale": "model-00014-of-00047.safetensors", + "model.layers.13.mlp.experts.57.down_proj.weight": "model-00014-of-00047.safetensors", + "model.layers.13.mlp.experts.57.down_proj.weight_scale": "model-00014-of-00047.safetensors", + "model.layers.13.mlp.experts.57.gate_proj.weight": "model-00014-of-00047.safetensors", + "model.layers.13.mlp.experts.57.gate_proj.weight_scale": "model-00014-of-00047.safetensors", + "model.layers.13.mlp.experts.57.up_proj.weight": "model-00014-of-00047.safetensors", + "model.layers.13.mlp.experts.57.up_proj.weight_scale": "model-00014-of-00047.safetensors", + "model.layers.13.mlp.experts.58.down_proj.weight": "model-00014-of-00047.safetensors", + "model.layers.13.mlp.experts.58.down_proj.weight_scale": "model-00014-of-00047.safetensors", + "model.layers.13.mlp.experts.58.gate_proj.weight": "model-00014-of-00047.safetensors", + "model.layers.13.mlp.experts.58.gate_proj.weight_scale": "model-00014-of-00047.safetensors", + "model.layers.13.mlp.experts.58.up_proj.weight": "model-00014-of-00047.safetensors", + "model.layers.13.mlp.experts.58.up_proj.weight_scale": "model-00014-of-00047.safetensors", + "model.layers.13.mlp.experts.59.down_proj.weight": "model-00014-of-00047.safetensors", + "model.layers.13.mlp.experts.59.down_proj.weight_scale": "model-00014-of-00047.safetensors", + "model.layers.13.mlp.experts.59.gate_proj.weight": "model-00014-of-00047.safetensors", + "model.layers.13.mlp.experts.59.gate_proj.weight_scale": "model-00014-of-00047.safetensors", + "model.layers.13.mlp.experts.59.up_proj.weight": "model-00014-of-00047.safetensors", + "model.layers.13.mlp.experts.59.up_proj.weight_scale": "model-00014-of-00047.safetensors", + "model.layers.13.mlp.experts.6.down_proj.weight": "model-00014-of-00047.safetensors", + "model.layers.13.mlp.experts.6.down_proj.weight_scale": "model-00014-of-00047.safetensors", + "model.layers.13.mlp.experts.6.gate_proj.weight": "model-00014-of-00047.safetensors", + "model.layers.13.mlp.experts.6.gate_proj.weight_scale": "model-00014-of-00047.safetensors", + "model.layers.13.mlp.experts.6.up_proj.weight": "model-00014-of-00047.safetensors", + "model.layers.13.mlp.experts.6.up_proj.weight_scale": "model-00014-of-00047.safetensors", + "model.layers.13.mlp.experts.60.down_proj.weight": "model-00014-of-00047.safetensors", + "model.layers.13.mlp.experts.60.down_proj.weight_scale": "model-00014-of-00047.safetensors", + "model.layers.13.mlp.experts.60.gate_proj.weight": "model-00014-of-00047.safetensors", + "model.layers.13.mlp.experts.60.gate_proj.weight_scale": "model-00014-of-00047.safetensors", + "model.layers.13.mlp.experts.60.up_proj.weight": "model-00014-of-00047.safetensors", + "model.layers.13.mlp.experts.60.up_proj.weight_scale": "model-00014-of-00047.safetensors", + "model.layers.13.mlp.experts.61.down_proj.weight": "model-00014-of-00047.safetensors", + "model.layers.13.mlp.experts.61.down_proj.weight_scale": "model-00014-of-00047.safetensors", + "model.layers.13.mlp.experts.61.gate_proj.weight": "model-00014-of-00047.safetensors", + "model.layers.13.mlp.experts.61.gate_proj.weight_scale": "model-00014-of-00047.safetensors", + "model.layers.13.mlp.experts.61.up_proj.weight": "model-00014-of-00047.safetensors", + "model.layers.13.mlp.experts.61.up_proj.weight_scale": "model-00014-of-00047.safetensors", + "model.layers.13.mlp.experts.62.down_proj.weight": "model-00014-of-00047.safetensors", + "model.layers.13.mlp.experts.62.down_proj.weight_scale": "model-00014-of-00047.safetensors", + "model.layers.13.mlp.experts.62.gate_proj.weight": "model-00014-of-00047.safetensors", + "model.layers.13.mlp.experts.62.gate_proj.weight_scale": "model-00014-of-00047.safetensors", + "model.layers.13.mlp.experts.62.up_proj.weight": "model-00014-of-00047.safetensors", + "model.layers.13.mlp.experts.62.up_proj.weight_scale": "model-00014-of-00047.safetensors", + "model.layers.13.mlp.experts.63.down_proj.weight": "model-00014-of-00047.safetensors", + "model.layers.13.mlp.experts.63.down_proj.weight_scale": "model-00014-of-00047.safetensors", + "model.layers.13.mlp.experts.63.gate_proj.weight": "model-00014-of-00047.safetensors", + "model.layers.13.mlp.experts.63.gate_proj.weight_scale": "model-00014-of-00047.safetensors", + "model.layers.13.mlp.experts.63.up_proj.weight": "model-00014-of-00047.safetensors", + "model.layers.13.mlp.experts.63.up_proj.weight_scale": "model-00014-of-00047.safetensors", + "model.layers.13.mlp.experts.64.down_proj.weight": "model-00014-of-00047.safetensors", + "model.layers.13.mlp.experts.64.down_proj.weight_scale": "model-00014-of-00047.safetensors", + "model.layers.13.mlp.experts.64.gate_proj.weight": "model-00014-of-00047.safetensors", + "model.layers.13.mlp.experts.64.gate_proj.weight_scale": "model-00014-of-00047.safetensors", + "model.layers.13.mlp.experts.64.up_proj.weight": "model-00014-of-00047.safetensors", + "model.layers.13.mlp.experts.64.up_proj.weight_scale": "model-00014-of-00047.safetensors", + "model.layers.13.mlp.experts.65.down_proj.weight": "model-00014-of-00047.safetensors", + "model.layers.13.mlp.experts.65.down_proj.weight_scale": "model-00014-of-00047.safetensors", + "model.layers.13.mlp.experts.65.gate_proj.weight": "model-00014-of-00047.safetensors", + "model.layers.13.mlp.experts.65.gate_proj.weight_scale": "model-00014-of-00047.safetensors", + "model.layers.13.mlp.experts.65.up_proj.weight": "model-00014-of-00047.safetensors", + "model.layers.13.mlp.experts.65.up_proj.weight_scale": "model-00014-of-00047.safetensors", + "model.layers.13.mlp.experts.66.down_proj.weight": "model-00014-of-00047.safetensors", + "model.layers.13.mlp.experts.66.down_proj.weight_scale": "model-00014-of-00047.safetensors", + "model.layers.13.mlp.experts.66.gate_proj.weight": "model-00014-of-00047.safetensors", + "model.layers.13.mlp.experts.66.gate_proj.weight_scale": "model-00014-of-00047.safetensors", + "model.layers.13.mlp.experts.66.up_proj.weight": "model-00014-of-00047.safetensors", + "model.layers.13.mlp.experts.66.up_proj.weight_scale": "model-00014-of-00047.safetensors", + "model.layers.13.mlp.experts.67.down_proj.weight": "model-00014-of-00047.safetensors", + "model.layers.13.mlp.experts.67.down_proj.weight_scale": "model-00014-of-00047.safetensors", + "model.layers.13.mlp.experts.67.gate_proj.weight": "model-00014-of-00047.safetensors", + "model.layers.13.mlp.experts.67.gate_proj.weight_scale": "model-00014-of-00047.safetensors", + "model.layers.13.mlp.experts.67.up_proj.weight": "model-00014-of-00047.safetensors", + "model.layers.13.mlp.experts.67.up_proj.weight_scale": "model-00014-of-00047.safetensors", + "model.layers.13.mlp.experts.68.down_proj.weight": "model-00014-of-00047.safetensors", + "model.layers.13.mlp.experts.68.down_proj.weight_scale": "model-00014-of-00047.safetensors", + "model.layers.13.mlp.experts.68.gate_proj.weight": "model-00014-of-00047.safetensors", + "model.layers.13.mlp.experts.68.gate_proj.weight_scale": "model-00014-of-00047.safetensors", + "model.layers.13.mlp.experts.68.up_proj.weight": "model-00014-of-00047.safetensors", + "model.layers.13.mlp.experts.68.up_proj.weight_scale": "model-00014-of-00047.safetensors", + "model.layers.13.mlp.experts.69.down_proj.weight": "model-00014-of-00047.safetensors", + "model.layers.13.mlp.experts.69.down_proj.weight_scale": "model-00014-of-00047.safetensors", + "model.layers.13.mlp.experts.69.gate_proj.weight": "model-00014-of-00047.safetensors", + "model.layers.13.mlp.experts.69.gate_proj.weight_scale": "model-00014-of-00047.safetensors", + "model.layers.13.mlp.experts.69.up_proj.weight": "model-00014-of-00047.safetensors", + "model.layers.13.mlp.experts.69.up_proj.weight_scale": "model-00014-of-00047.safetensors", + "model.layers.13.mlp.experts.7.down_proj.weight": "model-00014-of-00047.safetensors", + "model.layers.13.mlp.experts.7.down_proj.weight_scale": "model-00014-of-00047.safetensors", + "model.layers.13.mlp.experts.7.gate_proj.weight": "model-00014-of-00047.safetensors", + "model.layers.13.mlp.experts.7.gate_proj.weight_scale": "model-00014-of-00047.safetensors", + "model.layers.13.mlp.experts.7.up_proj.weight": "model-00014-of-00047.safetensors", + "model.layers.13.mlp.experts.7.up_proj.weight_scale": "model-00014-of-00047.safetensors", + "model.layers.13.mlp.experts.70.down_proj.weight": "model-00014-of-00047.safetensors", + "model.layers.13.mlp.experts.70.down_proj.weight_scale": "model-00014-of-00047.safetensors", + "model.layers.13.mlp.experts.70.gate_proj.weight": "model-00014-of-00047.safetensors", + "model.layers.13.mlp.experts.70.gate_proj.weight_scale": "model-00014-of-00047.safetensors", + "model.layers.13.mlp.experts.70.up_proj.weight": "model-00014-of-00047.safetensors", + "model.layers.13.mlp.experts.70.up_proj.weight_scale": "model-00014-of-00047.safetensors", + "model.layers.13.mlp.experts.71.down_proj.weight": "model-00014-of-00047.safetensors", + "model.layers.13.mlp.experts.71.down_proj.weight_scale": "model-00014-of-00047.safetensors", + "model.layers.13.mlp.experts.71.gate_proj.weight": "model-00014-of-00047.safetensors", + "model.layers.13.mlp.experts.71.gate_proj.weight_scale": "model-00014-of-00047.safetensors", + "model.layers.13.mlp.experts.71.up_proj.weight": "model-00014-of-00047.safetensors", + "model.layers.13.mlp.experts.71.up_proj.weight_scale": "model-00014-of-00047.safetensors", + "model.layers.13.mlp.experts.72.down_proj.weight": "model-00014-of-00047.safetensors", + "model.layers.13.mlp.experts.72.down_proj.weight_scale": "model-00014-of-00047.safetensors", + "model.layers.13.mlp.experts.72.gate_proj.weight": "model-00014-of-00047.safetensors", + "model.layers.13.mlp.experts.72.gate_proj.weight_scale": "model-00014-of-00047.safetensors", + "model.layers.13.mlp.experts.72.up_proj.weight": "model-00014-of-00047.safetensors", + "model.layers.13.mlp.experts.72.up_proj.weight_scale": "model-00014-of-00047.safetensors", + "model.layers.13.mlp.experts.73.down_proj.weight": "model-00014-of-00047.safetensors", + "model.layers.13.mlp.experts.73.down_proj.weight_scale": "model-00014-of-00047.safetensors", + "model.layers.13.mlp.experts.73.gate_proj.weight": "model-00014-of-00047.safetensors", + "model.layers.13.mlp.experts.73.gate_proj.weight_scale": "model-00014-of-00047.safetensors", + "model.layers.13.mlp.experts.73.up_proj.weight": "model-00014-of-00047.safetensors", + "model.layers.13.mlp.experts.73.up_proj.weight_scale": "model-00014-of-00047.safetensors", + "model.layers.13.mlp.experts.74.down_proj.weight": "model-00014-of-00047.safetensors", + "model.layers.13.mlp.experts.74.down_proj.weight_scale": "model-00014-of-00047.safetensors", + "model.layers.13.mlp.experts.74.gate_proj.weight": "model-00014-of-00047.safetensors", + "model.layers.13.mlp.experts.74.gate_proj.weight_scale": "model-00014-of-00047.safetensors", + "model.layers.13.mlp.experts.74.up_proj.weight": "model-00014-of-00047.safetensors", + "model.layers.13.mlp.experts.74.up_proj.weight_scale": "model-00014-of-00047.safetensors", + "model.layers.13.mlp.experts.75.down_proj.weight": "model-00014-of-00047.safetensors", + "model.layers.13.mlp.experts.75.down_proj.weight_scale": "model-00014-of-00047.safetensors", + "model.layers.13.mlp.experts.75.gate_proj.weight": "model-00014-of-00047.safetensors", + "model.layers.13.mlp.experts.75.gate_proj.weight_scale": "model-00014-of-00047.safetensors", + "model.layers.13.mlp.experts.75.up_proj.weight": "model-00014-of-00047.safetensors", + "model.layers.13.mlp.experts.75.up_proj.weight_scale": "model-00014-of-00047.safetensors", + "model.layers.13.mlp.experts.76.down_proj.weight": "model-00014-of-00047.safetensors", + "model.layers.13.mlp.experts.76.down_proj.weight_scale": "model-00014-of-00047.safetensors", + "model.layers.13.mlp.experts.76.gate_proj.weight": "model-00014-of-00047.safetensors", + "model.layers.13.mlp.experts.76.gate_proj.weight_scale": "model-00014-of-00047.safetensors", + "model.layers.13.mlp.experts.76.up_proj.weight": "model-00014-of-00047.safetensors", + "model.layers.13.mlp.experts.76.up_proj.weight_scale": "model-00014-of-00047.safetensors", + "model.layers.13.mlp.experts.77.down_proj.weight": "model-00014-of-00047.safetensors", + "model.layers.13.mlp.experts.77.down_proj.weight_scale": "model-00014-of-00047.safetensors", + "model.layers.13.mlp.experts.77.gate_proj.weight": "model-00014-of-00047.safetensors", + "model.layers.13.mlp.experts.77.gate_proj.weight_scale": "model-00014-of-00047.safetensors", + "model.layers.13.mlp.experts.77.up_proj.weight": "model-00014-of-00047.safetensors", + "model.layers.13.mlp.experts.77.up_proj.weight_scale": "model-00014-of-00047.safetensors", + "model.layers.13.mlp.experts.78.down_proj.weight": "model-00014-of-00047.safetensors", + "model.layers.13.mlp.experts.78.down_proj.weight_scale": "model-00014-of-00047.safetensors", + "model.layers.13.mlp.experts.78.gate_proj.weight": "model-00014-of-00047.safetensors", + "model.layers.13.mlp.experts.78.gate_proj.weight_scale": "model-00014-of-00047.safetensors", + "model.layers.13.mlp.experts.78.up_proj.weight": "model-00014-of-00047.safetensors", + "model.layers.13.mlp.experts.78.up_proj.weight_scale": "model-00014-of-00047.safetensors", + "model.layers.13.mlp.experts.79.down_proj.weight": "model-00014-of-00047.safetensors", + "model.layers.13.mlp.experts.79.down_proj.weight_scale": "model-00014-of-00047.safetensors", + "model.layers.13.mlp.experts.79.gate_proj.weight": "model-00014-of-00047.safetensors", + "model.layers.13.mlp.experts.79.gate_proj.weight_scale": "model-00014-of-00047.safetensors", + "model.layers.13.mlp.experts.79.up_proj.weight": "model-00014-of-00047.safetensors", + "model.layers.13.mlp.experts.79.up_proj.weight_scale": "model-00014-of-00047.safetensors", + "model.layers.13.mlp.experts.8.down_proj.weight": "model-00014-of-00047.safetensors", + "model.layers.13.mlp.experts.8.down_proj.weight_scale": "model-00014-of-00047.safetensors", + "model.layers.13.mlp.experts.8.gate_proj.weight": "model-00014-of-00047.safetensors", + "model.layers.13.mlp.experts.8.gate_proj.weight_scale": "model-00014-of-00047.safetensors", + "model.layers.13.mlp.experts.8.up_proj.weight": "model-00014-of-00047.safetensors", + "model.layers.13.mlp.experts.8.up_proj.weight_scale": "model-00014-of-00047.safetensors", + "model.layers.13.mlp.experts.80.down_proj.weight": "model-00014-of-00047.safetensors", + "model.layers.13.mlp.experts.80.down_proj.weight_scale": "model-00014-of-00047.safetensors", + "model.layers.13.mlp.experts.80.gate_proj.weight": "model-00014-of-00047.safetensors", + "model.layers.13.mlp.experts.80.gate_proj.weight_scale": "model-00014-of-00047.safetensors", + "model.layers.13.mlp.experts.80.up_proj.weight": "model-00014-of-00047.safetensors", + "model.layers.13.mlp.experts.80.up_proj.weight_scale": "model-00014-of-00047.safetensors", + "model.layers.13.mlp.experts.81.down_proj.weight": "model-00014-of-00047.safetensors", + "model.layers.13.mlp.experts.81.down_proj.weight_scale": "model-00014-of-00047.safetensors", + "model.layers.13.mlp.experts.81.gate_proj.weight": "model-00014-of-00047.safetensors", + "model.layers.13.mlp.experts.81.gate_proj.weight_scale": "model-00014-of-00047.safetensors", + "model.layers.13.mlp.experts.81.up_proj.weight": "model-00014-of-00047.safetensors", + "model.layers.13.mlp.experts.81.up_proj.weight_scale": "model-00014-of-00047.safetensors", + "model.layers.13.mlp.experts.82.down_proj.weight": "model-00014-of-00047.safetensors", + "model.layers.13.mlp.experts.82.down_proj.weight_scale": "model-00014-of-00047.safetensors", + "model.layers.13.mlp.experts.82.gate_proj.weight": "model-00014-of-00047.safetensors", + "model.layers.13.mlp.experts.82.gate_proj.weight_scale": "model-00014-of-00047.safetensors", + "model.layers.13.mlp.experts.82.up_proj.weight": "model-00014-of-00047.safetensors", + "model.layers.13.mlp.experts.82.up_proj.weight_scale": "model-00014-of-00047.safetensors", + "model.layers.13.mlp.experts.83.down_proj.weight": "model-00014-of-00047.safetensors", + "model.layers.13.mlp.experts.83.down_proj.weight_scale": "model-00014-of-00047.safetensors", + "model.layers.13.mlp.experts.83.gate_proj.weight": "model-00014-of-00047.safetensors", + "model.layers.13.mlp.experts.83.gate_proj.weight_scale": "model-00014-of-00047.safetensors", + "model.layers.13.mlp.experts.83.up_proj.weight": "model-00014-of-00047.safetensors", + "model.layers.13.mlp.experts.83.up_proj.weight_scale": "model-00014-of-00047.safetensors", + "model.layers.13.mlp.experts.84.down_proj.weight": "model-00014-of-00047.safetensors", + "model.layers.13.mlp.experts.84.down_proj.weight_scale": "model-00014-of-00047.safetensors", + "model.layers.13.mlp.experts.84.gate_proj.weight": "model-00014-of-00047.safetensors", + "model.layers.13.mlp.experts.84.gate_proj.weight_scale": "model-00014-of-00047.safetensors", + "model.layers.13.mlp.experts.84.up_proj.weight": "model-00014-of-00047.safetensors", + "model.layers.13.mlp.experts.84.up_proj.weight_scale": "model-00014-of-00047.safetensors", + "model.layers.13.mlp.experts.85.down_proj.weight": "model-00014-of-00047.safetensors", + "model.layers.13.mlp.experts.85.down_proj.weight_scale": "model-00014-of-00047.safetensors", + "model.layers.13.mlp.experts.85.gate_proj.weight": "model-00014-of-00047.safetensors", + "model.layers.13.mlp.experts.85.gate_proj.weight_scale": "model-00014-of-00047.safetensors", + "model.layers.13.mlp.experts.85.up_proj.weight": "model-00014-of-00047.safetensors", + "model.layers.13.mlp.experts.85.up_proj.weight_scale": "model-00014-of-00047.safetensors", + "model.layers.13.mlp.experts.86.down_proj.weight": "model-00014-of-00047.safetensors", + "model.layers.13.mlp.experts.86.down_proj.weight_scale": "model-00014-of-00047.safetensors", + "model.layers.13.mlp.experts.86.gate_proj.weight": "model-00014-of-00047.safetensors", + "model.layers.13.mlp.experts.86.gate_proj.weight_scale": "model-00014-of-00047.safetensors", + "model.layers.13.mlp.experts.86.up_proj.weight": "model-00014-of-00047.safetensors", + "model.layers.13.mlp.experts.86.up_proj.weight_scale": "model-00014-of-00047.safetensors", + "model.layers.13.mlp.experts.87.down_proj.weight": "model-00014-of-00047.safetensors", + "model.layers.13.mlp.experts.87.down_proj.weight_scale": "model-00014-of-00047.safetensors", + "model.layers.13.mlp.experts.87.gate_proj.weight": "model-00014-of-00047.safetensors", + "model.layers.13.mlp.experts.87.gate_proj.weight_scale": "model-00014-of-00047.safetensors", + "model.layers.13.mlp.experts.87.up_proj.weight": "model-00014-of-00047.safetensors", + "model.layers.13.mlp.experts.87.up_proj.weight_scale": "model-00014-of-00047.safetensors", + "model.layers.13.mlp.experts.88.down_proj.weight": "model-00014-of-00047.safetensors", + "model.layers.13.mlp.experts.88.down_proj.weight_scale": "model-00014-of-00047.safetensors", + "model.layers.13.mlp.experts.88.gate_proj.weight": "model-00014-of-00047.safetensors", + "model.layers.13.mlp.experts.88.gate_proj.weight_scale": "model-00014-of-00047.safetensors", + "model.layers.13.mlp.experts.88.up_proj.weight": "model-00014-of-00047.safetensors", + "model.layers.13.mlp.experts.88.up_proj.weight_scale": "model-00014-of-00047.safetensors", + "model.layers.13.mlp.experts.89.down_proj.weight": "model-00014-of-00047.safetensors", + "model.layers.13.mlp.experts.89.down_proj.weight_scale": "model-00014-of-00047.safetensors", + "model.layers.13.mlp.experts.89.gate_proj.weight": "model-00014-of-00047.safetensors", + "model.layers.13.mlp.experts.89.gate_proj.weight_scale": "model-00014-of-00047.safetensors", + "model.layers.13.mlp.experts.89.up_proj.weight": "model-00014-of-00047.safetensors", + "model.layers.13.mlp.experts.89.up_proj.weight_scale": "model-00014-of-00047.safetensors", + "model.layers.13.mlp.experts.9.down_proj.weight": "model-00014-of-00047.safetensors", + "model.layers.13.mlp.experts.9.down_proj.weight_scale": "model-00014-of-00047.safetensors", + "model.layers.13.mlp.experts.9.gate_proj.weight": "model-00014-of-00047.safetensors", + "model.layers.13.mlp.experts.9.gate_proj.weight_scale": "model-00014-of-00047.safetensors", + "model.layers.13.mlp.experts.9.up_proj.weight": "model-00014-of-00047.safetensors", + "model.layers.13.mlp.experts.9.up_proj.weight_scale": "model-00014-of-00047.safetensors", + "model.layers.13.mlp.experts.90.down_proj.weight": "model-00014-of-00047.safetensors", + "model.layers.13.mlp.experts.90.down_proj.weight_scale": "model-00014-of-00047.safetensors", + "model.layers.13.mlp.experts.90.gate_proj.weight": "model-00014-of-00047.safetensors", + "model.layers.13.mlp.experts.90.gate_proj.weight_scale": "model-00014-of-00047.safetensors", + "model.layers.13.mlp.experts.90.up_proj.weight": "model-00014-of-00047.safetensors", + "model.layers.13.mlp.experts.90.up_proj.weight_scale": "model-00014-of-00047.safetensors", + "model.layers.13.mlp.experts.91.down_proj.weight": "model-00014-of-00047.safetensors", + "model.layers.13.mlp.experts.91.down_proj.weight_scale": "model-00014-of-00047.safetensors", + "model.layers.13.mlp.experts.91.gate_proj.weight": "model-00014-of-00047.safetensors", + "model.layers.13.mlp.experts.91.gate_proj.weight_scale": "model-00014-of-00047.safetensors", + "model.layers.13.mlp.experts.91.up_proj.weight": "model-00014-of-00047.safetensors", + "model.layers.13.mlp.experts.91.up_proj.weight_scale": "model-00014-of-00047.safetensors", + "model.layers.13.mlp.experts.92.down_proj.weight": "model-00014-of-00047.safetensors", + "model.layers.13.mlp.experts.92.down_proj.weight_scale": "model-00014-of-00047.safetensors", + "model.layers.13.mlp.experts.92.gate_proj.weight": "model-00014-of-00047.safetensors", + "model.layers.13.mlp.experts.92.gate_proj.weight_scale": "model-00014-of-00047.safetensors", + "model.layers.13.mlp.experts.92.up_proj.weight": "model-00014-of-00047.safetensors", + "model.layers.13.mlp.experts.92.up_proj.weight_scale": "model-00014-of-00047.safetensors", + "model.layers.13.mlp.experts.93.down_proj.weight": "model-00014-of-00047.safetensors", + "model.layers.13.mlp.experts.93.down_proj.weight_scale": "model-00014-of-00047.safetensors", + "model.layers.13.mlp.experts.93.gate_proj.weight": "model-00014-of-00047.safetensors", + "model.layers.13.mlp.experts.93.gate_proj.weight_scale": "model-00014-of-00047.safetensors", + "model.layers.13.mlp.experts.93.up_proj.weight": "model-00014-of-00047.safetensors", + "model.layers.13.mlp.experts.93.up_proj.weight_scale": "model-00014-of-00047.safetensors", + "model.layers.13.mlp.experts.94.down_proj.weight": "model-00014-of-00047.safetensors", + "model.layers.13.mlp.experts.94.down_proj.weight_scale": "model-00014-of-00047.safetensors", + "model.layers.13.mlp.experts.94.gate_proj.weight": "model-00014-of-00047.safetensors", + "model.layers.13.mlp.experts.94.gate_proj.weight_scale": "model-00014-of-00047.safetensors", + "model.layers.13.mlp.experts.94.up_proj.weight": "model-00014-of-00047.safetensors", + "model.layers.13.mlp.experts.94.up_proj.weight_scale": "model-00014-of-00047.safetensors", + "model.layers.13.mlp.experts.95.down_proj.weight": "model-00014-of-00047.safetensors", + "model.layers.13.mlp.experts.95.down_proj.weight_scale": "model-00014-of-00047.safetensors", + "model.layers.13.mlp.experts.95.gate_proj.weight": "model-00014-of-00047.safetensors", + "model.layers.13.mlp.experts.95.gate_proj.weight_scale": "model-00014-of-00047.safetensors", + "model.layers.13.mlp.experts.95.up_proj.weight": "model-00014-of-00047.safetensors", + "model.layers.13.mlp.experts.95.up_proj.weight_scale": "model-00014-of-00047.safetensors", + "model.layers.13.mlp.experts.96.down_proj.weight": "model-00014-of-00047.safetensors", + "model.layers.13.mlp.experts.96.down_proj.weight_scale": "model-00014-of-00047.safetensors", + "model.layers.13.mlp.experts.96.gate_proj.weight": "model-00014-of-00047.safetensors", + "model.layers.13.mlp.experts.96.gate_proj.weight_scale": "model-00014-of-00047.safetensors", + "model.layers.13.mlp.experts.96.up_proj.weight": "model-00014-of-00047.safetensors", + "model.layers.13.mlp.experts.96.up_proj.weight_scale": "model-00014-of-00047.safetensors", + "model.layers.13.mlp.experts.97.down_proj.weight": "model-00014-of-00047.safetensors", + "model.layers.13.mlp.experts.97.down_proj.weight_scale": "model-00014-of-00047.safetensors", + "model.layers.13.mlp.experts.97.gate_proj.weight": "model-00014-of-00047.safetensors", + "model.layers.13.mlp.experts.97.gate_proj.weight_scale": "model-00014-of-00047.safetensors", + "model.layers.13.mlp.experts.97.up_proj.weight": "model-00014-of-00047.safetensors", + "model.layers.13.mlp.experts.97.up_proj.weight_scale": "model-00014-of-00047.safetensors", + "model.layers.13.mlp.experts.98.down_proj.weight": "model-00014-of-00047.safetensors", + "model.layers.13.mlp.experts.98.down_proj.weight_scale": "model-00014-of-00047.safetensors", + "model.layers.13.mlp.experts.98.gate_proj.weight": "model-00014-of-00047.safetensors", + "model.layers.13.mlp.experts.98.gate_proj.weight_scale": "model-00014-of-00047.safetensors", + "model.layers.13.mlp.experts.98.up_proj.weight": "model-00014-of-00047.safetensors", + "model.layers.13.mlp.experts.98.up_proj.weight_scale": "model-00014-of-00047.safetensors", + "model.layers.13.mlp.experts.99.down_proj.weight": "model-00014-of-00047.safetensors", + "model.layers.13.mlp.experts.99.down_proj.weight_scale": "model-00014-of-00047.safetensors", + "model.layers.13.mlp.experts.99.gate_proj.weight": "model-00014-of-00047.safetensors", + "model.layers.13.mlp.experts.99.gate_proj.weight_scale": "model-00014-of-00047.safetensors", + "model.layers.13.mlp.experts.99.up_proj.weight": "model-00014-of-00047.safetensors", + "model.layers.13.mlp.experts.99.up_proj.weight_scale": "model-00014-of-00047.safetensors", + "model.layers.13.mlp.gate.e_score_correction_bias": "model-00014-of-00047.safetensors", + "model.layers.13.mlp.gate.weight": "model-00014-of-00047.safetensors", + "model.layers.13.mlp.shared_experts.down_proj.weight": "model-00014-of-00047.safetensors", + "model.layers.13.mlp.shared_experts.down_proj.weight_scale": "model-00014-of-00047.safetensors", + "model.layers.13.mlp.shared_experts.gate_proj.weight": "model-00014-of-00047.safetensors", + "model.layers.13.mlp.shared_experts.gate_proj.weight_scale": "model-00014-of-00047.safetensors", + "model.layers.13.mlp.shared_experts.up_proj.weight": "model-00014-of-00047.safetensors", + "model.layers.13.mlp.shared_experts.up_proj.weight_scale": "model-00014-of-00047.safetensors", + "model.layers.13.post_attention_layernorm.weight": "model-00014-of-00047.safetensors", + "model.layers.13.self_attn.k_proj.bias": "model-00014-of-00047.safetensors", + "model.layers.13.self_attn.k_proj.weight": "model-00014-of-00047.safetensors", + "model.layers.13.self_attn.k_proj.weight_scale": "model-00014-of-00047.safetensors", + "model.layers.13.self_attn.o_proj.weight": "model-00014-of-00047.safetensors", + "model.layers.13.self_attn.o_proj.weight_scale": "model-00014-of-00047.safetensors", + "model.layers.13.self_attn.q_proj.bias": "model-00014-of-00047.safetensors", + "model.layers.13.self_attn.q_proj.weight": "model-00014-of-00047.safetensors", + "model.layers.13.self_attn.q_proj.weight_scale": "model-00014-of-00047.safetensors", + "model.layers.13.self_attn.v_proj.bias": "model-00014-of-00047.safetensors", + "model.layers.13.self_attn.v_proj.weight": "model-00014-of-00047.safetensors", + "model.layers.13.self_attn.v_proj.weight_scale": "model-00014-of-00047.safetensors", + "model.layers.14.input_layernorm.weight": "model-00015-of-00047.safetensors", + "model.layers.14.mlp.experts.0.down_proj.weight": "model-00015-of-00047.safetensors", + "model.layers.14.mlp.experts.0.down_proj.weight_scale": "model-00015-of-00047.safetensors", + "model.layers.14.mlp.experts.0.gate_proj.weight": "model-00015-of-00047.safetensors", + "model.layers.14.mlp.experts.0.gate_proj.weight_scale": "model-00015-of-00047.safetensors", + "model.layers.14.mlp.experts.0.up_proj.weight": "model-00015-of-00047.safetensors", + "model.layers.14.mlp.experts.0.up_proj.weight_scale": "model-00015-of-00047.safetensors", + "model.layers.14.mlp.experts.1.down_proj.weight": "model-00015-of-00047.safetensors", + "model.layers.14.mlp.experts.1.down_proj.weight_scale": "model-00015-of-00047.safetensors", + "model.layers.14.mlp.experts.1.gate_proj.weight": "model-00015-of-00047.safetensors", + "model.layers.14.mlp.experts.1.gate_proj.weight_scale": "model-00015-of-00047.safetensors", + "model.layers.14.mlp.experts.1.up_proj.weight": "model-00015-of-00047.safetensors", + "model.layers.14.mlp.experts.1.up_proj.weight_scale": "model-00015-of-00047.safetensors", + "model.layers.14.mlp.experts.10.down_proj.weight": "model-00015-of-00047.safetensors", + "model.layers.14.mlp.experts.10.down_proj.weight_scale": "model-00015-of-00047.safetensors", + "model.layers.14.mlp.experts.10.gate_proj.weight": "model-00015-of-00047.safetensors", + "model.layers.14.mlp.experts.10.gate_proj.weight_scale": "model-00015-of-00047.safetensors", + "model.layers.14.mlp.experts.10.up_proj.weight": "model-00015-of-00047.safetensors", + "model.layers.14.mlp.experts.10.up_proj.weight_scale": "model-00015-of-00047.safetensors", + "model.layers.14.mlp.experts.100.down_proj.weight": "model-00015-of-00047.safetensors", + "model.layers.14.mlp.experts.100.down_proj.weight_scale": "model-00015-of-00047.safetensors", + "model.layers.14.mlp.experts.100.gate_proj.weight": "model-00015-of-00047.safetensors", + "model.layers.14.mlp.experts.100.gate_proj.weight_scale": "model-00015-of-00047.safetensors", + "model.layers.14.mlp.experts.100.up_proj.weight": "model-00015-of-00047.safetensors", + "model.layers.14.mlp.experts.100.up_proj.weight_scale": "model-00015-of-00047.safetensors", + "model.layers.14.mlp.experts.101.down_proj.weight": "model-00015-of-00047.safetensors", + "model.layers.14.mlp.experts.101.down_proj.weight_scale": "model-00015-of-00047.safetensors", + "model.layers.14.mlp.experts.101.gate_proj.weight": "model-00015-of-00047.safetensors", + "model.layers.14.mlp.experts.101.gate_proj.weight_scale": "model-00015-of-00047.safetensors", + "model.layers.14.mlp.experts.101.up_proj.weight": "model-00015-of-00047.safetensors", + "model.layers.14.mlp.experts.101.up_proj.weight_scale": "model-00015-of-00047.safetensors", + "model.layers.14.mlp.experts.102.down_proj.weight": "model-00015-of-00047.safetensors", + "model.layers.14.mlp.experts.102.down_proj.weight_scale": "model-00015-of-00047.safetensors", + "model.layers.14.mlp.experts.102.gate_proj.weight": "model-00015-of-00047.safetensors", + "model.layers.14.mlp.experts.102.gate_proj.weight_scale": "model-00015-of-00047.safetensors", + "model.layers.14.mlp.experts.102.up_proj.weight": "model-00015-of-00047.safetensors", + "model.layers.14.mlp.experts.102.up_proj.weight_scale": "model-00015-of-00047.safetensors", + "model.layers.14.mlp.experts.103.down_proj.weight": "model-00015-of-00047.safetensors", + "model.layers.14.mlp.experts.103.down_proj.weight_scale": "model-00015-of-00047.safetensors", + "model.layers.14.mlp.experts.103.gate_proj.weight": "model-00015-of-00047.safetensors", + "model.layers.14.mlp.experts.103.gate_proj.weight_scale": "model-00015-of-00047.safetensors", + "model.layers.14.mlp.experts.103.up_proj.weight": "model-00015-of-00047.safetensors", + "model.layers.14.mlp.experts.103.up_proj.weight_scale": "model-00015-of-00047.safetensors", + "model.layers.14.mlp.experts.104.down_proj.weight": "model-00015-of-00047.safetensors", + "model.layers.14.mlp.experts.104.down_proj.weight_scale": "model-00015-of-00047.safetensors", + "model.layers.14.mlp.experts.104.gate_proj.weight": "model-00015-of-00047.safetensors", + "model.layers.14.mlp.experts.104.gate_proj.weight_scale": "model-00015-of-00047.safetensors", + "model.layers.14.mlp.experts.104.up_proj.weight": "model-00015-of-00047.safetensors", + "model.layers.14.mlp.experts.104.up_proj.weight_scale": "model-00015-of-00047.safetensors", + "model.layers.14.mlp.experts.105.down_proj.weight": "model-00015-of-00047.safetensors", + "model.layers.14.mlp.experts.105.down_proj.weight_scale": "model-00015-of-00047.safetensors", + "model.layers.14.mlp.experts.105.gate_proj.weight": "model-00015-of-00047.safetensors", + "model.layers.14.mlp.experts.105.gate_proj.weight_scale": "model-00015-of-00047.safetensors", + "model.layers.14.mlp.experts.105.up_proj.weight": "model-00015-of-00047.safetensors", + "model.layers.14.mlp.experts.105.up_proj.weight_scale": "model-00015-of-00047.safetensors", + "model.layers.14.mlp.experts.106.down_proj.weight": "model-00015-of-00047.safetensors", + "model.layers.14.mlp.experts.106.down_proj.weight_scale": "model-00015-of-00047.safetensors", + "model.layers.14.mlp.experts.106.gate_proj.weight": "model-00015-of-00047.safetensors", + "model.layers.14.mlp.experts.106.gate_proj.weight_scale": "model-00015-of-00047.safetensors", + "model.layers.14.mlp.experts.106.up_proj.weight": "model-00015-of-00047.safetensors", + "model.layers.14.mlp.experts.106.up_proj.weight_scale": "model-00015-of-00047.safetensors", + "model.layers.14.mlp.experts.107.down_proj.weight": "model-00015-of-00047.safetensors", + "model.layers.14.mlp.experts.107.down_proj.weight_scale": "model-00015-of-00047.safetensors", + "model.layers.14.mlp.experts.107.gate_proj.weight": "model-00015-of-00047.safetensors", + "model.layers.14.mlp.experts.107.gate_proj.weight_scale": "model-00015-of-00047.safetensors", + "model.layers.14.mlp.experts.107.up_proj.weight": "model-00015-of-00047.safetensors", + "model.layers.14.mlp.experts.107.up_proj.weight_scale": "model-00015-of-00047.safetensors", + "model.layers.14.mlp.experts.108.down_proj.weight": "model-00015-of-00047.safetensors", + "model.layers.14.mlp.experts.108.down_proj.weight_scale": "model-00015-of-00047.safetensors", + "model.layers.14.mlp.experts.108.gate_proj.weight": "model-00015-of-00047.safetensors", + "model.layers.14.mlp.experts.108.gate_proj.weight_scale": "model-00015-of-00047.safetensors", + "model.layers.14.mlp.experts.108.up_proj.weight": "model-00015-of-00047.safetensors", + "model.layers.14.mlp.experts.108.up_proj.weight_scale": "model-00015-of-00047.safetensors", + "model.layers.14.mlp.experts.109.down_proj.weight": "model-00015-of-00047.safetensors", + "model.layers.14.mlp.experts.109.down_proj.weight_scale": "model-00015-of-00047.safetensors", + "model.layers.14.mlp.experts.109.gate_proj.weight": "model-00015-of-00047.safetensors", + "model.layers.14.mlp.experts.109.gate_proj.weight_scale": "model-00015-of-00047.safetensors", + "model.layers.14.mlp.experts.109.up_proj.weight": "model-00015-of-00047.safetensors", + "model.layers.14.mlp.experts.109.up_proj.weight_scale": "model-00015-of-00047.safetensors", + "model.layers.14.mlp.experts.11.down_proj.weight": "model-00015-of-00047.safetensors", + "model.layers.14.mlp.experts.11.down_proj.weight_scale": "model-00015-of-00047.safetensors", + "model.layers.14.mlp.experts.11.gate_proj.weight": "model-00015-of-00047.safetensors", + "model.layers.14.mlp.experts.11.gate_proj.weight_scale": "model-00015-of-00047.safetensors", + "model.layers.14.mlp.experts.11.up_proj.weight": "model-00015-of-00047.safetensors", + "model.layers.14.mlp.experts.11.up_proj.weight_scale": "model-00015-of-00047.safetensors", + "model.layers.14.mlp.experts.110.down_proj.weight": "model-00015-of-00047.safetensors", + "model.layers.14.mlp.experts.110.down_proj.weight_scale": "model-00015-of-00047.safetensors", + "model.layers.14.mlp.experts.110.gate_proj.weight": "model-00015-of-00047.safetensors", + "model.layers.14.mlp.experts.110.gate_proj.weight_scale": "model-00015-of-00047.safetensors", + "model.layers.14.mlp.experts.110.up_proj.weight": "model-00015-of-00047.safetensors", + "model.layers.14.mlp.experts.110.up_proj.weight_scale": "model-00015-of-00047.safetensors", + "model.layers.14.mlp.experts.111.down_proj.weight": "model-00015-of-00047.safetensors", + "model.layers.14.mlp.experts.111.down_proj.weight_scale": "model-00015-of-00047.safetensors", + "model.layers.14.mlp.experts.111.gate_proj.weight": "model-00015-of-00047.safetensors", + "model.layers.14.mlp.experts.111.gate_proj.weight_scale": "model-00015-of-00047.safetensors", + "model.layers.14.mlp.experts.111.up_proj.weight": "model-00015-of-00047.safetensors", + "model.layers.14.mlp.experts.111.up_proj.weight_scale": "model-00015-of-00047.safetensors", + "model.layers.14.mlp.experts.112.down_proj.weight": "model-00015-of-00047.safetensors", + "model.layers.14.mlp.experts.112.down_proj.weight_scale": "model-00015-of-00047.safetensors", + "model.layers.14.mlp.experts.112.gate_proj.weight": "model-00015-of-00047.safetensors", + "model.layers.14.mlp.experts.112.gate_proj.weight_scale": "model-00015-of-00047.safetensors", + "model.layers.14.mlp.experts.112.up_proj.weight": "model-00015-of-00047.safetensors", + "model.layers.14.mlp.experts.112.up_proj.weight_scale": "model-00015-of-00047.safetensors", + "model.layers.14.mlp.experts.113.down_proj.weight": "model-00015-of-00047.safetensors", + "model.layers.14.mlp.experts.113.down_proj.weight_scale": "model-00015-of-00047.safetensors", + "model.layers.14.mlp.experts.113.gate_proj.weight": "model-00015-of-00047.safetensors", + "model.layers.14.mlp.experts.113.gate_proj.weight_scale": "model-00015-of-00047.safetensors", + "model.layers.14.mlp.experts.113.up_proj.weight": "model-00015-of-00047.safetensors", + "model.layers.14.mlp.experts.113.up_proj.weight_scale": "model-00015-of-00047.safetensors", + "model.layers.14.mlp.experts.114.down_proj.weight": "model-00015-of-00047.safetensors", + "model.layers.14.mlp.experts.114.down_proj.weight_scale": "model-00015-of-00047.safetensors", + "model.layers.14.mlp.experts.114.gate_proj.weight": "model-00015-of-00047.safetensors", + "model.layers.14.mlp.experts.114.gate_proj.weight_scale": "model-00015-of-00047.safetensors", + "model.layers.14.mlp.experts.114.up_proj.weight": "model-00015-of-00047.safetensors", + "model.layers.14.mlp.experts.114.up_proj.weight_scale": "model-00015-of-00047.safetensors", + "model.layers.14.mlp.experts.115.down_proj.weight": "model-00015-of-00047.safetensors", + "model.layers.14.mlp.experts.115.down_proj.weight_scale": "model-00015-of-00047.safetensors", + "model.layers.14.mlp.experts.115.gate_proj.weight": "model-00015-of-00047.safetensors", + "model.layers.14.mlp.experts.115.gate_proj.weight_scale": "model-00015-of-00047.safetensors", + "model.layers.14.mlp.experts.115.up_proj.weight": "model-00015-of-00047.safetensors", + "model.layers.14.mlp.experts.115.up_proj.weight_scale": "model-00015-of-00047.safetensors", + "model.layers.14.mlp.experts.116.down_proj.weight": "model-00015-of-00047.safetensors", + "model.layers.14.mlp.experts.116.down_proj.weight_scale": "model-00015-of-00047.safetensors", + "model.layers.14.mlp.experts.116.gate_proj.weight": "model-00015-of-00047.safetensors", + "model.layers.14.mlp.experts.116.gate_proj.weight_scale": "model-00015-of-00047.safetensors", + "model.layers.14.mlp.experts.116.up_proj.weight": "model-00015-of-00047.safetensors", + "model.layers.14.mlp.experts.116.up_proj.weight_scale": "model-00015-of-00047.safetensors", + "model.layers.14.mlp.experts.117.down_proj.weight": "model-00015-of-00047.safetensors", + "model.layers.14.mlp.experts.117.down_proj.weight_scale": "model-00015-of-00047.safetensors", + "model.layers.14.mlp.experts.117.gate_proj.weight": "model-00015-of-00047.safetensors", + "model.layers.14.mlp.experts.117.gate_proj.weight_scale": "model-00015-of-00047.safetensors", + "model.layers.14.mlp.experts.117.up_proj.weight": "model-00015-of-00047.safetensors", + "model.layers.14.mlp.experts.117.up_proj.weight_scale": "model-00015-of-00047.safetensors", + "model.layers.14.mlp.experts.118.down_proj.weight": "model-00015-of-00047.safetensors", + "model.layers.14.mlp.experts.118.down_proj.weight_scale": "model-00015-of-00047.safetensors", + "model.layers.14.mlp.experts.118.gate_proj.weight": "model-00015-of-00047.safetensors", + "model.layers.14.mlp.experts.118.gate_proj.weight_scale": "model-00015-of-00047.safetensors", + "model.layers.14.mlp.experts.118.up_proj.weight": "model-00015-of-00047.safetensors", + "model.layers.14.mlp.experts.118.up_proj.weight_scale": "model-00015-of-00047.safetensors", + "model.layers.14.mlp.experts.119.down_proj.weight": "model-00015-of-00047.safetensors", + "model.layers.14.mlp.experts.119.down_proj.weight_scale": "model-00015-of-00047.safetensors", + "model.layers.14.mlp.experts.119.gate_proj.weight": "model-00015-of-00047.safetensors", + "model.layers.14.mlp.experts.119.gate_proj.weight_scale": "model-00015-of-00047.safetensors", + "model.layers.14.mlp.experts.119.up_proj.weight": "model-00015-of-00047.safetensors", + "model.layers.14.mlp.experts.119.up_proj.weight_scale": "model-00015-of-00047.safetensors", + "model.layers.14.mlp.experts.12.down_proj.weight": "model-00015-of-00047.safetensors", + "model.layers.14.mlp.experts.12.down_proj.weight_scale": "model-00015-of-00047.safetensors", + "model.layers.14.mlp.experts.12.gate_proj.weight": "model-00015-of-00047.safetensors", + "model.layers.14.mlp.experts.12.gate_proj.weight_scale": "model-00015-of-00047.safetensors", + "model.layers.14.mlp.experts.12.up_proj.weight": "model-00015-of-00047.safetensors", + "model.layers.14.mlp.experts.12.up_proj.weight_scale": "model-00015-of-00047.safetensors", + "model.layers.14.mlp.experts.120.down_proj.weight": "model-00015-of-00047.safetensors", + "model.layers.14.mlp.experts.120.down_proj.weight_scale": "model-00015-of-00047.safetensors", + "model.layers.14.mlp.experts.120.gate_proj.weight": "model-00015-of-00047.safetensors", + "model.layers.14.mlp.experts.120.gate_proj.weight_scale": "model-00015-of-00047.safetensors", + "model.layers.14.mlp.experts.120.up_proj.weight": "model-00015-of-00047.safetensors", + "model.layers.14.mlp.experts.120.up_proj.weight_scale": "model-00015-of-00047.safetensors", + "model.layers.14.mlp.experts.121.down_proj.weight": "model-00015-of-00047.safetensors", + "model.layers.14.mlp.experts.121.down_proj.weight_scale": "model-00015-of-00047.safetensors", + "model.layers.14.mlp.experts.121.gate_proj.weight": "model-00015-of-00047.safetensors", + "model.layers.14.mlp.experts.121.gate_proj.weight_scale": "model-00015-of-00047.safetensors", + "model.layers.14.mlp.experts.121.up_proj.weight": "model-00015-of-00047.safetensors", + "model.layers.14.mlp.experts.121.up_proj.weight_scale": "model-00015-of-00047.safetensors", + "model.layers.14.mlp.experts.122.down_proj.weight": "model-00015-of-00047.safetensors", + "model.layers.14.mlp.experts.122.down_proj.weight_scale": "model-00015-of-00047.safetensors", + "model.layers.14.mlp.experts.122.gate_proj.weight": "model-00015-of-00047.safetensors", + "model.layers.14.mlp.experts.122.gate_proj.weight_scale": "model-00015-of-00047.safetensors", + "model.layers.14.mlp.experts.122.up_proj.weight": "model-00015-of-00047.safetensors", + "model.layers.14.mlp.experts.122.up_proj.weight_scale": "model-00015-of-00047.safetensors", + "model.layers.14.mlp.experts.123.down_proj.weight": "model-00015-of-00047.safetensors", + "model.layers.14.mlp.experts.123.down_proj.weight_scale": "model-00015-of-00047.safetensors", + "model.layers.14.mlp.experts.123.gate_proj.weight": "model-00015-of-00047.safetensors", + "model.layers.14.mlp.experts.123.gate_proj.weight_scale": "model-00015-of-00047.safetensors", + "model.layers.14.mlp.experts.123.up_proj.weight": "model-00015-of-00047.safetensors", + "model.layers.14.mlp.experts.123.up_proj.weight_scale": "model-00015-of-00047.safetensors", + "model.layers.14.mlp.experts.124.down_proj.weight": "model-00015-of-00047.safetensors", + "model.layers.14.mlp.experts.124.down_proj.weight_scale": "model-00015-of-00047.safetensors", + "model.layers.14.mlp.experts.124.gate_proj.weight": "model-00015-of-00047.safetensors", + "model.layers.14.mlp.experts.124.gate_proj.weight_scale": "model-00015-of-00047.safetensors", + "model.layers.14.mlp.experts.124.up_proj.weight": "model-00015-of-00047.safetensors", + "model.layers.14.mlp.experts.124.up_proj.weight_scale": "model-00015-of-00047.safetensors", + "model.layers.14.mlp.experts.125.down_proj.weight": "model-00015-of-00047.safetensors", + "model.layers.14.mlp.experts.125.down_proj.weight_scale": "model-00015-of-00047.safetensors", + "model.layers.14.mlp.experts.125.gate_proj.weight": "model-00015-of-00047.safetensors", + "model.layers.14.mlp.experts.125.gate_proj.weight_scale": "model-00015-of-00047.safetensors", + "model.layers.14.mlp.experts.125.up_proj.weight": "model-00015-of-00047.safetensors", + "model.layers.14.mlp.experts.125.up_proj.weight_scale": "model-00015-of-00047.safetensors", + "model.layers.14.mlp.experts.126.down_proj.weight": "model-00015-of-00047.safetensors", + "model.layers.14.mlp.experts.126.down_proj.weight_scale": "model-00015-of-00047.safetensors", + "model.layers.14.mlp.experts.126.gate_proj.weight": "model-00015-of-00047.safetensors", + "model.layers.14.mlp.experts.126.gate_proj.weight_scale": "model-00015-of-00047.safetensors", + "model.layers.14.mlp.experts.126.up_proj.weight": "model-00015-of-00047.safetensors", + "model.layers.14.mlp.experts.126.up_proj.weight_scale": "model-00015-of-00047.safetensors", + "model.layers.14.mlp.experts.127.down_proj.weight": "model-00015-of-00047.safetensors", + "model.layers.14.mlp.experts.127.down_proj.weight_scale": "model-00015-of-00047.safetensors", + "model.layers.14.mlp.experts.127.gate_proj.weight": "model-00015-of-00047.safetensors", + "model.layers.14.mlp.experts.127.gate_proj.weight_scale": "model-00015-of-00047.safetensors", + "model.layers.14.mlp.experts.127.up_proj.weight": "model-00015-of-00047.safetensors", + "model.layers.14.mlp.experts.127.up_proj.weight_scale": "model-00015-of-00047.safetensors", + "model.layers.14.mlp.experts.13.down_proj.weight": "model-00015-of-00047.safetensors", + "model.layers.14.mlp.experts.13.down_proj.weight_scale": "model-00015-of-00047.safetensors", + "model.layers.14.mlp.experts.13.gate_proj.weight": "model-00015-of-00047.safetensors", + "model.layers.14.mlp.experts.13.gate_proj.weight_scale": "model-00015-of-00047.safetensors", + "model.layers.14.mlp.experts.13.up_proj.weight": "model-00015-of-00047.safetensors", + "model.layers.14.mlp.experts.13.up_proj.weight_scale": "model-00015-of-00047.safetensors", + "model.layers.14.mlp.experts.14.down_proj.weight": "model-00015-of-00047.safetensors", + "model.layers.14.mlp.experts.14.down_proj.weight_scale": "model-00015-of-00047.safetensors", + "model.layers.14.mlp.experts.14.gate_proj.weight": "model-00015-of-00047.safetensors", + "model.layers.14.mlp.experts.14.gate_proj.weight_scale": "model-00015-of-00047.safetensors", + "model.layers.14.mlp.experts.14.up_proj.weight": "model-00015-of-00047.safetensors", + "model.layers.14.mlp.experts.14.up_proj.weight_scale": "model-00015-of-00047.safetensors", + "model.layers.14.mlp.experts.15.down_proj.weight": "model-00015-of-00047.safetensors", + "model.layers.14.mlp.experts.15.down_proj.weight_scale": "model-00015-of-00047.safetensors", + "model.layers.14.mlp.experts.15.gate_proj.weight": "model-00015-of-00047.safetensors", + "model.layers.14.mlp.experts.15.gate_proj.weight_scale": "model-00015-of-00047.safetensors", + "model.layers.14.mlp.experts.15.up_proj.weight": "model-00015-of-00047.safetensors", + "model.layers.14.mlp.experts.15.up_proj.weight_scale": "model-00015-of-00047.safetensors", + "model.layers.14.mlp.experts.16.down_proj.weight": "model-00015-of-00047.safetensors", + "model.layers.14.mlp.experts.16.down_proj.weight_scale": "model-00015-of-00047.safetensors", + "model.layers.14.mlp.experts.16.gate_proj.weight": "model-00015-of-00047.safetensors", + "model.layers.14.mlp.experts.16.gate_proj.weight_scale": "model-00015-of-00047.safetensors", + "model.layers.14.mlp.experts.16.up_proj.weight": "model-00015-of-00047.safetensors", + "model.layers.14.mlp.experts.16.up_proj.weight_scale": "model-00015-of-00047.safetensors", + "model.layers.14.mlp.experts.17.down_proj.weight": "model-00015-of-00047.safetensors", + "model.layers.14.mlp.experts.17.down_proj.weight_scale": "model-00015-of-00047.safetensors", + "model.layers.14.mlp.experts.17.gate_proj.weight": "model-00015-of-00047.safetensors", + "model.layers.14.mlp.experts.17.gate_proj.weight_scale": "model-00015-of-00047.safetensors", + "model.layers.14.mlp.experts.17.up_proj.weight": "model-00015-of-00047.safetensors", + "model.layers.14.mlp.experts.17.up_proj.weight_scale": "model-00015-of-00047.safetensors", + "model.layers.14.mlp.experts.18.down_proj.weight": "model-00015-of-00047.safetensors", + "model.layers.14.mlp.experts.18.down_proj.weight_scale": "model-00015-of-00047.safetensors", + "model.layers.14.mlp.experts.18.gate_proj.weight": "model-00015-of-00047.safetensors", + "model.layers.14.mlp.experts.18.gate_proj.weight_scale": "model-00015-of-00047.safetensors", + "model.layers.14.mlp.experts.18.up_proj.weight": "model-00015-of-00047.safetensors", + "model.layers.14.mlp.experts.18.up_proj.weight_scale": "model-00015-of-00047.safetensors", + "model.layers.14.mlp.experts.19.down_proj.weight": "model-00015-of-00047.safetensors", + "model.layers.14.mlp.experts.19.down_proj.weight_scale": "model-00015-of-00047.safetensors", + "model.layers.14.mlp.experts.19.gate_proj.weight": "model-00015-of-00047.safetensors", + "model.layers.14.mlp.experts.19.gate_proj.weight_scale": "model-00015-of-00047.safetensors", + "model.layers.14.mlp.experts.19.up_proj.weight": "model-00015-of-00047.safetensors", + "model.layers.14.mlp.experts.19.up_proj.weight_scale": "model-00015-of-00047.safetensors", + "model.layers.14.mlp.experts.2.down_proj.weight": "model-00015-of-00047.safetensors", + "model.layers.14.mlp.experts.2.down_proj.weight_scale": "model-00015-of-00047.safetensors", + "model.layers.14.mlp.experts.2.gate_proj.weight": "model-00015-of-00047.safetensors", + "model.layers.14.mlp.experts.2.gate_proj.weight_scale": "model-00015-of-00047.safetensors", + "model.layers.14.mlp.experts.2.up_proj.weight": "model-00015-of-00047.safetensors", + "model.layers.14.mlp.experts.2.up_proj.weight_scale": "model-00015-of-00047.safetensors", + "model.layers.14.mlp.experts.20.down_proj.weight": "model-00015-of-00047.safetensors", + "model.layers.14.mlp.experts.20.down_proj.weight_scale": "model-00015-of-00047.safetensors", + "model.layers.14.mlp.experts.20.gate_proj.weight": "model-00015-of-00047.safetensors", + "model.layers.14.mlp.experts.20.gate_proj.weight_scale": "model-00015-of-00047.safetensors", + "model.layers.14.mlp.experts.20.up_proj.weight": "model-00015-of-00047.safetensors", + "model.layers.14.mlp.experts.20.up_proj.weight_scale": "model-00015-of-00047.safetensors", + "model.layers.14.mlp.experts.21.down_proj.weight": "model-00015-of-00047.safetensors", + "model.layers.14.mlp.experts.21.down_proj.weight_scale": "model-00015-of-00047.safetensors", + "model.layers.14.mlp.experts.21.gate_proj.weight": "model-00015-of-00047.safetensors", + "model.layers.14.mlp.experts.21.gate_proj.weight_scale": "model-00015-of-00047.safetensors", + "model.layers.14.mlp.experts.21.up_proj.weight": "model-00015-of-00047.safetensors", + "model.layers.14.mlp.experts.21.up_proj.weight_scale": "model-00015-of-00047.safetensors", + "model.layers.14.mlp.experts.22.down_proj.weight": "model-00015-of-00047.safetensors", + "model.layers.14.mlp.experts.22.down_proj.weight_scale": "model-00015-of-00047.safetensors", + "model.layers.14.mlp.experts.22.gate_proj.weight": "model-00015-of-00047.safetensors", + "model.layers.14.mlp.experts.22.gate_proj.weight_scale": "model-00015-of-00047.safetensors", + "model.layers.14.mlp.experts.22.up_proj.weight": "model-00015-of-00047.safetensors", + "model.layers.14.mlp.experts.22.up_proj.weight_scale": "model-00015-of-00047.safetensors", + "model.layers.14.mlp.experts.23.down_proj.weight": "model-00015-of-00047.safetensors", + "model.layers.14.mlp.experts.23.down_proj.weight_scale": "model-00015-of-00047.safetensors", + "model.layers.14.mlp.experts.23.gate_proj.weight": "model-00015-of-00047.safetensors", + "model.layers.14.mlp.experts.23.gate_proj.weight_scale": "model-00015-of-00047.safetensors", + "model.layers.14.mlp.experts.23.up_proj.weight": "model-00015-of-00047.safetensors", + "model.layers.14.mlp.experts.23.up_proj.weight_scale": "model-00015-of-00047.safetensors", + "model.layers.14.mlp.experts.24.down_proj.weight": "model-00015-of-00047.safetensors", + "model.layers.14.mlp.experts.24.down_proj.weight_scale": "model-00015-of-00047.safetensors", + "model.layers.14.mlp.experts.24.gate_proj.weight": "model-00015-of-00047.safetensors", + "model.layers.14.mlp.experts.24.gate_proj.weight_scale": "model-00015-of-00047.safetensors", + "model.layers.14.mlp.experts.24.up_proj.weight": "model-00015-of-00047.safetensors", + "model.layers.14.mlp.experts.24.up_proj.weight_scale": "model-00015-of-00047.safetensors", + "model.layers.14.mlp.experts.25.down_proj.weight": "model-00015-of-00047.safetensors", + "model.layers.14.mlp.experts.25.down_proj.weight_scale": "model-00015-of-00047.safetensors", + "model.layers.14.mlp.experts.25.gate_proj.weight": "model-00015-of-00047.safetensors", + "model.layers.14.mlp.experts.25.gate_proj.weight_scale": "model-00015-of-00047.safetensors", + "model.layers.14.mlp.experts.25.up_proj.weight": "model-00015-of-00047.safetensors", + "model.layers.14.mlp.experts.25.up_proj.weight_scale": "model-00015-of-00047.safetensors", + "model.layers.14.mlp.experts.26.down_proj.weight": "model-00015-of-00047.safetensors", + "model.layers.14.mlp.experts.26.down_proj.weight_scale": "model-00015-of-00047.safetensors", + "model.layers.14.mlp.experts.26.gate_proj.weight": "model-00015-of-00047.safetensors", + "model.layers.14.mlp.experts.26.gate_proj.weight_scale": "model-00015-of-00047.safetensors", + "model.layers.14.mlp.experts.26.up_proj.weight": "model-00015-of-00047.safetensors", + "model.layers.14.mlp.experts.26.up_proj.weight_scale": "model-00015-of-00047.safetensors", + "model.layers.14.mlp.experts.27.down_proj.weight": "model-00015-of-00047.safetensors", + "model.layers.14.mlp.experts.27.down_proj.weight_scale": "model-00015-of-00047.safetensors", + "model.layers.14.mlp.experts.27.gate_proj.weight": "model-00015-of-00047.safetensors", + "model.layers.14.mlp.experts.27.gate_proj.weight_scale": "model-00015-of-00047.safetensors", + "model.layers.14.mlp.experts.27.up_proj.weight": "model-00015-of-00047.safetensors", + "model.layers.14.mlp.experts.27.up_proj.weight_scale": "model-00015-of-00047.safetensors", + "model.layers.14.mlp.experts.28.down_proj.weight": "model-00015-of-00047.safetensors", + "model.layers.14.mlp.experts.28.down_proj.weight_scale": "model-00015-of-00047.safetensors", + "model.layers.14.mlp.experts.28.gate_proj.weight": "model-00015-of-00047.safetensors", + "model.layers.14.mlp.experts.28.gate_proj.weight_scale": "model-00015-of-00047.safetensors", + "model.layers.14.mlp.experts.28.up_proj.weight": "model-00015-of-00047.safetensors", + "model.layers.14.mlp.experts.28.up_proj.weight_scale": "model-00015-of-00047.safetensors", + "model.layers.14.mlp.experts.29.down_proj.weight": "model-00015-of-00047.safetensors", + "model.layers.14.mlp.experts.29.down_proj.weight_scale": "model-00015-of-00047.safetensors", + "model.layers.14.mlp.experts.29.gate_proj.weight": "model-00015-of-00047.safetensors", + "model.layers.14.mlp.experts.29.gate_proj.weight_scale": "model-00015-of-00047.safetensors", + "model.layers.14.mlp.experts.29.up_proj.weight": "model-00015-of-00047.safetensors", + "model.layers.14.mlp.experts.29.up_proj.weight_scale": "model-00015-of-00047.safetensors", + "model.layers.14.mlp.experts.3.down_proj.weight": "model-00015-of-00047.safetensors", + "model.layers.14.mlp.experts.3.down_proj.weight_scale": "model-00015-of-00047.safetensors", + "model.layers.14.mlp.experts.3.gate_proj.weight": "model-00015-of-00047.safetensors", + "model.layers.14.mlp.experts.3.gate_proj.weight_scale": "model-00015-of-00047.safetensors", + "model.layers.14.mlp.experts.3.up_proj.weight": "model-00015-of-00047.safetensors", + "model.layers.14.mlp.experts.3.up_proj.weight_scale": "model-00015-of-00047.safetensors", + "model.layers.14.mlp.experts.30.down_proj.weight": "model-00015-of-00047.safetensors", + "model.layers.14.mlp.experts.30.down_proj.weight_scale": "model-00015-of-00047.safetensors", + "model.layers.14.mlp.experts.30.gate_proj.weight": "model-00015-of-00047.safetensors", + "model.layers.14.mlp.experts.30.gate_proj.weight_scale": "model-00015-of-00047.safetensors", + "model.layers.14.mlp.experts.30.up_proj.weight": "model-00015-of-00047.safetensors", + "model.layers.14.mlp.experts.30.up_proj.weight_scale": "model-00015-of-00047.safetensors", + "model.layers.14.mlp.experts.31.down_proj.weight": "model-00015-of-00047.safetensors", + "model.layers.14.mlp.experts.31.down_proj.weight_scale": "model-00015-of-00047.safetensors", + "model.layers.14.mlp.experts.31.gate_proj.weight": "model-00015-of-00047.safetensors", + "model.layers.14.mlp.experts.31.gate_proj.weight_scale": "model-00015-of-00047.safetensors", + "model.layers.14.mlp.experts.31.up_proj.weight": "model-00015-of-00047.safetensors", + "model.layers.14.mlp.experts.31.up_proj.weight_scale": "model-00015-of-00047.safetensors", + "model.layers.14.mlp.experts.32.down_proj.weight": "model-00015-of-00047.safetensors", + "model.layers.14.mlp.experts.32.down_proj.weight_scale": "model-00015-of-00047.safetensors", + "model.layers.14.mlp.experts.32.gate_proj.weight": "model-00015-of-00047.safetensors", + "model.layers.14.mlp.experts.32.gate_proj.weight_scale": "model-00015-of-00047.safetensors", + "model.layers.14.mlp.experts.32.up_proj.weight": "model-00015-of-00047.safetensors", + "model.layers.14.mlp.experts.32.up_proj.weight_scale": "model-00015-of-00047.safetensors", + "model.layers.14.mlp.experts.33.down_proj.weight": "model-00015-of-00047.safetensors", + "model.layers.14.mlp.experts.33.down_proj.weight_scale": "model-00015-of-00047.safetensors", + "model.layers.14.mlp.experts.33.gate_proj.weight": "model-00015-of-00047.safetensors", + "model.layers.14.mlp.experts.33.gate_proj.weight_scale": "model-00015-of-00047.safetensors", + "model.layers.14.mlp.experts.33.up_proj.weight": "model-00015-of-00047.safetensors", + "model.layers.14.mlp.experts.33.up_proj.weight_scale": "model-00015-of-00047.safetensors", + "model.layers.14.mlp.experts.34.down_proj.weight": "model-00015-of-00047.safetensors", + "model.layers.14.mlp.experts.34.down_proj.weight_scale": "model-00015-of-00047.safetensors", + "model.layers.14.mlp.experts.34.gate_proj.weight": "model-00015-of-00047.safetensors", + "model.layers.14.mlp.experts.34.gate_proj.weight_scale": "model-00015-of-00047.safetensors", + "model.layers.14.mlp.experts.34.up_proj.weight": "model-00015-of-00047.safetensors", + "model.layers.14.mlp.experts.34.up_proj.weight_scale": "model-00015-of-00047.safetensors", + "model.layers.14.mlp.experts.35.down_proj.weight": "model-00015-of-00047.safetensors", + "model.layers.14.mlp.experts.35.down_proj.weight_scale": "model-00015-of-00047.safetensors", + "model.layers.14.mlp.experts.35.gate_proj.weight": "model-00015-of-00047.safetensors", + "model.layers.14.mlp.experts.35.gate_proj.weight_scale": "model-00015-of-00047.safetensors", + "model.layers.14.mlp.experts.35.up_proj.weight": "model-00015-of-00047.safetensors", + "model.layers.14.mlp.experts.35.up_proj.weight_scale": "model-00015-of-00047.safetensors", + "model.layers.14.mlp.experts.36.down_proj.weight": "model-00015-of-00047.safetensors", + "model.layers.14.mlp.experts.36.down_proj.weight_scale": "model-00015-of-00047.safetensors", + "model.layers.14.mlp.experts.36.gate_proj.weight": "model-00015-of-00047.safetensors", + "model.layers.14.mlp.experts.36.gate_proj.weight_scale": "model-00015-of-00047.safetensors", + "model.layers.14.mlp.experts.36.up_proj.weight": "model-00015-of-00047.safetensors", + "model.layers.14.mlp.experts.36.up_proj.weight_scale": "model-00015-of-00047.safetensors", + "model.layers.14.mlp.experts.37.down_proj.weight": "model-00015-of-00047.safetensors", + "model.layers.14.mlp.experts.37.down_proj.weight_scale": "model-00015-of-00047.safetensors", + "model.layers.14.mlp.experts.37.gate_proj.weight": "model-00015-of-00047.safetensors", + "model.layers.14.mlp.experts.37.gate_proj.weight_scale": "model-00015-of-00047.safetensors", + "model.layers.14.mlp.experts.37.up_proj.weight": "model-00015-of-00047.safetensors", + "model.layers.14.mlp.experts.37.up_proj.weight_scale": "model-00015-of-00047.safetensors", + "model.layers.14.mlp.experts.38.down_proj.weight": "model-00015-of-00047.safetensors", + "model.layers.14.mlp.experts.38.down_proj.weight_scale": "model-00015-of-00047.safetensors", + "model.layers.14.mlp.experts.38.gate_proj.weight": "model-00015-of-00047.safetensors", + "model.layers.14.mlp.experts.38.gate_proj.weight_scale": "model-00015-of-00047.safetensors", + "model.layers.14.mlp.experts.38.up_proj.weight": "model-00015-of-00047.safetensors", + "model.layers.14.mlp.experts.38.up_proj.weight_scale": "model-00015-of-00047.safetensors", + "model.layers.14.mlp.experts.39.down_proj.weight": "model-00015-of-00047.safetensors", + "model.layers.14.mlp.experts.39.down_proj.weight_scale": "model-00015-of-00047.safetensors", + "model.layers.14.mlp.experts.39.gate_proj.weight": "model-00015-of-00047.safetensors", + "model.layers.14.mlp.experts.39.gate_proj.weight_scale": "model-00015-of-00047.safetensors", + "model.layers.14.mlp.experts.39.up_proj.weight": "model-00015-of-00047.safetensors", + "model.layers.14.mlp.experts.39.up_proj.weight_scale": "model-00015-of-00047.safetensors", + "model.layers.14.mlp.experts.4.down_proj.weight": "model-00015-of-00047.safetensors", + "model.layers.14.mlp.experts.4.down_proj.weight_scale": "model-00015-of-00047.safetensors", + "model.layers.14.mlp.experts.4.gate_proj.weight": "model-00015-of-00047.safetensors", + "model.layers.14.mlp.experts.4.gate_proj.weight_scale": "model-00015-of-00047.safetensors", + "model.layers.14.mlp.experts.4.up_proj.weight": "model-00015-of-00047.safetensors", + "model.layers.14.mlp.experts.4.up_proj.weight_scale": "model-00015-of-00047.safetensors", + "model.layers.14.mlp.experts.40.down_proj.weight": "model-00015-of-00047.safetensors", + "model.layers.14.mlp.experts.40.down_proj.weight_scale": "model-00015-of-00047.safetensors", + "model.layers.14.mlp.experts.40.gate_proj.weight": "model-00015-of-00047.safetensors", + "model.layers.14.mlp.experts.40.gate_proj.weight_scale": "model-00015-of-00047.safetensors", + "model.layers.14.mlp.experts.40.up_proj.weight": "model-00015-of-00047.safetensors", + "model.layers.14.mlp.experts.40.up_proj.weight_scale": "model-00015-of-00047.safetensors", + "model.layers.14.mlp.experts.41.down_proj.weight": "model-00015-of-00047.safetensors", + "model.layers.14.mlp.experts.41.down_proj.weight_scale": "model-00015-of-00047.safetensors", + "model.layers.14.mlp.experts.41.gate_proj.weight": "model-00015-of-00047.safetensors", + "model.layers.14.mlp.experts.41.gate_proj.weight_scale": "model-00015-of-00047.safetensors", + "model.layers.14.mlp.experts.41.up_proj.weight": "model-00015-of-00047.safetensors", + "model.layers.14.mlp.experts.41.up_proj.weight_scale": "model-00015-of-00047.safetensors", + "model.layers.14.mlp.experts.42.down_proj.weight": "model-00015-of-00047.safetensors", + "model.layers.14.mlp.experts.42.down_proj.weight_scale": "model-00015-of-00047.safetensors", + "model.layers.14.mlp.experts.42.gate_proj.weight": "model-00015-of-00047.safetensors", + "model.layers.14.mlp.experts.42.gate_proj.weight_scale": "model-00015-of-00047.safetensors", + "model.layers.14.mlp.experts.42.up_proj.weight": "model-00015-of-00047.safetensors", + "model.layers.14.mlp.experts.42.up_proj.weight_scale": "model-00015-of-00047.safetensors", + "model.layers.14.mlp.experts.43.down_proj.weight": "model-00015-of-00047.safetensors", + "model.layers.14.mlp.experts.43.down_proj.weight_scale": "model-00015-of-00047.safetensors", + "model.layers.14.mlp.experts.43.gate_proj.weight": "model-00015-of-00047.safetensors", + "model.layers.14.mlp.experts.43.gate_proj.weight_scale": "model-00015-of-00047.safetensors", + "model.layers.14.mlp.experts.43.up_proj.weight": "model-00015-of-00047.safetensors", + "model.layers.14.mlp.experts.43.up_proj.weight_scale": "model-00015-of-00047.safetensors", + "model.layers.14.mlp.experts.44.down_proj.weight": "model-00015-of-00047.safetensors", + "model.layers.14.mlp.experts.44.down_proj.weight_scale": "model-00015-of-00047.safetensors", + "model.layers.14.mlp.experts.44.gate_proj.weight": "model-00015-of-00047.safetensors", + "model.layers.14.mlp.experts.44.gate_proj.weight_scale": "model-00015-of-00047.safetensors", + "model.layers.14.mlp.experts.44.up_proj.weight": "model-00015-of-00047.safetensors", + "model.layers.14.mlp.experts.44.up_proj.weight_scale": "model-00015-of-00047.safetensors", + "model.layers.14.mlp.experts.45.down_proj.weight": "model-00015-of-00047.safetensors", + "model.layers.14.mlp.experts.45.down_proj.weight_scale": "model-00015-of-00047.safetensors", + "model.layers.14.mlp.experts.45.gate_proj.weight": "model-00015-of-00047.safetensors", + "model.layers.14.mlp.experts.45.gate_proj.weight_scale": "model-00015-of-00047.safetensors", + "model.layers.14.mlp.experts.45.up_proj.weight": "model-00015-of-00047.safetensors", + "model.layers.14.mlp.experts.45.up_proj.weight_scale": "model-00015-of-00047.safetensors", + "model.layers.14.mlp.experts.46.down_proj.weight": "model-00015-of-00047.safetensors", + "model.layers.14.mlp.experts.46.down_proj.weight_scale": "model-00015-of-00047.safetensors", + "model.layers.14.mlp.experts.46.gate_proj.weight": "model-00015-of-00047.safetensors", + "model.layers.14.mlp.experts.46.gate_proj.weight_scale": "model-00015-of-00047.safetensors", + "model.layers.14.mlp.experts.46.up_proj.weight": "model-00015-of-00047.safetensors", + "model.layers.14.mlp.experts.46.up_proj.weight_scale": "model-00015-of-00047.safetensors", + "model.layers.14.mlp.experts.47.down_proj.weight": "model-00015-of-00047.safetensors", + "model.layers.14.mlp.experts.47.down_proj.weight_scale": "model-00015-of-00047.safetensors", + "model.layers.14.mlp.experts.47.gate_proj.weight": "model-00015-of-00047.safetensors", + "model.layers.14.mlp.experts.47.gate_proj.weight_scale": "model-00015-of-00047.safetensors", + "model.layers.14.mlp.experts.47.up_proj.weight": "model-00015-of-00047.safetensors", + "model.layers.14.mlp.experts.47.up_proj.weight_scale": "model-00015-of-00047.safetensors", + "model.layers.14.mlp.experts.48.down_proj.weight": "model-00015-of-00047.safetensors", + "model.layers.14.mlp.experts.48.down_proj.weight_scale": "model-00015-of-00047.safetensors", + "model.layers.14.mlp.experts.48.gate_proj.weight": "model-00015-of-00047.safetensors", + "model.layers.14.mlp.experts.48.gate_proj.weight_scale": "model-00015-of-00047.safetensors", + "model.layers.14.mlp.experts.48.up_proj.weight": "model-00015-of-00047.safetensors", + "model.layers.14.mlp.experts.48.up_proj.weight_scale": "model-00015-of-00047.safetensors", + "model.layers.14.mlp.experts.49.down_proj.weight": "model-00015-of-00047.safetensors", + "model.layers.14.mlp.experts.49.down_proj.weight_scale": "model-00015-of-00047.safetensors", + "model.layers.14.mlp.experts.49.gate_proj.weight": "model-00015-of-00047.safetensors", + "model.layers.14.mlp.experts.49.gate_proj.weight_scale": "model-00015-of-00047.safetensors", + "model.layers.14.mlp.experts.49.up_proj.weight": "model-00015-of-00047.safetensors", + "model.layers.14.mlp.experts.49.up_proj.weight_scale": "model-00015-of-00047.safetensors", + "model.layers.14.mlp.experts.5.down_proj.weight": "model-00015-of-00047.safetensors", + "model.layers.14.mlp.experts.5.down_proj.weight_scale": "model-00015-of-00047.safetensors", + "model.layers.14.mlp.experts.5.gate_proj.weight": "model-00015-of-00047.safetensors", + "model.layers.14.mlp.experts.5.gate_proj.weight_scale": "model-00015-of-00047.safetensors", + "model.layers.14.mlp.experts.5.up_proj.weight": "model-00015-of-00047.safetensors", + "model.layers.14.mlp.experts.5.up_proj.weight_scale": "model-00015-of-00047.safetensors", + "model.layers.14.mlp.experts.50.down_proj.weight": "model-00015-of-00047.safetensors", + "model.layers.14.mlp.experts.50.down_proj.weight_scale": "model-00015-of-00047.safetensors", + "model.layers.14.mlp.experts.50.gate_proj.weight": "model-00015-of-00047.safetensors", + "model.layers.14.mlp.experts.50.gate_proj.weight_scale": "model-00015-of-00047.safetensors", + "model.layers.14.mlp.experts.50.up_proj.weight": "model-00015-of-00047.safetensors", + "model.layers.14.mlp.experts.50.up_proj.weight_scale": "model-00015-of-00047.safetensors", + "model.layers.14.mlp.experts.51.down_proj.weight": "model-00015-of-00047.safetensors", + "model.layers.14.mlp.experts.51.down_proj.weight_scale": "model-00015-of-00047.safetensors", + "model.layers.14.mlp.experts.51.gate_proj.weight": "model-00015-of-00047.safetensors", + "model.layers.14.mlp.experts.51.gate_proj.weight_scale": "model-00015-of-00047.safetensors", + "model.layers.14.mlp.experts.51.up_proj.weight": "model-00015-of-00047.safetensors", + "model.layers.14.mlp.experts.51.up_proj.weight_scale": "model-00015-of-00047.safetensors", + "model.layers.14.mlp.experts.52.down_proj.weight": "model-00015-of-00047.safetensors", + "model.layers.14.mlp.experts.52.down_proj.weight_scale": "model-00015-of-00047.safetensors", + "model.layers.14.mlp.experts.52.gate_proj.weight": "model-00015-of-00047.safetensors", + "model.layers.14.mlp.experts.52.gate_proj.weight_scale": "model-00015-of-00047.safetensors", + "model.layers.14.mlp.experts.52.up_proj.weight": "model-00015-of-00047.safetensors", + "model.layers.14.mlp.experts.52.up_proj.weight_scale": "model-00015-of-00047.safetensors", + "model.layers.14.mlp.experts.53.down_proj.weight": "model-00015-of-00047.safetensors", + "model.layers.14.mlp.experts.53.down_proj.weight_scale": "model-00015-of-00047.safetensors", + "model.layers.14.mlp.experts.53.gate_proj.weight": "model-00015-of-00047.safetensors", + "model.layers.14.mlp.experts.53.gate_proj.weight_scale": "model-00015-of-00047.safetensors", + "model.layers.14.mlp.experts.53.up_proj.weight": "model-00015-of-00047.safetensors", + "model.layers.14.mlp.experts.53.up_proj.weight_scale": "model-00015-of-00047.safetensors", + "model.layers.14.mlp.experts.54.down_proj.weight": "model-00015-of-00047.safetensors", + "model.layers.14.mlp.experts.54.down_proj.weight_scale": "model-00015-of-00047.safetensors", + "model.layers.14.mlp.experts.54.gate_proj.weight": "model-00015-of-00047.safetensors", + "model.layers.14.mlp.experts.54.gate_proj.weight_scale": "model-00015-of-00047.safetensors", + "model.layers.14.mlp.experts.54.up_proj.weight": "model-00015-of-00047.safetensors", + "model.layers.14.mlp.experts.54.up_proj.weight_scale": "model-00015-of-00047.safetensors", + "model.layers.14.mlp.experts.55.down_proj.weight": "model-00015-of-00047.safetensors", + "model.layers.14.mlp.experts.55.down_proj.weight_scale": "model-00015-of-00047.safetensors", + "model.layers.14.mlp.experts.55.gate_proj.weight": "model-00015-of-00047.safetensors", + "model.layers.14.mlp.experts.55.gate_proj.weight_scale": "model-00015-of-00047.safetensors", + "model.layers.14.mlp.experts.55.up_proj.weight": "model-00015-of-00047.safetensors", + "model.layers.14.mlp.experts.55.up_proj.weight_scale": "model-00015-of-00047.safetensors", + "model.layers.14.mlp.experts.56.down_proj.weight": "model-00015-of-00047.safetensors", + "model.layers.14.mlp.experts.56.down_proj.weight_scale": "model-00015-of-00047.safetensors", + "model.layers.14.mlp.experts.56.gate_proj.weight": "model-00015-of-00047.safetensors", + "model.layers.14.mlp.experts.56.gate_proj.weight_scale": "model-00015-of-00047.safetensors", + "model.layers.14.mlp.experts.56.up_proj.weight": "model-00015-of-00047.safetensors", + "model.layers.14.mlp.experts.56.up_proj.weight_scale": "model-00015-of-00047.safetensors", + "model.layers.14.mlp.experts.57.down_proj.weight": "model-00015-of-00047.safetensors", + "model.layers.14.mlp.experts.57.down_proj.weight_scale": "model-00015-of-00047.safetensors", + "model.layers.14.mlp.experts.57.gate_proj.weight": "model-00015-of-00047.safetensors", + "model.layers.14.mlp.experts.57.gate_proj.weight_scale": "model-00015-of-00047.safetensors", + "model.layers.14.mlp.experts.57.up_proj.weight": "model-00015-of-00047.safetensors", + "model.layers.14.mlp.experts.57.up_proj.weight_scale": "model-00015-of-00047.safetensors", + "model.layers.14.mlp.experts.58.down_proj.weight": "model-00015-of-00047.safetensors", + "model.layers.14.mlp.experts.58.down_proj.weight_scale": "model-00015-of-00047.safetensors", + "model.layers.14.mlp.experts.58.gate_proj.weight": "model-00015-of-00047.safetensors", + "model.layers.14.mlp.experts.58.gate_proj.weight_scale": "model-00015-of-00047.safetensors", + "model.layers.14.mlp.experts.58.up_proj.weight": "model-00015-of-00047.safetensors", + "model.layers.14.mlp.experts.58.up_proj.weight_scale": "model-00015-of-00047.safetensors", + "model.layers.14.mlp.experts.59.down_proj.weight": "model-00015-of-00047.safetensors", + "model.layers.14.mlp.experts.59.down_proj.weight_scale": "model-00015-of-00047.safetensors", + "model.layers.14.mlp.experts.59.gate_proj.weight": "model-00015-of-00047.safetensors", + "model.layers.14.mlp.experts.59.gate_proj.weight_scale": "model-00015-of-00047.safetensors", + "model.layers.14.mlp.experts.59.up_proj.weight": "model-00015-of-00047.safetensors", + "model.layers.14.mlp.experts.59.up_proj.weight_scale": "model-00015-of-00047.safetensors", + "model.layers.14.mlp.experts.6.down_proj.weight": "model-00015-of-00047.safetensors", + "model.layers.14.mlp.experts.6.down_proj.weight_scale": "model-00015-of-00047.safetensors", + "model.layers.14.mlp.experts.6.gate_proj.weight": "model-00015-of-00047.safetensors", + "model.layers.14.mlp.experts.6.gate_proj.weight_scale": "model-00015-of-00047.safetensors", + "model.layers.14.mlp.experts.6.up_proj.weight": "model-00015-of-00047.safetensors", + "model.layers.14.mlp.experts.6.up_proj.weight_scale": "model-00015-of-00047.safetensors", + "model.layers.14.mlp.experts.60.down_proj.weight": "model-00015-of-00047.safetensors", + "model.layers.14.mlp.experts.60.down_proj.weight_scale": "model-00015-of-00047.safetensors", + "model.layers.14.mlp.experts.60.gate_proj.weight": "model-00015-of-00047.safetensors", + "model.layers.14.mlp.experts.60.gate_proj.weight_scale": "model-00015-of-00047.safetensors", + "model.layers.14.mlp.experts.60.up_proj.weight": "model-00015-of-00047.safetensors", + "model.layers.14.mlp.experts.60.up_proj.weight_scale": "model-00015-of-00047.safetensors", + "model.layers.14.mlp.experts.61.down_proj.weight": "model-00015-of-00047.safetensors", + "model.layers.14.mlp.experts.61.down_proj.weight_scale": "model-00015-of-00047.safetensors", + "model.layers.14.mlp.experts.61.gate_proj.weight": "model-00015-of-00047.safetensors", + "model.layers.14.mlp.experts.61.gate_proj.weight_scale": "model-00015-of-00047.safetensors", + "model.layers.14.mlp.experts.61.up_proj.weight": "model-00015-of-00047.safetensors", + "model.layers.14.mlp.experts.61.up_proj.weight_scale": "model-00015-of-00047.safetensors", + "model.layers.14.mlp.experts.62.down_proj.weight": "model-00015-of-00047.safetensors", + "model.layers.14.mlp.experts.62.down_proj.weight_scale": "model-00015-of-00047.safetensors", + "model.layers.14.mlp.experts.62.gate_proj.weight": "model-00015-of-00047.safetensors", + "model.layers.14.mlp.experts.62.gate_proj.weight_scale": "model-00015-of-00047.safetensors", + "model.layers.14.mlp.experts.62.up_proj.weight": "model-00015-of-00047.safetensors", + "model.layers.14.mlp.experts.62.up_proj.weight_scale": "model-00015-of-00047.safetensors", + "model.layers.14.mlp.experts.63.down_proj.weight": "model-00015-of-00047.safetensors", + "model.layers.14.mlp.experts.63.down_proj.weight_scale": "model-00015-of-00047.safetensors", + "model.layers.14.mlp.experts.63.gate_proj.weight": "model-00015-of-00047.safetensors", + "model.layers.14.mlp.experts.63.gate_proj.weight_scale": "model-00015-of-00047.safetensors", + "model.layers.14.mlp.experts.63.up_proj.weight": "model-00015-of-00047.safetensors", + "model.layers.14.mlp.experts.63.up_proj.weight_scale": "model-00015-of-00047.safetensors", + "model.layers.14.mlp.experts.64.down_proj.weight": "model-00015-of-00047.safetensors", + "model.layers.14.mlp.experts.64.down_proj.weight_scale": "model-00015-of-00047.safetensors", + "model.layers.14.mlp.experts.64.gate_proj.weight": "model-00015-of-00047.safetensors", + "model.layers.14.mlp.experts.64.gate_proj.weight_scale": "model-00015-of-00047.safetensors", + "model.layers.14.mlp.experts.64.up_proj.weight": "model-00015-of-00047.safetensors", + "model.layers.14.mlp.experts.64.up_proj.weight_scale": "model-00015-of-00047.safetensors", + "model.layers.14.mlp.experts.65.down_proj.weight": "model-00015-of-00047.safetensors", + "model.layers.14.mlp.experts.65.down_proj.weight_scale": "model-00015-of-00047.safetensors", + "model.layers.14.mlp.experts.65.gate_proj.weight": "model-00015-of-00047.safetensors", + "model.layers.14.mlp.experts.65.gate_proj.weight_scale": "model-00015-of-00047.safetensors", + "model.layers.14.mlp.experts.65.up_proj.weight": "model-00015-of-00047.safetensors", + "model.layers.14.mlp.experts.65.up_proj.weight_scale": "model-00015-of-00047.safetensors", + "model.layers.14.mlp.experts.66.down_proj.weight": "model-00015-of-00047.safetensors", + "model.layers.14.mlp.experts.66.down_proj.weight_scale": "model-00015-of-00047.safetensors", + "model.layers.14.mlp.experts.66.gate_proj.weight": "model-00015-of-00047.safetensors", + "model.layers.14.mlp.experts.66.gate_proj.weight_scale": "model-00015-of-00047.safetensors", + "model.layers.14.mlp.experts.66.up_proj.weight": "model-00015-of-00047.safetensors", + "model.layers.14.mlp.experts.66.up_proj.weight_scale": "model-00015-of-00047.safetensors", + "model.layers.14.mlp.experts.67.down_proj.weight": "model-00015-of-00047.safetensors", + "model.layers.14.mlp.experts.67.down_proj.weight_scale": "model-00015-of-00047.safetensors", + "model.layers.14.mlp.experts.67.gate_proj.weight": "model-00015-of-00047.safetensors", + "model.layers.14.mlp.experts.67.gate_proj.weight_scale": "model-00015-of-00047.safetensors", + "model.layers.14.mlp.experts.67.up_proj.weight": "model-00015-of-00047.safetensors", + "model.layers.14.mlp.experts.67.up_proj.weight_scale": "model-00015-of-00047.safetensors", + "model.layers.14.mlp.experts.68.down_proj.weight": "model-00015-of-00047.safetensors", + "model.layers.14.mlp.experts.68.down_proj.weight_scale": "model-00015-of-00047.safetensors", + "model.layers.14.mlp.experts.68.gate_proj.weight": "model-00015-of-00047.safetensors", + "model.layers.14.mlp.experts.68.gate_proj.weight_scale": "model-00015-of-00047.safetensors", + "model.layers.14.mlp.experts.68.up_proj.weight": "model-00015-of-00047.safetensors", + "model.layers.14.mlp.experts.68.up_proj.weight_scale": "model-00015-of-00047.safetensors", + "model.layers.14.mlp.experts.69.down_proj.weight": "model-00015-of-00047.safetensors", + "model.layers.14.mlp.experts.69.down_proj.weight_scale": "model-00015-of-00047.safetensors", + "model.layers.14.mlp.experts.69.gate_proj.weight": "model-00015-of-00047.safetensors", + "model.layers.14.mlp.experts.69.gate_proj.weight_scale": "model-00015-of-00047.safetensors", + "model.layers.14.mlp.experts.69.up_proj.weight": "model-00015-of-00047.safetensors", + "model.layers.14.mlp.experts.69.up_proj.weight_scale": "model-00015-of-00047.safetensors", + "model.layers.14.mlp.experts.7.down_proj.weight": "model-00015-of-00047.safetensors", + "model.layers.14.mlp.experts.7.down_proj.weight_scale": "model-00015-of-00047.safetensors", + "model.layers.14.mlp.experts.7.gate_proj.weight": "model-00015-of-00047.safetensors", + "model.layers.14.mlp.experts.7.gate_proj.weight_scale": "model-00015-of-00047.safetensors", + "model.layers.14.mlp.experts.7.up_proj.weight": "model-00015-of-00047.safetensors", + "model.layers.14.mlp.experts.7.up_proj.weight_scale": "model-00015-of-00047.safetensors", + "model.layers.14.mlp.experts.70.down_proj.weight": "model-00015-of-00047.safetensors", + "model.layers.14.mlp.experts.70.down_proj.weight_scale": "model-00015-of-00047.safetensors", + "model.layers.14.mlp.experts.70.gate_proj.weight": "model-00015-of-00047.safetensors", + "model.layers.14.mlp.experts.70.gate_proj.weight_scale": "model-00015-of-00047.safetensors", + "model.layers.14.mlp.experts.70.up_proj.weight": "model-00015-of-00047.safetensors", + "model.layers.14.mlp.experts.70.up_proj.weight_scale": "model-00015-of-00047.safetensors", + "model.layers.14.mlp.experts.71.down_proj.weight": "model-00015-of-00047.safetensors", + "model.layers.14.mlp.experts.71.down_proj.weight_scale": "model-00015-of-00047.safetensors", + "model.layers.14.mlp.experts.71.gate_proj.weight": "model-00015-of-00047.safetensors", + "model.layers.14.mlp.experts.71.gate_proj.weight_scale": "model-00015-of-00047.safetensors", + "model.layers.14.mlp.experts.71.up_proj.weight": "model-00015-of-00047.safetensors", + "model.layers.14.mlp.experts.71.up_proj.weight_scale": "model-00015-of-00047.safetensors", + "model.layers.14.mlp.experts.72.down_proj.weight": "model-00015-of-00047.safetensors", + "model.layers.14.mlp.experts.72.down_proj.weight_scale": "model-00015-of-00047.safetensors", + "model.layers.14.mlp.experts.72.gate_proj.weight": "model-00015-of-00047.safetensors", + "model.layers.14.mlp.experts.72.gate_proj.weight_scale": "model-00015-of-00047.safetensors", + "model.layers.14.mlp.experts.72.up_proj.weight": "model-00015-of-00047.safetensors", + "model.layers.14.mlp.experts.72.up_proj.weight_scale": "model-00015-of-00047.safetensors", + "model.layers.14.mlp.experts.73.down_proj.weight": "model-00015-of-00047.safetensors", + "model.layers.14.mlp.experts.73.down_proj.weight_scale": "model-00015-of-00047.safetensors", + "model.layers.14.mlp.experts.73.gate_proj.weight": "model-00015-of-00047.safetensors", + "model.layers.14.mlp.experts.73.gate_proj.weight_scale": "model-00015-of-00047.safetensors", + "model.layers.14.mlp.experts.73.up_proj.weight": "model-00015-of-00047.safetensors", + "model.layers.14.mlp.experts.73.up_proj.weight_scale": "model-00015-of-00047.safetensors", + "model.layers.14.mlp.experts.74.down_proj.weight": "model-00015-of-00047.safetensors", + "model.layers.14.mlp.experts.74.down_proj.weight_scale": "model-00015-of-00047.safetensors", + "model.layers.14.mlp.experts.74.gate_proj.weight": "model-00015-of-00047.safetensors", + "model.layers.14.mlp.experts.74.gate_proj.weight_scale": "model-00015-of-00047.safetensors", + "model.layers.14.mlp.experts.74.up_proj.weight": "model-00015-of-00047.safetensors", + "model.layers.14.mlp.experts.74.up_proj.weight_scale": "model-00015-of-00047.safetensors", + "model.layers.14.mlp.experts.75.down_proj.weight": "model-00015-of-00047.safetensors", + "model.layers.14.mlp.experts.75.down_proj.weight_scale": "model-00015-of-00047.safetensors", + "model.layers.14.mlp.experts.75.gate_proj.weight": "model-00015-of-00047.safetensors", + "model.layers.14.mlp.experts.75.gate_proj.weight_scale": "model-00015-of-00047.safetensors", + "model.layers.14.mlp.experts.75.up_proj.weight": "model-00015-of-00047.safetensors", + "model.layers.14.mlp.experts.75.up_proj.weight_scale": "model-00015-of-00047.safetensors", + "model.layers.14.mlp.experts.76.down_proj.weight": "model-00015-of-00047.safetensors", + "model.layers.14.mlp.experts.76.down_proj.weight_scale": "model-00015-of-00047.safetensors", + "model.layers.14.mlp.experts.76.gate_proj.weight": "model-00015-of-00047.safetensors", + "model.layers.14.mlp.experts.76.gate_proj.weight_scale": "model-00015-of-00047.safetensors", + "model.layers.14.mlp.experts.76.up_proj.weight": "model-00015-of-00047.safetensors", + "model.layers.14.mlp.experts.76.up_proj.weight_scale": "model-00015-of-00047.safetensors", + "model.layers.14.mlp.experts.77.down_proj.weight": "model-00015-of-00047.safetensors", + "model.layers.14.mlp.experts.77.down_proj.weight_scale": "model-00015-of-00047.safetensors", + "model.layers.14.mlp.experts.77.gate_proj.weight": "model-00015-of-00047.safetensors", + "model.layers.14.mlp.experts.77.gate_proj.weight_scale": "model-00015-of-00047.safetensors", + "model.layers.14.mlp.experts.77.up_proj.weight": "model-00015-of-00047.safetensors", + "model.layers.14.mlp.experts.77.up_proj.weight_scale": "model-00015-of-00047.safetensors", + "model.layers.14.mlp.experts.78.down_proj.weight": "model-00015-of-00047.safetensors", + "model.layers.14.mlp.experts.78.down_proj.weight_scale": "model-00015-of-00047.safetensors", + "model.layers.14.mlp.experts.78.gate_proj.weight": "model-00015-of-00047.safetensors", + "model.layers.14.mlp.experts.78.gate_proj.weight_scale": "model-00015-of-00047.safetensors", + "model.layers.14.mlp.experts.78.up_proj.weight": "model-00015-of-00047.safetensors", + "model.layers.14.mlp.experts.78.up_proj.weight_scale": "model-00015-of-00047.safetensors", + "model.layers.14.mlp.experts.79.down_proj.weight": "model-00015-of-00047.safetensors", + "model.layers.14.mlp.experts.79.down_proj.weight_scale": "model-00015-of-00047.safetensors", + "model.layers.14.mlp.experts.79.gate_proj.weight": "model-00015-of-00047.safetensors", + "model.layers.14.mlp.experts.79.gate_proj.weight_scale": "model-00015-of-00047.safetensors", + "model.layers.14.mlp.experts.79.up_proj.weight": "model-00015-of-00047.safetensors", + "model.layers.14.mlp.experts.79.up_proj.weight_scale": "model-00015-of-00047.safetensors", + "model.layers.14.mlp.experts.8.down_proj.weight": "model-00015-of-00047.safetensors", + "model.layers.14.mlp.experts.8.down_proj.weight_scale": "model-00015-of-00047.safetensors", + "model.layers.14.mlp.experts.8.gate_proj.weight": "model-00015-of-00047.safetensors", + "model.layers.14.mlp.experts.8.gate_proj.weight_scale": "model-00015-of-00047.safetensors", + "model.layers.14.mlp.experts.8.up_proj.weight": "model-00015-of-00047.safetensors", + "model.layers.14.mlp.experts.8.up_proj.weight_scale": "model-00015-of-00047.safetensors", + "model.layers.14.mlp.experts.80.down_proj.weight": "model-00015-of-00047.safetensors", + "model.layers.14.mlp.experts.80.down_proj.weight_scale": "model-00015-of-00047.safetensors", + "model.layers.14.mlp.experts.80.gate_proj.weight": "model-00015-of-00047.safetensors", + "model.layers.14.mlp.experts.80.gate_proj.weight_scale": "model-00015-of-00047.safetensors", + "model.layers.14.mlp.experts.80.up_proj.weight": "model-00015-of-00047.safetensors", + "model.layers.14.mlp.experts.80.up_proj.weight_scale": "model-00015-of-00047.safetensors", + "model.layers.14.mlp.experts.81.down_proj.weight": "model-00015-of-00047.safetensors", + "model.layers.14.mlp.experts.81.down_proj.weight_scale": "model-00015-of-00047.safetensors", + "model.layers.14.mlp.experts.81.gate_proj.weight": "model-00015-of-00047.safetensors", + "model.layers.14.mlp.experts.81.gate_proj.weight_scale": "model-00015-of-00047.safetensors", + "model.layers.14.mlp.experts.81.up_proj.weight": "model-00015-of-00047.safetensors", + "model.layers.14.mlp.experts.81.up_proj.weight_scale": "model-00015-of-00047.safetensors", + "model.layers.14.mlp.experts.82.down_proj.weight": "model-00015-of-00047.safetensors", + "model.layers.14.mlp.experts.82.down_proj.weight_scale": "model-00015-of-00047.safetensors", + "model.layers.14.mlp.experts.82.gate_proj.weight": "model-00015-of-00047.safetensors", + "model.layers.14.mlp.experts.82.gate_proj.weight_scale": "model-00015-of-00047.safetensors", + "model.layers.14.mlp.experts.82.up_proj.weight": "model-00015-of-00047.safetensors", + "model.layers.14.mlp.experts.82.up_proj.weight_scale": "model-00015-of-00047.safetensors", + "model.layers.14.mlp.experts.83.down_proj.weight": "model-00015-of-00047.safetensors", + "model.layers.14.mlp.experts.83.down_proj.weight_scale": "model-00015-of-00047.safetensors", + "model.layers.14.mlp.experts.83.gate_proj.weight": "model-00015-of-00047.safetensors", + "model.layers.14.mlp.experts.83.gate_proj.weight_scale": "model-00015-of-00047.safetensors", + "model.layers.14.mlp.experts.83.up_proj.weight": "model-00015-of-00047.safetensors", + "model.layers.14.mlp.experts.83.up_proj.weight_scale": "model-00015-of-00047.safetensors", + "model.layers.14.mlp.experts.84.down_proj.weight": "model-00015-of-00047.safetensors", + "model.layers.14.mlp.experts.84.down_proj.weight_scale": "model-00015-of-00047.safetensors", + "model.layers.14.mlp.experts.84.gate_proj.weight": "model-00015-of-00047.safetensors", + "model.layers.14.mlp.experts.84.gate_proj.weight_scale": "model-00015-of-00047.safetensors", + "model.layers.14.mlp.experts.84.up_proj.weight": "model-00015-of-00047.safetensors", + "model.layers.14.mlp.experts.84.up_proj.weight_scale": "model-00015-of-00047.safetensors", + "model.layers.14.mlp.experts.85.down_proj.weight": "model-00015-of-00047.safetensors", + "model.layers.14.mlp.experts.85.down_proj.weight_scale": "model-00015-of-00047.safetensors", + "model.layers.14.mlp.experts.85.gate_proj.weight": "model-00015-of-00047.safetensors", + "model.layers.14.mlp.experts.85.gate_proj.weight_scale": "model-00015-of-00047.safetensors", + "model.layers.14.mlp.experts.85.up_proj.weight": "model-00015-of-00047.safetensors", + "model.layers.14.mlp.experts.85.up_proj.weight_scale": "model-00015-of-00047.safetensors", + "model.layers.14.mlp.experts.86.down_proj.weight": "model-00015-of-00047.safetensors", + "model.layers.14.mlp.experts.86.down_proj.weight_scale": "model-00015-of-00047.safetensors", + "model.layers.14.mlp.experts.86.gate_proj.weight": "model-00015-of-00047.safetensors", + "model.layers.14.mlp.experts.86.gate_proj.weight_scale": "model-00015-of-00047.safetensors", + "model.layers.14.mlp.experts.86.up_proj.weight": "model-00015-of-00047.safetensors", + "model.layers.14.mlp.experts.86.up_proj.weight_scale": "model-00015-of-00047.safetensors", + "model.layers.14.mlp.experts.87.down_proj.weight": "model-00015-of-00047.safetensors", + "model.layers.14.mlp.experts.87.down_proj.weight_scale": "model-00015-of-00047.safetensors", + "model.layers.14.mlp.experts.87.gate_proj.weight": "model-00015-of-00047.safetensors", + "model.layers.14.mlp.experts.87.gate_proj.weight_scale": "model-00015-of-00047.safetensors", + "model.layers.14.mlp.experts.87.up_proj.weight": "model-00015-of-00047.safetensors", + "model.layers.14.mlp.experts.87.up_proj.weight_scale": "model-00015-of-00047.safetensors", + "model.layers.14.mlp.experts.88.down_proj.weight": "model-00015-of-00047.safetensors", + "model.layers.14.mlp.experts.88.down_proj.weight_scale": "model-00015-of-00047.safetensors", + "model.layers.14.mlp.experts.88.gate_proj.weight": "model-00015-of-00047.safetensors", + "model.layers.14.mlp.experts.88.gate_proj.weight_scale": "model-00015-of-00047.safetensors", + "model.layers.14.mlp.experts.88.up_proj.weight": "model-00015-of-00047.safetensors", + "model.layers.14.mlp.experts.88.up_proj.weight_scale": "model-00015-of-00047.safetensors", + "model.layers.14.mlp.experts.89.down_proj.weight": "model-00015-of-00047.safetensors", + "model.layers.14.mlp.experts.89.down_proj.weight_scale": "model-00015-of-00047.safetensors", + "model.layers.14.mlp.experts.89.gate_proj.weight": "model-00015-of-00047.safetensors", + "model.layers.14.mlp.experts.89.gate_proj.weight_scale": "model-00015-of-00047.safetensors", + "model.layers.14.mlp.experts.89.up_proj.weight": "model-00015-of-00047.safetensors", + "model.layers.14.mlp.experts.89.up_proj.weight_scale": "model-00015-of-00047.safetensors", + "model.layers.14.mlp.experts.9.down_proj.weight": "model-00015-of-00047.safetensors", + "model.layers.14.mlp.experts.9.down_proj.weight_scale": "model-00015-of-00047.safetensors", + "model.layers.14.mlp.experts.9.gate_proj.weight": "model-00015-of-00047.safetensors", + "model.layers.14.mlp.experts.9.gate_proj.weight_scale": "model-00015-of-00047.safetensors", + "model.layers.14.mlp.experts.9.up_proj.weight": "model-00015-of-00047.safetensors", + "model.layers.14.mlp.experts.9.up_proj.weight_scale": "model-00015-of-00047.safetensors", + "model.layers.14.mlp.experts.90.down_proj.weight": "model-00015-of-00047.safetensors", + "model.layers.14.mlp.experts.90.down_proj.weight_scale": "model-00015-of-00047.safetensors", + "model.layers.14.mlp.experts.90.gate_proj.weight": "model-00015-of-00047.safetensors", + "model.layers.14.mlp.experts.90.gate_proj.weight_scale": "model-00015-of-00047.safetensors", + "model.layers.14.mlp.experts.90.up_proj.weight": "model-00015-of-00047.safetensors", + "model.layers.14.mlp.experts.90.up_proj.weight_scale": "model-00015-of-00047.safetensors", + "model.layers.14.mlp.experts.91.down_proj.weight": "model-00015-of-00047.safetensors", + "model.layers.14.mlp.experts.91.down_proj.weight_scale": "model-00015-of-00047.safetensors", + "model.layers.14.mlp.experts.91.gate_proj.weight": "model-00015-of-00047.safetensors", + "model.layers.14.mlp.experts.91.gate_proj.weight_scale": "model-00015-of-00047.safetensors", + "model.layers.14.mlp.experts.91.up_proj.weight": "model-00015-of-00047.safetensors", + "model.layers.14.mlp.experts.91.up_proj.weight_scale": "model-00015-of-00047.safetensors", + "model.layers.14.mlp.experts.92.down_proj.weight": "model-00015-of-00047.safetensors", + "model.layers.14.mlp.experts.92.down_proj.weight_scale": "model-00015-of-00047.safetensors", + "model.layers.14.mlp.experts.92.gate_proj.weight": "model-00015-of-00047.safetensors", + "model.layers.14.mlp.experts.92.gate_proj.weight_scale": "model-00015-of-00047.safetensors", + "model.layers.14.mlp.experts.92.up_proj.weight": "model-00015-of-00047.safetensors", + "model.layers.14.mlp.experts.92.up_proj.weight_scale": "model-00015-of-00047.safetensors", + "model.layers.14.mlp.experts.93.down_proj.weight": "model-00015-of-00047.safetensors", + "model.layers.14.mlp.experts.93.down_proj.weight_scale": "model-00015-of-00047.safetensors", + "model.layers.14.mlp.experts.93.gate_proj.weight": "model-00015-of-00047.safetensors", + "model.layers.14.mlp.experts.93.gate_proj.weight_scale": "model-00015-of-00047.safetensors", + "model.layers.14.mlp.experts.93.up_proj.weight": "model-00015-of-00047.safetensors", + "model.layers.14.mlp.experts.93.up_proj.weight_scale": "model-00015-of-00047.safetensors", + "model.layers.14.mlp.experts.94.down_proj.weight": "model-00015-of-00047.safetensors", + "model.layers.14.mlp.experts.94.down_proj.weight_scale": "model-00015-of-00047.safetensors", + "model.layers.14.mlp.experts.94.gate_proj.weight": "model-00015-of-00047.safetensors", + "model.layers.14.mlp.experts.94.gate_proj.weight_scale": "model-00015-of-00047.safetensors", + "model.layers.14.mlp.experts.94.up_proj.weight": "model-00015-of-00047.safetensors", + "model.layers.14.mlp.experts.94.up_proj.weight_scale": "model-00015-of-00047.safetensors", + "model.layers.14.mlp.experts.95.down_proj.weight": "model-00015-of-00047.safetensors", + "model.layers.14.mlp.experts.95.down_proj.weight_scale": "model-00015-of-00047.safetensors", + "model.layers.14.mlp.experts.95.gate_proj.weight": "model-00015-of-00047.safetensors", + "model.layers.14.mlp.experts.95.gate_proj.weight_scale": "model-00015-of-00047.safetensors", + "model.layers.14.mlp.experts.95.up_proj.weight": "model-00015-of-00047.safetensors", + "model.layers.14.mlp.experts.95.up_proj.weight_scale": "model-00015-of-00047.safetensors", + "model.layers.14.mlp.experts.96.down_proj.weight": "model-00015-of-00047.safetensors", + "model.layers.14.mlp.experts.96.down_proj.weight_scale": "model-00015-of-00047.safetensors", + "model.layers.14.mlp.experts.96.gate_proj.weight": "model-00015-of-00047.safetensors", + "model.layers.14.mlp.experts.96.gate_proj.weight_scale": "model-00015-of-00047.safetensors", + "model.layers.14.mlp.experts.96.up_proj.weight": "model-00015-of-00047.safetensors", + "model.layers.14.mlp.experts.96.up_proj.weight_scale": "model-00015-of-00047.safetensors", + "model.layers.14.mlp.experts.97.down_proj.weight": "model-00015-of-00047.safetensors", + "model.layers.14.mlp.experts.97.down_proj.weight_scale": "model-00015-of-00047.safetensors", + "model.layers.14.mlp.experts.97.gate_proj.weight": "model-00015-of-00047.safetensors", + "model.layers.14.mlp.experts.97.gate_proj.weight_scale": "model-00015-of-00047.safetensors", + "model.layers.14.mlp.experts.97.up_proj.weight": "model-00015-of-00047.safetensors", + "model.layers.14.mlp.experts.97.up_proj.weight_scale": "model-00015-of-00047.safetensors", + "model.layers.14.mlp.experts.98.down_proj.weight": "model-00015-of-00047.safetensors", + "model.layers.14.mlp.experts.98.down_proj.weight_scale": "model-00015-of-00047.safetensors", + "model.layers.14.mlp.experts.98.gate_proj.weight": "model-00015-of-00047.safetensors", + "model.layers.14.mlp.experts.98.gate_proj.weight_scale": "model-00015-of-00047.safetensors", + "model.layers.14.mlp.experts.98.up_proj.weight": "model-00015-of-00047.safetensors", + "model.layers.14.mlp.experts.98.up_proj.weight_scale": "model-00015-of-00047.safetensors", + "model.layers.14.mlp.experts.99.down_proj.weight": "model-00015-of-00047.safetensors", + "model.layers.14.mlp.experts.99.down_proj.weight_scale": "model-00015-of-00047.safetensors", + "model.layers.14.mlp.experts.99.gate_proj.weight": "model-00015-of-00047.safetensors", + "model.layers.14.mlp.experts.99.gate_proj.weight_scale": "model-00015-of-00047.safetensors", + "model.layers.14.mlp.experts.99.up_proj.weight": "model-00015-of-00047.safetensors", + "model.layers.14.mlp.experts.99.up_proj.weight_scale": "model-00015-of-00047.safetensors", + "model.layers.14.mlp.gate.e_score_correction_bias": "model-00015-of-00047.safetensors", + "model.layers.14.mlp.gate.weight": "model-00015-of-00047.safetensors", + "model.layers.14.mlp.shared_experts.down_proj.weight": "model-00015-of-00047.safetensors", + "model.layers.14.mlp.shared_experts.down_proj.weight_scale": "model-00015-of-00047.safetensors", + "model.layers.14.mlp.shared_experts.gate_proj.weight": "model-00015-of-00047.safetensors", + "model.layers.14.mlp.shared_experts.gate_proj.weight_scale": "model-00015-of-00047.safetensors", + "model.layers.14.mlp.shared_experts.up_proj.weight": "model-00015-of-00047.safetensors", + "model.layers.14.mlp.shared_experts.up_proj.weight_scale": "model-00015-of-00047.safetensors", + "model.layers.14.post_attention_layernorm.weight": "model-00015-of-00047.safetensors", + "model.layers.14.self_attn.k_proj.bias": "model-00015-of-00047.safetensors", + "model.layers.14.self_attn.k_proj.weight": "model-00015-of-00047.safetensors", + "model.layers.14.self_attn.k_proj.weight_scale": "model-00015-of-00047.safetensors", + "model.layers.14.self_attn.o_proj.weight": "model-00015-of-00047.safetensors", + "model.layers.14.self_attn.o_proj.weight_scale": "model-00015-of-00047.safetensors", + "model.layers.14.self_attn.q_proj.bias": "model-00015-of-00047.safetensors", + "model.layers.14.self_attn.q_proj.weight": "model-00015-of-00047.safetensors", + "model.layers.14.self_attn.q_proj.weight_scale": "model-00015-of-00047.safetensors", + "model.layers.14.self_attn.v_proj.bias": "model-00015-of-00047.safetensors", + "model.layers.14.self_attn.v_proj.weight": "model-00015-of-00047.safetensors", + "model.layers.14.self_attn.v_proj.weight_scale": "model-00015-of-00047.safetensors", + "model.layers.15.input_layernorm.weight": "model-00016-of-00047.safetensors", + "model.layers.15.mlp.experts.0.down_proj.weight": "model-00016-of-00047.safetensors", + "model.layers.15.mlp.experts.0.down_proj.weight_scale": "model-00016-of-00047.safetensors", + "model.layers.15.mlp.experts.0.gate_proj.weight": "model-00016-of-00047.safetensors", + "model.layers.15.mlp.experts.0.gate_proj.weight_scale": "model-00016-of-00047.safetensors", + "model.layers.15.mlp.experts.0.up_proj.weight": "model-00016-of-00047.safetensors", + "model.layers.15.mlp.experts.0.up_proj.weight_scale": "model-00016-of-00047.safetensors", + "model.layers.15.mlp.experts.1.down_proj.weight": "model-00016-of-00047.safetensors", + "model.layers.15.mlp.experts.1.down_proj.weight_scale": "model-00016-of-00047.safetensors", + "model.layers.15.mlp.experts.1.gate_proj.weight": "model-00016-of-00047.safetensors", + "model.layers.15.mlp.experts.1.gate_proj.weight_scale": "model-00016-of-00047.safetensors", + "model.layers.15.mlp.experts.1.up_proj.weight": "model-00016-of-00047.safetensors", + "model.layers.15.mlp.experts.1.up_proj.weight_scale": "model-00016-of-00047.safetensors", + "model.layers.15.mlp.experts.10.down_proj.weight": "model-00016-of-00047.safetensors", + "model.layers.15.mlp.experts.10.down_proj.weight_scale": "model-00016-of-00047.safetensors", + "model.layers.15.mlp.experts.10.gate_proj.weight": "model-00016-of-00047.safetensors", + "model.layers.15.mlp.experts.10.gate_proj.weight_scale": "model-00016-of-00047.safetensors", + "model.layers.15.mlp.experts.10.up_proj.weight": "model-00016-of-00047.safetensors", + "model.layers.15.mlp.experts.10.up_proj.weight_scale": "model-00016-of-00047.safetensors", + "model.layers.15.mlp.experts.100.down_proj.weight": "model-00016-of-00047.safetensors", + "model.layers.15.mlp.experts.100.down_proj.weight_scale": "model-00016-of-00047.safetensors", + "model.layers.15.mlp.experts.100.gate_proj.weight": "model-00016-of-00047.safetensors", + "model.layers.15.mlp.experts.100.gate_proj.weight_scale": "model-00016-of-00047.safetensors", + "model.layers.15.mlp.experts.100.up_proj.weight": "model-00016-of-00047.safetensors", + "model.layers.15.mlp.experts.100.up_proj.weight_scale": "model-00016-of-00047.safetensors", + "model.layers.15.mlp.experts.101.down_proj.weight": "model-00016-of-00047.safetensors", + "model.layers.15.mlp.experts.101.down_proj.weight_scale": "model-00016-of-00047.safetensors", + "model.layers.15.mlp.experts.101.gate_proj.weight": "model-00016-of-00047.safetensors", + "model.layers.15.mlp.experts.101.gate_proj.weight_scale": "model-00016-of-00047.safetensors", + "model.layers.15.mlp.experts.101.up_proj.weight": "model-00016-of-00047.safetensors", + "model.layers.15.mlp.experts.101.up_proj.weight_scale": "model-00016-of-00047.safetensors", + "model.layers.15.mlp.experts.102.down_proj.weight": "model-00016-of-00047.safetensors", + "model.layers.15.mlp.experts.102.down_proj.weight_scale": "model-00016-of-00047.safetensors", + "model.layers.15.mlp.experts.102.gate_proj.weight": "model-00016-of-00047.safetensors", + "model.layers.15.mlp.experts.102.gate_proj.weight_scale": "model-00016-of-00047.safetensors", + "model.layers.15.mlp.experts.102.up_proj.weight": "model-00016-of-00047.safetensors", + "model.layers.15.mlp.experts.102.up_proj.weight_scale": "model-00016-of-00047.safetensors", + "model.layers.15.mlp.experts.103.down_proj.weight": "model-00016-of-00047.safetensors", + "model.layers.15.mlp.experts.103.down_proj.weight_scale": "model-00016-of-00047.safetensors", + "model.layers.15.mlp.experts.103.gate_proj.weight": "model-00016-of-00047.safetensors", + "model.layers.15.mlp.experts.103.gate_proj.weight_scale": "model-00016-of-00047.safetensors", + "model.layers.15.mlp.experts.103.up_proj.weight": "model-00016-of-00047.safetensors", + "model.layers.15.mlp.experts.103.up_proj.weight_scale": "model-00016-of-00047.safetensors", + "model.layers.15.mlp.experts.104.down_proj.weight": "model-00016-of-00047.safetensors", + "model.layers.15.mlp.experts.104.down_proj.weight_scale": "model-00016-of-00047.safetensors", + "model.layers.15.mlp.experts.104.gate_proj.weight": "model-00016-of-00047.safetensors", + "model.layers.15.mlp.experts.104.gate_proj.weight_scale": "model-00016-of-00047.safetensors", + "model.layers.15.mlp.experts.104.up_proj.weight": "model-00016-of-00047.safetensors", + "model.layers.15.mlp.experts.104.up_proj.weight_scale": "model-00016-of-00047.safetensors", + "model.layers.15.mlp.experts.105.down_proj.weight": "model-00016-of-00047.safetensors", + "model.layers.15.mlp.experts.105.down_proj.weight_scale": "model-00016-of-00047.safetensors", + "model.layers.15.mlp.experts.105.gate_proj.weight": "model-00016-of-00047.safetensors", + "model.layers.15.mlp.experts.105.gate_proj.weight_scale": "model-00016-of-00047.safetensors", + "model.layers.15.mlp.experts.105.up_proj.weight": "model-00016-of-00047.safetensors", + "model.layers.15.mlp.experts.105.up_proj.weight_scale": "model-00016-of-00047.safetensors", + "model.layers.15.mlp.experts.106.down_proj.weight": "model-00016-of-00047.safetensors", + "model.layers.15.mlp.experts.106.down_proj.weight_scale": "model-00016-of-00047.safetensors", + "model.layers.15.mlp.experts.106.gate_proj.weight": "model-00016-of-00047.safetensors", + "model.layers.15.mlp.experts.106.gate_proj.weight_scale": "model-00016-of-00047.safetensors", + "model.layers.15.mlp.experts.106.up_proj.weight": "model-00016-of-00047.safetensors", + "model.layers.15.mlp.experts.106.up_proj.weight_scale": "model-00016-of-00047.safetensors", + "model.layers.15.mlp.experts.107.down_proj.weight": "model-00016-of-00047.safetensors", + "model.layers.15.mlp.experts.107.down_proj.weight_scale": "model-00016-of-00047.safetensors", + "model.layers.15.mlp.experts.107.gate_proj.weight": "model-00016-of-00047.safetensors", + "model.layers.15.mlp.experts.107.gate_proj.weight_scale": "model-00016-of-00047.safetensors", + "model.layers.15.mlp.experts.107.up_proj.weight": "model-00016-of-00047.safetensors", + "model.layers.15.mlp.experts.107.up_proj.weight_scale": "model-00016-of-00047.safetensors", + "model.layers.15.mlp.experts.108.down_proj.weight": "model-00016-of-00047.safetensors", + "model.layers.15.mlp.experts.108.down_proj.weight_scale": "model-00016-of-00047.safetensors", + "model.layers.15.mlp.experts.108.gate_proj.weight": "model-00016-of-00047.safetensors", + "model.layers.15.mlp.experts.108.gate_proj.weight_scale": "model-00016-of-00047.safetensors", + "model.layers.15.mlp.experts.108.up_proj.weight": "model-00016-of-00047.safetensors", + "model.layers.15.mlp.experts.108.up_proj.weight_scale": "model-00016-of-00047.safetensors", + "model.layers.15.mlp.experts.109.down_proj.weight": "model-00016-of-00047.safetensors", + "model.layers.15.mlp.experts.109.down_proj.weight_scale": "model-00016-of-00047.safetensors", + "model.layers.15.mlp.experts.109.gate_proj.weight": "model-00016-of-00047.safetensors", + "model.layers.15.mlp.experts.109.gate_proj.weight_scale": "model-00016-of-00047.safetensors", + "model.layers.15.mlp.experts.109.up_proj.weight": "model-00016-of-00047.safetensors", + "model.layers.15.mlp.experts.109.up_proj.weight_scale": "model-00016-of-00047.safetensors", + "model.layers.15.mlp.experts.11.down_proj.weight": "model-00016-of-00047.safetensors", + "model.layers.15.mlp.experts.11.down_proj.weight_scale": "model-00016-of-00047.safetensors", + "model.layers.15.mlp.experts.11.gate_proj.weight": "model-00016-of-00047.safetensors", + "model.layers.15.mlp.experts.11.gate_proj.weight_scale": "model-00016-of-00047.safetensors", + "model.layers.15.mlp.experts.11.up_proj.weight": "model-00016-of-00047.safetensors", + "model.layers.15.mlp.experts.11.up_proj.weight_scale": "model-00016-of-00047.safetensors", + "model.layers.15.mlp.experts.110.down_proj.weight": "model-00016-of-00047.safetensors", + "model.layers.15.mlp.experts.110.down_proj.weight_scale": "model-00016-of-00047.safetensors", + "model.layers.15.mlp.experts.110.gate_proj.weight": "model-00016-of-00047.safetensors", + "model.layers.15.mlp.experts.110.gate_proj.weight_scale": "model-00016-of-00047.safetensors", + "model.layers.15.mlp.experts.110.up_proj.weight": "model-00016-of-00047.safetensors", + "model.layers.15.mlp.experts.110.up_proj.weight_scale": "model-00016-of-00047.safetensors", + "model.layers.15.mlp.experts.111.down_proj.weight": "model-00016-of-00047.safetensors", + "model.layers.15.mlp.experts.111.down_proj.weight_scale": "model-00016-of-00047.safetensors", + "model.layers.15.mlp.experts.111.gate_proj.weight": "model-00016-of-00047.safetensors", + "model.layers.15.mlp.experts.111.gate_proj.weight_scale": "model-00016-of-00047.safetensors", + "model.layers.15.mlp.experts.111.up_proj.weight": "model-00016-of-00047.safetensors", + "model.layers.15.mlp.experts.111.up_proj.weight_scale": "model-00016-of-00047.safetensors", + "model.layers.15.mlp.experts.112.down_proj.weight": "model-00016-of-00047.safetensors", + "model.layers.15.mlp.experts.112.down_proj.weight_scale": "model-00016-of-00047.safetensors", + "model.layers.15.mlp.experts.112.gate_proj.weight": "model-00016-of-00047.safetensors", + "model.layers.15.mlp.experts.112.gate_proj.weight_scale": "model-00016-of-00047.safetensors", + "model.layers.15.mlp.experts.112.up_proj.weight": "model-00016-of-00047.safetensors", + "model.layers.15.mlp.experts.112.up_proj.weight_scale": "model-00016-of-00047.safetensors", + "model.layers.15.mlp.experts.113.down_proj.weight": "model-00016-of-00047.safetensors", + "model.layers.15.mlp.experts.113.down_proj.weight_scale": "model-00016-of-00047.safetensors", + "model.layers.15.mlp.experts.113.gate_proj.weight": "model-00016-of-00047.safetensors", + "model.layers.15.mlp.experts.113.gate_proj.weight_scale": "model-00016-of-00047.safetensors", + "model.layers.15.mlp.experts.113.up_proj.weight": "model-00016-of-00047.safetensors", + "model.layers.15.mlp.experts.113.up_proj.weight_scale": "model-00016-of-00047.safetensors", + "model.layers.15.mlp.experts.114.down_proj.weight": "model-00016-of-00047.safetensors", + "model.layers.15.mlp.experts.114.down_proj.weight_scale": "model-00016-of-00047.safetensors", + "model.layers.15.mlp.experts.114.gate_proj.weight": "model-00016-of-00047.safetensors", + "model.layers.15.mlp.experts.114.gate_proj.weight_scale": "model-00016-of-00047.safetensors", + "model.layers.15.mlp.experts.114.up_proj.weight": "model-00016-of-00047.safetensors", + "model.layers.15.mlp.experts.114.up_proj.weight_scale": "model-00016-of-00047.safetensors", + "model.layers.15.mlp.experts.115.down_proj.weight": "model-00016-of-00047.safetensors", + "model.layers.15.mlp.experts.115.down_proj.weight_scale": "model-00016-of-00047.safetensors", + "model.layers.15.mlp.experts.115.gate_proj.weight": "model-00016-of-00047.safetensors", + "model.layers.15.mlp.experts.115.gate_proj.weight_scale": "model-00016-of-00047.safetensors", + "model.layers.15.mlp.experts.115.up_proj.weight": "model-00016-of-00047.safetensors", + "model.layers.15.mlp.experts.115.up_proj.weight_scale": "model-00016-of-00047.safetensors", + "model.layers.15.mlp.experts.116.down_proj.weight": "model-00016-of-00047.safetensors", + "model.layers.15.mlp.experts.116.down_proj.weight_scale": "model-00016-of-00047.safetensors", + "model.layers.15.mlp.experts.116.gate_proj.weight": "model-00016-of-00047.safetensors", + "model.layers.15.mlp.experts.116.gate_proj.weight_scale": "model-00016-of-00047.safetensors", + "model.layers.15.mlp.experts.116.up_proj.weight": "model-00016-of-00047.safetensors", + "model.layers.15.mlp.experts.116.up_proj.weight_scale": "model-00016-of-00047.safetensors", + "model.layers.15.mlp.experts.117.down_proj.weight": "model-00016-of-00047.safetensors", + "model.layers.15.mlp.experts.117.down_proj.weight_scale": "model-00016-of-00047.safetensors", + "model.layers.15.mlp.experts.117.gate_proj.weight": "model-00016-of-00047.safetensors", + "model.layers.15.mlp.experts.117.gate_proj.weight_scale": "model-00016-of-00047.safetensors", + "model.layers.15.mlp.experts.117.up_proj.weight": "model-00016-of-00047.safetensors", + "model.layers.15.mlp.experts.117.up_proj.weight_scale": "model-00016-of-00047.safetensors", + "model.layers.15.mlp.experts.118.down_proj.weight": "model-00016-of-00047.safetensors", + "model.layers.15.mlp.experts.118.down_proj.weight_scale": "model-00016-of-00047.safetensors", + "model.layers.15.mlp.experts.118.gate_proj.weight": "model-00016-of-00047.safetensors", + "model.layers.15.mlp.experts.118.gate_proj.weight_scale": "model-00016-of-00047.safetensors", + "model.layers.15.mlp.experts.118.up_proj.weight": "model-00016-of-00047.safetensors", + "model.layers.15.mlp.experts.118.up_proj.weight_scale": "model-00016-of-00047.safetensors", + "model.layers.15.mlp.experts.119.down_proj.weight": "model-00016-of-00047.safetensors", + "model.layers.15.mlp.experts.119.down_proj.weight_scale": "model-00016-of-00047.safetensors", + "model.layers.15.mlp.experts.119.gate_proj.weight": "model-00016-of-00047.safetensors", + "model.layers.15.mlp.experts.119.gate_proj.weight_scale": "model-00016-of-00047.safetensors", + "model.layers.15.mlp.experts.119.up_proj.weight": "model-00016-of-00047.safetensors", + "model.layers.15.mlp.experts.119.up_proj.weight_scale": "model-00016-of-00047.safetensors", + "model.layers.15.mlp.experts.12.down_proj.weight": "model-00016-of-00047.safetensors", + "model.layers.15.mlp.experts.12.down_proj.weight_scale": "model-00016-of-00047.safetensors", + "model.layers.15.mlp.experts.12.gate_proj.weight": "model-00016-of-00047.safetensors", + "model.layers.15.mlp.experts.12.gate_proj.weight_scale": "model-00016-of-00047.safetensors", + "model.layers.15.mlp.experts.12.up_proj.weight": "model-00016-of-00047.safetensors", + "model.layers.15.mlp.experts.12.up_proj.weight_scale": "model-00016-of-00047.safetensors", + "model.layers.15.mlp.experts.120.down_proj.weight": "model-00016-of-00047.safetensors", + "model.layers.15.mlp.experts.120.down_proj.weight_scale": "model-00016-of-00047.safetensors", + "model.layers.15.mlp.experts.120.gate_proj.weight": "model-00016-of-00047.safetensors", + "model.layers.15.mlp.experts.120.gate_proj.weight_scale": "model-00016-of-00047.safetensors", + "model.layers.15.mlp.experts.120.up_proj.weight": "model-00016-of-00047.safetensors", + "model.layers.15.mlp.experts.120.up_proj.weight_scale": "model-00016-of-00047.safetensors", + "model.layers.15.mlp.experts.121.down_proj.weight": "model-00016-of-00047.safetensors", + "model.layers.15.mlp.experts.121.down_proj.weight_scale": "model-00016-of-00047.safetensors", + "model.layers.15.mlp.experts.121.gate_proj.weight": "model-00016-of-00047.safetensors", + "model.layers.15.mlp.experts.121.gate_proj.weight_scale": "model-00016-of-00047.safetensors", + "model.layers.15.mlp.experts.121.up_proj.weight": "model-00016-of-00047.safetensors", + "model.layers.15.mlp.experts.121.up_proj.weight_scale": "model-00016-of-00047.safetensors", + "model.layers.15.mlp.experts.122.down_proj.weight": "model-00016-of-00047.safetensors", + "model.layers.15.mlp.experts.122.down_proj.weight_scale": "model-00016-of-00047.safetensors", + "model.layers.15.mlp.experts.122.gate_proj.weight": "model-00016-of-00047.safetensors", + "model.layers.15.mlp.experts.122.gate_proj.weight_scale": "model-00016-of-00047.safetensors", + "model.layers.15.mlp.experts.122.up_proj.weight": "model-00016-of-00047.safetensors", + "model.layers.15.mlp.experts.122.up_proj.weight_scale": "model-00016-of-00047.safetensors", + "model.layers.15.mlp.experts.123.down_proj.weight": "model-00016-of-00047.safetensors", + "model.layers.15.mlp.experts.123.down_proj.weight_scale": "model-00016-of-00047.safetensors", + "model.layers.15.mlp.experts.123.gate_proj.weight": "model-00016-of-00047.safetensors", + "model.layers.15.mlp.experts.123.gate_proj.weight_scale": "model-00016-of-00047.safetensors", + "model.layers.15.mlp.experts.123.up_proj.weight": "model-00016-of-00047.safetensors", + "model.layers.15.mlp.experts.123.up_proj.weight_scale": "model-00016-of-00047.safetensors", + "model.layers.15.mlp.experts.124.down_proj.weight": "model-00016-of-00047.safetensors", + "model.layers.15.mlp.experts.124.down_proj.weight_scale": "model-00016-of-00047.safetensors", + "model.layers.15.mlp.experts.124.gate_proj.weight": "model-00016-of-00047.safetensors", + "model.layers.15.mlp.experts.124.gate_proj.weight_scale": "model-00016-of-00047.safetensors", + "model.layers.15.mlp.experts.124.up_proj.weight": "model-00016-of-00047.safetensors", + "model.layers.15.mlp.experts.124.up_proj.weight_scale": "model-00016-of-00047.safetensors", + "model.layers.15.mlp.experts.125.down_proj.weight": "model-00016-of-00047.safetensors", + "model.layers.15.mlp.experts.125.down_proj.weight_scale": "model-00016-of-00047.safetensors", + "model.layers.15.mlp.experts.125.gate_proj.weight": "model-00016-of-00047.safetensors", + "model.layers.15.mlp.experts.125.gate_proj.weight_scale": "model-00016-of-00047.safetensors", + "model.layers.15.mlp.experts.125.up_proj.weight": "model-00016-of-00047.safetensors", + "model.layers.15.mlp.experts.125.up_proj.weight_scale": "model-00016-of-00047.safetensors", + "model.layers.15.mlp.experts.126.down_proj.weight": "model-00016-of-00047.safetensors", + "model.layers.15.mlp.experts.126.down_proj.weight_scale": "model-00016-of-00047.safetensors", + "model.layers.15.mlp.experts.126.gate_proj.weight": "model-00016-of-00047.safetensors", + "model.layers.15.mlp.experts.126.gate_proj.weight_scale": "model-00016-of-00047.safetensors", + "model.layers.15.mlp.experts.126.up_proj.weight": "model-00016-of-00047.safetensors", + "model.layers.15.mlp.experts.126.up_proj.weight_scale": "model-00016-of-00047.safetensors", + "model.layers.15.mlp.experts.127.down_proj.weight": "model-00016-of-00047.safetensors", + "model.layers.15.mlp.experts.127.down_proj.weight_scale": "model-00016-of-00047.safetensors", + "model.layers.15.mlp.experts.127.gate_proj.weight": "model-00016-of-00047.safetensors", + "model.layers.15.mlp.experts.127.gate_proj.weight_scale": "model-00016-of-00047.safetensors", + "model.layers.15.mlp.experts.127.up_proj.weight": "model-00016-of-00047.safetensors", + "model.layers.15.mlp.experts.127.up_proj.weight_scale": "model-00016-of-00047.safetensors", + "model.layers.15.mlp.experts.13.down_proj.weight": "model-00016-of-00047.safetensors", + "model.layers.15.mlp.experts.13.down_proj.weight_scale": "model-00016-of-00047.safetensors", + "model.layers.15.mlp.experts.13.gate_proj.weight": "model-00016-of-00047.safetensors", + "model.layers.15.mlp.experts.13.gate_proj.weight_scale": "model-00016-of-00047.safetensors", + "model.layers.15.mlp.experts.13.up_proj.weight": "model-00016-of-00047.safetensors", + "model.layers.15.mlp.experts.13.up_proj.weight_scale": "model-00016-of-00047.safetensors", + "model.layers.15.mlp.experts.14.down_proj.weight": "model-00016-of-00047.safetensors", + "model.layers.15.mlp.experts.14.down_proj.weight_scale": "model-00016-of-00047.safetensors", + "model.layers.15.mlp.experts.14.gate_proj.weight": "model-00016-of-00047.safetensors", + "model.layers.15.mlp.experts.14.gate_proj.weight_scale": "model-00016-of-00047.safetensors", + "model.layers.15.mlp.experts.14.up_proj.weight": "model-00016-of-00047.safetensors", + "model.layers.15.mlp.experts.14.up_proj.weight_scale": "model-00016-of-00047.safetensors", + "model.layers.15.mlp.experts.15.down_proj.weight": "model-00016-of-00047.safetensors", + "model.layers.15.mlp.experts.15.down_proj.weight_scale": "model-00016-of-00047.safetensors", + "model.layers.15.mlp.experts.15.gate_proj.weight": "model-00016-of-00047.safetensors", + "model.layers.15.mlp.experts.15.gate_proj.weight_scale": "model-00016-of-00047.safetensors", + "model.layers.15.mlp.experts.15.up_proj.weight": "model-00016-of-00047.safetensors", + "model.layers.15.mlp.experts.15.up_proj.weight_scale": "model-00016-of-00047.safetensors", + "model.layers.15.mlp.experts.16.down_proj.weight": "model-00016-of-00047.safetensors", + "model.layers.15.mlp.experts.16.down_proj.weight_scale": "model-00016-of-00047.safetensors", + "model.layers.15.mlp.experts.16.gate_proj.weight": "model-00016-of-00047.safetensors", + "model.layers.15.mlp.experts.16.gate_proj.weight_scale": "model-00016-of-00047.safetensors", + "model.layers.15.mlp.experts.16.up_proj.weight": "model-00016-of-00047.safetensors", + "model.layers.15.mlp.experts.16.up_proj.weight_scale": "model-00016-of-00047.safetensors", + "model.layers.15.mlp.experts.17.down_proj.weight": "model-00016-of-00047.safetensors", + "model.layers.15.mlp.experts.17.down_proj.weight_scale": "model-00016-of-00047.safetensors", + "model.layers.15.mlp.experts.17.gate_proj.weight": "model-00016-of-00047.safetensors", + "model.layers.15.mlp.experts.17.gate_proj.weight_scale": "model-00016-of-00047.safetensors", + "model.layers.15.mlp.experts.17.up_proj.weight": "model-00016-of-00047.safetensors", + "model.layers.15.mlp.experts.17.up_proj.weight_scale": "model-00016-of-00047.safetensors", + "model.layers.15.mlp.experts.18.down_proj.weight": "model-00016-of-00047.safetensors", + "model.layers.15.mlp.experts.18.down_proj.weight_scale": "model-00016-of-00047.safetensors", + "model.layers.15.mlp.experts.18.gate_proj.weight": "model-00016-of-00047.safetensors", + "model.layers.15.mlp.experts.18.gate_proj.weight_scale": "model-00016-of-00047.safetensors", + "model.layers.15.mlp.experts.18.up_proj.weight": "model-00016-of-00047.safetensors", + "model.layers.15.mlp.experts.18.up_proj.weight_scale": "model-00016-of-00047.safetensors", + "model.layers.15.mlp.experts.19.down_proj.weight": "model-00016-of-00047.safetensors", + "model.layers.15.mlp.experts.19.down_proj.weight_scale": "model-00016-of-00047.safetensors", + "model.layers.15.mlp.experts.19.gate_proj.weight": "model-00016-of-00047.safetensors", + "model.layers.15.mlp.experts.19.gate_proj.weight_scale": "model-00016-of-00047.safetensors", + "model.layers.15.mlp.experts.19.up_proj.weight": "model-00016-of-00047.safetensors", + "model.layers.15.mlp.experts.19.up_proj.weight_scale": "model-00016-of-00047.safetensors", + "model.layers.15.mlp.experts.2.down_proj.weight": "model-00016-of-00047.safetensors", + "model.layers.15.mlp.experts.2.down_proj.weight_scale": "model-00016-of-00047.safetensors", + "model.layers.15.mlp.experts.2.gate_proj.weight": "model-00016-of-00047.safetensors", + "model.layers.15.mlp.experts.2.gate_proj.weight_scale": "model-00016-of-00047.safetensors", + "model.layers.15.mlp.experts.2.up_proj.weight": "model-00016-of-00047.safetensors", + "model.layers.15.mlp.experts.2.up_proj.weight_scale": "model-00016-of-00047.safetensors", + "model.layers.15.mlp.experts.20.down_proj.weight": "model-00016-of-00047.safetensors", + "model.layers.15.mlp.experts.20.down_proj.weight_scale": "model-00016-of-00047.safetensors", + "model.layers.15.mlp.experts.20.gate_proj.weight": "model-00016-of-00047.safetensors", + "model.layers.15.mlp.experts.20.gate_proj.weight_scale": "model-00016-of-00047.safetensors", + "model.layers.15.mlp.experts.20.up_proj.weight": "model-00016-of-00047.safetensors", + "model.layers.15.mlp.experts.20.up_proj.weight_scale": "model-00016-of-00047.safetensors", + "model.layers.15.mlp.experts.21.down_proj.weight": "model-00016-of-00047.safetensors", + "model.layers.15.mlp.experts.21.down_proj.weight_scale": "model-00016-of-00047.safetensors", + "model.layers.15.mlp.experts.21.gate_proj.weight": "model-00016-of-00047.safetensors", + "model.layers.15.mlp.experts.21.gate_proj.weight_scale": "model-00016-of-00047.safetensors", + "model.layers.15.mlp.experts.21.up_proj.weight": "model-00016-of-00047.safetensors", + "model.layers.15.mlp.experts.21.up_proj.weight_scale": "model-00016-of-00047.safetensors", + "model.layers.15.mlp.experts.22.down_proj.weight": "model-00016-of-00047.safetensors", + "model.layers.15.mlp.experts.22.down_proj.weight_scale": "model-00016-of-00047.safetensors", + "model.layers.15.mlp.experts.22.gate_proj.weight": "model-00016-of-00047.safetensors", + "model.layers.15.mlp.experts.22.gate_proj.weight_scale": "model-00016-of-00047.safetensors", + "model.layers.15.mlp.experts.22.up_proj.weight": "model-00016-of-00047.safetensors", + "model.layers.15.mlp.experts.22.up_proj.weight_scale": "model-00016-of-00047.safetensors", + "model.layers.15.mlp.experts.23.down_proj.weight": "model-00016-of-00047.safetensors", + "model.layers.15.mlp.experts.23.down_proj.weight_scale": "model-00016-of-00047.safetensors", + "model.layers.15.mlp.experts.23.gate_proj.weight": "model-00016-of-00047.safetensors", + "model.layers.15.mlp.experts.23.gate_proj.weight_scale": "model-00016-of-00047.safetensors", + "model.layers.15.mlp.experts.23.up_proj.weight": "model-00016-of-00047.safetensors", + "model.layers.15.mlp.experts.23.up_proj.weight_scale": "model-00016-of-00047.safetensors", + "model.layers.15.mlp.experts.24.down_proj.weight": "model-00016-of-00047.safetensors", + "model.layers.15.mlp.experts.24.down_proj.weight_scale": "model-00016-of-00047.safetensors", + "model.layers.15.mlp.experts.24.gate_proj.weight": "model-00016-of-00047.safetensors", + "model.layers.15.mlp.experts.24.gate_proj.weight_scale": "model-00016-of-00047.safetensors", + "model.layers.15.mlp.experts.24.up_proj.weight": "model-00016-of-00047.safetensors", + "model.layers.15.mlp.experts.24.up_proj.weight_scale": "model-00016-of-00047.safetensors", + "model.layers.15.mlp.experts.25.down_proj.weight": "model-00016-of-00047.safetensors", + "model.layers.15.mlp.experts.25.down_proj.weight_scale": "model-00016-of-00047.safetensors", + "model.layers.15.mlp.experts.25.gate_proj.weight": "model-00016-of-00047.safetensors", + "model.layers.15.mlp.experts.25.gate_proj.weight_scale": "model-00016-of-00047.safetensors", + "model.layers.15.mlp.experts.25.up_proj.weight": "model-00016-of-00047.safetensors", + "model.layers.15.mlp.experts.25.up_proj.weight_scale": "model-00016-of-00047.safetensors", + "model.layers.15.mlp.experts.26.down_proj.weight": "model-00016-of-00047.safetensors", + "model.layers.15.mlp.experts.26.down_proj.weight_scale": "model-00016-of-00047.safetensors", + "model.layers.15.mlp.experts.26.gate_proj.weight": "model-00016-of-00047.safetensors", + "model.layers.15.mlp.experts.26.gate_proj.weight_scale": "model-00016-of-00047.safetensors", + "model.layers.15.mlp.experts.26.up_proj.weight": "model-00016-of-00047.safetensors", + "model.layers.15.mlp.experts.26.up_proj.weight_scale": "model-00016-of-00047.safetensors", + "model.layers.15.mlp.experts.27.down_proj.weight": "model-00016-of-00047.safetensors", + "model.layers.15.mlp.experts.27.down_proj.weight_scale": "model-00016-of-00047.safetensors", + "model.layers.15.mlp.experts.27.gate_proj.weight": "model-00016-of-00047.safetensors", + "model.layers.15.mlp.experts.27.gate_proj.weight_scale": "model-00016-of-00047.safetensors", + "model.layers.15.mlp.experts.27.up_proj.weight": "model-00016-of-00047.safetensors", + "model.layers.15.mlp.experts.27.up_proj.weight_scale": "model-00016-of-00047.safetensors", + "model.layers.15.mlp.experts.28.down_proj.weight": "model-00016-of-00047.safetensors", + "model.layers.15.mlp.experts.28.down_proj.weight_scale": "model-00016-of-00047.safetensors", + "model.layers.15.mlp.experts.28.gate_proj.weight": "model-00016-of-00047.safetensors", + "model.layers.15.mlp.experts.28.gate_proj.weight_scale": "model-00016-of-00047.safetensors", + "model.layers.15.mlp.experts.28.up_proj.weight": "model-00016-of-00047.safetensors", + "model.layers.15.mlp.experts.28.up_proj.weight_scale": "model-00016-of-00047.safetensors", + "model.layers.15.mlp.experts.29.down_proj.weight": "model-00016-of-00047.safetensors", + "model.layers.15.mlp.experts.29.down_proj.weight_scale": "model-00016-of-00047.safetensors", + "model.layers.15.mlp.experts.29.gate_proj.weight": "model-00016-of-00047.safetensors", + "model.layers.15.mlp.experts.29.gate_proj.weight_scale": "model-00016-of-00047.safetensors", + "model.layers.15.mlp.experts.29.up_proj.weight": "model-00016-of-00047.safetensors", + "model.layers.15.mlp.experts.29.up_proj.weight_scale": "model-00016-of-00047.safetensors", + "model.layers.15.mlp.experts.3.down_proj.weight": "model-00016-of-00047.safetensors", + "model.layers.15.mlp.experts.3.down_proj.weight_scale": "model-00016-of-00047.safetensors", + "model.layers.15.mlp.experts.3.gate_proj.weight": "model-00016-of-00047.safetensors", + "model.layers.15.mlp.experts.3.gate_proj.weight_scale": "model-00016-of-00047.safetensors", + "model.layers.15.mlp.experts.3.up_proj.weight": "model-00016-of-00047.safetensors", + "model.layers.15.mlp.experts.3.up_proj.weight_scale": "model-00016-of-00047.safetensors", + "model.layers.15.mlp.experts.30.down_proj.weight": "model-00016-of-00047.safetensors", + "model.layers.15.mlp.experts.30.down_proj.weight_scale": "model-00016-of-00047.safetensors", + "model.layers.15.mlp.experts.30.gate_proj.weight": "model-00016-of-00047.safetensors", + "model.layers.15.mlp.experts.30.gate_proj.weight_scale": "model-00016-of-00047.safetensors", + "model.layers.15.mlp.experts.30.up_proj.weight": "model-00016-of-00047.safetensors", + "model.layers.15.mlp.experts.30.up_proj.weight_scale": "model-00016-of-00047.safetensors", + "model.layers.15.mlp.experts.31.down_proj.weight": "model-00016-of-00047.safetensors", + "model.layers.15.mlp.experts.31.down_proj.weight_scale": "model-00016-of-00047.safetensors", + "model.layers.15.mlp.experts.31.gate_proj.weight": "model-00016-of-00047.safetensors", + "model.layers.15.mlp.experts.31.gate_proj.weight_scale": "model-00016-of-00047.safetensors", + "model.layers.15.mlp.experts.31.up_proj.weight": "model-00016-of-00047.safetensors", + "model.layers.15.mlp.experts.31.up_proj.weight_scale": "model-00016-of-00047.safetensors", + "model.layers.15.mlp.experts.32.down_proj.weight": "model-00016-of-00047.safetensors", + "model.layers.15.mlp.experts.32.down_proj.weight_scale": "model-00016-of-00047.safetensors", + "model.layers.15.mlp.experts.32.gate_proj.weight": "model-00016-of-00047.safetensors", + "model.layers.15.mlp.experts.32.gate_proj.weight_scale": "model-00016-of-00047.safetensors", + "model.layers.15.mlp.experts.32.up_proj.weight": "model-00016-of-00047.safetensors", + "model.layers.15.mlp.experts.32.up_proj.weight_scale": "model-00016-of-00047.safetensors", + "model.layers.15.mlp.experts.33.down_proj.weight": "model-00016-of-00047.safetensors", + "model.layers.15.mlp.experts.33.down_proj.weight_scale": "model-00016-of-00047.safetensors", + "model.layers.15.mlp.experts.33.gate_proj.weight": "model-00016-of-00047.safetensors", + "model.layers.15.mlp.experts.33.gate_proj.weight_scale": "model-00016-of-00047.safetensors", + "model.layers.15.mlp.experts.33.up_proj.weight": "model-00016-of-00047.safetensors", + "model.layers.15.mlp.experts.33.up_proj.weight_scale": "model-00016-of-00047.safetensors", + "model.layers.15.mlp.experts.34.down_proj.weight": "model-00016-of-00047.safetensors", + "model.layers.15.mlp.experts.34.down_proj.weight_scale": "model-00016-of-00047.safetensors", + "model.layers.15.mlp.experts.34.gate_proj.weight": "model-00016-of-00047.safetensors", + "model.layers.15.mlp.experts.34.gate_proj.weight_scale": "model-00016-of-00047.safetensors", + "model.layers.15.mlp.experts.34.up_proj.weight": "model-00016-of-00047.safetensors", + "model.layers.15.mlp.experts.34.up_proj.weight_scale": "model-00016-of-00047.safetensors", + "model.layers.15.mlp.experts.35.down_proj.weight": "model-00016-of-00047.safetensors", + "model.layers.15.mlp.experts.35.down_proj.weight_scale": "model-00016-of-00047.safetensors", + "model.layers.15.mlp.experts.35.gate_proj.weight": "model-00016-of-00047.safetensors", + "model.layers.15.mlp.experts.35.gate_proj.weight_scale": "model-00016-of-00047.safetensors", + "model.layers.15.mlp.experts.35.up_proj.weight": "model-00016-of-00047.safetensors", + "model.layers.15.mlp.experts.35.up_proj.weight_scale": "model-00016-of-00047.safetensors", + "model.layers.15.mlp.experts.36.down_proj.weight": "model-00016-of-00047.safetensors", + "model.layers.15.mlp.experts.36.down_proj.weight_scale": "model-00016-of-00047.safetensors", + "model.layers.15.mlp.experts.36.gate_proj.weight": "model-00016-of-00047.safetensors", + "model.layers.15.mlp.experts.36.gate_proj.weight_scale": "model-00016-of-00047.safetensors", + "model.layers.15.mlp.experts.36.up_proj.weight": "model-00016-of-00047.safetensors", + "model.layers.15.mlp.experts.36.up_proj.weight_scale": "model-00016-of-00047.safetensors", + "model.layers.15.mlp.experts.37.down_proj.weight": "model-00016-of-00047.safetensors", + "model.layers.15.mlp.experts.37.down_proj.weight_scale": "model-00016-of-00047.safetensors", + "model.layers.15.mlp.experts.37.gate_proj.weight": "model-00016-of-00047.safetensors", + "model.layers.15.mlp.experts.37.gate_proj.weight_scale": "model-00016-of-00047.safetensors", + "model.layers.15.mlp.experts.37.up_proj.weight": "model-00016-of-00047.safetensors", + "model.layers.15.mlp.experts.37.up_proj.weight_scale": "model-00016-of-00047.safetensors", + "model.layers.15.mlp.experts.38.down_proj.weight": "model-00016-of-00047.safetensors", + "model.layers.15.mlp.experts.38.down_proj.weight_scale": "model-00016-of-00047.safetensors", + "model.layers.15.mlp.experts.38.gate_proj.weight": "model-00016-of-00047.safetensors", + "model.layers.15.mlp.experts.38.gate_proj.weight_scale": "model-00016-of-00047.safetensors", + "model.layers.15.mlp.experts.38.up_proj.weight": "model-00016-of-00047.safetensors", + "model.layers.15.mlp.experts.38.up_proj.weight_scale": "model-00016-of-00047.safetensors", + "model.layers.15.mlp.experts.39.down_proj.weight": "model-00016-of-00047.safetensors", + "model.layers.15.mlp.experts.39.down_proj.weight_scale": "model-00016-of-00047.safetensors", + "model.layers.15.mlp.experts.39.gate_proj.weight": "model-00016-of-00047.safetensors", + "model.layers.15.mlp.experts.39.gate_proj.weight_scale": "model-00016-of-00047.safetensors", + "model.layers.15.mlp.experts.39.up_proj.weight": "model-00016-of-00047.safetensors", + "model.layers.15.mlp.experts.39.up_proj.weight_scale": "model-00016-of-00047.safetensors", + "model.layers.15.mlp.experts.4.down_proj.weight": "model-00016-of-00047.safetensors", + "model.layers.15.mlp.experts.4.down_proj.weight_scale": "model-00016-of-00047.safetensors", + "model.layers.15.mlp.experts.4.gate_proj.weight": "model-00016-of-00047.safetensors", + "model.layers.15.mlp.experts.4.gate_proj.weight_scale": "model-00016-of-00047.safetensors", + "model.layers.15.mlp.experts.4.up_proj.weight": "model-00016-of-00047.safetensors", + "model.layers.15.mlp.experts.4.up_proj.weight_scale": "model-00016-of-00047.safetensors", + "model.layers.15.mlp.experts.40.down_proj.weight": "model-00016-of-00047.safetensors", + "model.layers.15.mlp.experts.40.down_proj.weight_scale": "model-00016-of-00047.safetensors", + "model.layers.15.mlp.experts.40.gate_proj.weight": "model-00016-of-00047.safetensors", + "model.layers.15.mlp.experts.40.gate_proj.weight_scale": "model-00016-of-00047.safetensors", + "model.layers.15.mlp.experts.40.up_proj.weight": "model-00016-of-00047.safetensors", + "model.layers.15.mlp.experts.40.up_proj.weight_scale": "model-00016-of-00047.safetensors", + "model.layers.15.mlp.experts.41.down_proj.weight": "model-00016-of-00047.safetensors", + "model.layers.15.mlp.experts.41.down_proj.weight_scale": "model-00016-of-00047.safetensors", + "model.layers.15.mlp.experts.41.gate_proj.weight": "model-00016-of-00047.safetensors", + "model.layers.15.mlp.experts.41.gate_proj.weight_scale": "model-00016-of-00047.safetensors", + "model.layers.15.mlp.experts.41.up_proj.weight": "model-00016-of-00047.safetensors", + "model.layers.15.mlp.experts.41.up_proj.weight_scale": "model-00016-of-00047.safetensors", + "model.layers.15.mlp.experts.42.down_proj.weight": "model-00016-of-00047.safetensors", + "model.layers.15.mlp.experts.42.down_proj.weight_scale": "model-00016-of-00047.safetensors", + "model.layers.15.mlp.experts.42.gate_proj.weight": "model-00016-of-00047.safetensors", + "model.layers.15.mlp.experts.42.gate_proj.weight_scale": "model-00016-of-00047.safetensors", + "model.layers.15.mlp.experts.42.up_proj.weight": "model-00016-of-00047.safetensors", + "model.layers.15.mlp.experts.42.up_proj.weight_scale": "model-00016-of-00047.safetensors", + "model.layers.15.mlp.experts.43.down_proj.weight": "model-00016-of-00047.safetensors", + "model.layers.15.mlp.experts.43.down_proj.weight_scale": "model-00016-of-00047.safetensors", + "model.layers.15.mlp.experts.43.gate_proj.weight": "model-00016-of-00047.safetensors", + "model.layers.15.mlp.experts.43.gate_proj.weight_scale": "model-00016-of-00047.safetensors", + "model.layers.15.mlp.experts.43.up_proj.weight": "model-00016-of-00047.safetensors", + "model.layers.15.mlp.experts.43.up_proj.weight_scale": "model-00016-of-00047.safetensors", + "model.layers.15.mlp.experts.44.down_proj.weight": "model-00016-of-00047.safetensors", + "model.layers.15.mlp.experts.44.down_proj.weight_scale": "model-00016-of-00047.safetensors", + "model.layers.15.mlp.experts.44.gate_proj.weight": "model-00016-of-00047.safetensors", + "model.layers.15.mlp.experts.44.gate_proj.weight_scale": "model-00016-of-00047.safetensors", + "model.layers.15.mlp.experts.44.up_proj.weight": "model-00016-of-00047.safetensors", + "model.layers.15.mlp.experts.44.up_proj.weight_scale": "model-00016-of-00047.safetensors", + "model.layers.15.mlp.experts.45.down_proj.weight": "model-00016-of-00047.safetensors", + "model.layers.15.mlp.experts.45.down_proj.weight_scale": "model-00016-of-00047.safetensors", + "model.layers.15.mlp.experts.45.gate_proj.weight": "model-00016-of-00047.safetensors", + "model.layers.15.mlp.experts.45.gate_proj.weight_scale": "model-00016-of-00047.safetensors", + "model.layers.15.mlp.experts.45.up_proj.weight": "model-00016-of-00047.safetensors", + "model.layers.15.mlp.experts.45.up_proj.weight_scale": "model-00016-of-00047.safetensors", + "model.layers.15.mlp.experts.46.down_proj.weight": "model-00016-of-00047.safetensors", + "model.layers.15.mlp.experts.46.down_proj.weight_scale": "model-00016-of-00047.safetensors", + "model.layers.15.mlp.experts.46.gate_proj.weight": "model-00016-of-00047.safetensors", + "model.layers.15.mlp.experts.46.gate_proj.weight_scale": "model-00016-of-00047.safetensors", + "model.layers.15.mlp.experts.46.up_proj.weight": "model-00016-of-00047.safetensors", + "model.layers.15.mlp.experts.46.up_proj.weight_scale": "model-00016-of-00047.safetensors", + "model.layers.15.mlp.experts.47.down_proj.weight": "model-00016-of-00047.safetensors", + "model.layers.15.mlp.experts.47.down_proj.weight_scale": "model-00016-of-00047.safetensors", + "model.layers.15.mlp.experts.47.gate_proj.weight": "model-00016-of-00047.safetensors", + "model.layers.15.mlp.experts.47.gate_proj.weight_scale": "model-00016-of-00047.safetensors", + "model.layers.15.mlp.experts.47.up_proj.weight": "model-00016-of-00047.safetensors", + "model.layers.15.mlp.experts.47.up_proj.weight_scale": "model-00016-of-00047.safetensors", + "model.layers.15.mlp.experts.48.down_proj.weight": "model-00016-of-00047.safetensors", + "model.layers.15.mlp.experts.48.down_proj.weight_scale": "model-00016-of-00047.safetensors", + "model.layers.15.mlp.experts.48.gate_proj.weight": "model-00016-of-00047.safetensors", + "model.layers.15.mlp.experts.48.gate_proj.weight_scale": "model-00016-of-00047.safetensors", + "model.layers.15.mlp.experts.48.up_proj.weight": "model-00016-of-00047.safetensors", + "model.layers.15.mlp.experts.48.up_proj.weight_scale": "model-00016-of-00047.safetensors", + "model.layers.15.mlp.experts.49.down_proj.weight": "model-00016-of-00047.safetensors", + "model.layers.15.mlp.experts.49.down_proj.weight_scale": "model-00016-of-00047.safetensors", + "model.layers.15.mlp.experts.49.gate_proj.weight": "model-00016-of-00047.safetensors", + "model.layers.15.mlp.experts.49.gate_proj.weight_scale": "model-00016-of-00047.safetensors", + "model.layers.15.mlp.experts.49.up_proj.weight": "model-00016-of-00047.safetensors", + "model.layers.15.mlp.experts.49.up_proj.weight_scale": "model-00016-of-00047.safetensors", + "model.layers.15.mlp.experts.5.down_proj.weight": "model-00016-of-00047.safetensors", + "model.layers.15.mlp.experts.5.down_proj.weight_scale": "model-00016-of-00047.safetensors", + "model.layers.15.mlp.experts.5.gate_proj.weight": "model-00016-of-00047.safetensors", + "model.layers.15.mlp.experts.5.gate_proj.weight_scale": "model-00016-of-00047.safetensors", + "model.layers.15.mlp.experts.5.up_proj.weight": "model-00016-of-00047.safetensors", + "model.layers.15.mlp.experts.5.up_proj.weight_scale": "model-00016-of-00047.safetensors", + "model.layers.15.mlp.experts.50.down_proj.weight": "model-00016-of-00047.safetensors", + "model.layers.15.mlp.experts.50.down_proj.weight_scale": "model-00016-of-00047.safetensors", + "model.layers.15.mlp.experts.50.gate_proj.weight": "model-00016-of-00047.safetensors", + "model.layers.15.mlp.experts.50.gate_proj.weight_scale": "model-00016-of-00047.safetensors", + "model.layers.15.mlp.experts.50.up_proj.weight": "model-00016-of-00047.safetensors", + "model.layers.15.mlp.experts.50.up_proj.weight_scale": "model-00016-of-00047.safetensors", + "model.layers.15.mlp.experts.51.down_proj.weight": "model-00016-of-00047.safetensors", + "model.layers.15.mlp.experts.51.down_proj.weight_scale": "model-00016-of-00047.safetensors", + "model.layers.15.mlp.experts.51.gate_proj.weight": "model-00016-of-00047.safetensors", + "model.layers.15.mlp.experts.51.gate_proj.weight_scale": "model-00016-of-00047.safetensors", + "model.layers.15.mlp.experts.51.up_proj.weight": "model-00016-of-00047.safetensors", + "model.layers.15.mlp.experts.51.up_proj.weight_scale": "model-00016-of-00047.safetensors", + "model.layers.15.mlp.experts.52.down_proj.weight": "model-00016-of-00047.safetensors", + "model.layers.15.mlp.experts.52.down_proj.weight_scale": "model-00016-of-00047.safetensors", + "model.layers.15.mlp.experts.52.gate_proj.weight": "model-00016-of-00047.safetensors", + "model.layers.15.mlp.experts.52.gate_proj.weight_scale": "model-00016-of-00047.safetensors", + "model.layers.15.mlp.experts.52.up_proj.weight": "model-00016-of-00047.safetensors", + "model.layers.15.mlp.experts.52.up_proj.weight_scale": "model-00016-of-00047.safetensors", + "model.layers.15.mlp.experts.53.down_proj.weight": "model-00016-of-00047.safetensors", + "model.layers.15.mlp.experts.53.down_proj.weight_scale": "model-00016-of-00047.safetensors", + "model.layers.15.mlp.experts.53.gate_proj.weight": "model-00016-of-00047.safetensors", + "model.layers.15.mlp.experts.53.gate_proj.weight_scale": "model-00016-of-00047.safetensors", + "model.layers.15.mlp.experts.53.up_proj.weight": "model-00016-of-00047.safetensors", + "model.layers.15.mlp.experts.53.up_proj.weight_scale": "model-00016-of-00047.safetensors", + "model.layers.15.mlp.experts.54.down_proj.weight": "model-00016-of-00047.safetensors", + "model.layers.15.mlp.experts.54.down_proj.weight_scale": "model-00016-of-00047.safetensors", + "model.layers.15.mlp.experts.54.gate_proj.weight": "model-00016-of-00047.safetensors", + "model.layers.15.mlp.experts.54.gate_proj.weight_scale": "model-00016-of-00047.safetensors", + "model.layers.15.mlp.experts.54.up_proj.weight": "model-00016-of-00047.safetensors", + "model.layers.15.mlp.experts.54.up_proj.weight_scale": "model-00016-of-00047.safetensors", + "model.layers.15.mlp.experts.55.down_proj.weight": "model-00016-of-00047.safetensors", + "model.layers.15.mlp.experts.55.down_proj.weight_scale": "model-00016-of-00047.safetensors", + "model.layers.15.mlp.experts.55.gate_proj.weight": "model-00016-of-00047.safetensors", + "model.layers.15.mlp.experts.55.gate_proj.weight_scale": "model-00016-of-00047.safetensors", + "model.layers.15.mlp.experts.55.up_proj.weight": "model-00016-of-00047.safetensors", + "model.layers.15.mlp.experts.55.up_proj.weight_scale": "model-00016-of-00047.safetensors", + "model.layers.15.mlp.experts.56.down_proj.weight": "model-00016-of-00047.safetensors", + "model.layers.15.mlp.experts.56.down_proj.weight_scale": "model-00016-of-00047.safetensors", + "model.layers.15.mlp.experts.56.gate_proj.weight": "model-00016-of-00047.safetensors", + "model.layers.15.mlp.experts.56.gate_proj.weight_scale": "model-00016-of-00047.safetensors", + "model.layers.15.mlp.experts.56.up_proj.weight": "model-00016-of-00047.safetensors", + "model.layers.15.mlp.experts.56.up_proj.weight_scale": "model-00016-of-00047.safetensors", + "model.layers.15.mlp.experts.57.down_proj.weight": "model-00016-of-00047.safetensors", + "model.layers.15.mlp.experts.57.down_proj.weight_scale": "model-00016-of-00047.safetensors", + "model.layers.15.mlp.experts.57.gate_proj.weight": "model-00016-of-00047.safetensors", + "model.layers.15.mlp.experts.57.gate_proj.weight_scale": "model-00016-of-00047.safetensors", + "model.layers.15.mlp.experts.57.up_proj.weight": "model-00016-of-00047.safetensors", + "model.layers.15.mlp.experts.57.up_proj.weight_scale": "model-00016-of-00047.safetensors", + "model.layers.15.mlp.experts.58.down_proj.weight": "model-00016-of-00047.safetensors", + "model.layers.15.mlp.experts.58.down_proj.weight_scale": "model-00016-of-00047.safetensors", + "model.layers.15.mlp.experts.58.gate_proj.weight": "model-00016-of-00047.safetensors", + "model.layers.15.mlp.experts.58.gate_proj.weight_scale": "model-00016-of-00047.safetensors", + "model.layers.15.mlp.experts.58.up_proj.weight": "model-00016-of-00047.safetensors", + "model.layers.15.mlp.experts.58.up_proj.weight_scale": "model-00016-of-00047.safetensors", + "model.layers.15.mlp.experts.59.down_proj.weight": "model-00016-of-00047.safetensors", + "model.layers.15.mlp.experts.59.down_proj.weight_scale": "model-00016-of-00047.safetensors", + "model.layers.15.mlp.experts.59.gate_proj.weight": "model-00016-of-00047.safetensors", + "model.layers.15.mlp.experts.59.gate_proj.weight_scale": "model-00016-of-00047.safetensors", + "model.layers.15.mlp.experts.59.up_proj.weight": "model-00016-of-00047.safetensors", + "model.layers.15.mlp.experts.59.up_proj.weight_scale": "model-00016-of-00047.safetensors", + "model.layers.15.mlp.experts.6.down_proj.weight": "model-00016-of-00047.safetensors", + "model.layers.15.mlp.experts.6.down_proj.weight_scale": "model-00016-of-00047.safetensors", + "model.layers.15.mlp.experts.6.gate_proj.weight": "model-00016-of-00047.safetensors", + "model.layers.15.mlp.experts.6.gate_proj.weight_scale": "model-00016-of-00047.safetensors", + "model.layers.15.mlp.experts.6.up_proj.weight": "model-00016-of-00047.safetensors", + "model.layers.15.mlp.experts.6.up_proj.weight_scale": "model-00016-of-00047.safetensors", + "model.layers.15.mlp.experts.60.down_proj.weight": "model-00016-of-00047.safetensors", + "model.layers.15.mlp.experts.60.down_proj.weight_scale": "model-00016-of-00047.safetensors", + "model.layers.15.mlp.experts.60.gate_proj.weight": "model-00016-of-00047.safetensors", + "model.layers.15.mlp.experts.60.gate_proj.weight_scale": "model-00016-of-00047.safetensors", + "model.layers.15.mlp.experts.60.up_proj.weight": "model-00016-of-00047.safetensors", + "model.layers.15.mlp.experts.60.up_proj.weight_scale": "model-00016-of-00047.safetensors", + "model.layers.15.mlp.experts.61.down_proj.weight": "model-00016-of-00047.safetensors", + "model.layers.15.mlp.experts.61.down_proj.weight_scale": "model-00016-of-00047.safetensors", + "model.layers.15.mlp.experts.61.gate_proj.weight": "model-00016-of-00047.safetensors", + "model.layers.15.mlp.experts.61.gate_proj.weight_scale": "model-00016-of-00047.safetensors", + "model.layers.15.mlp.experts.61.up_proj.weight": "model-00016-of-00047.safetensors", + "model.layers.15.mlp.experts.61.up_proj.weight_scale": "model-00016-of-00047.safetensors", + "model.layers.15.mlp.experts.62.down_proj.weight": "model-00016-of-00047.safetensors", + "model.layers.15.mlp.experts.62.down_proj.weight_scale": "model-00016-of-00047.safetensors", + "model.layers.15.mlp.experts.62.gate_proj.weight": "model-00016-of-00047.safetensors", + "model.layers.15.mlp.experts.62.gate_proj.weight_scale": "model-00016-of-00047.safetensors", + "model.layers.15.mlp.experts.62.up_proj.weight": "model-00016-of-00047.safetensors", + "model.layers.15.mlp.experts.62.up_proj.weight_scale": "model-00016-of-00047.safetensors", + "model.layers.15.mlp.experts.63.down_proj.weight": "model-00016-of-00047.safetensors", + "model.layers.15.mlp.experts.63.down_proj.weight_scale": "model-00016-of-00047.safetensors", + "model.layers.15.mlp.experts.63.gate_proj.weight": "model-00016-of-00047.safetensors", + "model.layers.15.mlp.experts.63.gate_proj.weight_scale": "model-00016-of-00047.safetensors", + "model.layers.15.mlp.experts.63.up_proj.weight": "model-00016-of-00047.safetensors", + "model.layers.15.mlp.experts.63.up_proj.weight_scale": "model-00016-of-00047.safetensors", + "model.layers.15.mlp.experts.64.down_proj.weight": "model-00016-of-00047.safetensors", + "model.layers.15.mlp.experts.64.down_proj.weight_scale": "model-00016-of-00047.safetensors", + "model.layers.15.mlp.experts.64.gate_proj.weight": "model-00016-of-00047.safetensors", + "model.layers.15.mlp.experts.64.gate_proj.weight_scale": "model-00016-of-00047.safetensors", + "model.layers.15.mlp.experts.64.up_proj.weight": "model-00016-of-00047.safetensors", + "model.layers.15.mlp.experts.64.up_proj.weight_scale": "model-00016-of-00047.safetensors", + "model.layers.15.mlp.experts.65.down_proj.weight": "model-00016-of-00047.safetensors", + "model.layers.15.mlp.experts.65.down_proj.weight_scale": "model-00016-of-00047.safetensors", + "model.layers.15.mlp.experts.65.gate_proj.weight": "model-00016-of-00047.safetensors", + "model.layers.15.mlp.experts.65.gate_proj.weight_scale": "model-00016-of-00047.safetensors", + "model.layers.15.mlp.experts.65.up_proj.weight": "model-00016-of-00047.safetensors", + "model.layers.15.mlp.experts.65.up_proj.weight_scale": "model-00016-of-00047.safetensors", + "model.layers.15.mlp.experts.66.down_proj.weight": "model-00016-of-00047.safetensors", + "model.layers.15.mlp.experts.66.down_proj.weight_scale": "model-00016-of-00047.safetensors", + "model.layers.15.mlp.experts.66.gate_proj.weight": "model-00016-of-00047.safetensors", + "model.layers.15.mlp.experts.66.gate_proj.weight_scale": "model-00016-of-00047.safetensors", + "model.layers.15.mlp.experts.66.up_proj.weight": "model-00016-of-00047.safetensors", + "model.layers.15.mlp.experts.66.up_proj.weight_scale": "model-00016-of-00047.safetensors", + "model.layers.15.mlp.experts.67.down_proj.weight": "model-00016-of-00047.safetensors", + "model.layers.15.mlp.experts.67.down_proj.weight_scale": "model-00016-of-00047.safetensors", + "model.layers.15.mlp.experts.67.gate_proj.weight": "model-00016-of-00047.safetensors", + "model.layers.15.mlp.experts.67.gate_proj.weight_scale": "model-00016-of-00047.safetensors", + "model.layers.15.mlp.experts.67.up_proj.weight": "model-00016-of-00047.safetensors", + "model.layers.15.mlp.experts.67.up_proj.weight_scale": "model-00016-of-00047.safetensors", + "model.layers.15.mlp.experts.68.down_proj.weight": "model-00016-of-00047.safetensors", + "model.layers.15.mlp.experts.68.down_proj.weight_scale": "model-00016-of-00047.safetensors", + "model.layers.15.mlp.experts.68.gate_proj.weight": "model-00016-of-00047.safetensors", + "model.layers.15.mlp.experts.68.gate_proj.weight_scale": "model-00016-of-00047.safetensors", + "model.layers.15.mlp.experts.68.up_proj.weight": "model-00016-of-00047.safetensors", + "model.layers.15.mlp.experts.68.up_proj.weight_scale": "model-00016-of-00047.safetensors", + "model.layers.15.mlp.experts.69.down_proj.weight": "model-00016-of-00047.safetensors", + "model.layers.15.mlp.experts.69.down_proj.weight_scale": "model-00016-of-00047.safetensors", + "model.layers.15.mlp.experts.69.gate_proj.weight": "model-00016-of-00047.safetensors", + "model.layers.15.mlp.experts.69.gate_proj.weight_scale": "model-00016-of-00047.safetensors", + "model.layers.15.mlp.experts.69.up_proj.weight": "model-00016-of-00047.safetensors", + "model.layers.15.mlp.experts.69.up_proj.weight_scale": "model-00016-of-00047.safetensors", + "model.layers.15.mlp.experts.7.down_proj.weight": "model-00016-of-00047.safetensors", + "model.layers.15.mlp.experts.7.down_proj.weight_scale": "model-00016-of-00047.safetensors", + "model.layers.15.mlp.experts.7.gate_proj.weight": "model-00016-of-00047.safetensors", + "model.layers.15.mlp.experts.7.gate_proj.weight_scale": "model-00016-of-00047.safetensors", + "model.layers.15.mlp.experts.7.up_proj.weight": "model-00016-of-00047.safetensors", + "model.layers.15.mlp.experts.7.up_proj.weight_scale": "model-00016-of-00047.safetensors", + "model.layers.15.mlp.experts.70.down_proj.weight": "model-00016-of-00047.safetensors", + "model.layers.15.mlp.experts.70.down_proj.weight_scale": "model-00016-of-00047.safetensors", + "model.layers.15.mlp.experts.70.gate_proj.weight": "model-00016-of-00047.safetensors", + "model.layers.15.mlp.experts.70.gate_proj.weight_scale": "model-00016-of-00047.safetensors", + "model.layers.15.mlp.experts.70.up_proj.weight": "model-00016-of-00047.safetensors", + "model.layers.15.mlp.experts.70.up_proj.weight_scale": "model-00016-of-00047.safetensors", + "model.layers.15.mlp.experts.71.down_proj.weight": "model-00016-of-00047.safetensors", + "model.layers.15.mlp.experts.71.down_proj.weight_scale": "model-00016-of-00047.safetensors", + "model.layers.15.mlp.experts.71.gate_proj.weight": "model-00016-of-00047.safetensors", + "model.layers.15.mlp.experts.71.gate_proj.weight_scale": "model-00016-of-00047.safetensors", + "model.layers.15.mlp.experts.71.up_proj.weight": "model-00016-of-00047.safetensors", + "model.layers.15.mlp.experts.71.up_proj.weight_scale": "model-00016-of-00047.safetensors", + "model.layers.15.mlp.experts.72.down_proj.weight": "model-00016-of-00047.safetensors", + "model.layers.15.mlp.experts.72.down_proj.weight_scale": "model-00016-of-00047.safetensors", + "model.layers.15.mlp.experts.72.gate_proj.weight": "model-00016-of-00047.safetensors", + "model.layers.15.mlp.experts.72.gate_proj.weight_scale": "model-00016-of-00047.safetensors", + "model.layers.15.mlp.experts.72.up_proj.weight": "model-00016-of-00047.safetensors", + "model.layers.15.mlp.experts.72.up_proj.weight_scale": "model-00016-of-00047.safetensors", + "model.layers.15.mlp.experts.73.down_proj.weight": "model-00016-of-00047.safetensors", + "model.layers.15.mlp.experts.73.down_proj.weight_scale": "model-00016-of-00047.safetensors", + "model.layers.15.mlp.experts.73.gate_proj.weight": "model-00016-of-00047.safetensors", + "model.layers.15.mlp.experts.73.gate_proj.weight_scale": "model-00016-of-00047.safetensors", + "model.layers.15.mlp.experts.73.up_proj.weight": "model-00016-of-00047.safetensors", + "model.layers.15.mlp.experts.73.up_proj.weight_scale": "model-00016-of-00047.safetensors", + "model.layers.15.mlp.experts.74.down_proj.weight": "model-00016-of-00047.safetensors", + "model.layers.15.mlp.experts.74.down_proj.weight_scale": "model-00016-of-00047.safetensors", + "model.layers.15.mlp.experts.74.gate_proj.weight": "model-00016-of-00047.safetensors", + "model.layers.15.mlp.experts.74.gate_proj.weight_scale": "model-00016-of-00047.safetensors", + "model.layers.15.mlp.experts.74.up_proj.weight": "model-00016-of-00047.safetensors", + "model.layers.15.mlp.experts.74.up_proj.weight_scale": "model-00016-of-00047.safetensors", + "model.layers.15.mlp.experts.75.down_proj.weight": "model-00016-of-00047.safetensors", + "model.layers.15.mlp.experts.75.down_proj.weight_scale": "model-00016-of-00047.safetensors", + "model.layers.15.mlp.experts.75.gate_proj.weight": "model-00016-of-00047.safetensors", + "model.layers.15.mlp.experts.75.gate_proj.weight_scale": "model-00016-of-00047.safetensors", + "model.layers.15.mlp.experts.75.up_proj.weight": "model-00016-of-00047.safetensors", + "model.layers.15.mlp.experts.75.up_proj.weight_scale": "model-00016-of-00047.safetensors", + "model.layers.15.mlp.experts.76.down_proj.weight": "model-00016-of-00047.safetensors", + "model.layers.15.mlp.experts.76.down_proj.weight_scale": "model-00016-of-00047.safetensors", + "model.layers.15.mlp.experts.76.gate_proj.weight": "model-00016-of-00047.safetensors", + "model.layers.15.mlp.experts.76.gate_proj.weight_scale": "model-00016-of-00047.safetensors", + "model.layers.15.mlp.experts.76.up_proj.weight": "model-00016-of-00047.safetensors", + "model.layers.15.mlp.experts.76.up_proj.weight_scale": "model-00016-of-00047.safetensors", + "model.layers.15.mlp.experts.77.down_proj.weight": "model-00016-of-00047.safetensors", + "model.layers.15.mlp.experts.77.down_proj.weight_scale": "model-00016-of-00047.safetensors", + "model.layers.15.mlp.experts.77.gate_proj.weight": "model-00016-of-00047.safetensors", + "model.layers.15.mlp.experts.77.gate_proj.weight_scale": "model-00016-of-00047.safetensors", + "model.layers.15.mlp.experts.77.up_proj.weight": "model-00016-of-00047.safetensors", + "model.layers.15.mlp.experts.77.up_proj.weight_scale": "model-00016-of-00047.safetensors", + "model.layers.15.mlp.experts.78.down_proj.weight": "model-00016-of-00047.safetensors", + "model.layers.15.mlp.experts.78.down_proj.weight_scale": "model-00016-of-00047.safetensors", + "model.layers.15.mlp.experts.78.gate_proj.weight": "model-00016-of-00047.safetensors", + "model.layers.15.mlp.experts.78.gate_proj.weight_scale": "model-00016-of-00047.safetensors", + "model.layers.15.mlp.experts.78.up_proj.weight": "model-00016-of-00047.safetensors", + "model.layers.15.mlp.experts.78.up_proj.weight_scale": "model-00016-of-00047.safetensors", + "model.layers.15.mlp.experts.79.down_proj.weight": "model-00016-of-00047.safetensors", + "model.layers.15.mlp.experts.79.down_proj.weight_scale": "model-00016-of-00047.safetensors", + "model.layers.15.mlp.experts.79.gate_proj.weight": "model-00016-of-00047.safetensors", + "model.layers.15.mlp.experts.79.gate_proj.weight_scale": "model-00016-of-00047.safetensors", + "model.layers.15.mlp.experts.79.up_proj.weight": "model-00016-of-00047.safetensors", + "model.layers.15.mlp.experts.79.up_proj.weight_scale": "model-00016-of-00047.safetensors", + "model.layers.15.mlp.experts.8.down_proj.weight": "model-00016-of-00047.safetensors", + "model.layers.15.mlp.experts.8.down_proj.weight_scale": "model-00016-of-00047.safetensors", + "model.layers.15.mlp.experts.8.gate_proj.weight": "model-00016-of-00047.safetensors", + "model.layers.15.mlp.experts.8.gate_proj.weight_scale": "model-00016-of-00047.safetensors", + "model.layers.15.mlp.experts.8.up_proj.weight": "model-00016-of-00047.safetensors", + "model.layers.15.mlp.experts.8.up_proj.weight_scale": "model-00016-of-00047.safetensors", + "model.layers.15.mlp.experts.80.down_proj.weight": "model-00016-of-00047.safetensors", + "model.layers.15.mlp.experts.80.down_proj.weight_scale": "model-00016-of-00047.safetensors", + "model.layers.15.mlp.experts.80.gate_proj.weight": "model-00016-of-00047.safetensors", + "model.layers.15.mlp.experts.80.gate_proj.weight_scale": "model-00016-of-00047.safetensors", + "model.layers.15.mlp.experts.80.up_proj.weight": "model-00016-of-00047.safetensors", + "model.layers.15.mlp.experts.80.up_proj.weight_scale": "model-00016-of-00047.safetensors", + "model.layers.15.mlp.experts.81.down_proj.weight": "model-00016-of-00047.safetensors", + "model.layers.15.mlp.experts.81.down_proj.weight_scale": "model-00016-of-00047.safetensors", + "model.layers.15.mlp.experts.81.gate_proj.weight": "model-00016-of-00047.safetensors", + "model.layers.15.mlp.experts.81.gate_proj.weight_scale": "model-00016-of-00047.safetensors", + "model.layers.15.mlp.experts.81.up_proj.weight": "model-00016-of-00047.safetensors", + "model.layers.15.mlp.experts.81.up_proj.weight_scale": "model-00016-of-00047.safetensors", + "model.layers.15.mlp.experts.82.down_proj.weight": "model-00016-of-00047.safetensors", + "model.layers.15.mlp.experts.82.down_proj.weight_scale": "model-00016-of-00047.safetensors", + "model.layers.15.mlp.experts.82.gate_proj.weight": "model-00016-of-00047.safetensors", + "model.layers.15.mlp.experts.82.gate_proj.weight_scale": "model-00016-of-00047.safetensors", + "model.layers.15.mlp.experts.82.up_proj.weight": "model-00016-of-00047.safetensors", + "model.layers.15.mlp.experts.82.up_proj.weight_scale": "model-00016-of-00047.safetensors", + "model.layers.15.mlp.experts.83.down_proj.weight": "model-00016-of-00047.safetensors", + "model.layers.15.mlp.experts.83.down_proj.weight_scale": "model-00016-of-00047.safetensors", + "model.layers.15.mlp.experts.83.gate_proj.weight": "model-00016-of-00047.safetensors", + "model.layers.15.mlp.experts.83.gate_proj.weight_scale": "model-00016-of-00047.safetensors", + "model.layers.15.mlp.experts.83.up_proj.weight": "model-00016-of-00047.safetensors", + "model.layers.15.mlp.experts.83.up_proj.weight_scale": "model-00016-of-00047.safetensors", + "model.layers.15.mlp.experts.84.down_proj.weight": "model-00016-of-00047.safetensors", + "model.layers.15.mlp.experts.84.down_proj.weight_scale": "model-00016-of-00047.safetensors", + "model.layers.15.mlp.experts.84.gate_proj.weight": "model-00016-of-00047.safetensors", + "model.layers.15.mlp.experts.84.gate_proj.weight_scale": "model-00016-of-00047.safetensors", + "model.layers.15.mlp.experts.84.up_proj.weight": "model-00016-of-00047.safetensors", + "model.layers.15.mlp.experts.84.up_proj.weight_scale": "model-00016-of-00047.safetensors", + "model.layers.15.mlp.experts.85.down_proj.weight": "model-00016-of-00047.safetensors", + "model.layers.15.mlp.experts.85.down_proj.weight_scale": "model-00016-of-00047.safetensors", + "model.layers.15.mlp.experts.85.gate_proj.weight": "model-00016-of-00047.safetensors", + "model.layers.15.mlp.experts.85.gate_proj.weight_scale": "model-00016-of-00047.safetensors", + "model.layers.15.mlp.experts.85.up_proj.weight": "model-00016-of-00047.safetensors", + "model.layers.15.mlp.experts.85.up_proj.weight_scale": "model-00016-of-00047.safetensors", + "model.layers.15.mlp.experts.86.down_proj.weight": "model-00016-of-00047.safetensors", + "model.layers.15.mlp.experts.86.down_proj.weight_scale": "model-00016-of-00047.safetensors", + "model.layers.15.mlp.experts.86.gate_proj.weight": "model-00016-of-00047.safetensors", + "model.layers.15.mlp.experts.86.gate_proj.weight_scale": "model-00016-of-00047.safetensors", + "model.layers.15.mlp.experts.86.up_proj.weight": "model-00016-of-00047.safetensors", + "model.layers.15.mlp.experts.86.up_proj.weight_scale": "model-00016-of-00047.safetensors", + "model.layers.15.mlp.experts.87.down_proj.weight": "model-00016-of-00047.safetensors", + "model.layers.15.mlp.experts.87.down_proj.weight_scale": "model-00016-of-00047.safetensors", + "model.layers.15.mlp.experts.87.gate_proj.weight": "model-00016-of-00047.safetensors", + "model.layers.15.mlp.experts.87.gate_proj.weight_scale": "model-00016-of-00047.safetensors", + "model.layers.15.mlp.experts.87.up_proj.weight": "model-00016-of-00047.safetensors", + "model.layers.15.mlp.experts.87.up_proj.weight_scale": "model-00016-of-00047.safetensors", + "model.layers.15.mlp.experts.88.down_proj.weight": "model-00016-of-00047.safetensors", + "model.layers.15.mlp.experts.88.down_proj.weight_scale": "model-00016-of-00047.safetensors", + "model.layers.15.mlp.experts.88.gate_proj.weight": "model-00016-of-00047.safetensors", + "model.layers.15.mlp.experts.88.gate_proj.weight_scale": "model-00016-of-00047.safetensors", + "model.layers.15.mlp.experts.88.up_proj.weight": "model-00016-of-00047.safetensors", + "model.layers.15.mlp.experts.88.up_proj.weight_scale": "model-00016-of-00047.safetensors", + "model.layers.15.mlp.experts.89.down_proj.weight": "model-00016-of-00047.safetensors", + "model.layers.15.mlp.experts.89.down_proj.weight_scale": "model-00016-of-00047.safetensors", + "model.layers.15.mlp.experts.89.gate_proj.weight": "model-00016-of-00047.safetensors", + "model.layers.15.mlp.experts.89.gate_proj.weight_scale": "model-00016-of-00047.safetensors", + "model.layers.15.mlp.experts.89.up_proj.weight": "model-00016-of-00047.safetensors", + "model.layers.15.mlp.experts.89.up_proj.weight_scale": "model-00016-of-00047.safetensors", + "model.layers.15.mlp.experts.9.down_proj.weight": "model-00016-of-00047.safetensors", + "model.layers.15.mlp.experts.9.down_proj.weight_scale": "model-00016-of-00047.safetensors", + "model.layers.15.mlp.experts.9.gate_proj.weight": "model-00016-of-00047.safetensors", + "model.layers.15.mlp.experts.9.gate_proj.weight_scale": "model-00016-of-00047.safetensors", + "model.layers.15.mlp.experts.9.up_proj.weight": "model-00016-of-00047.safetensors", + "model.layers.15.mlp.experts.9.up_proj.weight_scale": "model-00016-of-00047.safetensors", + "model.layers.15.mlp.experts.90.down_proj.weight": "model-00016-of-00047.safetensors", + "model.layers.15.mlp.experts.90.down_proj.weight_scale": "model-00016-of-00047.safetensors", + "model.layers.15.mlp.experts.90.gate_proj.weight": "model-00016-of-00047.safetensors", + "model.layers.15.mlp.experts.90.gate_proj.weight_scale": "model-00016-of-00047.safetensors", + "model.layers.15.mlp.experts.90.up_proj.weight": "model-00016-of-00047.safetensors", + "model.layers.15.mlp.experts.90.up_proj.weight_scale": "model-00016-of-00047.safetensors", + "model.layers.15.mlp.experts.91.down_proj.weight": "model-00016-of-00047.safetensors", + "model.layers.15.mlp.experts.91.down_proj.weight_scale": "model-00016-of-00047.safetensors", + "model.layers.15.mlp.experts.91.gate_proj.weight": "model-00016-of-00047.safetensors", + "model.layers.15.mlp.experts.91.gate_proj.weight_scale": "model-00016-of-00047.safetensors", + "model.layers.15.mlp.experts.91.up_proj.weight": "model-00016-of-00047.safetensors", + "model.layers.15.mlp.experts.91.up_proj.weight_scale": "model-00016-of-00047.safetensors", + "model.layers.15.mlp.experts.92.down_proj.weight": "model-00016-of-00047.safetensors", + "model.layers.15.mlp.experts.92.down_proj.weight_scale": "model-00016-of-00047.safetensors", + "model.layers.15.mlp.experts.92.gate_proj.weight": "model-00016-of-00047.safetensors", + "model.layers.15.mlp.experts.92.gate_proj.weight_scale": "model-00016-of-00047.safetensors", + "model.layers.15.mlp.experts.92.up_proj.weight": "model-00016-of-00047.safetensors", + "model.layers.15.mlp.experts.92.up_proj.weight_scale": "model-00016-of-00047.safetensors", + "model.layers.15.mlp.experts.93.down_proj.weight": "model-00016-of-00047.safetensors", + "model.layers.15.mlp.experts.93.down_proj.weight_scale": "model-00016-of-00047.safetensors", + "model.layers.15.mlp.experts.93.gate_proj.weight": "model-00016-of-00047.safetensors", + "model.layers.15.mlp.experts.93.gate_proj.weight_scale": "model-00016-of-00047.safetensors", + "model.layers.15.mlp.experts.93.up_proj.weight": "model-00016-of-00047.safetensors", + "model.layers.15.mlp.experts.93.up_proj.weight_scale": "model-00016-of-00047.safetensors", + "model.layers.15.mlp.experts.94.down_proj.weight": "model-00016-of-00047.safetensors", + "model.layers.15.mlp.experts.94.down_proj.weight_scale": "model-00016-of-00047.safetensors", + "model.layers.15.mlp.experts.94.gate_proj.weight": "model-00016-of-00047.safetensors", + "model.layers.15.mlp.experts.94.gate_proj.weight_scale": "model-00016-of-00047.safetensors", + "model.layers.15.mlp.experts.94.up_proj.weight": "model-00016-of-00047.safetensors", + "model.layers.15.mlp.experts.94.up_proj.weight_scale": "model-00016-of-00047.safetensors", + "model.layers.15.mlp.experts.95.down_proj.weight": "model-00016-of-00047.safetensors", + "model.layers.15.mlp.experts.95.down_proj.weight_scale": "model-00016-of-00047.safetensors", + "model.layers.15.mlp.experts.95.gate_proj.weight": "model-00016-of-00047.safetensors", + "model.layers.15.mlp.experts.95.gate_proj.weight_scale": "model-00016-of-00047.safetensors", + "model.layers.15.mlp.experts.95.up_proj.weight": "model-00016-of-00047.safetensors", + "model.layers.15.mlp.experts.95.up_proj.weight_scale": "model-00016-of-00047.safetensors", + "model.layers.15.mlp.experts.96.down_proj.weight": "model-00016-of-00047.safetensors", + "model.layers.15.mlp.experts.96.down_proj.weight_scale": "model-00016-of-00047.safetensors", + "model.layers.15.mlp.experts.96.gate_proj.weight": "model-00016-of-00047.safetensors", + "model.layers.15.mlp.experts.96.gate_proj.weight_scale": "model-00016-of-00047.safetensors", + "model.layers.15.mlp.experts.96.up_proj.weight": "model-00016-of-00047.safetensors", + "model.layers.15.mlp.experts.96.up_proj.weight_scale": "model-00016-of-00047.safetensors", + "model.layers.15.mlp.experts.97.down_proj.weight": "model-00016-of-00047.safetensors", + "model.layers.15.mlp.experts.97.down_proj.weight_scale": "model-00016-of-00047.safetensors", + "model.layers.15.mlp.experts.97.gate_proj.weight": "model-00016-of-00047.safetensors", + "model.layers.15.mlp.experts.97.gate_proj.weight_scale": "model-00016-of-00047.safetensors", + "model.layers.15.mlp.experts.97.up_proj.weight": "model-00016-of-00047.safetensors", + "model.layers.15.mlp.experts.97.up_proj.weight_scale": "model-00016-of-00047.safetensors", + "model.layers.15.mlp.experts.98.down_proj.weight": "model-00016-of-00047.safetensors", + "model.layers.15.mlp.experts.98.down_proj.weight_scale": "model-00016-of-00047.safetensors", + "model.layers.15.mlp.experts.98.gate_proj.weight": "model-00016-of-00047.safetensors", + "model.layers.15.mlp.experts.98.gate_proj.weight_scale": "model-00016-of-00047.safetensors", + "model.layers.15.mlp.experts.98.up_proj.weight": "model-00016-of-00047.safetensors", + "model.layers.15.mlp.experts.98.up_proj.weight_scale": "model-00016-of-00047.safetensors", + "model.layers.15.mlp.experts.99.down_proj.weight": "model-00016-of-00047.safetensors", + "model.layers.15.mlp.experts.99.down_proj.weight_scale": "model-00016-of-00047.safetensors", + "model.layers.15.mlp.experts.99.gate_proj.weight": "model-00016-of-00047.safetensors", + "model.layers.15.mlp.experts.99.gate_proj.weight_scale": "model-00016-of-00047.safetensors", + "model.layers.15.mlp.experts.99.up_proj.weight": "model-00016-of-00047.safetensors", + "model.layers.15.mlp.experts.99.up_proj.weight_scale": "model-00016-of-00047.safetensors", + "model.layers.15.mlp.gate.e_score_correction_bias": "model-00016-of-00047.safetensors", + "model.layers.15.mlp.gate.weight": "model-00016-of-00047.safetensors", + "model.layers.15.mlp.shared_experts.down_proj.weight": "model-00016-of-00047.safetensors", + "model.layers.15.mlp.shared_experts.down_proj.weight_scale": "model-00016-of-00047.safetensors", + "model.layers.15.mlp.shared_experts.gate_proj.weight": "model-00016-of-00047.safetensors", + "model.layers.15.mlp.shared_experts.gate_proj.weight_scale": "model-00016-of-00047.safetensors", + "model.layers.15.mlp.shared_experts.up_proj.weight": "model-00016-of-00047.safetensors", + "model.layers.15.mlp.shared_experts.up_proj.weight_scale": "model-00016-of-00047.safetensors", + "model.layers.15.post_attention_layernorm.weight": "model-00016-of-00047.safetensors", + "model.layers.15.self_attn.k_proj.bias": "model-00016-of-00047.safetensors", + "model.layers.15.self_attn.k_proj.weight": "model-00016-of-00047.safetensors", + "model.layers.15.self_attn.k_proj.weight_scale": "model-00016-of-00047.safetensors", + "model.layers.15.self_attn.o_proj.weight": "model-00016-of-00047.safetensors", + "model.layers.15.self_attn.o_proj.weight_scale": "model-00016-of-00047.safetensors", + "model.layers.15.self_attn.q_proj.bias": "model-00016-of-00047.safetensors", + "model.layers.15.self_attn.q_proj.weight": "model-00016-of-00047.safetensors", + "model.layers.15.self_attn.q_proj.weight_scale": "model-00016-of-00047.safetensors", + "model.layers.15.self_attn.v_proj.bias": "model-00016-of-00047.safetensors", + "model.layers.15.self_attn.v_proj.weight": "model-00016-of-00047.safetensors", + "model.layers.15.self_attn.v_proj.weight_scale": "model-00016-of-00047.safetensors", + "model.layers.16.input_layernorm.weight": "model-00017-of-00047.safetensors", + "model.layers.16.mlp.experts.0.down_proj.weight": "model-00017-of-00047.safetensors", + "model.layers.16.mlp.experts.0.down_proj.weight_scale": "model-00017-of-00047.safetensors", + "model.layers.16.mlp.experts.0.gate_proj.weight": "model-00017-of-00047.safetensors", + "model.layers.16.mlp.experts.0.gate_proj.weight_scale": "model-00017-of-00047.safetensors", + "model.layers.16.mlp.experts.0.up_proj.weight": "model-00017-of-00047.safetensors", + "model.layers.16.mlp.experts.0.up_proj.weight_scale": "model-00017-of-00047.safetensors", + "model.layers.16.mlp.experts.1.down_proj.weight": "model-00017-of-00047.safetensors", + "model.layers.16.mlp.experts.1.down_proj.weight_scale": "model-00017-of-00047.safetensors", + "model.layers.16.mlp.experts.1.gate_proj.weight": "model-00017-of-00047.safetensors", + "model.layers.16.mlp.experts.1.gate_proj.weight_scale": "model-00017-of-00047.safetensors", + "model.layers.16.mlp.experts.1.up_proj.weight": "model-00017-of-00047.safetensors", + "model.layers.16.mlp.experts.1.up_proj.weight_scale": "model-00017-of-00047.safetensors", + "model.layers.16.mlp.experts.10.down_proj.weight": "model-00017-of-00047.safetensors", + "model.layers.16.mlp.experts.10.down_proj.weight_scale": "model-00017-of-00047.safetensors", + "model.layers.16.mlp.experts.10.gate_proj.weight": "model-00017-of-00047.safetensors", + "model.layers.16.mlp.experts.10.gate_proj.weight_scale": "model-00017-of-00047.safetensors", + "model.layers.16.mlp.experts.10.up_proj.weight": "model-00017-of-00047.safetensors", + "model.layers.16.mlp.experts.10.up_proj.weight_scale": "model-00017-of-00047.safetensors", + "model.layers.16.mlp.experts.100.down_proj.weight": "model-00017-of-00047.safetensors", + "model.layers.16.mlp.experts.100.down_proj.weight_scale": "model-00017-of-00047.safetensors", + "model.layers.16.mlp.experts.100.gate_proj.weight": "model-00017-of-00047.safetensors", + "model.layers.16.mlp.experts.100.gate_proj.weight_scale": "model-00017-of-00047.safetensors", + "model.layers.16.mlp.experts.100.up_proj.weight": "model-00017-of-00047.safetensors", + "model.layers.16.mlp.experts.100.up_proj.weight_scale": "model-00017-of-00047.safetensors", + "model.layers.16.mlp.experts.101.down_proj.weight": "model-00017-of-00047.safetensors", + "model.layers.16.mlp.experts.101.down_proj.weight_scale": "model-00017-of-00047.safetensors", + "model.layers.16.mlp.experts.101.gate_proj.weight": "model-00017-of-00047.safetensors", + "model.layers.16.mlp.experts.101.gate_proj.weight_scale": "model-00017-of-00047.safetensors", + "model.layers.16.mlp.experts.101.up_proj.weight": "model-00017-of-00047.safetensors", + "model.layers.16.mlp.experts.101.up_proj.weight_scale": "model-00017-of-00047.safetensors", + "model.layers.16.mlp.experts.102.down_proj.weight": "model-00017-of-00047.safetensors", + "model.layers.16.mlp.experts.102.down_proj.weight_scale": "model-00017-of-00047.safetensors", + "model.layers.16.mlp.experts.102.gate_proj.weight": "model-00017-of-00047.safetensors", + "model.layers.16.mlp.experts.102.gate_proj.weight_scale": "model-00017-of-00047.safetensors", + "model.layers.16.mlp.experts.102.up_proj.weight": "model-00017-of-00047.safetensors", + "model.layers.16.mlp.experts.102.up_proj.weight_scale": "model-00017-of-00047.safetensors", + "model.layers.16.mlp.experts.103.down_proj.weight": "model-00017-of-00047.safetensors", + "model.layers.16.mlp.experts.103.down_proj.weight_scale": "model-00017-of-00047.safetensors", + "model.layers.16.mlp.experts.103.gate_proj.weight": "model-00017-of-00047.safetensors", + "model.layers.16.mlp.experts.103.gate_proj.weight_scale": "model-00017-of-00047.safetensors", + "model.layers.16.mlp.experts.103.up_proj.weight": "model-00017-of-00047.safetensors", + "model.layers.16.mlp.experts.103.up_proj.weight_scale": "model-00017-of-00047.safetensors", + "model.layers.16.mlp.experts.104.down_proj.weight": "model-00017-of-00047.safetensors", + "model.layers.16.mlp.experts.104.down_proj.weight_scale": "model-00017-of-00047.safetensors", + "model.layers.16.mlp.experts.104.gate_proj.weight": "model-00017-of-00047.safetensors", + "model.layers.16.mlp.experts.104.gate_proj.weight_scale": "model-00017-of-00047.safetensors", + "model.layers.16.mlp.experts.104.up_proj.weight": "model-00017-of-00047.safetensors", + "model.layers.16.mlp.experts.104.up_proj.weight_scale": "model-00017-of-00047.safetensors", + "model.layers.16.mlp.experts.105.down_proj.weight": "model-00017-of-00047.safetensors", + "model.layers.16.mlp.experts.105.down_proj.weight_scale": "model-00017-of-00047.safetensors", + "model.layers.16.mlp.experts.105.gate_proj.weight": "model-00017-of-00047.safetensors", + "model.layers.16.mlp.experts.105.gate_proj.weight_scale": "model-00017-of-00047.safetensors", + "model.layers.16.mlp.experts.105.up_proj.weight": "model-00017-of-00047.safetensors", + "model.layers.16.mlp.experts.105.up_proj.weight_scale": "model-00017-of-00047.safetensors", + "model.layers.16.mlp.experts.106.down_proj.weight": "model-00017-of-00047.safetensors", + "model.layers.16.mlp.experts.106.down_proj.weight_scale": "model-00017-of-00047.safetensors", + "model.layers.16.mlp.experts.106.gate_proj.weight": "model-00017-of-00047.safetensors", + "model.layers.16.mlp.experts.106.gate_proj.weight_scale": "model-00017-of-00047.safetensors", + "model.layers.16.mlp.experts.106.up_proj.weight": "model-00017-of-00047.safetensors", + "model.layers.16.mlp.experts.106.up_proj.weight_scale": "model-00017-of-00047.safetensors", + "model.layers.16.mlp.experts.107.down_proj.weight": "model-00017-of-00047.safetensors", + "model.layers.16.mlp.experts.107.down_proj.weight_scale": "model-00017-of-00047.safetensors", + "model.layers.16.mlp.experts.107.gate_proj.weight": "model-00017-of-00047.safetensors", + "model.layers.16.mlp.experts.107.gate_proj.weight_scale": "model-00017-of-00047.safetensors", + "model.layers.16.mlp.experts.107.up_proj.weight": "model-00017-of-00047.safetensors", + "model.layers.16.mlp.experts.107.up_proj.weight_scale": "model-00017-of-00047.safetensors", + "model.layers.16.mlp.experts.108.down_proj.weight": "model-00017-of-00047.safetensors", + "model.layers.16.mlp.experts.108.down_proj.weight_scale": "model-00017-of-00047.safetensors", + "model.layers.16.mlp.experts.108.gate_proj.weight": "model-00017-of-00047.safetensors", + "model.layers.16.mlp.experts.108.gate_proj.weight_scale": "model-00017-of-00047.safetensors", + "model.layers.16.mlp.experts.108.up_proj.weight": "model-00017-of-00047.safetensors", + "model.layers.16.mlp.experts.108.up_proj.weight_scale": "model-00017-of-00047.safetensors", + "model.layers.16.mlp.experts.109.down_proj.weight": "model-00017-of-00047.safetensors", + "model.layers.16.mlp.experts.109.down_proj.weight_scale": "model-00017-of-00047.safetensors", + "model.layers.16.mlp.experts.109.gate_proj.weight": "model-00017-of-00047.safetensors", + "model.layers.16.mlp.experts.109.gate_proj.weight_scale": "model-00017-of-00047.safetensors", + "model.layers.16.mlp.experts.109.up_proj.weight": "model-00017-of-00047.safetensors", + "model.layers.16.mlp.experts.109.up_proj.weight_scale": "model-00017-of-00047.safetensors", + "model.layers.16.mlp.experts.11.down_proj.weight": "model-00017-of-00047.safetensors", + "model.layers.16.mlp.experts.11.down_proj.weight_scale": "model-00017-of-00047.safetensors", + "model.layers.16.mlp.experts.11.gate_proj.weight": "model-00017-of-00047.safetensors", + "model.layers.16.mlp.experts.11.gate_proj.weight_scale": "model-00017-of-00047.safetensors", + "model.layers.16.mlp.experts.11.up_proj.weight": "model-00017-of-00047.safetensors", + "model.layers.16.mlp.experts.11.up_proj.weight_scale": "model-00017-of-00047.safetensors", + "model.layers.16.mlp.experts.110.down_proj.weight": "model-00017-of-00047.safetensors", + "model.layers.16.mlp.experts.110.down_proj.weight_scale": "model-00017-of-00047.safetensors", + "model.layers.16.mlp.experts.110.gate_proj.weight": "model-00017-of-00047.safetensors", + "model.layers.16.mlp.experts.110.gate_proj.weight_scale": "model-00017-of-00047.safetensors", + "model.layers.16.mlp.experts.110.up_proj.weight": "model-00017-of-00047.safetensors", + "model.layers.16.mlp.experts.110.up_proj.weight_scale": "model-00017-of-00047.safetensors", + "model.layers.16.mlp.experts.111.down_proj.weight": "model-00017-of-00047.safetensors", + "model.layers.16.mlp.experts.111.down_proj.weight_scale": "model-00017-of-00047.safetensors", + "model.layers.16.mlp.experts.111.gate_proj.weight": "model-00017-of-00047.safetensors", + "model.layers.16.mlp.experts.111.gate_proj.weight_scale": "model-00017-of-00047.safetensors", + "model.layers.16.mlp.experts.111.up_proj.weight": "model-00017-of-00047.safetensors", + "model.layers.16.mlp.experts.111.up_proj.weight_scale": "model-00017-of-00047.safetensors", + "model.layers.16.mlp.experts.112.down_proj.weight": "model-00017-of-00047.safetensors", + "model.layers.16.mlp.experts.112.down_proj.weight_scale": "model-00017-of-00047.safetensors", + "model.layers.16.mlp.experts.112.gate_proj.weight": "model-00017-of-00047.safetensors", + "model.layers.16.mlp.experts.112.gate_proj.weight_scale": "model-00017-of-00047.safetensors", + "model.layers.16.mlp.experts.112.up_proj.weight": "model-00017-of-00047.safetensors", + "model.layers.16.mlp.experts.112.up_proj.weight_scale": "model-00017-of-00047.safetensors", + "model.layers.16.mlp.experts.113.down_proj.weight": "model-00017-of-00047.safetensors", + "model.layers.16.mlp.experts.113.down_proj.weight_scale": "model-00017-of-00047.safetensors", + "model.layers.16.mlp.experts.113.gate_proj.weight": "model-00017-of-00047.safetensors", + "model.layers.16.mlp.experts.113.gate_proj.weight_scale": "model-00017-of-00047.safetensors", + "model.layers.16.mlp.experts.113.up_proj.weight": "model-00017-of-00047.safetensors", + "model.layers.16.mlp.experts.113.up_proj.weight_scale": "model-00017-of-00047.safetensors", + "model.layers.16.mlp.experts.114.down_proj.weight": "model-00017-of-00047.safetensors", + "model.layers.16.mlp.experts.114.down_proj.weight_scale": "model-00017-of-00047.safetensors", + "model.layers.16.mlp.experts.114.gate_proj.weight": "model-00017-of-00047.safetensors", + "model.layers.16.mlp.experts.114.gate_proj.weight_scale": "model-00017-of-00047.safetensors", + "model.layers.16.mlp.experts.114.up_proj.weight": "model-00017-of-00047.safetensors", + "model.layers.16.mlp.experts.114.up_proj.weight_scale": "model-00017-of-00047.safetensors", + "model.layers.16.mlp.experts.115.down_proj.weight": "model-00017-of-00047.safetensors", + "model.layers.16.mlp.experts.115.down_proj.weight_scale": "model-00017-of-00047.safetensors", + "model.layers.16.mlp.experts.115.gate_proj.weight": "model-00017-of-00047.safetensors", + "model.layers.16.mlp.experts.115.gate_proj.weight_scale": "model-00017-of-00047.safetensors", + "model.layers.16.mlp.experts.115.up_proj.weight": "model-00017-of-00047.safetensors", + "model.layers.16.mlp.experts.115.up_proj.weight_scale": "model-00017-of-00047.safetensors", + "model.layers.16.mlp.experts.116.down_proj.weight": "model-00017-of-00047.safetensors", + "model.layers.16.mlp.experts.116.down_proj.weight_scale": "model-00017-of-00047.safetensors", + "model.layers.16.mlp.experts.116.gate_proj.weight": "model-00017-of-00047.safetensors", + "model.layers.16.mlp.experts.116.gate_proj.weight_scale": "model-00017-of-00047.safetensors", + "model.layers.16.mlp.experts.116.up_proj.weight": "model-00017-of-00047.safetensors", + "model.layers.16.mlp.experts.116.up_proj.weight_scale": "model-00017-of-00047.safetensors", + "model.layers.16.mlp.experts.117.down_proj.weight": "model-00017-of-00047.safetensors", + "model.layers.16.mlp.experts.117.down_proj.weight_scale": "model-00017-of-00047.safetensors", + "model.layers.16.mlp.experts.117.gate_proj.weight": "model-00017-of-00047.safetensors", + "model.layers.16.mlp.experts.117.gate_proj.weight_scale": "model-00017-of-00047.safetensors", + "model.layers.16.mlp.experts.117.up_proj.weight": "model-00017-of-00047.safetensors", + "model.layers.16.mlp.experts.117.up_proj.weight_scale": "model-00017-of-00047.safetensors", + "model.layers.16.mlp.experts.118.down_proj.weight": "model-00017-of-00047.safetensors", + "model.layers.16.mlp.experts.118.down_proj.weight_scale": "model-00017-of-00047.safetensors", + "model.layers.16.mlp.experts.118.gate_proj.weight": "model-00017-of-00047.safetensors", + "model.layers.16.mlp.experts.118.gate_proj.weight_scale": "model-00017-of-00047.safetensors", + "model.layers.16.mlp.experts.118.up_proj.weight": "model-00017-of-00047.safetensors", + "model.layers.16.mlp.experts.118.up_proj.weight_scale": "model-00017-of-00047.safetensors", + "model.layers.16.mlp.experts.119.down_proj.weight": "model-00017-of-00047.safetensors", + "model.layers.16.mlp.experts.119.down_proj.weight_scale": "model-00017-of-00047.safetensors", + "model.layers.16.mlp.experts.119.gate_proj.weight": "model-00017-of-00047.safetensors", + "model.layers.16.mlp.experts.119.gate_proj.weight_scale": "model-00017-of-00047.safetensors", + "model.layers.16.mlp.experts.119.up_proj.weight": "model-00017-of-00047.safetensors", + "model.layers.16.mlp.experts.119.up_proj.weight_scale": "model-00017-of-00047.safetensors", + "model.layers.16.mlp.experts.12.down_proj.weight": "model-00017-of-00047.safetensors", + "model.layers.16.mlp.experts.12.down_proj.weight_scale": "model-00017-of-00047.safetensors", + "model.layers.16.mlp.experts.12.gate_proj.weight": "model-00017-of-00047.safetensors", + "model.layers.16.mlp.experts.12.gate_proj.weight_scale": "model-00017-of-00047.safetensors", + "model.layers.16.mlp.experts.12.up_proj.weight": "model-00017-of-00047.safetensors", + "model.layers.16.mlp.experts.12.up_proj.weight_scale": "model-00017-of-00047.safetensors", + "model.layers.16.mlp.experts.120.down_proj.weight": "model-00017-of-00047.safetensors", + "model.layers.16.mlp.experts.120.down_proj.weight_scale": "model-00017-of-00047.safetensors", + "model.layers.16.mlp.experts.120.gate_proj.weight": "model-00017-of-00047.safetensors", + "model.layers.16.mlp.experts.120.gate_proj.weight_scale": "model-00017-of-00047.safetensors", + "model.layers.16.mlp.experts.120.up_proj.weight": "model-00017-of-00047.safetensors", + "model.layers.16.mlp.experts.120.up_proj.weight_scale": "model-00017-of-00047.safetensors", + "model.layers.16.mlp.experts.121.down_proj.weight": "model-00017-of-00047.safetensors", + "model.layers.16.mlp.experts.121.down_proj.weight_scale": "model-00017-of-00047.safetensors", + "model.layers.16.mlp.experts.121.gate_proj.weight": "model-00017-of-00047.safetensors", + "model.layers.16.mlp.experts.121.gate_proj.weight_scale": "model-00017-of-00047.safetensors", + "model.layers.16.mlp.experts.121.up_proj.weight": "model-00017-of-00047.safetensors", + "model.layers.16.mlp.experts.121.up_proj.weight_scale": "model-00017-of-00047.safetensors", + "model.layers.16.mlp.experts.122.down_proj.weight": "model-00017-of-00047.safetensors", + "model.layers.16.mlp.experts.122.down_proj.weight_scale": "model-00017-of-00047.safetensors", + "model.layers.16.mlp.experts.122.gate_proj.weight": "model-00017-of-00047.safetensors", + "model.layers.16.mlp.experts.122.gate_proj.weight_scale": "model-00017-of-00047.safetensors", + "model.layers.16.mlp.experts.122.up_proj.weight": "model-00017-of-00047.safetensors", + "model.layers.16.mlp.experts.122.up_proj.weight_scale": "model-00017-of-00047.safetensors", + "model.layers.16.mlp.experts.123.down_proj.weight": "model-00017-of-00047.safetensors", + "model.layers.16.mlp.experts.123.down_proj.weight_scale": "model-00017-of-00047.safetensors", + "model.layers.16.mlp.experts.123.gate_proj.weight": "model-00017-of-00047.safetensors", + "model.layers.16.mlp.experts.123.gate_proj.weight_scale": "model-00017-of-00047.safetensors", + "model.layers.16.mlp.experts.123.up_proj.weight": "model-00017-of-00047.safetensors", + "model.layers.16.mlp.experts.123.up_proj.weight_scale": "model-00017-of-00047.safetensors", + "model.layers.16.mlp.experts.124.down_proj.weight": "model-00017-of-00047.safetensors", + "model.layers.16.mlp.experts.124.down_proj.weight_scale": "model-00017-of-00047.safetensors", + "model.layers.16.mlp.experts.124.gate_proj.weight": "model-00017-of-00047.safetensors", + "model.layers.16.mlp.experts.124.gate_proj.weight_scale": "model-00017-of-00047.safetensors", + "model.layers.16.mlp.experts.124.up_proj.weight": "model-00017-of-00047.safetensors", + "model.layers.16.mlp.experts.124.up_proj.weight_scale": "model-00017-of-00047.safetensors", + "model.layers.16.mlp.experts.125.down_proj.weight": "model-00017-of-00047.safetensors", + "model.layers.16.mlp.experts.125.down_proj.weight_scale": "model-00017-of-00047.safetensors", + "model.layers.16.mlp.experts.125.gate_proj.weight": "model-00017-of-00047.safetensors", + "model.layers.16.mlp.experts.125.gate_proj.weight_scale": "model-00017-of-00047.safetensors", + "model.layers.16.mlp.experts.125.up_proj.weight": "model-00017-of-00047.safetensors", + "model.layers.16.mlp.experts.125.up_proj.weight_scale": "model-00017-of-00047.safetensors", + "model.layers.16.mlp.experts.126.down_proj.weight": "model-00017-of-00047.safetensors", + "model.layers.16.mlp.experts.126.down_proj.weight_scale": "model-00017-of-00047.safetensors", + "model.layers.16.mlp.experts.126.gate_proj.weight": "model-00017-of-00047.safetensors", + "model.layers.16.mlp.experts.126.gate_proj.weight_scale": "model-00017-of-00047.safetensors", + "model.layers.16.mlp.experts.126.up_proj.weight": "model-00017-of-00047.safetensors", + "model.layers.16.mlp.experts.126.up_proj.weight_scale": "model-00017-of-00047.safetensors", + "model.layers.16.mlp.experts.127.down_proj.weight": "model-00017-of-00047.safetensors", + "model.layers.16.mlp.experts.127.down_proj.weight_scale": "model-00017-of-00047.safetensors", + "model.layers.16.mlp.experts.127.gate_proj.weight": "model-00017-of-00047.safetensors", + "model.layers.16.mlp.experts.127.gate_proj.weight_scale": "model-00017-of-00047.safetensors", + "model.layers.16.mlp.experts.127.up_proj.weight": "model-00017-of-00047.safetensors", + "model.layers.16.mlp.experts.127.up_proj.weight_scale": "model-00017-of-00047.safetensors", + "model.layers.16.mlp.experts.13.down_proj.weight": "model-00017-of-00047.safetensors", + "model.layers.16.mlp.experts.13.down_proj.weight_scale": "model-00017-of-00047.safetensors", + "model.layers.16.mlp.experts.13.gate_proj.weight": "model-00017-of-00047.safetensors", + "model.layers.16.mlp.experts.13.gate_proj.weight_scale": "model-00017-of-00047.safetensors", + "model.layers.16.mlp.experts.13.up_proj.weight": "model-00017-of-00047.safetensors", + "model.layers.16.mlp.experts.13.up_proj.weight_scale": "model-00017-of-00047.safetensors", + "model.layers.16.mlp.experts.14.down_proj.weight": "model-00017-of-00047.safetensors", + "model.layers.16.mlp.experts.14.down_proj.weight_scale": "model-00017-of-00047.safetensors", + "model.layers.16.mlp.experts.14.gate_proj.weight": "model-00017-of-00047.safetensors", + "model.layers.16.mlp.experts.14.gate_proj.weight_scale": "model-00017-of-00047.safetensors", + "model.layers.16.mlp.experts.14.up_proj.weight": "model-00017-of-00047.safetensors", + "model.layers.16.mlp.experts.14.up_proj.weight_scale": "model-00017-of-00047.safetensors", + "model.layers.16.mlp.experts.15.down_proj.weight": "model-00017-of-00047.safetensors", + "model.layers.16.mlp.experts.15.down_proj.weight_scale": "model-00017-of-00047.safetensors", + "model.layers.16.mlp.experts.15.gate_proj.weight": "model-00017-of-00047.safetensors", + "model.layers.16.mlp.experts.15.gate_proj.weight_scale": "model-00017-of-00047.safetensors", + "model.layers.16.mlp.experts.15.up_proj.weight": "model-00017-of-00047.safetensors", + "model.layers.16.mlp.experts.15.up_proj.weight_scale": "model-00017-of-00047.safetensors", + "model.layers.16.mlp.experts.16.down_proj.weight": "model-00017-of-00047.safetensors", + "model.layers.16.mlp.experts.16.down_proj.weight_scale": "model-00017-of-00047.safetensors", + "model.layers.16.mlp.experts.16.gate_proj.weight": "model-00017-of-00047.safetensors", + "model.layers.16.mlp.experts.16.gate_proj.weight_scale": "model-00017-of-00047.safetensors", + "model.layers.16.mlp.experts.16.up_proj.weight": "model-00017-of-00047.safetensors", + "model.layers.16.mlp.experts.16.up_proj.weight_scale": "model-00017-of-00047.safetensors", + "model.layers.16.mlp.experts.17.down_proj.weight": "model-00017-of-00047.safetensors", + "model.layers.16.mlp.experts.17.down_proj.weight_scale": "model-00017-of-00047.safetensors", + "model.layers.16.mlp.experts.17.gate_proj.weight": "model-00017-of-00047.safetensors", + "model.layers.16.mlp.experts.17.gate_proj.weight_scale": "model-00017-of-00047.safetensors", + "model.layers.16.mlp.experts.17.up_proj.weight": "model-00017-of-00047.safetensors", + "model.layers.16.mlp.experts.17.up_proj.weight_scale": "model-00017-of-00047.safetensors", + "model.layers.16.mlp.experts.18.down_proj.weight": "model-00017-of-00047.safetensors", + "model.layers.16.mlp.experts.18.down_proj.weight_scale": "model-00017-of-00047.safetensors", + "model.layers.16.mlp.experts.18.gate_proj.weight": "model-00017-of-00047.safetensors", + "model.layers.16.mlp.experts.18.gate_proj.weight_scale": "model-00017-of-00047.safetensors", + "model.layers.16.mlp.experts.18.up_proj.weight": "model-00017-of-00047.safetensors", + "model.layers.16.mlp.experts.18.up_proj.weight_scale": "model-00017-of-00047.safetensors", + "model.layers.16.mlp.experts.19.down_proj.weight": "model-00017-of-00047.safetensors", + "model.layers.16.mlp.experts.19.down_proj.weight_scale": "model-00017-of-00047.safetensors", + "model.layers.16.mlp.experts.19.gate_proj.weight": "model-00017-of-00047.safetensors", + "model.layers.16.mlp.experts.19.gate_proj.weight_scale": "model-00017-of-00047.safetensors", + "model.layers.16.mlp.experts.19.up_proj.weight": "model-00017-of-00047.safetensors", + "model.layers.16.mlp.experts.19.up_proj.weight_scale": "model-00017-of-00047.safetensors", + "model.layers.16.mlp.experts.2.down_proj.weight": "model-00017-of-00047.safetensors", + "model.layers.16.mlp.experts.2.down_proj.weight_scale": "model-00017-of-00047.safetensors", + "model.layers.16.mlp.experts.2.gate_proj.weight": "model-00017-of-00047.safetensors", + "model.layers.16.mlp.experts.2.gate_proj.weight_scale": "model-00017-of-00047.safetensors", + "model.layers.16.mlp.experts.2.up_proj.weight": "model-00017-of-00047.safetensors", + "model.layers.16.mlp.experts.2.up_proj.weight_scale": "model-00017-of-00047.safetensors", + "model.layers.16.mlp.experts.20.down_proj.weight": "model-00017-of-00047.safetensors", + "model.layers.16.mlp.experts.20.down_proj.weight_scale": "model-00017-of-00047.safetensors", + "model.layers.16.mlp.experts.20.gate_proj.weight": "model-00017-of-00047.safetensors", + "model.layers.16.mlp.experts.20.gate_proj.weight_scale": "model-00017-of-00047.safetensors", + "model.layers.16.mlp.experts.20.up_proj.weight": "model-00017-of-00047.safetensors", + "model.layers.16.mlp.experts.20.up_proj.weight_scale": "model-00017-of-00047.safetensors", + "model.layers.16.mlp.experts.21.down_proj.weight": "model-00017-of-00047.safetensors", + "model.layers.16.mlp.experts.21.down_proj.weight_scale": "model-00017-of-00047.safetensors", + "model.layers.16.mlp.experts.21.gate_proj.weight": "model-00017-of-00047.safetensors", + "model.layers.16.mlp.experts.21.gate_proj.weight_scale": "model-00017-of-00047.safetensors", + "model.layers.16.mlp.experts.21.up_proj.weight": "model-00017-of-00047.safetensors", + "model.layers.16.mlp.experts.21.up_proj.weight_scale": "model-00017-of-00047.safetensors", + "model.layers.16.mlp.experts.22.down_proj.weight": "model-00017-of-00047.safetensors", + "model.layers.16.mlp.experts.22.down_proj.weight_scale": "model-00017-of-00047.safetensors", + "model.layers.16.mlp.experts.22.gate_proj.weight": "model-00017-of-00047.safetensors", + "model.layers.16.mlp.experts.22.gate_proj.weight_scale": "model-00017-of-00047.safetensors", + "model.layers.16.mlp.experts.22.up_proj.weight": "model-00017-of-00047.safetensors", + "model.layers.16.mlp.experts.22.up_proj.weight_scale": "model-00017-of-00047.safetensors", + "model.layers.16.mlp.experts.23.down_proj.weight": "model-00017-of-00047.safetensors", + "model.layers.16.mlp.experts.23.down_proj.weight_scale": "model-00017-of-00047.safetensors", + "model.layers.16.mlp.experts.23.gate_proj.weight": "model-00017-of-00047.safetensors", + "model.layers.16.mlp.experts.23.gate_proj.weight_scale": "model-00017-of-00047.safetensors", + "model.layers.16.mlp.experts.23.up_proj.weight": "model-00017-of-00047.safetensors", + "model.layers.16.mlp.experts.23.up_proj.weight_scale": "model-00017-of-00047.safetensors", + "model.layers.16.mlp.experts.24.down_proj.weight": "model-00017-of-00047.safetensors", + "model.layers.16.mlp.experts.24.down_proj.weight_scale": "model-00017-of-00047.safetensors", + "model.layers.16.mlp.experts.24.gate_proj.weight": "model-00017-of-00047.safetensors", + "model.layers.16.mlp.experts.24.gate_proj.weight_scale": "model-00017-of-00047.safetensors", + "model.layers.16.mlp.experts.24.up_proj.weight": "model-00017-of-00047.safetensors", + "model.layers.16.mlp.experts.24.up_proj.weight_scale": "model-00017-of-00047.safetensors", + "model.layers.16.mlp.experts.25.down_proj.weight": "model-00017-of-00047.safetensors", + "model.layers.16.mlp.experts.25.down_proj.weight_scale": "model-00017-of-00047.safetensors", + "model.layers.16.mlp.experts.25.gate_proj.weight": "model-00017-of-00047.safetensors", + "model.layers.16.mlp.experts.25.gate_proj.weight_scale": "model-00017-of-00047.safetensors", + "model.layers.16.mlp.experts.25.up_proj.weight": "model-00017-of-00047.safetensors", + "model.layers.16.mlp.experts.25.up_proj.weight_scale": "model-00017-of-00047.safetensors", + "model.layers.16.mlp.experts.26.down_proj.weight": "model-00017-of-00047.safetensors", + "model.layers.16.mlp.experts.26.down_proj.weight_scale": "model-00017-of-00047.safetensors", + "model.layers.16.mlp.experts.26.gate_proj.weight": "model-00017-of-00047.safetensors", + "model.layers.16.mlp.experts.26.gate_proj.weight_scale": "model-00017-of-00047.safetensors", + "model.layers.16.mlp.experts.26.up_proj.weight": "model-00017-of-00047.safetensors", + "model.layers.16.mlp.experts.26.up_proj.weight_scale": "model-00017-of-00047.safetensors", + "model.layers.16.mlp.experts.27.down_proj.weight": "model-00017-of-00047.safetensors", + "model.layers.16.mlp.experts.27.down_proj.weight_scale": "model-00017-of-00047.safetensors", + "model.layers.16.mlp.experts.27.gate_proj.weight": "model-00017-of-00047.safetensors", + "model.layers.16.mlp.experts.27.gate_proj.weight_scale": "model-00017-of-00047.safetensors", + "model.layers.16.mlp.experts.27.up_proj.weight": "model-00017-of-00047.safetensors", + "model.layers.16.mlp.experts.27.up_proj.weight_scale": "model-00017-of-00047.safetensors", + "model.layers.16.mlp.experts.28.down_proj.weight": "model-00017-of-00047.safetensors", + "model.layers.16.mlp.experts.28.down_proj.weight_scale": "model-00017-of-00047.safetensors", + "model.layers.16.mlp.experts.28.gate_proj.weight": "model-00017-of-00047.safetensors", + "model.layers.16.mlp.experts.28.gate_proj.weight_scale": "model-00017-of-00047.safetensors", + "model.layers.16.mlp.experts.28.up_proj.weight": "model-00017-of-00047.safetensors", + "model.layers.16.mlp.experts.28.up_proj.weight_scale": "model-00017-of-00047.safetensors", + "model.layers.16.mlp.experts.29.down_proj.weight": "model-00017-of-00047.safetensors", + "model.layers.16.mlp.experts.29.down_proj.weight_scale": "model-00017-of-00047.safetensors", + "model.layers.16.mlp.experts.29.gate_proj.weight": "model-00017-of-00047.safetensors", + "model.layers.16.mlp.experts.29.gate_proj.weight_scale": "model-00017-of-00047.safetensors", + "model.layers.16.mlp.experts.29.up_proj.weight": "model-00017-of-00047.safetensors", + "model.layers.16.mlp.experts.29.up_proj.weight_scale": "model-00017-of-00047.safetensors", + "model.layers.16.mlp.experts.3.down_proj.weight": "model-00017-of-00047.safetensors", + "model.layers.16.mlp.experts.3.down_proj.weight_scale": "model-00017-of-00047.safetensors", + "model.layers.16.mlp.experts.3.gate_proj.weight": "model-00017-of-00047.safetensors", + "model.layers.16.mlp.experts.3.gate_proj.weight_scale": "model-00017-of-00047.safetensors", + "model.layers.16.mlp.experts.3.up_proj.weight": "model-00017-of-00047.safetensors", + "model.layers.16.mlp.experts.3.up_proj.weight_scale": "model-00017-of-00047.safetensors", + "model.layers.16.mlp.experts.30.down_proj.weight": "model-00017-of-00047.safetensors", + "model.layers.16.mlp.experts.30.down_proj.weight_scale": "model-00017-of-00047.safetensors", + "model.layers.16.mlp.experts.30.gate_proj.weight": "model-00017-of-00047.safetensors", + "model.layers.16.mlp.experts.30.gate_proj.weight_scale": "model-00017-of-00047.safetensors", + "model.layers.16.mlp.experts.30.up_proj.weight": "model-00017-of-00047.safetensors", + "model.layers.16.mlp.experts.30.up_proj.weight_scale": "model-00017-of-00047.safetensors", + "model.layers.16.mlp.experts.31.down_proj.weight": "model-00017-of-00047.safetensors", + "model.layers.16.mlp.experts.31.down_proj.weight_scale": "model-00017-of-00047.safetensors", + "model.layers.16.mlp.experts.31.gate_proj.weight": "model-00017-of-00047.safetensors", + "model.layers.16.mlp.experts.31.gate_proj.weight_scale": "model-00017-of-00047.safetensors", + "model.layers.16.mlp.experts.31.up_proj.weight": "model-00017-of-00047.safetensors", + "model.layers.16.mlp.experts.31.up_proj.weight_scale": "model-00017-of-00047.safetensors", + "model.layers.16.mlp.experts.32.down_proj.weight": "model-00017-of-00047.safetensors", + "model.layers.16.mlp.experts.32.down_proj.weight_scale": "model-00017-of-00047.safetensors", + "model.layers.16.mlp.experts.32.gate_proj.weight": "model-00017-of-00047.safetensors", + "model.layers.16.mlp.experts.32.gate_proj.weight_scale": "model-00017-of-00047.safetensors", + "model.layers.16.mlp.experts.32.up_proj.weight": "model-00017-of-00047.safetensors", + "model.layers.16.mlp.experts.32.up_proj.weight_scale": "model-00017-of-00047.safetensors", + "model.layers.16.mlp.experts.33.down_proj.weight": "model-00017-of-00047.safetensors", + "model.layers.16.mlp.experts.33.down_proj.weight_scale": "model-00017-of-00047.safetensors", + "model.layers.16.mlp.experts.33.gate_proj.weight": "model-00017-of-00047.safetensors", + "model.layers.16.mlp.experts.33.gate_proj.weight_scale": "model-00017-of-00047.safetensors", + "model.layers.16.mlp.experts.33.up_proj.weight": "model-00017-of-00047.safetensors", + "model.layers.16.mlp.experts.33.up_proj.weight_scale": "model-00017-of-00047.safetensors", + "model.layers.16.mlp.experts.34.down_proj.weight": "model-00017-of-00047.safetensors", + "model.layers.16.mlp.experts.34.down_proj.weight_scale": "model-00017-of-00047.safetensors", + "model.layers.16.mlp.experts.34.gate_proj.weight": "model-00017-of-00047.safetensors", + "model.layers.16.mlp.experts.34.gate_proj.weight_scale": "model-00017-of-00047.safetensors", + "model.layers.16.mlp.experts.34.up_proj.weight": "model-00017-of-00047.safetensors", + "model.layers.16.mlp.experts.34.up_proj.weight_scale": "model-00017-of-00047.safetensors", + "model.layers.16.mlp.experts.35.down_proj.weight": "model-00017-of-00047.safetensors", + "model.layers.16.mlp.experts.35.down_proj.weight_scale": "model-00017-of-00047.safetensors", + "model.layers.16.mlp.experts.35.gate_proj.weight": "model-00017-of-00047.safetensors", + "model.layers.16.mlp.experts.35.gate_proj.weight_scale": "model-00017-of-00047.safetensors", + "model.layers.16.mlp.experts.35.up_proj.weight": "model-00017-of-00047.safetensors", + "model.layers.16.mlp.experts.35.up_proj.weight_scale": "model-00017-of-00047.safetensors", + "model.layers.16.mlp.experts.36.down_proj.weight": "model-00017-of-00047.safetensors", + "model.layers.16.mlp.experts.36.down_proj.weight_scale": "model-00017-of-00047.safetensors", + "model.layers.16.mlp.experts.36.gate_proj.weight": "model-00017-of-00047.safetensors", + "model.layers.16.mlp.experts.36.gate_proj.weight_scale": "model-00017-of-00047.safetensors", + "model.layers.16.mlp.experts.36.up_proj.weight": "model-00017-of-00047.safetensors", + "model.layers.16.mlp.experts.36.up_proj.weight_scale": "model-00017-of-00047.safetensors", + "model.layers.16.mlp.experts.37.down_proj.weight": "model-00017-of-00047.safetensors", + "model.layers.16.mlp.experts.37.down_proj.weight_scale": "model-00017-of-00047.safetensors", + "model.layers.16.mlp.experts.37.gate_proj.weight": "model-00017-of-00047.safetensors", + "model.layers.16.mlp.experts.37.gate_proj.weight_scale": "model-00017-of-00047.safetensors", + "model.layers.16.mlp.experts.37.up_proj.weight": "model-00017-of-00047.safetensors", + "model.layers.16.mlp.experts.37.up_proj.weight_scale": "model-00017-of-00047.safetensors", + "model.layers.16.mlp.experts.38.down_proj.weight": "model-00017-of-00047.safetensors", + "model.layers.16.mlp.experts.38.down_proj.weight_scale": "model-00017-of-00047.safetensors", + "model.layers.16.mlp.experts.38.gate_proj.weight": "model-00017-of-00047.safetensors", + "model.layers.16.mlp.experts.38.gate_proj.weight_scale": "model-00017-of-00047.safetensors", + "model.layers.16.mlp.experts.38.up_proj.weight": "model-00017-of-00047.safetensors", + "model.layers.16.mlp.experts.38.up_proj.weight_scale": "model-00017-of-00047.safetensors", + "model.layers.16.mlp.experts.39.down_proj.weight": "model-00017-of-00047.safetensors", + "model.layers.16.mlp.experts.39.down_proj.weight_scale": "model-00017-of-00047.safetensors", + "model.layers.16.mlp.experts.39.gate_proj.weight": "model-00017-of-00047.safetensors", + "model.layers.16.mlp.experts.39.gate_proj.weight_scale": "model-00017-of-00047.safetensors", + "model.layers.16.mlp.experts.39.up_proj.weight": "model-00017-of-00047.safetensors", + "model.layers.16.mlp.experts.39.up_proj.weight_scale": "model-00017-of-00047.safetensors", + "model.layers.16.mlp.experts.4.down_proj.weight": "model-00017-of-00047.safetensors", + "model.layers.16.mlp.experts.4.down_proj.weight_scale": "model-00017-of-00047.safetensors", + "model.layers.16.mlp.experts.4.gate_proj.weight": "model-00017-of-00047.safetensors", + "model.layers.16.mlp.experts.4.gate_proj.weight_scale": "model-00017-of-00047.safetensors", + "model.layers.16.mlp.experts.4.up_proj.weight": "model-00017-of-00047.safetensors", + "model.layers.16.mlp.experts.4.up_proj.weight_scale": "model-00017-of-00047.safetensors", + "model.layers.16.mlp.experts.40.down_proj.weight": "model-00017-of-00047.safetensors", + "model.layers.16.mlp.experts.40.down_proj.weight_scale": "model-00017-of-00047.safetensors", + "model.layers.16.mlp.experts.40.gate_proj.weight": "model-00017-of-00047.safetensors", + "model.layers.16.mlp.experts.40.gate_proj.weight_scale": "model-00017-of-00047.safetensors", + "model.layers.16.mlp.experts.40.up_proj.weight": "model-00017-of-00047.safetensors", + "model.layers.16.mlp.experts.40.up_proj.weight_scale": "model-00017-of-00047.safetensors", + "model.layers.16.mlp.experts.41.down_proj.weight": "model-00017-of-00047.safetensors", + "model.layers.16.mlp.experts.41.down_proj.weight_scale": "model-00017-of-00047.safetensors", + "model.layers.16.mlp.experts.41.gate_proj.weight": "model-00017-of-00047.safetensors", + "model.layers.16.mlp.experts.41.gate_proj.weight_scale": "model-00017-of-00047.safetensors", + "model.layers.16.mlp.experts.41.up_proj.weight": "model-00017-of-00047.safetensors", + "model.layers.16.mlp.experts.41.up_proj.weight_scale": "model-00017-of-00047.safetensors", + "model.layers.16.mlp.experts.42.down_proj.weight": "model-00017-of-00047.safetensors", + "model.layers.16.mlp.experts.42.down_proj.weight_scale": "model-00017-of-00047.safetensors", + "model.layers.16.mlp.experts.42.gate_proj.weight": "model-00017-of-00047.safetensors", + "model.layers.16.mlp.experts.42.gate_proj.weight_scale": "model-00017-of-00047.safetensors", + "model.layers.16.mlp.experts.42.up_proj.weight": "model-00017-of-00047.safetensors", + "model.layers.16.mlp.experts.42.up_proj.weight_scale": "model-00017-of-00047.safetensors", + "model.layers.16.mlp.experts.43.down_proj.weight": "model-00017-of-00047.safetensors", + "model.layers.16.mlp.experts.43.down_proj.weight_scale": "model-00017-of-00047.safetensors", + "model.layers.16.mlp.experts.43.gate_proj.weight": "model-00017-of-00047.safetensors", + "model.layers.16.mlp.experts.43.gate_proj.weight_scale": "model-00017-of-00047.safetensors", + "model.layers.16.mlp.experts.43.up_proj.weight": "model-00017-of-00047.safetensors", + "model.layers.16.mlp.experts.43.up_proj.weight_scale": "model-00017-of-00047.safetensors", + "model.layers.16.mlp.experts.44.down_proj.weight": "model-00017-of-00047.safetensors", + "model.layers.16.mlp.experts.44.down_proj.weight_scale": "model-00017-of-00047.safetensors", + "model.layers.16.mlp.experts.44.gate_proj.weight": "model-00017-of-00047.safetensors", + "model.layers.16.mlp.experts.44.gate_proj.weight_scale": "model-00017-of-00047.safetensors", + "model.layers.16.mlp.experts.44.up_proj.weight": "model-00017-of-00047.safetensors", + "model.layers.16.mlp.experts.44.up_proj.weight_scale": "model-00017-of-00047.safetensors", + "model.layers.16.mlp.experts.45.down_proj.weight": "model-00017-of-00047.safetensors", + "model.layers.16.mlp.experts.45.down_proj.weight_scale": "model-00017-of-00047.safetensors", + "model.layers.16.mlp.experts.45.gate_proj.weight": "model-00017-of-00047.safetensors", + "model.layers.16.mlp.experts.45.gate_proj.weight_scale": "model-00017-of-00047.safetensors", + "model.layers.16.mlp.experts.45.up_proj.weight": "model-00017-of-00047.safetensors", + "model.layers.16.mlp.experts.45.up_proj.weight_scale": "model-00017-of-00047.safetensors", + "model.layers.16.mlp.experts.46.down_proj.weight": "model-00017-of-00047.safetensors", + "model.layers.16.mlp.experts.46.down_proj.weight_scale": "model-00017-of-00047.safetensors", + "model.layers.16.mlp.experts.46.gate_proj.weight": "model-00017-of-00047.safetensors", + "model.layers.16.mlp.experts.46.gate_proj.weight_scale": "model-00017-of-00047.safetensors", + "model.layers.16.mlp.experts.46.up_proj.weight": "model-00017-of-00047.safetensors", + "model.layers.16.mlp.experts.46.up_proj.weight_scale": "model-00017-of-00047.safetensors", + "model.layers.16.mlp.experts.47.down_proj.weight": "model-00017-of-00047.safetensors", + "model.layers.16.mlp.experts.47.down_proj.weight_scale": "model-00017-of-00047.safetensors", + "model.layers.16.mlp.experts.47.gate_proj.weight": "model-00017-of-00047.safetensors", + "model.layers.16.mlp.experts.47.gate_proj.weight_scale": "model-00017-of-00047.safetensors", + "model.layers.16.mlp.experts.47.up_proj.weight": "model-00017-of-00047.safetensors", + "model.layers.16.mlp.experts.47.up_proj.weight_scale": "model-00017-of-00047.safetensors", + "model.layers.16.mlp.experts.48.down_proj.weight": "model-00017-of-00047.safetensors", + "model.layers.16.mlp.experts.48.down_proj.weight_scale": "model-00017-of-00047.safetensors", + "model.layers.16.mlp.experts.48.gate_proj.weight": "model-00017-of-00047.safetensors", + "model.layers.16.mlp.experts.48.gate_proj.weight_scale": "model-00017-of-00047.safetensors", + "model.layers.16.mlp.experts.48.up_proj.weight": "model-00017-of-00047.safetensors", + "model.layers.16.mlp.experts.48.up_proj.weight_scale": "model-00017-of-00047.safetensors", + "model.layers.16.mlp.experts.49.down_proj.weight": "model-00017-of-00047.safetensors", + "model.layers.16.mlp.experts.49.down_proj.weight_scale": "model-00017-of-00047.safetensors", + "model.layers.16.mlp.experts.49.gate_proj.weight": "model-00017-of-00047.safetensors", + "model.layers.16.mlp.experts.49.gate_proj.weight_scale": "model-00017-of-00047.safetensors", + "model.layers.16.mlp.experts.49.up_proj.weight": "model-00017-of-00047.safetensors", + "model.layers.16.mlp.experts.49.up_proj.weight_scale": "model-00017-of-00047.safetensors", + "model.layers.16.mlp.experts.5.down_proj.weight": "model-00017-of-00047.safetensors", + "model.layers.16.mlp.experts.5.down_proj.weight_scale": "model-00017-of-00047.safetensors", + "model.layers.16.mlp.experts.5.gate_proj.weight": "model-00017-of-00047.safetensors", + "model.layers.16.mlp.experts.5.gate_proj.weight_scale": "model-00017-of-00047.safetensors", + "model.layers.16.mlp.experts.5.up_proj.weight": "model-00017-of-00047.safetensors", + "model.layers.16.mlp.experts.5.up_proj.weight_scale": "model-00017-of-00047.safetensors", + "model.layers.16.mlp.experts.50.down_proj.weight": "model-00017-of-00047.safetensors", + "model.layers.16.mlp.experts.50.down_proj.weight_scale": "model-00017-of-00047.safetensors", + "model.layers.16.mlp.experts.50.gate_proj.weight": "model-00017-of-00047.safetensors", + "model.layers.16.mlp.experts.50.gate_proj.weight_scale": "model-00017-of-00047.safetensors", + "model.layers.16.mlp.experts.50.up_proj.weight": "model-00017-of-00047.safetensors", + "model.layers.16.mlp.experts.50.up_proj.weight_scale": "model-00017-of-00047.safetensors", + "model.layers.16.mlp.experts.51.down_proj.weight": "model-00017-of-00047.safetensors", + "model.layers.16.mlp.experts.51.down_proj.weight_scale": "model-00017-of-00047.safetensors", + "model.layers.16.mlp.experts.51.gate_proj.weight": "model-00017-of-00047.safetensors", + "model.layers.16.mlp.experts.51.gate_proj.weight_scale": "model-00017-of-00047.safetensors", + "model.layers.16.mlp.experts.51.up_proj.weight": "model-00017-of-00047.safetensors", + "model.layers.16.mlp.experts.51.up_proj.weight_scale": "model-00017-of-00047.safetensors", + "model.layers.16.mlp.experts.52.down_proj.weight": "model-00017-of-00047.safetensors", + "model.layers.16.mlp.experts.52.down_proj.weight_scale": "model-00017-of-00047.safetensors", + "model.layers.16.mlp.experts.52.gate_proj.weight": "model-00017-of-00047.safetensors", + "model.layers.16.mlp.experts.52.gate_proj.weight_scale": "model-00017-of-00047.safetensors", + "model.layers.16.mlp.experts.52.up_proj.weight": "model-00017-of-00047.safetensors", + "model.layers.16.mlp.experts.52.up_proj.weight_scale": "model-00017-of-00047.safetensors", + "model.layers.16.mlp.experts.53.down_proj.weight": "model-00017-of-00047.safetensors", + "model.layers.16.mlp.experts.53.down_proj.weight_scale": "model-00017-of-00047.safetensors", + "model.layers.16.mlp.experts.53.gate_proj.weight": "model-00017-of-00047.safetensors", + "model.layers.16.mlp.experts.53.gate_proj.weight_scale": "model-00017-of-00047.safetensors", + "model.layers.16.mlp.experts.53.up_proj.weight": "model-00017-of-00047.safetensors", + "model.layers.16.mlp.experts.53.up_proj.weight_scale": "model-00017-of-00047.safetensors", + "model.layers.16.mlp.experts.54.down_proj.weight": "model-00017-of-00047.safetensors", + "model.layers.16.mlp.experts.54.down_proj.weight_scale": "model-00017-of-00047.safetensors", + "model.layers.16.mlp.experts.54.gate_proj.weight": "model-00017-of-00047.safetensors", + "model.layers.16.mlp.experts.54.gate_proj.weight_scale": "model-00017-of-00047.safetensors", + "model.layers.16.mlp.experts.54.up_proj.weight": "model-00017-of-00047.safetensors", + "model.layers.16.mlp.experts.54.up_proj.weight_scale": "model-00017-of-00047.safetensors", + "model.layers.16.mlp.experts.55.down_proj.weight": "model-00017-of-00047.safetensors", + "model.layers.16.mlp.experts.55.down_proj.weight_scale": "model-00017-of-00047.safetensors", + "model.layers.16.mlp.experts.55.gate_proj.weight": "model-00017-of-00047.safetensors", + "model.layers.16.mlp.experts.55.gate_proj.weight_scale": "model-00017-of-00047.safetensors", + "model.layers.16.mlp.experts.55.up_proj.weight": "model-00017-of-00047.safetensors", + "model.layers.16.mlp.experts.55.up_proj.weight_scale": "model-00017-of-00047.safetensors", + "model.layers.16.mlp.experts.56.down_proj.weight": "model-00017-of-00047.safetensors", + "model.layers.16.mlp.experts.56.down_proj.weight_scale": "model-00017-of-00047.safetensors", + "model.layers.16.mlp.experts.56.gate_proj.weight": "model-00017-of-00047.safetensors", + "model.layers.16.mlp.experts.56.gate_proj.weight_scale": "model-00017-of-00047.safetensors", + "model.layers.16.mlp.experts.56.up_proj.weight": "model-00017-of-00047.safetensors", + "model.layers.16.mlp.experts.56.up_proj.weight_scale": "model-00017-of-00047.safetensors", + "model.layers.16.mlp.experts.57.down_proj.weight": "model-00017-of-00047.safetensors", + "model.layers.16.mlp.experts.57.down_proj.weight_scale": "model-00017-of-00047.safetensors", + "model.layers.16.mlp.experts.57.gate_proj.weight": "model-00017-of-00047.safetensors", + "model.layers.16.mlp.experts.57.gate_proj.weight_scale": "model-00017-of-00047.safetensors", + "model.layers.16.mlp.experts.57.up_proj.weight": "model-00017-of-00047.safetensors", + "model.layers.16.mlp.experts.57.up_proj.weight_scale": "model-00017-of-00047.safetensors", + "model.layers.16.mlp.experts.58.down_proj.weight": "model-00017-of-00047.safetensors", + "model.layers.16.mlp.experts.58.down_proj.weight_scale": "model-00017-of-00047.safetensors", + "model.layers.16.mlp.experts.58.gate_proj.weight": "model-00017-of-00047.safetensors", + "model.layers.16.mlp.experts.58.gate_proj.weight_scale": "model-00017-of-00047.safetensors", + "model.layers.16.mlp.experts.58.up_proj.weight": "model-00017-of-00047.safetensors", + "model.layers.16.mlp.experts.58.up_proj.weight_scale": "model-00017-of-00047.safetensors", + "model.layers.16.mlp.experts.59.down_proj.weight": "model-00017-of-00047.safetensors", + "model.layers.16.mlp.experts.59.down_proj.weight_scale": "model-00017-of-00047.safetensors", + "model.layers.16.mlp.experts.59.gate_proj.weight": "model-00017-of-00047.safetensors", + "model.layers.16.mlp.experts.59.gate_proj.weight_scale": "model-00017-of-00047.safetensors", + "model.layers.16.mlp.experts.59.up_proj.weight": "model-00017-of-00047.safetensors", + "model.layers.16.mlp.experts.59.up_proj.weight_scale": "model-00017-of-00047.safetensors", + "model.layers.16.mlp.experts.6.down_proj.weight": "model-00017-of-00047.safetensors", + "model.layers.16.mlp.experts.6.down_proj.weight_scale": "model-00017-of-00047.safetensors", + "model.layers.16.mlp.experts.6.gate_proj.weight": "model-00017-of-00047.safetensors", + "model.layers.16.mlp.experts.6.gate_proj.weight_scale": "model-00017-of-00047.safetensors", + "model.layers.16.mlp.experts.6.up_proj.weight": "model-00017-of-00047.safetensors", + "model.layers.16.mlp.experts.6.up_proj.weight_scale": "model-00017-of-00047.safetensors", + "model.layers.16.mlp.experts.60.down_proj.weight": "model-00017-of-00047.safetensors", + "model.layers.16.mlp.experts.60.down_proj.weight_scale": "model-00017-of-00047.safetensors", + "model.layers.16.mlp.experts.60.gate_proj.weight": "model-00017-of-00047.safetensors", + "model.layers.16.mlp.experts.60.gate_proj.weight_scale": "model-00017-of-00047.safetensors", + "model.layers.16.mlp.experts.60.up_proj.weight": "model-00017-of-00047.safetensors", + "model.layers.16.mlp.experts.60.up_proj.weight_scale": "model-00017-of-00047.safetensors", + "model.layers.16.mlp.experts.61.down_proj.weight": "model-00017-of-00047.safetensors", + "model.layers.16.mlp.experts.61.down_proj.weight_scale": "model-00017-of-00047.safetensors", + "model.layers.16.mlp.experts.61.gate_proj.weight": "model-00017-of-00047.safetensors", + "model.layers.16.mlp.experts.61.gate_proj.weight_scale": "model-00017-of-00047.safetensors", + "model.layers.16.mlp.experts.61.up_proj.weight": "model-00017-of-00047.safetensors", + "model.layers.16.mlp.experts.61.up_proj.weight_scale": "model-00017-of-00047.safetensors", + "model.layers.16.mlp.experts.62.down_proj.weight": "model-00017-of-00047.safetensors", + "model.layers.16.mlp.experts.62.down_proj.weight_scale": "model-00017-of-00047.safetensors", + "model.layers.16.mlp.experts.62.gate_proj.weight": "model-00017-of-00047.safetensors", + "model.layers.16.mlp.experts.62.gate_proj.weight_scale": "model-00017-of-00047.safetensors", + "model.layers.16.mlp.experts.62.up_proj.weight": "model-00017-of-00047.safetensors", + "model.layers.16.mlp.experts.62.up_proj.weight_scale": "model-00017-of-00047.safetensors", + "model.layers.16.mlp.experts.63.down_proj.weight": "model-00017-of-00047.safetensors", + "model.layers.16.mlp.experts.63.down_proj.weight_scale": "model-00017-of-00047.safetensors", + "model.layers.16.mlp.experts.63.gate_proj.weight": "model-00017-of-00047.safetensors", + "model.layers.16.mlp.experts.63.gate_proj.weight_scale": "model-00017-of-00047.safetensors", + "model.layers.16.mlp.experts.63.up_proj.weight": "model-00017-of-00047.safetensors", + "model.layers.16.mlp.experts.63.up_proj.weight_scale": "model-00017-of-00047.safetensors", + "model.layers.16.mlp.experts.64.down_proj.weight": "model-00017-of-00047.safetensors", + "model.layers.16.mlp.experts.64.down_proj.weight_scale": "model-00017-of-00047.safetensors", + "model.layers.16.mlp.experts.64.gate_proj.weight": "model-00017-of-00047.safetensors", + "model.layers.16.mlp.experts.64.gate_proj.weight_scale": "model-00017-of-00047.safetensors", + "model.layers.16.mlp.experts.64.up_proj.weight": "model-00017-of-00047.safetensors", + "model.layers.16.mlp.experts.64.up_proj.weight_scale": "model-00017-of-00047.safetensors", + "model.layers.16.mlp.experts.65.down_proj.weight": "model-00017-of-00047.safetensors", + "model.layers.16.mlp.experts.65.down_proj.weight_scale": "model-00017-of-00047.safetensors", + "model.layers.16.mlp.experts.65.gate_proj.weight": "model-00017-of-00047.safetensors", + "model.layers.16.mlp.experts.65.gate_proj.weight_scale": "model-00017-of-00047.safetensors", + "model.layers.16.mlp.experts.65.up_proj.weight": "model-00017-of-00047.safetensors", + "model.layers.16.mlp.experts.65.up_proj.weight_scale": "model-00017-of-00047.safetensors", + "model.layers.16.mlp.experts.66.down_proj.weight": "model-00017-of-00047.safetensors", + "model.layers.16.mlp.experts.66.down_proj.weight_scale": "model-00017-of-00047.safetensors", + "model.layers.16.mlp.experts.66.gate_proj.weight": "model-00017-of-00047.safetensors", + "model.layers.16.mlp.experts.66.gate_proj.weight_scale": "model-00017-of-00047.safetensors", + "model.layers.16.mlp.experts.66.up_proj.weight": "model-00017-of-00047.safetensors", + "model.layers.16.mlp.experts.66.up_proj.weight_scale": "model-00017-of-00047.safetensors", + "model.layers.16.mlp.experts.67.down_proj.weight": "model-00017-of-00047.safetensors", + "model.layers.16.mlp.experts.67.down_proj.weight_scale": "model-00017-of-00047.safetensors", + "model.layers.16.mlp.experts.67.gate_proj.weight": "model-00017-of-00047.safetensors", + "model.layers.16.mlp.experts.67.gate_proj.weight_scale": "model-00017-of-00047.safetensors", + "model.layers.16.mlp.experts.67.up_proj.weight": "model-00017-of-00047.safetensors", + "model.layers.16.mlp.experts.67.up_proj.weight_scale": "model-00017-of-00047.safetensors", + "model.layers.16.mlp.experts.68.down_proj.weight": "model-00017-of-00047.safetensors", + "model.layers.16.mlp.experts.68.down_proj.weight_scale": "model-00017-of-00047.safetensors", + "model.layers.16.mlp.experts.68.gate_proj.weight": "model-00017-of-00047.safetensors", + "model.layers.16.mlp.experts.68.gate_proj.weight_scale": "model-00017-of-00047.safetensors", + "model.layers.16.mlp.experts.68.up_proj.weight": "model-00017-of-00047.safetensors", + "model.layers.16.mlp.experts.68.up_proj.weight_scale": "model-00017-of-00047.safetensors", + "model.layers.16.mlp.experts.69.down_proj.weight": "model-00017-of-00047.safetensors", + "model.layers.16.mlp.experts.69.down_proj.weight_scale": "model-00017-of-00047.safetensors", + "model.layers.16.mlp.experts.69.gate_proj.weight": "model-00017-of-00047.safetensors", + "model.layers.16.mlp.experts.69.gate_proj.weight_scale": "model-00017-of-00047.safetensors", + "model.layers.16.mlp.experts.69.up_proj.weight": "model-00017-of-00047.safetensors", + "model.layers.16.mlp.experts.69.up_proj.weight_scale": "model-00017-of-00047.safetensors", + "model.layers.16.mlp.experts.7.down_proj.weight": "model-00017-of-00047.safetensors", + "model.layers.16.mlp.experts.7.down_proj.weight_scale": "model-00017-of-00047.safetensors", + "model.layers.16.mlp.experts.7.gate_proj.weight": "model-00017-of-00047.safetensors", + "model.layers.16.mlp.experts.7.gate_proj.weight_scale": "model-00017-of-00047.safetensors", + "model.layers.16.mlp.experts.7.up_proj.weight": "model-00017-of-00047.safetensors", + "model.layers.16.mlp.experts.7.up_proj.weight_scale": "model-00017-of-00047.safetensors", + "model.layers.16.mlp.experts.70.down_proj.weight": "model-00017-of-00047.safetensors", + "model.layers.16.mlp.experts.70.down_proj.weight_scale": "model-00017-of-00047.safetensors", + "model.layers.16.mlp.experts.70.gate_proj.weight": "model-00017-of-00047.safetensors", + "model.layers.16.mlp.experts.70.gate_proj.weight_scale": "model-00017-of-00047.safetensors", + "model.layers.16.mlp.experts.70.up_proj.weight": "model-00017-of-00047.safetensors", + "model.layers.16.mlp.experts.70.up_proj.weight_scale": "model-00017-of-00047.safetensors", + "model.layers.16.mlp.experts.71.down_proj.weight": "model-00017-of-00047.safetensors", + "model.layers.16.mlp.experts.71.down_proj.weight_scale": "model-00017-of-00047.safetensors", + "model.layers.16.mlp.experts.71.gate_proj.weight": "model-00017-of-00047.safetensors", + "model.layers.16.mlp.experts.71.gate_proj.weight_scale": "model-00017-of-00047.safetensors", + "model.layers.16.mlp.experts.71.up_proj.weight": "model-00017-of-00047.safetensors", + "model.layers.16.mlp.experts.71.up_proj.weight_scale": "model-00017-of-00047.safetensors", + "model.layers.16.mlp.experts.72.down_proj.weight": "model-00017-of-00047.safetensors", + "model.layers.16.mlp.experts.72.down_proj.weight_scale": "model-00017-of-00047.safetensors", + "model.layers.16.mlp.experts.72.gate_proj.weight": "model-00017-of-00047.safetensors", + "model.layers.16.mlp.experts.72.gate_proj.weight_scale": "model-00017-of-00047.safetensors", + "model.layers.16.mlp.experts.72.up_proj.weight": "model-00017-of-00047.safetensors", + "model.layers.16.mlp.experts.72.up_proj.weight_scale": "model-00017-of-00047.safetensors", + "model.layers.16.mlp.experts.73.down_proj.weight": "model-00017-of-00047.safetensors", + "model.layers.16.mlp.experts.73.down_proj.weight_scale": "model-00017-of-00047.safetensors", + "model.layers.16.mlp.experts.73.gate_proj.weight": "model-00017-of-00047.safetensors", + "model.layers.16.mlp.experts.73.gate_proj.weight_scale": "model-00017-of-00047.safetensors", + "model.layers.16.mlp.experts.73.up_proj.weight": "model-00017-of-00047.safetensors", + "model.layers.16.mlp.experts.73.up_proj.weight_scale": "model-00017-of-00047.safetensors", + "model.layers.16.mlp.experts.74.down_proj.weight": "model-00017-of-00047.safetensors", + "model.layers.16.mlp.experts.74.down_proj.weight_scale": "model-00017-of-00047.safetensors", + "model.layers.16.mlp.experts.74.gate_proj.weight": "model-00017-of-00047.safetensors", + "model.layers.16.mlp.experts.74.gate_proj.weight_scale": "model-00017-of-00047.safetensors", + "model.layers.16.mlp.experts.74.up_proj.weight": "model-00017-of-00047.safetensors", + "model.layers.16.mlp.experts.74.up_proj.weight_scale": "model-00017-of-00047.safetensors", + "model.layers.16.mlp.experts.75.down_proj.weight": "model-00017-of-00047.safetensors", + "model.layers.16.mlp.experts.75.down_proj.weight_scale": "model-00017-of-00047.safetensors", + "model.layers.16.mlp.experts.75.gate_proj.weight": "model-00017-of-00047.safetensors", + "model.layers.16.mlp.experts.75.gate_proj.weight_scale": "model-00017-of-00047.safetensors", + "model.layers.16.mlp.experts.75.up_proj.weight": "model-00017-of-00047.safetensors", + "model.layers.16.mlp.experts.75.up_proj.weight_scale": "model-00017-of-00047.safetensors", + "model.layers.16.mlp.experts.76.down_proj.weight": "model-00017-of-00047.safetensors", + "model.layers.16.mlp.experts.76.down_proj.weight_scale": "model-00017-of-00047.safetensors", + "model.layers.16.mlp.experts.76.gate_proj.weight": "model-00017-of-00047.safetensors", + "model.layers.16.mlp.experts.76.gate_proj.weight_scale": "model-00017-of-00047.safetensors", + "model.layers.16.mlp.experts.76.up_proj.weight": "model-00017-of-00047.safetensors", + "model.layers.16.mlp.experts.76.up_proj.weight_scale": "model-00017-of-00047.safetensors", + "model.layers.16.mlp.experts.77.down_proj.weight": "model-00017-of-00047.safetensors", + "model.layers.16.mlp.experts.77.down_proj.weight_scale": "model-00017-of-00047.safetensors", + "model.layers.16.mlp.experts.77.gate_proj.weight": "model-00017-of-00047.safetensors", + "model.layers.16.mlp.experts.77.gate_proj.weight_scale": "model-00017-of-00047.safetensors", + "model.layers.16.mlp.experts.77.up_proj.weight": "model-00017-of-00047.safetensors", + "model.layers.16.mlp.experts.77.up_proj.weight_scale": "model-00017-of-00047.safetensors", + "model.layers.16.mlp.experts.78.down_proj.weight": "model-00017-of-00047.safetensors", + "model.layers.16.mlp.experts.78.down_proj.weight_scale": "model-00017-of-00047.safetensors", + "model.layers.16.mlp.experts.78.gate_proj.weight": "model-00017-of-00047.safetensors", + "model.layers.16.mlp.experts.78.gate_proj.weight_scale": "model-00017-of-00047.safetensors", + "model.layers.16.mlp.experts.78.up_proj.weight": "model-00017-of-00047.safetensors", + "model.layers.16.mlp.experts.78.up_proj.weight_scale": "model-00017-of-00047.safetensors", + "model.layers.16.mlp.experts.79.down_proj.weight": "model-00017-of-00047.safetensors", + "model.layers.16.mlp.experts.79.down_proj.weight_scale": "model-00017-of-00047.safetensors", + "model.layers.16.mlp.experts.79.gate_proj.weight": "model-00017-of-00047.safetensors", + "model.layers.16.mlp.experts.79.gate_proj.weight_scale": "model-00017-of-00047.safetensors", + "model.layers.16.mlp.experts.79.up_proj.weight": "model-00017-of-00047.safetensors", + "model.layers.16.mlp.experts.79.up_proj.weight_scale": "model-00017-of-00047.safetensors", + "model.layers.16.mlp.experts.8.down_proj.weight": "model-00017-of-00047.safetensors", + "model.layers.16.mlp.experts.8.down_proj.weight_scale": "model-00017-of-00047.safetensors", + "model.layers.16.mlp.experts.8.gate_proj.weight": "model-00017-of-00047.safetensors", + "model.layers.16.mlp.experts.8.gate_proj.weight_scale": "model-00017-of-00047.safetensors", + "model.layers.16.mlp.experts.8.up_proj.weight": "model-00017-of-00047.safetensors", + "model.layers.16.mlp.experts.8.up_proj.weight_scale": "model-00017-of-00047.safetensors", + "model.layers.16.mlp.experts.80.down_proj.weight": "model-00017-of-00047.safetensors", + "model.layers.16.mlp.experts.80.down_proj.weight_scale": "model-00017-of-00047.safetensors", + "model.layers.16.mlp.experts.80.gate_proj.weight": "model-00017-of-00047.safetensors", + "model.layers.16.mlp.experts.80.gate_proj.weight_scale": "model-00017-of-00047.safetensors", + "model.layers.16.mlp.experts.80.up_proj.weight": "model-00017-of-00047.safetensors", + "model.layers.16.mlp.experts.80.up_proj.weight_scale": "model-00017-of-00047.safetensors", + "model.layers.16.mlp.experts.81.down_proj.weight": "model-00017-of-00047.safetensors", + "model.layers.16.mlp.experts.81.down_proj.weight_scale": "model-00017-of-00047.safetensors", + "model.layers.16.mlp.experts.81.gate_proj.weight": "model-00017-of-00047.safetensors", + "model.layers.16.mlp.experts.81.gate_proj.weight_scale": "model-00017-of-00047.safetensors", + "model.layers.16.mlp.experts.81.up_proj.weight": "model-00017-of-00047.safetensors", + "model.layers.16.mlp.experts.81.up_proj.weight_scale": "model-00017-of-00047.safetensors", + "model.layers.16.mlp.experts.82.down_proj.weight": "model-00017-of-00047.safetensors", + "model.layers.16.mlp.experts.82.down_proj.weight_scale": "model-00017-of-00047.safetensors", + "model.layers.16.mlp.experts.82.gate_proj.weight": "model-00017-of-00047.safetensors", + "model.layers.16.mlp.experts.82.gate_proj.weight_scale": "model-00017-of-00047.safetensors", + "model.layers.16.mlp.experts.82.up_proj.weight": "model-00017-of-00047.safetensors", + "model.layers.16.mlp.experts.82.up_proj.weight_scale": "model-00017-of-00047.safetensors", + "model.layers.16.mlp.experts.83.down_proj.weight": "model-00017-of-00047.safetensors", + "model.layers.16.mlp.experts.83.down_proj.weight_scale": "model-00017-of-00047.safetensors", + "model.layers.16.mlp.experts.83.gate_proj.weight": "model-00017-of-00047.safetensors", + "model.layers.16.mlp.experts.83.gate_proj.weight_scale": "model-00017-of-00047.safetensors", + "model.layers.16.mlp.experts.83.up_proj.weight": "model-00017-of-00047.safetensors", + "model.layers.16.mlp.experts.83.up_proj.weight_scale": "model-00017-of-00047.safetensors", + "model.layers.16.mlp.experts.84.down_proj.weight": "model-00017-of-00047.safetensors", + "model.layers.16.mlp.experts.84.down_proj.weight_scale": "model-00017-of-00047.safetensors", + "model.layers.16.mlp.experts.84.gate_proj.weight": "model-00017-of-00047.safetensors", + "model.layers.16.mlp.experts.84.gate_proj.weight_scale": "model-00017-of-00047.safetensors", + "model.layers.16.mlp.experts.84.up_proj.weight": "model-00017-of-00047.safetensors", + "model.layers.16.mlp.experts.84.up_proj.weight_scale": "model-00017-of-00047.safetensors", + "model.layers.16.mlp.experts.85.down_proj.weight": "model-00017-of-00047.safetensors", + "model.layers.16.mlp.experts.85.down_proj.weight_scale": "model-00017-of-00047.safetensors", + "model.layers.16.mlp.experts.85.gate_proj.weight": "model-00017-of-00047.safetensors", + "model.layers.16.mlp.experts.85.gate_proj.weight_scale": "model-00017-of-00047.safetensors", + "model.layers.16.mlp.experts.85.up_proj.weight": "model-00017-of-00047.safetensors", + "model.layers.16.mlp.experts.85.up_proj.weight_scale": "model-00017-of-00047.safetensors", + "model.layers.16.mlp.experts.86.down_proj.weight": "model-00017-of-00047.safetensors", + "model.layers.16.mlp.experts.86.down_proj.weight_scale": "model-00017-of-00047.safetensors", + "model.layers.16.mlp.experts.86.gate_proj.weight": "model-00017-of-00047.safetensors", + "model.layers.16.mlp.experts.86.gate_proj.weight_scale": "model-00017-of-00047.safetensors", + "model.layers.16.mlp.experts.86.up_proj.weight": "model-00017-of-00047.safetensors", + "model.layers.16.mlp.experts.86.up_proj.weight_scale": "model-00017-of-00047.safetensors", + "model.layers.16.mlp.experts.87.down_proj.weight": "model-00017-of-00047.safetensors", + "model.layers.16.mlp.experts.87.down_proj.weight_scale": "model-00017-of-00047.safetensors", + "model.layers.16.mlp.experts.87.gate_proj.weight": "model-00017-of-00047.safetensors", + "model.layers.16.mlp.experts.87.gate_proj.weight_scale": "model-00017-of-00047.safetensors", + "model.layers.16.mlp.experts.87.up_proj.weight": "model-00017-of-00047.safetensors", + "model.layers.16.mlp.experts.87.up_proj.weight_scale": "model-00017-of-00047.safetensors", + "model.layers.16.mlp.experts.88.down_proj.weight": "model-00017-of-00047.safetensors", + "model.layers.16.mlp.experts.88.down_proj.weight_scale": "model-00017-of-00047.safetensors", + "model.layers.16.mlp.experts.88.gate_proj.weight": "model-00017-of-00047.safetensors", + "model.layers.16.mlp.experts.88.gate_proj.weight_scale": "model-00017-of-00047.safetensors", + "model.layers.16.mlp.experts.88.up_proj.weight": "model-00017-of-00047.safetensors", + "model.layers.16.mlp.experts.88.up_proj.weight_scale": "model-00017-of-00047.safetensors", + "model.layers.16.mlp.experts.89.down_proj.weight": "model-00017-of-00047.safetensors", + "model.layers.16.mlp.experts.89.down_proj.weight_scale": "model-00017-of-00047.safetensors", + "model.layers.16.mlp.experts.89.gate_proj.weight": "model-00017-of-00047.safetensors", + "model.layers.16.mlp.experts.89.gate_proj.weight_scale": "model-00017-of-00047.safetensors", + "model.layers.16.mlp.experts.89.up_proj.weight": "model-00017-of-00047.safetensors", + "model.layers.16.mlp.experts.89.up_proj.weight_scale": "model-00017-of-00047.safetensors", + "model.layers.16.mlp.experts.9.down_proj.weight": "model-00017-of-00047.safetensors", + "model.layers.16.mlp.experts.9.down_proj.weight_scale": "model-00017-of-00047.safetensors", + "model.layers.16.mlp.experts.9.gate_proj.weight": "model-00017-of-00047.safetensors", + "model.layers.16.mlp.experts.9.gate_proj.weight_scale": "model-00017-of-00047.safetensors", + "model.layers.16.mlp.experts.9.up_proj.weight": "model-00017-of-00047.safetensors", + "model.layers.16.mlp.experts.9.up_proj.weight_scale": "model-00017-of-00047.safetensors", + "model.layers.16.mlp.experts.90.down_proj.weight": "model-00017-of-00047.safetensors", + "model.layers.16.mlp.experts.90.down_proj.weight_scale": "model-00017-of-00047.safetensors", + "model.layers.16.mlp.experts.90.gate_proj.weight": "model-00017-of-00047.safetensors", + "model.layers.16.mlp.experts.90.gate_proj.weight_scale": "model-00017-of-00047.safetensors", + "model.layers.16.mlp.experts.90.up_proj.weight": "model-00017-of-00047.safetensors", + "model.layers.16.mlp.experts.90.up_proj.weight_scale": "model-00017-of-00047.safetensors", + "model.layers.16.mlp.experts.91.down_proj.weight": "model-00017-of-00047.safetensors", + "model.layers.16.mlp.experts.91.down_proj.weight_scale": "model-00017-of-00047.safetensors", + "model.layers.16.mlp.experts.91.gate_proj.weight": "model-00017-of-00047.safetensors", + "model.layers.16.mlp.experts.91.gate_proj.weight_scale": "model-00017-of-00047.safetensors", + "model.layers.16.mlp.experts.91.up_proj.weight": "model-00017-of-00047.safetensors", + "model.layers.16.mlp.experts.91.up_proj.weight_scale": "model-00017-of-00047.safetensors", + "model.layers.16.mlp.experts.92.down_proj.weight": "model-00017-of-00047.safetensors", + "model.layers.16.mlp.experts.92.down_proj.weight_scale": "model-00017-of-00047.safetensors", + "model.layers.16.mlp.experts.92.gate_proj.weight": "model-00017-of-00047.safetensors", + "model.layers.16.mlp.experts.92.gate_proj.weight_scale": "model-00017-of-00047.safetensors", + "model.layers.16.mlp.experts.92.up_proj.weight": "model-00017-of-00047.safetensors", + "model.layers.16.mlp.experts.92.up_proj.weight_scale": "model-00017-of-00047.safetensors", + "model.layers.16.mlp.experts.93.down_proj.weight": "model-00017-of-00047.safetensors", + "model.layers.16.mlp.experts.93.down_proj.weight_scale": "model-00017-of-00047.safetensors", + "model.layers.16.mlp.experts.93.gate_proj.weight": "model-00017-of-00047.safetensors", + "model.layers.16.mlp.experts.93.gate_proj.weight_scale": "model-00017-of-00047.safetensors", + "model.layers.16.mlp.experts.93.up_proj.weight": "model-00017-of-00047.safetensors", + "model.layers.16.mlp.experts.93.up_proj.weight_scale": "model-00017-of-00047.safetensors", + "model.layers.16.mlp.experts.94.down_proj.weight": "model-00017-of-00047.safetensors", + "model.layers.16.mlp.experts.94.down_proj.weight_scale": "model-00017-of-00047.safetensors", + "model.layers.16.mlp.experts.94.gate_proj.weight": "model-00017-of-00047.safetensors", + "model.layers.16.mlp.experts.94.gate_proj.weight_scale": "model-00017-of-00047.safetensors", + "model.layers.16.mlp.experts.94.up_proj.weight": "model-00017-of-00047.safetensors", + "model.layers.16.mlp.experts.94.up_proj.weight_scale": "model-00017-of-00047.safetensors", + "model.layers.16.mlp.experts.95.down_proj.weight": "model-00017-of-00047.safetensors", + "model.layers.16.mlp.experts.95.down_proj.weight_scale": "model-00017-of-00047.safetensors", + "model.layers.16.mlp.experts.95.gate_proj.weight": "model-00017-of-00047.safetensors", + "model.layers.16.mlp.experts.95.gate_proj.weight_scale": "model-00017-of-00047.safetensors", + "model.layers.16.mlp.experts.95.up_proj.weight": "model-00017-of-00047.safetensors", + "model.layers.16.mlp.experts.95.up_proj.weight_scale": "model-00017-of-00047.safetensors", + "model.layers.16.mlp.experts.96.down_proj.weight": "model-00017-of-00047.safetensors", + "model.layers.16.mlp.experts.96.down_proj.weight_scale": "model-00017-of-00047.safetensors", + "model.layers.16.mlp.experts.96.gate_proj.weight": "model-00017-of-00047.safetensors", + "model.layers.16.mlp.experts.96.gate_proj.weight_scale": "model-00017-of-00047.safetensors", + "model.layers.16.mlp.experts.96.up_proj.weight": "model-00017-of-00047.safetensors", + "model.layers.16.mlp.experts.96.up_proj.weight_scale": "model-00017-of-00047.safetensors", + "model.layers.16.mlp.experts.97.down_proj.weight": "model-00017-of-00047.safetensors", + "model.layers.16.mlp.experts.97.down_proj.weight_scale": "model-00017-of-00047.safetensors", + "model.layers.16.mlp.experts.97.gate_proj.weight": "model-00017-of-00047.safetensors", + "model.layers.16.mlp.experts.97.gate_proj.weight_scale": "model-00017-of-00047.safetensors", + "model.layers.16.mlp.experts.97.up_proj.weight": "model-00017-of-00047.safetensors", + "model.layers.16.mlp.experts.97.up_proj.weight_scale": "model-00017-of-00047.safetensors", + "model.layers.16.mlp.experts.98.down_proj.weight": "model-00017-of-00047.safetensors", + "model.layers.16.mlp.experts.98.down_proj.weight_scale": "model-00017-of-00047.safetensors", + "model.layers.16.mlp.experts.98.gate_proj.weight": "model-00017-of-00047.safetensors", + "model.layers.16.mlp.experts.98.gate_proj.weight_scale": "model-00017-of-00047.safetensors", + "model.layers.16.mlp.experts.98.up_proj.weight": "model-00017-of-00047.safetensors", + "model.layers.16.mlp.experts.98.up_proj.weight_scale": "model-00017-of-00047.safetensors", + "model.layers.16.mlp.experts.99.down_proj.weight": "model-00017-of-00047.safetensors", + "model.layers.16.mlp.experts.99.down_proj.weight_scale": "model-00017-of-00047.safetensors", + "model.layers.16.mlp.experts.99.gate_proj.weight": "model-00017-of-00047.safetensors", + "model.layers.16.mlp.experts.99.gate_proj.weight_scale": "model-00017-of-00047.safetensors", + "model.layers.16.mlp.experts.99.up_proj.weight": "model-00017-of-00047.safetensors", + "model.layers.16.mlp.experts.99.up_proj.weight_scale": "model-00017-of-00047.safetensors", + "model.layers.16.mlp.gate.e_score_correction_bias": "model-00017-of-00047.safetensors", + "model.layers.16.mlp.gate.weight": "model-00017-of-00047.safetensors", + "model.layers.16.mlp.shared_experts.down_proj.weight": "model-00017-of-00047.safetensors", + "model.layers.16.mlp.shared_experts.down_proj.weight_scale": "model-00017-of-00047.safetensors", + "model.layers.16.mlp.shared_experts.gate_proj.weight": "model-00017-of-00047.safetensors", + "model.layers.16.mlp.shared_experts.gate_proj.weight_scale": "model-00017-of-00047.safetensors", + "model.layers.16.mlp.shared_experts.up_proj.weight": "model-00017-of-00047.safetensors", + "model.layers.16.mlp.shared_experts.up_proj.weight_scale": "model-00017-of-00047.safetensors", + "model.layers.16.post_attention_layernorm.weight": "model-00017-of-00047.safetensors", + "model.layers.16.self_attn.k_proj.bias": "model-00017-of-00047.safetensors", + "model.layers.16.self_attn.k_proj.weight": "model-00017-of-00047.safetensors", + "model.layers.16.self_attn.k_proj.weight_scale": "model-00017-of-00047.safetensors", + "model.layers.16.self_attn.o_proj.weight": "model-00017-of-00047.safetensors", + "model.layers.16.self_attn.o_proj.weight_scale": "model-00017-of-00047.safetensors", + "model.layers.16.self_attn.q_proj.bias": "model-00017-of-00047.safetensors", + "model.layers.16.self_attn.q_proj.weight": "model-00017-of-00047.safetensors", + "model.layers.16.self_attn.q_proj.weight_scale": "model-00017-of-00047.safetensors", + "model.layers.16.self_attn.v_proj.bias": "model-00017-of-00047.safetensors", + "model.layers.16.self_attn.v_proj.weight": "model-00017-of-00047.safetensors", + "model.layers.16.self_attn.v_proj.weight_scale": "model-00017-of-00047.safetensors", + "model.layers.17.input_layernorm.weight": "model-00018-of-00047.safetensors", + "model.layers.17.mlp.experts.0.down_proj.weight": "model-00018-of-00047.safetensors", + "model.layers.17.mlp.experts.0.down_proj.weight_scale": "model-00018-of-00047.safetensors", + "model.layers.17.mlp.experts.0.gate_proj.weight": "model-00018-of-00047.safetensors", + "model.layers.17.mlp.experts.0.gate_proj.weight_scale": "model-00018-of-00047.safetensors", + "model.layers.17.mlp.experts.0.up_proj.weight": "model-00018-of-00047.safetensors", + "model.layers.17.mlp.experts.0.up_proj.weight_scale": "model-00018-of-00047.safetensors", + "model.layers.17.mlp.experts.1.down_proj.weight": "model-00018-of-00047.safetensors", + "model.layers.17.mlp.experts.1.down_proj.weight_scale": "model-00018-of-00047.safetensors", + "model.layers.17.mlp.experts.1.gate_proj.weight": "model-00018-of-00047.safetensors", + "model.layers.17.mlp.experts.1.gate_proj.weight_scale": "model-00018-of-00047.safetensors", + "model.layers.17.mlp.experts.1.up_proj.weight": "model-00018-of-00047.safetensors", + "model.layers.17.mlp.experts.1.up_proj.weight_scale": "model-00018-of-00047.safetensors", + "model.layers.17.mlp.experts.10.down_proj.weight": "model-00018-of-00047.safetensors", + "model.layers.17.mlp.experts.10.down_proj.weight_scale": "model-00018-of-00047.safetensors", + "model.layers.17.mlp.experts.10.gate_proj.weight": "model-00018-of-00047.safetensors", + "model.layers.17.mlp.experts.10.gate_proj.weight_scale": "model-00018-of-00047.safetensors", + "model.layers.17.mlp.experts.10.up_proj.weight": "model-00018-of-00047.safetensors", + "model.layers.17.mlp.experts.10.up_proj.weight_scale": "model-00018-of-00047.safetensors", + "model.layers.17.mlp.experts.100.down_proj.weight": "model-00018-of-00047.safetensors", + "model.layers.17.mlp.experts.100.down_proj.weight_scale": "model-00018-of-00047.safetensors", + "model.layers.17.mlp.experts.100.gate_proj.weight": "model-00018-of-00047.safetensors", + "model.layers.17.mlp.experts.100.gate_proj.weight_scale": "model-00018-of-00047.safetensors", + "model.layers.17.mlp.experts.100.up_proj.weight": "model-00018-of-00047.safetensors", + "model.layers.17.mlp.experts.100.up_proj.weight_scale": "model-00018-of-00047.safetensors", + "model.layers.17.mlp.experts.101.down_proj.weight": "model-00018-of-00047.safetensors", + "model.layers.17.mlp.experts.101.down_proj.weight_scale": "model-00018-of-00047.safetensors", + "model.layers.17.mlp.experts.101.gate_proj.weight": "model-00018-of-00047.safetensors", + "model.layers.17.mlp.experts.101.gate_proj.weight_scale": "model-00018-of-00047.safetensors", + "model.layers.17.mlp.experts.101.up_proj.weight": "model-00018-of-00047.safetensors", + "model.layers.17.mlp.experts.101.up_proj.weight_scale": "model-00018-of-00047.safetensors", + "model.layers.17.mlp.experts.102.down_proj.weight": "model-00018-of-00047.safetensors", + "model.layers.17.mlp.experts.102.down_proj.weight_scale": "model-00018-of-00047.safetensors", + "model.layers.17.mlp.experts.102.gate_proj.weight": "model-00018-of-00047.safetensors", + "model.layers.17.mlp.experts.102.gate_proj.weight_scale": "model-00018-of-00047.safetensors", + "model.layers.17.mlp.experts.102.up_proj.weight": "model-00018-of-00047.safetensors", + "model.layers.17.mlp.experts.102.up_proj.weight_scale": "model-00018-of-00047.safetensors", + "model.layers.17.mlp.experts.103.down_proj.weight": "model-00018-of-00047.safetensors", + "model.layers.17.mlp.experts.103.down_proj.weight_scale": "model-00018-of-00047.safetensors", + "model.layers.17.mlp.experts.103.gate_proj.weight": "model-00018-of-00047.safetensors", + "model.layers.17.mlp.experts.103.gate_proj.weight_scale": "model-00018-of-00047.safetensors", + "model.layers.17.mlp.experts.103.up_proj.weight": "model-00018-of-00047.safetensors", + "model.layers.17.mlp.experts.103.up_proj.weight_scale": "model-00018-of-00047.safetensors", + "model.layers.17.mlp.experts.104.down_proj.weight": "model-00018-of-00047.safetensors", + "model.layers.17.mlp.experts.104.down_proj.weight_scale": "model-00018-of-00047.safetensors", + "model.layers.17.mlp.experts.104.gate_proj.weight": "model-00018-of-00047.safetensors", + "model.layers.17.mlp.experts.104.gate_proj.weight_scale": "model-00018-of-00047.safetensors", + "model.layers.17.mlp.experts.104.up_proj.weight": "model-00018-of-00047.safetensors", + "model.layers.17.mlp.experts.104.up_proj.weight_scale": "model-00018-of-00047.safetensors", + "model.layers.17.mlp.experts.105.down_proj.weight": "model-00018-of-00047.safetensors", + "model.layers.17.mlp.experts.105.down_proj.weight_scale": "model-00018-of-00047.safetensors", + "model.layers.17.mlp.experts.105.gate_proj.weight": "model-00018-of-00047.safetensors", + "model.layers.17.mlp.experts.105.gate_proj.weight_scale": "model-00018-of-00047.safetensors", + "model.layers.17.mlp.experts.105.up_proj.weight": "model-00018-of-00047.safetensors", + "model.layers.17.mlp.experts.105.up_proj.weight_scale": "model-00018-of-00047.safetensors", + "model.layers.17.mlp.experts.106.down_proj.weight": "model-00018-of-00047.safetensors", + "model.layers.17.mlp.experts.106.down_proj.weight_scale": "model-00018-of-00047.safetensors", + "model.layers.17.mlp.experts.106.gate_proj.weight": "model-00018-of-00047.safetensors", + "model.layers.17.mlp.experts.106.gate_proj.weight_scale": "model-00018-of-00047.safetensors", + "model.layers.17.mlp.experts.106.up_proj.weight": "model-00018-of-00047.safetensors", + "model.layers.17.mlp.experts.106.up_proj.weight_scale": "model-00018-of-00047.safetensors", + "model.layers.17.mlp.experts.107.down_proj.weight": "model-00018-of-00047.safetensors", + "model.layers.17.mlp.experts.107.down_proj.weight_scale": "model-00018-of-00047.safetensors", + "model.layers.17.mlp.experts.107.gate_proj.weight": "model-00018-of-00047.safetensors", + "model.layers.17.mlp.experts.107.gate_proj.weight_scale": "model-00018-of-00047.safetensors", + "model.layers.17.mlp.experts.107.up_proj.weight": "model-00018-of-00047.safetensors", + "model.layers.17.mlp.experts.107.up_proj.weight_scale": "model-00018-of-00047.safetensors", + "model.layers.17.mlp.experts.108.down_proj.weight": "model-00018-of-00047.safetensors", + "model.layers.17.mlp.experts.108.down_proj.weight_scale": "model-00018-of-00047.safetensors", + "model.layers.17.mlp.experts.108.gate_proj.weight": "model-00018-of-00047.safetensors", + "model.layers.17.mlp.experts.108.gate_proj.weight_scale": "model-00018-of-00047.safetensors", + "model.layers.17.mlp.experts.108.up_proj.weight": "model-00018-of-00047.safetensors", + "model.layers.17.mlp.experts.108.up_proj.weight_scale": "model-00018-of-00047.safetensors", + "model.layers.17.mlp.experts.109.down_proj.weight": "model-00018-of-00047.safetensors", + "model.layers.17.mlp.experts.109.down_proj.weight_scale": "model-00018-of-00047.safetensors", + "model.layers.17.mlp.experts.109.gate_proj.weight": "model-00018-of-00047.safetensors", + "model.layers.17.mlp.experts.109.gate_proj.weight_scale": "model-00018-of-00047.safetensors", + "model.layers.17.mlp.experts.109.up_proj.weight": "model-00018-of-00047.safetensors", + "model.layers.17.mlp.experts.109.up_proj.weight_scale": "model-00018-of-00047.safetensors", + "model.layers.17.mlp.experts.11.down_proj.weight": "model-00018-of-00047.safetensors", + "model.layers.17.mlp.experts.11.down_proj.weight_scale": "model-00018-of-00047.safetensors", + "model.layers.17.mlp.experts.11.gate_proj.weight": "model-00018-of-00047.safetensors", + "model.layers.17.mlp.experts.11.gate_proj.weight_scale": "model-00018-of-00047.safetensors", + "model.layers.17.mlp.experts.11.up_proj.weight": "model-00018-of-00047.safetensors", + "model.layers.17.mlp.experts.11.up_proj.weight_scale": "model-00018-of-00047.safetensors", + "model.layers.17.mlp.experts.110.down_proj.weight": "model-00018-of-00047.safetensors", + "model.layers.17.mlp.experts.110.down_proj.weight_scale": "model-00018-of-00047.safetensors", + "model.layers.17.mlp.experts.110.gate_proj.weight": "model-00018-of-00047.safetensors", + "model.layers.17.mlp.experts.110.gate_proj.weight_scale": "model-00018-of-00047.safetensors", + "model.layers.17.mlp.experts.110.up_proj.weight": "model-00018-of-00047.safetensors", + "model.layers.17.mlp.experts.110.up_proj.weight_scale": "model-00018-of-00047.safetensors", + "model.layers.17.mlp.experts.111.down_proj.weight": "model-00018-of-00047.safetensors", + "model.layers.17.mlp.experts.111.down_proj.weight_scale": "model-00018-of-00047.safetensors", + "model.layers.17.mlp.experts.111.gate_proj.weight": "model-00018-of-00047.safetensors", + "model.layers.17.mlp.experts.111.gate_proj.weight_scale": "model-00018-of-00047.safetensors", + "model.layers.17.mlp.experts.111.up_proj.weight": "model-00018-of-00047.safetensors", + "model.layers.17.mlp.experts.111.up_proj.weight_scale": "model-00018-of-00047.safetensors", + "model.layers.17.mlp.experts.112.down_proj.weight": "model-00018-of-00047.safetensors", + "model.layers.17.mlp.experts.112.down_proj.weight_scale": "model-00018-of-00047.safetensors", + "model.layers.17.mlp.experts.112.gate_proj.weight": "model-00018-of-00047.safetensors", + "model.layers.17.mlp.experts.112.gate_proj.weight_scale": "model-00018-of-00047.safetensors", + "model.layers.17.mlp.experts.112.up_proj.weight": "model-00018-of-00047.safetensors", + "model.layers.17.mlp.experts.112.up_proj.weight_scale": "model-00018-of-00047.safetensors", + "model.layers.17.mlp.experts.113.down_proj.weight": "model-00018-of-00047.safetensors", + "model.layers.17.mlp.experts.113.down_proj.weight_scale": "model-00018-of-00047.safetensors", + "model.layers.17.mlp.experts.113.gate_proj.weight": "model-00018-of-00047.safetensors", + "model.layers.17.mlp.experts.113.gate_proj.weight_scale": "model-00018-of-00047.safetensors", + "model.layers.17.mlp.experts.113.up_proj.weight": "model-00018-of-00047.safetensors", + "model.layers.17.mlp.experts.113.up_proj.weight_scale": "model-00018-of-00047.safetensors", + "model.layers.17.mlp.experts.114.down_proj.weight": "model-00018-of-00047.safetensors", + "model.layers.17.mlp.experts.114.down_proj.weight_scale": "model-00018-of-00047.safetensors", + "model.layers.17.mlp.experts.114.gate_proj.weight": "model-00018-of-00047.safetensors", + "model.layers.17.mlp.experts.114.gate_proj.weight_scale": "model-00018-of-00047.safetensors", + "model.layers.17.mlp.experts.114.up_proj.weight": "model-00018-of-00047.safetensors", + "model.layers.17.mlp.experts.114.up_proj.weight_scale": "model-00018-of-00047.safetensors", + "model.layers.17.mlp.experts.115.down_proj.weight": "model-00018-of-00047.safetensors", + "model.layers.17.mlp.experts.115.down_proj.weight_scale": "model-00018-of-00047.safetensors", + "model.layers.17.mlp.experts.115.gate_proj.weight": "model-00018-of-00047.safetensors", + "model.layers.17.mlp.experts.115.gate_proj.weight_scale": "model-00018-of-00047.safetensors", + "model.layers.17.mlp.experts.115.up_proj.weight": "model-00018-of-00047.safetensors", + "model.layers.17.mlp.experts.115.up_proj.weight_scale": "model-00018-of-00047.safetensors", + "model.layers.17.mlp.experts.116.down_proj.weight": "model-00018-of-00047.safetensors", + "model.layers.17.mlp.experts.116.down_proj.weight_scale": "model-00018-of-00047.safetensors", + "model.layers.17.mlp.experts.116.gate_proj.weight": "model-00018-of-00047.safetensors", + "model.layers.17.mlp.experts.116.gate_proj.weight_scale": "model-00018-of-00047.safetensors", + "model.layers.17.mlp.experts.116.up_proj.weight": "model-00018-of-00047.safetensors", + "model.layers.17.mlp.experts.116.up_proj.weight_scale": "model-00018-of-00047.safetensors", + "model.layers.17.mlp.experts.117.down_proj.weight": "model-00018-of-00047.safetensors", + "model.layers.17.mlp.experts.117.down_proj.weight_scale": "model-00018-of-00047.safetensors", + "model.layers.17.mlp.experts.117.gate_proj.weight": "model-00018-of-00047.safetensors", + "model.layers.17.mlp.experts.117.gate_proj.weight_scale": "model-00018-of-00047.safetensors", + "model.layers.17.mlp.experts.117.up_proj.weight": "model-00018-of-00047.safetensors", + "model.layers.17.mlp.experts.117.up_proj.weight_scale": "model-00018-of-00047.safetensors", + "model.layers.17.mlp.experts.118.down_proj.weight": "model-00018-of-00047.safetensors", + "model.layers.17.mlp.experts.118.down_proj.weight_scale": "model-00018-of-00047.safetensors", + "model.layers.17.mlp.experts.118.gate_proj.weight": "model-00018-of-00047.safetensors", + "model.layers.17.mlp.experts.118.gate_proj.weight_scale": "model-00018-of-00047.safetensors", + "model.layers.17.mlp.experts.118.up_proj.weight": "model-00018-of-00047.safetensors", + "model.layers.17.mlp.experts.118.up_proj.weight_scale": "model-00018-of-00047.safetensors", + "model.layers.17.mlp.experts.119.down_proj.weight": "model-00018-of-00047.safetensors", + "model.layers.17.mlp.experts.119.down_proj.weight_scale": "model-00018-of-00047.safetensors", + "model.layers.17.mlp.experts.119.gate_proj.weight": "model-00018-of-00047.safetensors", + "model.layers.17.mlp.experts.119.gate_proj.weight_scale": "model-00018-of-00047.safetensors", + "model.layers.17.mlp.experts.119.up_proj.weight": "model-00018-of-00047.safetensors", + "model.layers.17.mlp.experts.119.up_proj.weight_scale": "model-00018-of-00047.safetensors", + "model.layers.17.mlp.experts.12.down_proj.weight": "model-00018-of-00047.safetensors", + "model.layers.17.mlp.experts.12.down_proj.weight_scale": "model-00018-of-00047.safetensors", + "model.layers.17.mlp.experts.12.gate_proj.weight": "model-00018-of-00047.safetensors", + "model.layers.17.mlp.experts.12.gate_proj.weight_scale": "model-00018-of-00047.safetensors", + "model.layers.17.mlp.experts.12.up_proj.weight": "model-00018-of-00047.safetensors", + "model.layers.17.mlp.experts.12.up_proj.weight_scale": "model-00018-of-00047.safetensors", + "model.layers.17.mlp.experts.120.down_proj.weight": "model-00018-of-00047.safetensors", + "model.layers.17.mlp.experts.120.down_proj.weight_scale": "model-00018-of-00047.safetensors", + "model.layers.17.mlp.experts.120.gate_proj.weight": "model-00018-of-00047.safetensors", + "model.layers.17.mlp.experts.120.gate_proj.weight_scale": "model-00018-of-00047.safetensors", + "model.layers.17.mlp.experts.120.up_proj.weight": "model-00018-of-00047.safetensors", + "model.layers.17.mlp.experts.120.up_proj.weight_scale": "model-00018-of-00047.safetensors", + "model.layers.17.mlp.experts.121.down_proj.weight": "model-00018-of-00047.safetensors", + "model.layers.17.mlp.experts.121.down_proj.weight_scale": "model-00018-of-00047.safetensors", + "model.layers.17.mlp.experts.121.gate_proj.weight": "model-00018-of-00047.safetensors", + "model.layers.17.mlp.experts.121.gate_proj.weight_scale": "model-00018-of-00047.safetensors", + "model.layers.17.mlp.experts.121.up_proj.weight": "model-00018-of-00047.safetensors", + "model.layers.17.mlp.experts.121.up_proj.weight_scale": "model-00018-of-00047.safetensors", + "model.layers.17.mlp.experts.122.down_proj.weight": "model-00018-of-00047.safetensors", + "model.layers.17.mlp.experts.122.down_proj.weight_scale": "model-00018-of-00047.safetensors", + "model.layers.17.mlp.experts.122.gate_proj.weight": "model-00018-of-00047.safetensors", + "model.layers.17.mlp.experts.122.gate_proj.weight_scale": "model-00018-of-00047.safetensors", + "model.layers.17.mlp.experts.122.up_proj.weight": "model-00018-of-00047.safetensors", + "model.layers.17.mlp.experts.122.up_proj.weight_scale": "model-00018-of-00047.safetensors", + "model.layers.17.mlp.experts.123.down_proj.weight": "model-00018-of-00047.safetensors", + "model.layers.17.mlp.experts.123.down_proj.weight_scale": "model-00018-of-00047.safetensors", + "model.layers.17.mlp.experts.123.gate_proj.weight": "model-00018-of-00047.safetensors", + "model.layers.17.mlp.experts.123.gate_proj.weight_scale": "model-00018-of-00047.safetensors", + "model.layers.17.mlp.experts.123.up_proj.weight": "model-00018-of-00047.safetensors", + "model.layers.17.mlp.experts.123.up_proj.weight_scale": "model-00018-of-00047.safetensors", + "model.layers.17.mlp.experts.124.down_proj.weight": "model-00018-of-00047.safetensors", + "model.layers.17.mlp.experts.124.down_proj.weight_scale": "model-00018-of-00047.safetensors", + "model.layers.17.mlp.experts.124.gate_proj.weight": "model-00018-of-00047.safetensors", + "model.layers.17.mlp.experts.124.gate_proj.weight_scale": "model-00018-of-00047.safetensors", + "model.layers.17.mlp.experts.124.up_proj.weight": "model-00018-of-00047.safetensors", + "model.layers.17.mlp.experts.124.up_proj.weight_scale": "model-00018-of-00047.safetensors", + "model.layers.17.mlp.experts.125.down_proj.weight": "model-00018-of-00047.safetensors", + "model.layers.17.mlp.experts.125.down_proj.weight_scale": "model-00018-of-00047.safetensors", + "model.layers.17.mlp.experts.125.gate_proj.weight": "model-00018-of-00047.safetensors", + "model.layers.17.mlp.experts.125.gate_proj.weight_scale": "model-00018-of-00047.safetensors", + "model.layers.17.mlp.experts.125.up_proj.weight": "model-00018-of-00047.safetensors", + "model.layers.17.mlp.experts.125.up_proj.weight_scale": "model-00018-of-00047.safetensors", + "model.layers.17.mlp.experts.126.down_proj.weight": "model-00018-of-00047.safetensors", + "model.layers.17.mlp.experts.126.down_proj.weight_scale": "model-00018-of-00047.safetensors", + "model.layers.17.mlp.experts.126.gate_proj.weight": "model-00018-of-00047.safetensors", + "model.layers.17.mlp.experts.126.gate_proj.weight_scale": "model-00018-of-00047.safetensors", + "model.layers.17.mlp.experts.126.up_proj.weight": "model-00018-of-00047.safetensors", + "model.layers.17.mlp.experts.126.up_proj.weight_scale": "model-00018-of-00047.safetensors", + "model.layers.17.mlp.experts.127.down_proj.weight": "model-00018-of-00047.safetensors", + "model.layers.17.mlp.experts.127.down_proj.weight_scale": "model-00018-of-00047.safetensors", + "model.layers.17.mlp.experts.127.gate_proj.weight": "model-00018-of-00047.safetensors", + "model.layers.17.mlp.experts.127.gate_proj.weight_scale": "model-00018-of-00047.safetensors", + "model.layers.17.mlp.experts.127.up_proj.weight": "model-00018-of-00047.safetensors", + "model.layers.17.mlp.experts.127.up_proj.weight_scale": "model-00018-of-00047.safetensors", + "model.layers.17.mlp.experts.13.down_proj.weight": "model-00018-of-00047.safetensors", + "model.layers.17.mlp.experts.13.down_proj.weight_scale": "model-00018-of-00047.safetensors", + "model.layers.17.mlp.experts.13.gate_proj.weight": "model-00018-of-00047.safetensors", + "model.layers.17.mlp.experts.13.gate_proj.weight_scale": "model-00018-of-00047.safetensors", + "model.layers.17.mlp.experts.13.up_proj.weight": "model-00018-of-00047.safetensors", + "model.layers.17.mlp.experts.13.up_proj.weight_scale": "model-00018-of-00047.safetensors", + "model.layers.17.mlp.experts.14.down_proj.weight": "model-00018-of-00047.safetensors", + "model.layers.17.mlp.experts.14.down_proj.weight_scale": "model-00018-of-00047.safetensors", + "model.layers.17.mlp.experts.14.gate_proj.weight": "model-00018-of-00047.safetensors", + "model.layers.17.mlp.experts.14.gate_proj.weight_scale": "model-00018-of-00047.safetensors", + "model.layers.17.mlp.experts.14.up_proj.weight": "model-00018-of-00047.safetensors", + "model.layers.17.mlp.experts.14.up_proj.weight_scale": "model-00018-of-00047.safetensors", + "model.layers.17.mlp.experts.15.down_proj.weight": "model-00018-of-00047.safetensors", + "model.layers.17.mlp.experts.15.down_proj.weight_scale": "model-00018-of-00047.safetensors", + "model.layers.17.mlp.experts.15.gate_proj.weight": "model-00018-of-00047.safetensors", + "model.layers.17.mlp.experts.15.gate_proj.weight_scale": "model-00018-of-00047.safetensors", + "model.layers.17.mlp.experts.15.up_proj.weight": "model-00018-of-00047.safetensors", + "model.layers.17.mlp.experts.15.up_proj.weight_scale": "model-00018-of-00047.safetensors", + "model.layers.17.mlp.experts.16.down_proj.weight": "model-00018-of-00047.safetensors", + "model.layers.17.mlp.experts.16.down_proj.weight_scale": "model-00018-of-00047.safetensors", + "model.layers.17.mlp.experts.16.gate_proj.weight": "model-00018-of-00047.safetensors", + "model.layers.17.mlp.experts.16.gate_proj.weight_scale": "model-00018-of-00047.safetensors", + "model.layers.17.mlp.experts.16.up_proj.weight": "model-00018-of-00047.safetensors", + "model.layers.17.mlp.experts.16.up_proj.weight_scale": "model-00018-of-00047.safetensors", + "model.layers.17.mlp.experts.17.down_proj.weight": "model-00018-of-00047.safetensors", + "model.layers.17.mlp.experts.17.down_proj.weight_scale": "model-00018-of-00047.safetensors", + "model.layers.17.mlp.experts.17.gate_proj.weight": "model-00018-of-00047.safetensors", + "model.layers.17.mlp.experts.17.gate_proj.weight_scale": "model-00018-of-00047.safetensors", + "model.layers.17.mlp.experts.17.up_proj.weight": "model-00018-of-00047.safetensors", + "model.layers.17.mlp.experts.17.up_proj.weight_scale": "model-00018-of-00047.safetensors", + "model.layers.17.mlp.experts.18.down_proj.weight": "model-00018-of-00047.safetensors", + "model.layers.17.mlp.experts.18.down_proj.weight_scale": "model-00018-of-00047.safetensors", + "model.layers.17.mlp.experts.18.gate_proj.weight": "model-00018-of-00047.safetensors", + "model.layers.17.mlp.experts.18.gate_proj.weight_scale": "model-00018-of-00047.safetensors", + "model.layers.17.mlp.experts.18.up_proj.weight": "model-00018-of-00047.safetensors", + "model.layers.17.mlp.experts.18.up_proj.weight_scale": "model-00018-of-00047.safetensors", + "model.layers.17.mlp.experts.19.down_proj.weight": "model-00018-of-00047.safetensors", + "model.layers.17.mlp.experts.19.down_proj.weight_scale": "model-00018-of-00047.safetensors", + "model.layers.17.mlp.experts.19.gate_proj.weight": "model-00018-of-00047.safetensors", + "model.layers.17.mlp.experts.19.gate_proj.weight_scale": "model-00018-of-00047.safetensors", + "model.layers.17.mlp.experts.19.up_proj.weight": "model-00018-of-00047.safetensors", + "model.layers.17.mlp.experts.19.up_proj.weight_scale": "model-00018-of-00047.safetensors", + "model.layers.17.mlp.experts.2.down_proj.weight": "model-00018-of-00047.safetensors", + "model.layers.17.mlp.experts.2.down_proj.weight_scale": "model-00018-of-00047.safetensors", + "model.layers.17.mlp.experts.2.gate_proj.weight": "model-00018-of-00047.safetensors", + "model.layers.17.mlp.experts.2.gate_proj.weight_scale": "model-00018-of-00047.safetensors", + "model.layers.17.mlp.experts.2.up_proj.weight": "model-00018-of-00047.safetensors", + "model.layers.17.mlp.experts.2.up_proj.weight_scale": "model-00018-of-00047.safetensors", + "model.layers.17.mlp.experts.20.down_proj.weight": "model-00018-of-00047.safetensors", + "model.layers.17.mlp.experts.20.down_proj.weight_scale": "model-00018-of-00047.safetensors", + "model.layers.17.mlp.experts.20.gate_proj.weight": "model-00018-of-00047.safetensors", + "model.layers.17.mlp.experts.20.gate_proj.weight_scale": "model-00018-of-00047.safetensors", + "model.layers.17.mlp.experts.20.up_proj.weight": "model-00018-of-00047.safetensors", + "model.layers.17.mlp.experts.20.up_proj.weight_scale": "model-00018-of-00047.safetensors", + "model.layers.17.mlp.experts.21.down_proj.weight": "model-00018-of-00047.safetensors", + "model.layers.17.mlp.experts.21.down_proj.weight_scale": "model-00018-of-00047.safetensors", + "model.layers.17.mlp.experts.21.gate_proj.weight": "model-00018-of-00047.safetensors", + "model.layers.17.mlp.experts.21.gate_proj.weight_scale": "model-00018-of-00047.safetensors", + "model.layers.17.mlp.experts.21.up_proj.weight": "model-00018-of-00047.safetensors", + "model.layers.17.mlp.experts.21.up_proj.weight_scale": "model-00018-of-00047.safetensors", + "model.layers.17.mlp.experts.22.down_proj.weight": "model-00018-of-00047.safetensors", + "model.layers.17.mlp.experts.22.down_proj.weight_scale": "model-00018-of-00047.safetensors", + "model.layers.17.mlp.experts.22.gate_proj.weight": "model-00018-of-00047.safetensors", + "model.layers.17.mlp.experts.22.gate_proj.weight_scale": "model-00018-of-00047.safetensors", + "model.layers.17.mlp.experts.22.up_proj.weight": "model-00018-of-00047.safetensors", + "model.layers.17.mlp.experts.22.up_proj.weight_scale": "model-00018-of-00047.safetensors", + "model.layers.17.mlp.experts.23.down_proj.weight": "model-00018-of-00047.safetensors", + "model.layers.17.mlp.experts.23.down_proj.weight_scale": "model-00018-of-00047.safetensors", + "model.layers.17.mlp.experts.23.gate_proj.weight": "model-00018-of-00047.safetensors", + "model.layers.17.mlp.experts.23.gate_proj.weight_scale": "model-00018-of-00047.safetensors", + "model.layers.17.mlp.experts.23.up_proj.weight": "model-00018-of-00047.safetensors", + "model.layers.17.mlp.experts.23.up_proj.weight_scale": "model-00018-of-00047.safetensors", + "model.layers.17.mlp.experts.24.down_proj.weight": "model-00018-of-00047.safetensors", + "model.layers.17.mlp.experts.24.down_proj.weight_scale": "model-00018-of-00047.safetensors", + "model.layers.17.mlp.experts.24.gate_proj.weight": "model-00018-of-00047.safetensors", + "model.layers.17.mlp.experts.24.gate_proj.weight_scale": "model-00018-of-00047.safetensors", + "model.layers.17.mlp.experts.24.up_proj.weight": "model-00018-of-00047.safetensors", + "model.layers.17.mlp.experts.24.up_proj.weight_scale": "model-00018-of-00047.safetensors", + "model.layers.17.mlp.experts.25.down_proj.weight": "model-00018-of-00047.safetensors", + "model.layers.17.mlp.experts.25.down_proj.weight_scale": "model-00018-of-00047.safetensors", + "model.layers.17.mlp.experts.25.gate_proj.weight": "model-00018-of-00047.safetensors", + "model.layers.17.mlp.experts.25.gate_proj.weight_scale": "model-00018-of-00047.safetensors", + "model.layers.17.mlp.experts.25.up_proj.weight": "model-00018-of-00047.safetensors", + "model.layers.17.mlp.experts.25.up_proj.weight_scale": "model-00018-of-00047.safetensors", + "model.layers.17.mlp.experts.26.down_proj.weight": "model-00018-of-00047.safetensors", + "model.layers.17.mlp.experts.26.down_proj.weight_scale": "model-00018-of-00047.safetensors", + "model.layers.17.mlp.experts.26.gate_proj.weight": "model-00018-of-00047.safetensors", + "model.layers.17.mlp.experts.26.gate_proj.weight_scale": "model-00018-of-00047.safetensors", + "model.layers.17.mlp.experts.26.up_proj.weight": "model-00018-of-00047.safetensors", + "model.layers.17.mlp.experts.26.up_proj.weight_scale": "model-00018-of-00047.safetensors", + "model.layers.17.mlp.experts.27.down_proj.weight": "model-00018-of-00047.safetensors", + "model.layers.17.mlp.experts.27.down_proj.weight_scale": "model-00018-of-00047.safetensors", + "model.layers.17.mlp.experts.27.gate_proj.weight": "model-00018-of-00047.safetensors", + "model.layers.17.mlp.experts.27.gate_proj.weight_scale": "model-00018-of-00047.safetensors", + "model.layers.17.mlp.experts.27.up_proj.weight": "model-00018-of-00047.safetensors", + "model.layers.17.mlp.experts.27.up_proj.weight_scale": "model-00018-of-00047.safetensors", + "model.layers.17.mlp.experts.28.down_proj.weight": "model-00018-of-00047.safetensors", + "model.layers.17.mlp.experts.28.down_proj.weight_scale": "model-00018-of-00047.safetensors", + "model.layers.17.mlp.experts.28.gate_proj.weight": "model-00018-of-00047.safetensors", + "model.layers.17.mlp.experts.28.gate_proj.weight_scale": "model-00018-of-00047.safetensors", + "model.layers.17.mlp.experts.28.up_proj.weight": "model-00018-of-00047.safetensors", + "model.layers.17.mlp.experts.28.up_proj.weight_scale": "model-00018-of-00047.safetensors", + "model.layers.17.mlp.experts.29.down_proj.weight": "model-00018-of-00047.safetensors", + "model.layers.17.mlp.experts.29.down_proj.weight_scale": "model-00018-of-00047.safetensors", + "model.layers.17.mlp.experts.29.gate_proj.weight": "model-00018-of-00047.safetensors", + "model.layers.17.mlp.experts.29.gate_proj.weight_scale": "model-00018-of-00047.safetensors", + "model.layers.17.mlp.experts.29.up_proj.weight": "model-00018-of-00047.safetensors", + "model.layers.17.mlp.experts.29.up_proj.weight_scale": "model-00018-of-00047.safetensors", + "model.layers.17.mlp.experts.3.down_proj.weight": "model-00018-of-00047.safetensors", + "model.layers.17.mlp.experts.3.down_proj.weight_scale": "model-00018-of-00047.safetensors", + "model.layers.17.mlp.experts.3.gate_proj.weight": "model-00018-of-00047.safetensors", + "model.layers.17.mlp.experts.3.gate_proj.weight_scale": "model-00018-of-00047.safetensors", + "model.layers.17.mlp.experts.3.up_proj.weight": "model-00018-of-00047.safetensors", + "model.layers.17.mlp.experts.3.up_proj.weight_scale": "model-00018-of-00047.safetensors", + "model.layers.17.mlp.experts.30.down_proj.weight": "model-00018-of-00047.safetensors", + "model.layers.17.mlp.experts.30.down_proj.weight_scale": "model-00018-of-00047.safetensors", + "model.layers.17.mlp.experts.30.gate_proj.weight": "model-00018-of-00047.safetensors", + "model.layers.17.mlp.experts.30.gate_proj.weight_scale": "model-00018-of-00047.safetensors", + "model.layers.17.mlp.experts.30.up_proj.weight": "model-00018-of-00047.safetensors", + "model.layers.17.mlp.experts.30.up_proj.weight_scale": "model-00018-of-00047.safetensors", + "model.layers.17.mlp.experts.31.down_proj.weight": "model-00018-of-00047.safetensors", + "model.layers.17.mlp.experts.31.down_proj.weight_scale": "model-00018-of-00047.safetensors", + "model.layers.17.mlp.experts.31.gate_proj.weight": "model-00018-of-00047.safetensors", + "model.layers.17.mlp.experts.31.gate_proj.weight_scale": "model-00018-of-00047.safetensors", + "model.layers.17.mlp.experts.31.up_proj.weight": "model-00018-of-00047.safetensors", + "model.layers.17.mlp.experts.31.up_proj.weight_scale": "model-00018-of-00047.safetensors", + "model.layers.17.mlp.experts.32.down_proj.weight": "model-00018-of-00047.safetensors", + "model.layers.17.mlp.experts.32.down_proj.weight_scale": "model-00018-of-00047.safetensors", + "model.layers.17.mlp.experts.32.gate_proj.weight": "model-00018-of-00047.safetensors", + "model.layers.17.mlp.experts.32.gate_proj.weight_scale": "model-00018-of-00047.safetensors", + "model.layers.17.mlp.experts.32.up_proj.weight": "model-00018-of-00047.safetensors", + "model.layers.17.mlp.experts.32.up_proj.weight_scale": "model-00018-of-00047.safetensors", + "model.layers.17.mlp.experts.33.down_proj.weight": "model-00018-of-00047.safetensors", + "model.layers.17.mlp.experts.33.down_proj.weight_scale": "model-00018-of-00047.safetensors", + "model.layers.17.mlp.experts.33.gate_proj.weight": "model-00018-of-00047.safetensors", + "model.layers.17.mlp.experts.33.gate_proj.weight_scale": "model-00018-of-00047.safetensors", + "model.layers.17.mlp.experts.33.up_proj.weight": "model-00018-of-00047.safetensors", + "model.layers.17.mlp.experts.33.up_proj.weight_scale": "model-00018-of-00047.safetensors", + "model.layers.17.mlp.experts.34.down_proj.weight": "model-00018-of-00047.safetensors", + "model.layers.17.mlp.experts.34.down_proj.weight_scale": "model-00018-of-00047.safetensors", + "model.layers.17.mlp.experts.34.gate_proj.weight": "model-00018-of-00047.safetensors", + "model.layers.17.mlp.experts.34.gate_proj.weight_scale": "model-00018-of-00047.safetensors", + "model.layers.17.mlp.experts.34.up_proj.weight": "model-00018-of-00047.safetensors", + "model.layers.17.mlp.experts.34.up_proj.weight_scale": "model-00018-of-00047.safetensors", + "model.layers.17.mlp.experts.35.down_proj.weight": "model-00018-of-00047.safetensors", + "model.layers.17.mlp.experts.35.down_proj.weight_scale": "model-00018-of-00047.safetensors", + "model.layers.17.mlp.experts.35.gate_proj.weight": "model-00018-of-00047.safetensors", + "model.layers.17.mlp.experts.35.gate_proj.weight_scale": "model-00018-of-00047.safetensors", + "model.layers.17.mlp.experts.35.up_proj.weight": "model-00018-of-00047.safetensors", + "model.layers.17.mlp.experts.35.up_proj.weight_scale": "model-00018-of-00047.safetensors", + "model.layers.17.mlp.experts.36.down_proj.weight": "model-00018-of-00047.safetensors", + "model.layers.17.mlp.experts.36.down_proj.weight_scale": "model-00018-of-00047.safetensors", + "model.layers.17.mlp.experts.36.gate_proj.weight": "model-00018-of-00047.safetensors", + "model.layers.17.mlp.experts.36.gate_proj.weight_scale": "model-00018-of-00047.safetensors", + "model.layers.17.mlp.experts.36.up_proj.weight": "model-00018-of-00047.safetensors", + "model.layers.17.mlp.experts.36.up_proj.weight_scale": "model-00018-of-00047.safetensors", + "model.layers.17.mlp.experts.37.down_proj.weight": "model-00018-of-00047.safetensors", + "model.layers.17.mlp.experts.37.down_proj.weight_scale": "model-00018-of-00047.safetensors", + "model.layers.17.mlp.experts.37.gate_proj.weight": "model-00018-of-00047.safetensors", + "model.layers.17.mlp.experts.37.gate_proj.weight_scale": "model-00018-of-00047.safetensors", + "model.layers.17.mlp.experts.37.up_proj.weight": "model-00018-of-00047.safetensors", + "model.layers.17.mlp.experts.37.up_proj.weight_scale": "model-00018-of-00047.safetensors", + "model.layers.17.mlp.experts.38.down_proj.weight": "model-00018-of-00047.safetensors", + "model.layers.17.mlp.experts.38.down_proj.weight_scale": "model-00018-of-00047.safetensors", + "model.layers.17.mlp.experts.38.gate_proj.weight": "model-00018-of-00047.safetensors", + "model.layers.17.mlp.experts.38.gate_proj.weight_scale": "model-00018-of-00047.safetensors", + "model.layers.17.mlp.experts.38.up_proj.weight": "model-00018-of-00047.safetensors", + "model.layers.17.mlp.experts.38.up_proj.weight_scale": "model-00018-of-00047.safetensors", + "model.layers.17.mlp.experts.39.down_proj.weight": "model-00018-of-00047.safetensors", + "model.layers.17.mlp.experts.39.down_proj.weight_scale": "model-00018-of-00047.safetensors", + "model.layers.17.mlp.experts.39.gate_proj.weight": "model-00018-of-00047.safetensors", + "model.layers.17.mlp.experts.39.gate_proj.weight_scale": "model-00018-of-00047.safetensors", + "model.layers.17.mlp.experts.39.up_proj.weight": "model-00018-of-00047.safetensors", + "model.layers.17.mlp.experts.39.up_proj.weight_scale": "model-00018-of-00047.safetensors", + "model.layers.17.mlp.experts.4.down_proj.weight": "model-00018-of-00047.safetensors", + "model.layers.17.mlp.experts.4.down_proj.weight_scale": "model-00018-of-00047.safetensors", + "model.layers.17.mlp.experts.4.gate_proj.weight": "model-00018-of-00047.safetensors", + "model.layers.17.mlp.experts.4.gate_proj.weight_scale": "model-00018-of-00047.safetensors", + "model.layers.17.mlp.experts.4.up_proj.weight": "model-00018-of-00047.safetensors", + "model.layers.17.mlp.experts.4.up_proj.weight_scale": "model-00018-of-00047.safetensors", + "model.layers.17.mlp.experts.40.down_proj.weight": "model-00018-of-00047.safetensors", + "model.layers.17.mlp.experts.40.down_proj.weight_scale": "model-00018-of-00047.safetensors", + "model.layers.17.mlp.experts.40.gate_proj.weight": "model-00018-of-00047.safetensors", + "model.layers.17.mlp.experts.40.gate_proj.weight_scale": "model-00018-of-00047.safetensors", + "model.layers.17.mlp.experts.40.up_proj.weight": "model-00018-of-00047.safetensors", + "model.layers.17.mlp.experts.40.up_proj.weight_scale": "model-00018-of-00047.safetensors", + "model.layers.17.mlp.experts.41.down_proj.weight": "model-00018-of-00047.safetensors", + "model.layers.17.mlp.experts.41.down_proj.weight_scale": "model-00018-of-00047.safetensors", + "model.layers.17.mlp.experts.41.gate_proj.weight": "model-00018-of-00047.safetensors", + "model.layers.17.mlp.experts.41.gate_proj.weight_scale": "model-00018-of-00047.safetensors", + "model.layers.17.mlp.experts.41.up_proj.weight": "model-00018-of-00047.safetensors", + "model.layers.17.mlp.experts.41.up_proj.weight_scale": "model-00018-of-00047.safetensors", + "model.layers.17.mlp.experts.42.down_proj.weight": "model-00018-of-00047.safetensors", + "model.layers.17.mlp.experts.42.down_proj.weight_scale": "model-00018-of-00047.safetensors", + "model.layers.17.mlp.experts.42.gate_proj.weight": "model-00018-of-00047.safetensors", + "model.layers.17.mlp.experts.42.gate_proj.weight_scale": "model-00018-of-00047.safetensors", + "model.layers.17.mlp.experts.42.up_proj.weight": "model-00018-of-00047.safetensors", + "model.layers.17.mlp.experts.42.up_proj.weight_scale": "model-00018-of-00047.safetensors", + "model.layers.17.mlp.experts.43.down_proj.weight": "model-00018-of-00047.safetensors", + "model.layers.17.mlp.experts.43.down_proj.weight_scale": "model-00018-of-00047.safetensors", + "model.layers.17.mlp.experts.43.gate_proj.weight": "model-00018-of-00047.safetensors", + "model.layers.17.mlp.experts.43.gate_proj.weight_scale": "model-00018-of-00047.safetensors", + "model.layers.17.mlp.experts.43.up_proj.weight": "model-00018-of-00047.safetensors", + "model.layers.17.mlp.experts.43.up_proj.weight_scale": "model-00018-of-00047.safetensors", + "model.layers.17.mlp.experts.44.down_proj.weight": "model-00018-of-00047.safetensors", + "model.layers.17.mlp.experts.44.down_proj.weight_scale": "model-00018-of-00047.safetensors", + "model.layers.17.mlp.experts.44.gate_proj.weight": "model-00018-of-00047.safetensors", + "model.layers.17.mlp.experts.44.gate_proj.weight_scale": "model-00018-of-00047.safetensors", + "model.layers.17.mlp.experts.44.up_proj.weight": "model-00018-of-00047.safetensors", + "model.layers.17.mlp.experts.44.up_proj.weight_scale": "model-00018-of-00047.safetensors", + "model.layers.17.mlp.experts.45.down_proj.weight": "model-00018-of-00047.safetensors", + "model.layers.17.mlp.experts.45.down_proj.weight_scale": "model-00018-of-00047.safetensors", + "model.layers.17.mlp.experts.45.gate_proj.weight": "model-00018-of-00047.safetensors", + "model.layers.17.mlp.experts.45.gate_proj.weight_scale": "model-00018-of-00047.safetensors", + "model.layers.17.mlp.experts.45.up_proj.weight": "model-00018-of-00047.safetensors", + "model.layers.17.mlp.experts.45.up_proj.weight_scale": "model-00018-of-00047.safetensors", + "model.layers.17.mlp.experts.46.down_proj.weight": "model-00018-of-00047.safetensors", + "model.layers.17.mlp.experts.46.down_proj.weight_scale": "model-00018-of-00047.safetensors", + "model.layers.17.mlp.experts.46.gate_proj.weight": "model-00018-of-00047.safetensors", + "model.layers.17.mlp.experts.46.gate_proj.weight_scale": "model-00018-of-00047.safetensors", + "model.layers.17.mlp.experts.46.up_proj.weight": "model-00018-of-00047.safetensors", + "model.layers.17.mlp.experts.46.up_proj.weight_scale": "model-00018-of-00047.safetensors", + "model.layers.17.mlp.experts.47.down_proj.weight": "model-00018-of-00047.safetensors", + "model.layers.17.mlp.experts.47.down_proj.weight_scale": "model-00018-of-00047.safetensors", + "model.layers.17.mlp.experts.47.gate_proj.weight": "model-00018-of-00047.safetensors", + "model.layers.17.mlp.experts.47.gate_proj.weight_scale": "model-00018-of-00047.safetensors", + "model.layers.17.mlp.experts.47.up_proj.weight": "model-00018-of-00047.safetensors", + "model.layers.17.mlp.experts.47.up_proj.weight_scale": "model-00018-of-00047.safetensors", + "model.layers.17.mlp.experts.48.down_proj.weight": "model-00018-of-00047.safetensors", + "model.layers.17.mlp.experts.48.down_proj.weight_scale": "model-00018-of-00047.safetensors", + "model.layers.17.mlp.experts.48.gate_proj.weight": "model-00018-of-00047.safetensors", + "model.layers.17.mlp.experts.48.gate_proj.weight_scale": "model-00018-of-00047.safetensors", + "model.layers.17.mlp.experts.48.up_proj.weight": "model-00018-of-00047.safetensors", + "model.layers.17.mlp.experts.48.up_proj.weight_scale": "model-00018-of-00047.safetensors", + "model.layers.17.mlp.experts.49.down_proj.weight": "model-00018-of-00047.safetensors", + "model.layers.17.mlp.experts.49.down_proj.weight_scale": "model-00018-of-00047.safetensors", + "model.layers.17.mlp.experts.49.gate_proj.weight": "model-00018-of-00047.safetensors", + "model.layers.17.mlp.experts.49.gate_proj.weight_scale": "model-00018-of-00047.safetensors", + "model.layers.17.mlp.experts.49.up_proj.weight": "model-00018-of-00047.safetensors", + "model.layers.17.mlp.experts.49.up_proj.weight_scale": "model-00018-of-00047.safetensors", + "model.layers.17.mlp.experts.5.down_proj.weight": "model-00018-of-00047.safetensors", + "model.layers.17.mlp.experts.5.down_proj.weight_scale": "model-00018-of-00047.safetensors", + "model.layers.17.mlp.experts.5.gate_proj.weight": "model-00018-of-00047.safetensors", + "model.layers.17.mlp.experts.5.gate_proj.weight_scale": "model-00018-of-00047.safetensors", + "model.layers.17.mlp.experts.5.up_proj.weight": "model-00018-of-00047.safetensors", + "model.layers.17.mlp.experts.5.up_proj.weight_scale": "model-00018-of-00047.safetensors", + "model.layers.17.mlp.experts.50.down_proj.weight": "model-00018-of-00047.safetensors", + "model.layers.17.mlp.experts.50.down_proj.weight_scale": "model-00018-of-00047.safetensors", + "model.layers.17.mlp.experts.50.gate_proj.weight": "model-00018-of-00047.safetensors", + "model.layers.17.mlp.experts.50.gate_proj.weight_scale": "model-00018-of-00047.safetensors", + "model.layers.17.mlp.experts.50.up_proj.weight": "model-00018-of-00047.safetensors", + "model.layers.17.mlp.experts.50.up_proj.weight_scale": "model-00018-of-00047.safetensors", + "model.layers.17.mlp.experts.51.down_proj.weight": "model-00018-of-00047.safetensors", + "model.layers.17.mlp.experts.51.down_proj.weight_scale": "model-00018-of-00047.safetensors", + "model.layers.17.mlp.experts.51.gate_proj.weight": "model-00018-of-00047.safetensors", + "model.layers.17.mlp.experts.51.gate_proj.weight_scale": "model-00018-of-00047.safetensors", + "model.layers.17.mlp.experts.51.up_proj.weight": "model-00018-of-00047.safetensors", + "model.layers.17.mlp.experts.51.up_proj.weight_scale": "model-00018-of-00047.safetensors", + "model.layers.17.mlp.experts.52.down_proj.weight": "model-00018-of-00047.safetensors", + "model.layers.17.mlp.experts.52.down_proj.weight_scale": "model-00018-of-00047.safetensors", + "model.layers.17.mlp.experts.52.gate_proj.weight": "model-00018-of-00047.safetensors", + "model.layers.17.mlp.experts.52.gate_proj.weight_scale": "model-00018-of-00047.safetensors", + "model.layers.17.mlp.experts.52.up_proj.weight": "model-00018-of-00047.safetensors", + "model.layers.17.mlp.experts.52.up_proj.weight_scale": "model-00018-of-00047.safetensors", + "model.layers.17.mlp.experts.53.down_proj.weight": "model-00018-of-00047.safetensors", + "model.layers.17.mlp.experts.53.down_proj.weight_scale": "model-00018-of-00047.safetensors", + "model.layers.17.mlp.experts.53.gate_proj.weight": "model-00018-of-00047.safetensors", + "model.layers.17.mlp.experts.53.gate_proj.weight_scale": "model-00018-of-00047.safetensors", + "model.layers.17.mlp.experts.53.up_proj.weight": "model-00018-of-00047.safetensors", + "model.layers.17.mlp.experts.53.up_proj.weight_scale": "model-00018-of-00047.safetensors", + "model.layers.17.mlp.experts.54.down_proj.weight": "model-00018-of-00047.safetensors", + "model.layers.17.mlp.experts.54.down_proj.weight_scale": "model-00018-of-00047.safetensors", + "model.layers.17.mlp.experts.54.gate_proj.weight": "model-00018-of-00047.safetensors", + "model.layers.17.mlp.experts.54.gate_proj.weight_scale": "model-00018-of-00047.safetensors", + "model.layers.17.mlp.experts.54.up_proj.weight": "model-00018-of-00047.safetensors", + "model.layers.17.mlp.experts.54.up_proj.weight_scale": "model-00018-of-00047.safetensors", + "model.layers.17.mlp.experts.55.down_proj.weight": "model-00018-of-00047.safetensors", + "model.layers.17.mlp.experts.55.down_proj.weight_scale": "model-00018-of-00047.safetensors", + "model.layers.17.mlp.experts.55.gate_proj.weight": "model-00018-of-00047.safetensors", + "model.layers.17.mlp.experts.55.gate_proj.weight_scale": "model-00018-of-00047.safetensors", + "model.layers.17.mlp.experts.55.up_proj.weight": "model-00018-of-00047.safetensors", + "model.layers.17.mlp.experts.55.up_proj.weight_scale": "model-00018-of-00047.safetensors", + "model.layers.17.mlp.experts.56.down_proj.weight": "model-00018-of-00047.safetensors", + "model.layers.17.mlp.experts.56.down_proj.weight_scale": "model-00018-of-00047.safetensors", + "model.layers.17.mlp.experts.56.gate_proj.weight": "model-00018-of-00047.safetensors", + "model.layers.17.mlp.experts.56.gate_proj.weight_scale": "model-00018-of-00047.safetensors", + "model.layers.17.mlp.experts.56.up_proj.weight": "model-00018-of-00047.safetensors", + "model.layers.17.mlp.experts.56.up_proj.weight_scale": "model-00018-of-00047.safetensors", + "model.layers.17.mlp.experts.57.down_proj.weight": "model-00018-of-00047.safetensors", + "model.layers.17.mlp.experts.57.down_proj.weight_scale": "model-00018-of-00047.safetensors", + "model.layers.17.mlp.experts.57.gate_proj.weight": "model-00018-of-00047.safetensors", + "model.layers.17.mlp.experts.57.gate_proj.weight_scale": "model-00018-of-00047.safetensors", + "model.layers.17.mlp.experts.57.up_proj.weight": "model-00018-of-00047.safetensors", + "model.layers.17.mlp.experts.57.up_proj.weight_scale": "model-00018-of-00047.safetensors", + "model.layers.17.mlp.experts.58.down_proj.weight": "model-00018-of-00047.safetensors", + "model.layers.17.mlp.experts.58.down_proj.weight_scale": "model-00018-of-00047.safetensors", + "model.layers.17.mlp.experts.58.gate_proj.weight": "model-00018-of-00047.safetensors", + "model.layers.17.mlp.experts.58.gate_proj.weight_scale": "model-00018-of-00047.safetensors", + "model.layers.17.mlp.experts.58.up_proj.weight": "model-00018-of-00047.safetensors", + "model.layers.17.mlp.experts.58.up_proj.weight_scale": "model-00018-of-00047.safetensors", + "model.layers.17.mlp.experts.59.down_proj.weight": "model-00018-of-00047.safetensors", + "model.layers.17.mlp.experts.59.down_proj.weight_scale": "model-00018-of-00047.safetensors", + "model.layers.17.mlp.experts.59.gate_proj.weight": "model-00018-of-00047.safetensors", + "model.layers.17.mlp.experts.59.gate_proj.weight_scale": "model-00018-of-00047.safetensors", + "model.layers.17.mlp.experts.59.up_proj.weight": "model-00018-of-00047.safetensors", + "model.layers.17.mlp.experts.59.up_proj.weight_scale": "model-00018-of-00047.safetensors", + "model.layers.17.mlp.experts.6.down_proj.weight": "model-00018-of-00047.safetensors", + "model.layers.17.mlp.experts.6.down_proj.weight_scale": "model-00018-of-00047.safetensors", + "model.layers.17.mlp.experts.6.gate_proj.weight": "model-00018-of-00047.safetensors", + "model.layers.17.mlp.experts.6.gate_proj.weight_scale": "model-00018-of-00047.safetensors", + "model.layers.17.mlp.experts.6.up_proj.weight": "model-00018-of-00047.safetensors", + "model.layers.17.mlp.experts.6.up_proj.weight_scale": "model-00018-of-00047.safetensors", + "model.layers.17.mlp.experts.60.down_proj.weight": "model-00018-of-00047.safetensors", + "model.layers.17.mlp.experts.60.down_proj.weight_scale": "model-00018-of-00047.safetensors", + "model.layers.17.mlp.experts.60.gate_proj.weight": "model-00018-of-00047.safetensors", + "model.layers.17.mlp.experts.60.gate_proj.weight_scale": "model-00018-of-00047.safetensors", + "model.layers.17.mlp.experts.60.up_proj.weight": "model-00018-of-00047.safetensors", + "model.layers.17.mlp.experts.60.up_proj.weight_scale": "model-00018-of-00047.safetensors", + "model.layers.17.mlp.experts.61.down_proj.weight": "model-00018-of-00047.safetensors", + "model.layers.17.mlp.experts.61.down_proj.weight_scale": "model-00018-of-00047.safetensors", + "model.layers.17.mlp.experts.61.gate_proj.weight": "model-00018-of-00047.safetensors", + "model.layers.17.mlp.experts.61.gate_proj.weight_scale": "model-00018-of-00047.safetensors", + "model.layers.17.mlp.experts.61.up_proj.weight": "model-00018-of-00047.safetensors", + "model.layers.17.mlp.experts.61.up_proj.weight_scale": "model-00018-of-00047.safetensors", + "model.layers.17.mlp.experts.62.down_proj.weight": "model-00018-of-00047.safetensors", + "model.layers.17.mlp.experts.62.down_proj.weight_scale": "model-00018-of-00047.safetensors", + "model.layers.17.mlp.experts.62.gate_proj.weight": "model-00018-of-00047.safetensors", + "model.layers.17.mlp.experts.62.gate_proj.weight_scale": "model-00018-of-00047.safetensors", + "model.layers.17.mlp.experts.62.up_proj.weight": "model-00018-of-00047.safetensors", + "model.layers.17.mlp.experts.62.up_proj.weight_scale": "model-00018-of-00047.safetensors", + "model.layers.17.mlp.experts.63.down_proj.weight": "model-00018-of-00047.safetensors", + "model.layers.17.mlp.experts.63.down_proj.weight_scale": "model-00018-of-00047.safetensors", + "model.layers.17.mlp.experts.63.gate_proj.weight": "model-00018-of-00047.safetensors", + "model.layers.17.mlp.experts.63.gate_proj.weight_scale": "model-00018-of-00047.safetensors", + "model.layers.17.mlp.experts.63.up_proj.weight": "model-00018-of-00047.safetensors", + "model.layers.17.mlp.experts.63.up_proj.weight_scale": "model-00018-of-00047.safetensors", + "model.layers.17.mlp.experts.64.down_proj.weight": "model-00018-of-00047.safetensors", + "model.layers.17.mlp.experts.64.down_proj.weight_scale": "model-00018-of-00047.safetensors", + "model.layers.17.mlp.experts.64.gate_proj.weight": "model-00018-of-00047.safetensors", + "model.layers.17.mlp.experts.64.gate_proj.weight_scale": "model-00018-of-00047.safetensors", + "model.layers.17.mlp.experts.64.up_proj.weight": "model-00018-of-00047.safetensors", + "model.layers.17.mlp.experts.64.up_proj.weight_scale": "model-00018-of-00047.safetensors", + "model.layers.17.mlp.experts.65.down_proj.weight": "model-00018-of-00047.safetensors", + "model.layers.17.mlp.experts.65.down_proj.weight_scale": "model-00018-of-00047.safetensors", + "model.layers.17.mlp.experts.65.gate_proj.weight": "model-00018-of-00047.safetensors", + "model.layers.17.mlp.experts.65.gate_proj.weight_scale": "model-00018-of-00047.safetensors", + "model.layers.17.mlp.experts.65.up_proj.weight": "model-00018-of-00047.safetensors", + "model.layers.17.mlp.experts.65.up_proj.weight_scale": "model-00018-of-00047.safetensors", + "model.layers.17.mlp.experts.66.down_proj.weight": "model-00018-of-00047.safetensors", + "model.layers.17.mlp.experts.66.down_proj.weight_scale": "model-00018-of-00047.safetensors", + "model.layers.17.mlp.experts.66.gate_proj.weight": "model-00018-of-00047.safetensors", + "model.layers.17.mlp.experts.66.gate_proj.weight_scale": "model-00018-of-00047.safetensors", + "model.layers.17.mlp.experts.66.up_proj.weight": "model-00018-of-00047.safetensors", + "model.layers.17.mlp.experts.66.up_proj.weight_scale": "model-00018-of-00047.safetensors", + "model.layers.17.mlp.experts.67.down_proj.weight": "model-00018-of-00047.safetensors", + "model.layers.17.mlp.experts.67.down_proj.weight_scale": "model-00018-of-00047.safetensors", + "model.layers.17.mlp.experts.67.gate_proj.weight": "model-00018-of-00047.safetensors", + "model.layers.17.mlp.experts.67.gate_proj.weight_scale": "model-00018-of-00047.safetensors", + "model.layers.17.mlp.experts.67.up_proj.weight": "model-00018-of-00047.safetensors", + "model.layers.17.mlp.experts.67.up_proj.weight_scale": "model-00018-of-00047.safetensors", + "model.layers.17.mlp.experts.68.down_proj.weight": "model-00018-of-00047.safetensors", + "model.layers.17.mlp.experts.68.down_proj.weight_scale": "model-00018-of-00047.safetensors", + "model.layers.17.mlp.experts.68.gate_proj.weight": "model-00018-of-00047.safetensors", + "model.layers.17.mlp.experts.68.gate_proj.weight_scale": "model-00018-of-00047.safetensors", + "model.layers.17.mlp.experts.68.up_proj.weight": "model-00018-of-00047.safetensors", + "model.layers.17.mlp.experts.68.up_proj.weight_scale": "model-00018-of-00047.safetensors", + "model.layers.17.mlp.experts.69.down_proj.weight": "model-00018-of-00047.safetensors", + "model.layers.17.mlp.experts.69.down_proj.weight_scale": "model-00018-of-00047.safetensors", + "model.layers.17.mlp.experts.69.gate_proj.weight": "model-00018-of-00047.safetensors", + "model.layers.17.mlp.experts.69.gate_proj.weight_scale": "model-00018-of-00047.safetensors", + "model.layers.17.mlp.experts.69.up_proj.weight": "model-00018-of-00047.safetensors", + "model.layers.17.mlp.experts.69.up_proj.weight_scale": "model-00018-of-00047.safetensors", + "model.layers.17.mlp.experts.7.down_proj.weight": "model-00018-of-00047.safetensors", + "model.layers.17.mlp.experts.7.down_proj.weight_scale": "model-00018-of-00047.safetensors", + "model.layers.17.mlp.experts.7.gate_proj.weight": "model-00018-of-00047.safetensors", + "model.layers.17.mlp.experts.7.gate_proj.weight_scale": "model-00018-of-00047.safetensors", + "model.layers.17.mlp.experts.7.up_proj.weight": "model-00018-of-00047.safetensors", + "model.layers.17.mlp.experts.7.up_proj.weight_scale": "model-00018-of-00047.safetensors", + "model.layers.17.mlp.experts.70.down_proj.weight": "model-00018-of-00047.safetensors", + "model.layers.17.mlp.experts.70.down_proj.weight_scale": "model-00018-of-00047.safetensors", + "model.layers.17.mlp.experts.70.gate_proj.weight": "model-00018-of-00047.safetensors", + "model.layers.17.mlp.experts.70.gate_proj.weight_scale": "model-00018-of-00047.safetensors", + "model.layers.17.mlp.experts.70.up_proj.weight": "model-00018-of-00047.safetensors", + "model.layers.17.mlp.experts.70.up_proj.weight_scale": "model-00018-of-00047.safetensors", + "model.layers.17.mlp.experts.71.down_proj.weight": "model-00018-of-00047.safetensors", + "model.layers.17.mlp.experts.71.down_proj.weight_scale": "model-00018-of-00047.safetensors", + "model.layers.17.mlp.experts.71.gate_proj.weight": "model-00018-of-00047.safetensors", + "model.layers.17.mlp.experts.71.gate_proj.weight_scale": "model-00018-of-00047.safetensors", + "model.layers.17.mlp.experts.71.up_proj.weight": "model-00018-of-00047.safetensors", + "model.layers.17.mlp.experts.71.up_proj.weight_scale": "model-00018-of-00047.safetensors", + "model.layers.17.mlp.experts.72.down_proj.weight": "model-00018-of-00047.safetensors", + "model.layers.17.mlp.experts.72.down_proj.weight_scale": "model-00018-of-00047.safetensors", + "model.layers.17.mlp.experts.72.gate_proj.weight": "model-00018-of-00047.safetensors", + "model.layers.17.mlp.experts.72.gate_proj.weight_scale": "model-00018-of-00047.safetensors", + "model.layers.17.mlp.experts.72.up_proj.weight": "model-00018-of-00047.safetensors", + "model.layers.17.mlp.experts.72.up_proj.weight_scale": "model-00018-of-00047.safetensors", + "model.layers.17.mlp.experts.73.down_proj.weight": "model-00018-of-00047.safetensors", + "model.layers.17.mlp.experts.73.down_proj.weight_scale": "model-00018-of-00047.safetensors", + "model.layers.17.mlp.experts.73.gate_proj.weight": "model-00018-of-00047.safetensors", + "model.layers.17.mlp.experts.73.gate_proj.weight_scale": "model-00018-of-00047.safetensors", + "model.layers.17.mlp.experts.73.up_proj.weight": "model-00018-of-00047.safetensors", + "model.layers.17.mlp.experts.73.up_proj.weight_scale": "model-00018-of-00047.safetensors", + "model.layers.17.mlp.experts.74.down_proj.weight": "model-00018-of-00047.safetensors", + "model.layers.17.mlp.experts.74.down_proj.weight_scale": "model-00018-of-00047.safetensors", + "model.layers.17.mlp.experts.74.gate_proj.weight": "model-00018-of-00047.safetensors", + "model.layers.17.mlp.experts.74.gate_proj.weight_scale": "model-00018-of-00047.safetensors", + "model.layers.17.mlp.experts.74.up_proj.weight": "model-00018-of-00047.safetensors", + "model.layers.17.mlp.experts.74.up_proj.weight_scale": "model-00018-of-00047.safetensors", + "model.layers.17.mlp.experts.75.down_proj.weight": "model-00018-of-00047.safetensors", + "model.layers.17.mlp.experts.75.down_proj.weight_scale": "model-00018-of-00047.safetensors", + "model.layers.17.mlp.experts.75.gate_proj.weight": "model-00018-of-00047.safetensors", + "model.layers.17.mlp.experts.75.gate_proj.weight_scale": "model-00018-of-00047.safetensors", + "model.layers.17.mlp.experts.75.up_proj.weight": "model-00018-of-00047.safetensors", + "model.layers.17.mlp.experts.75.up_proj.weight_scale": "model-00018-of-00047.safetensors", + "model.layers.17.mlp.experts.76.down_proj.weight": "model-00018-of-00047.safetensors", + "model.layers.17.mlp.experts.76.down_proj.weight_scale": "model-00018-of-00047.safetensors", + "model.layers.17.mlp.experts.76.gate_proj.weight": "model-00018-of-00047.safetensors", + "model.layers.17.mlp.experts.76.gate_proj.weight_scale": "model-00018-of-00047.safetensors", + "model.layers.17.mlp.experts.76.up_proj.weight": "model-00018-of-00047.safetensors", + "model.layers.17.mlp.experts.76.up_proj.weight_scale": "model-00018-of-00047.safetensors", + "model.layers.17.mlp.experts.77.down_proj.weight": "model-00018-of-00047.safetensors", + "model.layers.17.mlp.experts.77.down_proj.weight_scale": "model-00018-of-00047.safetensors", + "model.layers.17.mlp.experts.77.gate_proj.weight": "model-00018-of-00047.safetensors", + "model.layers.17.mlp.experts.77.gate_proj.weight_scale": "model-00018-of-00047.safetensors", + "model.layers.17.mlp.experts.77.up_proj.weight": "model-00018-of-00047.safetensors", + "model.layers.17.mlp.experts.77.up_proj.weight_scale": "model-00018-of-00047.safetensors", + "model.layers.17.mlp.experts.78.down_proj.weight": "model-00018-of-00047.safetensors", + "model.layers.17.mlp.experts.78.down_proj.weight_scale": "model-00018-of-00047.safetensors", + "model.layers.17.mlp.experts.78.gate_proj.weight": "model-00018-of-00047.safetensors", + "model.layers.17.mlp.experts.78.gate_proj.weight_scale": "model-00018-of-00047.safetensors", + "model.layers.17.mlp.experts.78.up_proj.weight": "model-00018-of-00047.safetensors", + "model.layers.17.mlp.experts.78.up_proj.weight_scale": "model-00018-of-00047.safetensors", + "model.layers.17.mlp.experts.79.down_proj.weight": "model-00018-of-00047.safetensors", + "model.layers.17.mlp.experts.79.down_proj.weight_scale": "model-00018-of-00047.safetensors", + "model.layers.17.mlp.experts.79.gate_proj.weight": "model-00018-of-00047.safetensors", + "model.layers.17.mlp.experts.79.gate_proj.weight_scale": "model-00018-of-00047.safetensors", + "model.layers.17.mlp.experts.79.up_proj.weight": "model-00018-of-00047.safetensors", + "model.layers.17.mlp.experts.79.up_proj.weight_scale": "model-00018-of-00047.safetensors", + "model.layers.17.mlp.experts.8.down_proj.weight": "model-00018-of-00047.safetensors", + "model.layers.17.mlp.experts.8.down_proj.weight_scale": "model-00018-of-00047.safetensors", + "model.layers.17.mlp.experts.8.gate_proj.weight": "model-00018-of-00047.safetensors", + "model.layers.17.mlp.experts.8.gate_proj.weight_scale": "model-00018-of-00047.safetensors", + "model.layers.17.mlp.experts.8.up_proj.weight": "model-00018-of-00047.safetensors", + "model.layers.17.mlp.experts.8.up_proj.weight_scale": "model-00018-of-00047.safetensors", + "model.layers.17.mlp.experts.80.down_proj.weight": "model-00018-of-00047.safetensors", + "model.layers.17.mlp.experts.80.down_proj.weight_scale": "model-00018-of-00047.safetensors", + "model.layers.17.mlp.experts.80.gate_proj.weight": "model-00018-of-00047.safetensors", + "model.layers.17.mlp.experts.80.gate_proj.weight_scale": "model-00018-of-00047.safetensors", + "model.layers.17.mlp.experts.80.up_proj.weight": "model-00018-of-00047.safetensors", + "model.layers.17.mlp.experts.80.up_proj.weight_scale": "model-00018-of-00047.safetensors", + "model.layers.17.mlp.experts.81.down_proj.weight": "model-00018-of-00047.safetensors", + "model.layers.17.mlp.experts.81.down_proj.weight_scale": "model-00018-of-00047.safetensors", + "model.layers.17.mlp.experts.81.gate_proj.weight": "model-00018-of-00047.safetensors", + "model.layers.17.mlp.experts.81.gate_proj.weight_scale": "model-00018-of-00047.safetensors", + "model.layers.17.mlp.experts.81.up_proj.weight": "model-00018-of-00047.safetensors", + "model.layers.17.mlp.experts.81.up_proj.weight_scale": "model-00018-of-00047.safetensors", + "model.layers.17.mlp.experts.82.down_proj.weight": "model-00018-of-00047.safetensors", + "model.layers.17.mlp.experts.82.down_proj.weight_scale": "model-00018-of-00047.safetensors", + "model.layers.17.mlp.experts.82.gate_proj.weight": "model-00018-of-00047.safetensors", + "model.layers.17.mlp.experts.82.gate_proj.weight_scale": "model-00018-of-00047.safetensors", + "model.layers.17.mlp.experts.82.up_proj.weight": "model-00018-of-00047.safetensors", + "model.layers.17.mlp.experts.82.up_proj.weight_scale": "model-00018-of-00047.safetensors", + "model.layers.17.mlp.experts.83.down_proj.weight": "model-00018-of-00047.safetensors", + "model.layers.17.mlp.experts.83.down_proj.weight_scale": "model-00018-of-00047.safetensors", + "model.layers.17.mlp.experts.83.gate_proj.weight": "model-00018-of-00047.safetensors", + "model.layers.17.mlp.experts.83.gate_proj.weight_scale": "model-00018-of-00047.safetensors", + "model.layers.17.mlp.experts.83.up_proj.weight": "model-00018-of-00047.safetensors", + "model.layers.17.mlp.experts.83.up_proj.weight_scale": "model-00018-of-00047.safetensors", + "model.layers.17.mlp.experts.84.down_proj.weight": "model-00018-of-00047.safetensors", + "model.layers.17.mlp.experts.84.down_proj.weight_scale": "model-00018-of-00047.safetensors", + "model.layers.17.mlp.experts.84.gate_proj.weight": "model-00018-of-00047.safetensors", + "model.layers.17.mlp.experts.84.gate_proj.weight_scale": "model-00018-of-00047.safetensors", + "model.layers.17.mlp.experts.84.up_proj.weight": "model-00018-of-00047.safetensors", + "model.layers.17.mlp.experts.84.up_proj.weight_scale": "model-00018-of-00047.safetensors", + "model.layers.17.mlp.experts.85.down_proj.weight": "model-00018-of-00047.safetensors", + "model.layers.17.mlp.experts.85.down_proj.weight_scale": "model-00018-of-00047.safetensors", + "model.layers.17.mlp.experts.85.gate_proj.weight": "model-00018-of-00047.safetensors", + "model.layers.17.mlp.experts.85.gate_proj.weight_scale": "model-00018-of-00047.safetensors", + "model.layers.17.mlp.experts.85.up_proj.weight": "model-00018-of-00047.safetensors", + "model.layers.17.mlp.experts.85.up_proj.weight_scale": "model-00018-of-00047.safetensors", + "model.layers.17.mlp.experts.86.down_proj.weight": "model-00018-of-00047.safetensors", + "model.layers.17.mlp.experts.86.down_proj.weight_scale": "model-00018-of-00047.safetensors", + "model.layers.17.mlp.experts.86.gate_proj.weight": "model-00018-of-00047.safetensors", + "model.layers.17.mlp.experts.86.gate_proj.weight_scale": "model-00018-of-00047.safetensors", + "model.layers.17.mlp.experts.86.up_proj.weight": "model-00018-of-00047.safetensors", + "model.layers.17.mlp.experts.86.up_proj.weight_scale": "model-00018-of-00047.safetensors", + "model.layers.17.mlp.experts.87.down_proj.weight": "model-00018-of-00047.safetensors", + "model.layers.17.mlp.experts.87.down_proj.weight_scale": "model-00018-of-00047.safetensors", + "model.layers.17.mlp.experts.87.gate_proj.weight": "model-00018-of-00047.safetensors", + "model.layers.17.mlp.experts.87.gate_proj.weight_scale": "model-00018-of-00047.safetensors", + "model.layers.17.mlp.experts.87.up_proj.weight": "model-00018-of-00047.safetensors", + "model.layers.17.mlp.experts.87.up_proj.weight_scale": "model-00018-of-00047.safetensors", + "model.layers.17.mlp.experts.88.down_proj.weight": "model-00018-of-00047.safetensors", + "model.layers.17.mlp.experts.88.down_proj.weight_scale": "model-00018-of-00047.safetensors", + "model.layers.17.mlp.experts.88.gate_proj.weight": "model-00018-of-00047.safetensors", + "model.layers.17.mlp.experts.88.gate_proj.weight_scale": "model-00018-of-00047.safetensors", + "model.layers.17.mlp.experts.88.up_proj.weight": "model-00018-of-00047.safetensors", + "model.layers.17.mlp.experts.88.up_proj.weight_scale": "model-00018-of-00047.safetensors", + "model.layers.17.mlp.experts.89.down_proj.weight": "model-00018-of-00047.safetensors", + "model.layers.17.mlp.experts.89.down_proj.weight_scale": "model-00018-of-00047.safetensors", + "model.layers.17.mlp.experts.89.gate_proj.weight": "model-00018-of-00047.safetensors", + "model.layers.17.mlp.experts.89.gate_proj.weight_scale": "model-00018-of-00047.safetensors", + "model.layers.17.mlp.experts.89.up_proj.weight": "model-00018-of-00047.safetensors", + "model.layers.17.mlp.experts.89.up_proj.weight_scale": "model-00018-of-00047.safetensors", + "model.layers.17.mlp.experts.9.down_proj.weight": "model-00018-of-00047.safetensors", + "model.layers.17.mlp.experts.9.down_proj.weight_scale": "model-00018-of-00047.safetensors", + "model.layers.17.mlp.experts.9.gate_proj.weight": "model-00018-of-00047.safetensors", + "model.layers.17.mlp.experts.9.gate_proj.weight_scale": "model-00018-of-00047.safetensors", + "model.layers.17.mlp.experts.9.up_proj.weight": "model-00018-of-00047.safetensors", + "model.layers.17.mlp.experts.9.up_proj.weight_scale": "model-00018-of-00047.safetensors", + "model.layers.17.mlp.experts.90.down_proj.weight": "model-00018-of-00047.safetensors", + "model.layers.17.mlp.experts.90.down_proj.weight_scale": "model-00018-of-00047.safetensors", + "model.layers.17.mlp.experts.90.gate_proj.weight": "model-00018-of-00047.safetensors", + "model.layers.17.mlp.experts.90.gate_proj.weight_scale": "model-00018-of-00047.safetensors", + "model.layers.17.mlp.experts.90.up_proj.weight": "model-00018-of-00047.safetensors", + "model.layers.17.mlp.experts.90.up_proj.weight_scale": "model-00018-of-00047.safetensors", + "model.layers.17.mlp.experts.91.down_proj.weight": "model-00018-of-00047.safetensors", + "model.layers.17.mlp.experts.91.down_proj.weight_scale": "model-00018-of-00047.safetensors", + "model.layers.17.mlp.experts.91.gate_proj.weight": "model-00018-of-00047.safetensors", + "model.layers.17.mlp.experts.91.gate_proj.weight_scale": "model-00018-of-00047.safetensors", + "model.layers.17.mlp.experts.91.up_proj.weight": "model-00018-of-00047.safetensors", + "model.layers.17.mlp.experts.91.up_proj.weight_scale": "model-00018-of-00047.safetensors", + "model.layers.17.mlp.experts.92.down_proj.weight": "model-00018-of-00047.safetensors", + "model.layers.17.mlp.experts.92.down_proj.weight_scale": "model-00018-of-00047.safetensors", + "model.layers.17.mlp.experts.92.gate_proj.weight": "model-00018-of-00047.safetensors", + "model.layers.17.mlp.experts.92.gate_proj.weight_scale": "model-00018-of-00047.safetensors", + "model.layers.17.mlp.experts.92.up_proj.weight": "model-00018-of-00047.safetensors", + "model.layers.17.mlp.experts.92.up_proj.weight_scale": "model-00018-of-00047.safetensors", + "model.layers.17.mlp.experts.93.down_proj.weight": "model-00018-of-00047.safetensors", + "model.layers.17.mlp.experts.93.down_proj.weight_scale": "model-00018-of-00047.safetensors", + "model.layers.17.mlp.experts.93.gate_proj.weight": "model-00018-of-00047.safetensors", + "model.layers.17.mlp.experts.93.gate_proj.weight_scale": "model-00018-of-00047.safetensors", + "model.layers.17.mlp.experts.93.up_proj.weight": "model-00018-of-00047.safetensors", + "model.layers.17.mlp.experts.93.up_proj.weight_scale": "model-00018-of-00047.safetensors", + "model.layers.17.mlp.experts.94.down_proj.weight": "model-00018-of-00047.safetensors", + "model.layers.17.mlp.experts.94.down_proj.weight_scale": "model-00018-of-00047.safetensors", + "model.layers.17.mlp.experts.94.gate_proj.weight": "model-00018-of-00047.safetensors", + "model.layers.17.mlp.experts.94.gate_proj.weight_scale": "model-00018-of-00047.safetensors", + "model.layers.17.mlp.experts.94.up_proj.weight": "model-00018-of-00047.safetensors", + "model.layers.17.mlp.experts.94.up_proj.weight_scale": "model-00018-of-00047.safetensors", + "model.layers.17.mlp.experts.95.down_proj.weight": "model-00018-of-00047.safetensors", + "model.layers.17.mlp.experts.95.down_proj.weight_scale": "model-00018-of-00047.safetensors", + "model.layers.17.mlp.experts.95.gate_proj.weight": "model-00018-of-00047.safetensors", + "model.layers.17.mlp.experts.95.gate_proj.weight_scale": "model-00018-of-00047.safetensors", + "model.layers.17.mlp.experts.95.up_proj.weight": "model-00018-of-00047.safetensors", + "model.layers.17.mlp.experts.95.up_proj.weight_scale": "model-00018-of-00047.safetensors", + "model.layers.17.mlp.experts.96.down_proj.weight": "model-00018-of-00047.safetensors", + "model.layers.17.mlp.experts.96.down_proj.weight_scale": "model-00018-of-00047.safetensors", + "model.layers.17.mlp.experts.96.gate_proj.weight": "model-00018-of-00047.safetensors", + "model.layers.17.mlp.experts.96.gate_proj.weight_scale": "model-00018-of-00047.safetensors", + "model.layers.17.mlp.experts.96.up_proj.weight": "model-00018-of-00047.safetensors", + "model.layers.17.mlp.experts.96.up_proj.weight_scale": "model-00018-of-00047.safetensors", + "model.layers.17.mlp.experts.97.down_proj.weight": "model-00018-of-00047.safetensors", + "model.layers.17.mlp.experts.97.down_proj.weight_scale": "model-00018-of-00047.safetensors", + "model.layers.17.mlp.experts.97.gate_proj.weight": "model-00018-of-00047.safetensors", + "model.layers.17.mlp.experts.97.gate_proj.weight_scale": "model-00018-of-00047.safetensors", + "model.layers.17.mlp.experts.97.up_proj.weight": "model-00018-of-00047.safetensors", + "model.layers.17.mlp.experts.97.up_proj.weight_scale": "model-00018-of-00047.safetensors", + "model.layers.17.mlp.experts.98.down_proj.weight": "model-00018-of-00047.safetensors", + "model.layers.17.mlp.experts.98.down_proj.weight_scale": "model-00018-of-00047.safetensors", + "model.layers.17.mlp.experts.98.gate_proj.weight": "model-00018-of-00047.safetensors", + "model.layers.17.mlp.experts.98.gate_proj.weight_scale": "model-00018-of-00047.safetensors", + "model.layers.17.mlp.experts.98.up_proj.weight": "model-00018-of-00047.safetensors", + "model.layers.17.mlp.experts.98.up_proj.weight_scale": "model-00018-of-00047.safetensors", + "model.layers.17.mlp.experts.99.down_proj.weight": "model-00018-of-00047.safetensors", + "model.layers.17.mlp.experts.99.down_proj.weight_scale": "model-00018-of-00047.safetensors", + "model.layers.17.mlp.experts.99.gate_proj.weight": "model-00018-of-00047.safetensors", + "model.layers.17.mlp.experts.99.gate_proj.weight_scale": "model-00018-of-00047.safetensors", + "model.layers.17.mlp.experts.99.up_proj.weight": "model-00018-of-00047.safetensors", + "model.layers.17.mlp.experts.99.up_proj.weight_scale": "model-00018-of-00047.safetensors", + "model.layers.17.mlp.gate.e_score_correction_bias": "model-00018-of-00047.safetensors", + "model.layers.17.mlp.gate.weight": "model-00018-of-00047.safetensors", + "model.layers.17.mlp.shared_experts.down_proj.weight": "model-00018-of-00047.safetensors", + "model.layers.17.mlp.shared_experts.down_proj.weight_scale": "model-00018-of-00047.safetensors", + "model.layers.17.mlp.shared_experts.gate_proj.weight": "model-00018-of-00047.safetensors", + "model.layers.17.mlp.shared_experts.gate_proj.weight_scale": "model-00018-of-00047.safetensors", + "model.layers.17.mlp.shared_experts.up_proj.weight": "model-00018-of-00047.safetensors", + "model.layers.17.mlp.shared_experts.up_proj.weight_scale": "model-00018-of-00047.safetensors", + "model.layers.17.post_attention_layernorm.weight": "model-00018-of-00047.safetensors", + "model.layers.17.self_attn.k_proj.bias": "model-00018-of-00047.safetensors", + "model.layers.17.self_attn.k_proj.weight": "model-00018-of-00047.safetensors", + "model.layers.17.self_attn.k_proj.weight_scale": "model-00018-of-00047.safetensors", + "model.layers.17.self_attn.o_proj.weight": "model-00018-of-00047.safetensors", + "model.layers.17.self_attn.o_proj.weight_scale": "model-00018-of-00047.safetensors", + "model.layers.17.self_attn.q_proj.bias": "model-00018-of-00047.safetensors", + "model.layers.17.self_attn.q_proj.weight": "model-00018-of-00047.safetensors", + "model.layers.17.self_attn.q_proj.weight_scale": "model-00018-of-00047.safetensors", + "model.layers.17.self_attn.v_proj.bias": "model-00018-of-00047.safetensors", + "model.layers.17.self_attn.v_proj.weight": "model-00018-of-00047.safetensors", + "model.layers.17.self_attn.v_proj.weight_scale": "model-00018-of-00047.safetensors", + "model.layers.18.input_layernorm.weight": "model-00019-of-00047.safetensors", + "model.layers.18.mlp.experts.0.down_proj.weight": "model-00019-of-00047.safetensors", + "model.layers.18.mlp.experts.0.down_proj.weight_scale": "model-00019-of-00047.safetensors", + "model.layers.18.mlp.experts.0.gate_proj.weight": "model-00019-of-00047.safetensors", + "model.layers.18.mlp.experts.0.gate_proj.weight_scale": "model-00019-of-00047.safetensors", + "model.layers.18.mlp.experts.0.up_proj.weight": "model-00019-of-00047.safetensors", + "model.layers.18.mlp.experts.0.up_proj.weight_scale": "model-00019-of-00047.safetensors", + "model.layers.18.mlp.experts.1.down_proj.weight": "model-00019-of-00047.safetensors", + "model.layers.18.mlp.experts.1.down_proj.weight_scale": "model-00019-of-00047.safetensors", + "model.layers.18.mlp.experts.1.gate_proj.weight": "model-00019-of-00047.safetensors", + "model.layers.18.mlp.experts.1.gate_proj.weight_scale": "model-00019-of-00047.safetensors", + "model.layers.18.mlp.experts.1.up_proj.weight": "model-00019-of-00047.safetensors", + "model.layers.18.mlp.experts.1.up_proj.weight_scale": "model-00019-of-00047.safetensors", + "model.layers.18.mlp.experts.10.down_proj.weight": "model-00019-of-00047.safetensors", + "model.layers.18.mlp.experts.10.down_proj.weight_scale": "model-00019-of-00047.safetensors", + "model.layers.18.mlp.experts.10.gate_proj.weight": "model-00019-of-00047.safetensors", + "model.layers.18.mlp.experts.10.gate_proj.weight_scale": "model-00019-of-00047.safetensors", + "model.layers.18.mlp.experts.10.up_proj.weight": "model-00019-of-00047.safetensors", + "model.layers.18.mlp.experts.10.up_proj.weight_scale": "model-00019-of-00047.safetensors", + "model.layers.18.mlp.experts.100.down_proj.weight": "model-00019-of-00047.safetensors", + "model.layers.18.mlp.experts.100.down_proj.weight_scale": "model-00019-of-00047.safetensors", + "model.layers.18.mlp.experts.100.gate_proj.weight": "model-00019-of-00047.safetensors", + "model.layers.18.mlp.experts.100.gate_proj.weight_scale": "model-00019-of-00047.safetensors", + "model.layers.18.mlp.experts.100.up_proj.weight": "model-00019-of-00047.safetensors", + "model.layers.18.mlp.experts.100.up_proj.weight_scale": "model-00019-of-00047.safetensors", + "model.layers.18.mlp.experts.101.down_proj.weight": "model-00019-of-00047.safetensors", + "model.layers.18.mlp.experts.101.down_proj.weight_scale": "model-00019-of-00047.safetensors", + "model.layers.18.mlp.experts.101.gate_proj.weight": "model-00019-of-00047.safetensors", + "model.layers.18.mlp.experts.101.gate_proj.weight_scale": "model-00019-of-00047.safetensors", + "model.layers.18.mlp.experts.101.up_proj.weight": "model-00019-of-00047.safetensors", + "model.layers.18.mlp.experts.101.up_proj.weight_scale": "model-00019-of-00047.safetensors", + "model.layers.18.mlp.experts.102.down_proj.weight": "model-00019-of-00047.safetensors", + "model.layers.18.mlp.experts.102.down_proj.weight_scale": "model-00019-of-00047.safetensors", + "model.layers.18.mlp.experts.102.gate_proj.weight": "model-00019-of-00047.safetensors", + "model.layers.18.mlp.experts.102.gate_proj.weight_scale": "model-00019-of-00047.safetensors", + "model.layers.18.mlp.experts.102.up_proj.weight": "model-00019-of-00047.safetensors", + "model.layers.18.mlp.experts.102.up_proj.weight_scale": "model-00019-of-00047.safetensors", + "model.layers.18.mlp.experts.103.down_proj.weight": "model-00019-of-00047.safetensors", + "model.layers.18.mlp.experts.103.down_proj.weight_scale": "model-00019-of-00047.safetensors", + "model.layers.18.mlp.experts.103.gate_proj.weight": "model-00019-of-00047.safetensors", + "model.layers.18.mlp.experts.103.gate_proj.weight_scale": "model-00019-of-00047.safetensors", + "model.layers.18.mlp.experts.103.up_proj.weight": "model-00019-of-00047.safetensors", + "model.layers.18.mlp.experts.103.up_proj.weight_scale": "model-00019-of-00047.safetensors", + "model.layers.18.mlp.experts.104.down_proj.weight": "model-00019-of-00047.safetensors", + "model.layers.18.mlp.experts.104.down_proj.weight_scale": "model-00019-of-00047.safetensors", + "model.layers.18.mlp.experts.104.gate_proj.weight": "model-00019-of-00047.safetensors", + "model.layers.18.mlp.experts.104.gate_proj.weight_scale": "model-00019-of-00047.safetensors", + "model.layers.18.mlp.experts.104.up_proj.weight": "model-00019-of-00047.safetensors", + "model.layers.18.mlp.experts.104.up_proj.weight_scale": "model-00019-of-00047.safetensors", + "model.layers.18.mlp.experts.105.down_proj.weight": "model-00019-of-00047.safetensors", + "model.layers.18.mlp.experts.105.down_proj.weight_scale": "model-00019-of-00047.safetensors", + "model.layers.18.mlp.experts.105.gate_proj.weight": "model-00019-of-00047.safetensors", + "model.layers.18.mlp.experts.105.gate_proj.weight_scale": "model-00019-of-00047.safetensors", + "model.layers.18.mlp.experts.105.up_proj.weight": "model-00019-of-00047.safetensors", + "model.layers.18.mlp.experts.105.up_proj.weight_scale": "model-00019-of-00047.safetensors", + "model.layers.18.mlp.experts.106.down_proj.weight": "model-00019-of-00047.safetensors", + "model.layers.18.mlp.experts.106.down_proj.weight_scale": "model-00019-of-00047.safetensors", + "model.layers.18.mlp.experts.106.gate_proj.weight": "model-00019-of-00047.safetensors", + "model.layers.18.mlp.experts.106.gate_proj.weight_scale": "model-00019-of-00047.safetensors", + "model.layers.18.mlp.experts.106.up_proj.weight": "model-00019-of-00047.safetensors", + "model.layers.18.mlp.experts.106.up_proj.weight_scale": "model-00019-of-00047.safetensors", + "model.layers.18.mlp.experts.107.down_proj.weight": "model-00019-of-00047.safetensors", + "model.layers.18.mlp.experts.107.down_proj.weight_scale": "model-00019-of-00047.safetensors", + "model.layers.18.mlp.experts.107.gate_proj.weight": "model-00019-of-00047.safetensors", + "model.layers.18.mlp.experts.107.gate_proj.weight_scale": "model-00019-of-00047.safetensors", + "model.layers.18.mlp.experts.107.up_proj.weight": "model-00019-of-00047.safetensors", + "model.layers.18.mlp.experts.107.up_proj.weight_scale": "model-00019-of-00047.safetensors", + "model.layers.18.mlp.experts.108.down_proj.weight": "model-00019-of-00047.safetensors", + "model.layers.18.mlp.experts.108.down_proj.weight_scale": "model-00019-of-00047.safetensors", + "model.layers.18.mlp.experts.108.gate_proj.weight": "model-00019-of-00047.safetensors", + "model.layers.18.mlp.experts.108.gate_proj.weight_scale": "model-00019-of-00047.safetensors", + "model.layers.18.mlp.experts.108.up_proj.weight": "model-00019-of-00047.safetensors", + "model.layers.18.mlp.experts.108.up_proj.weight_scale": "model-00019-of-00047.safetensors", + "model.layers.18.mlp.experts.109.down_proj.weight": "model-00019-of-00047.safetensors", + "model.layers.18.mlp.experts.109.down_proj.weight_scale": "model-00019-of-00047.safetensors", + "model.layers.18.mlp.experts.109.gate_proj.weight": "model-00019-of-00047.safetensors", + "model.layers.18.mlp.experts.109.gate_proj.weight_scale": "model-00019-of-00047.safetensors", + "model.layers.18.mlp.experts.109.up_proj.weight": "model-00019-of-00047.safetensors", + "model.layers.18.mlp.experts.109.up_proj.weight_scale": "model-00019-of-00047.safetensors", + "model.layers.18.mlp.experts.11.down_proj.weight": "model-00019-of-00047.safetensors", + "model.layers.18.mlp.experts.11.down_proj.weight_scale": "model-00019-of-00047.safetensors", + "model.layers.18.mlp.experts.11.gate_proj.weight": "model-00019-of-00047.safetensors", + "model.layers.18.mlp.experts.11.gate_proj.weight_scale": "model-00019-of-00047.safetensors", + "model.layers.18.mlp.experts.11.up_proj.weight": "model-00019-of-00047.safetensors", + "model.layers.18.mlp.experts.11.up_proj.weight_scale": "model-00019-of-00047.safetensors", + "model.layers.18.mlp.experts.110.down_proj.weight": "model-00019-of-00047.safetensors", + "model.layers.18.mlp.experts.110.down_proj.weight_scale": "model-00019-of-00047.safetensors", + "model.layers.18.mlp.experts.110.gate_proj.weight": "model-00019-of-00047.safetensors", + "model.layers.18.mlp.experts.110.gate_proj.weight_scale": "model-00019-of-00047.safetensors", + "model.layers.18.mlp.experts.110.up_proj.weight": "model-00019-of-00047.safetensors", + "model.layers.18.mlp.experts.110.up_proj.weight_scale": "model-00019-of-00047.safetensors", + "model.layers.18.mlp.experts.111.down_proj.weight": "model-00019-of-00047.safetensors", + "model.layers.18.mlp.experts.111.down_proj.weight_scale": "model-00019-of-00047.safetensors", + "model.layers.18.mlp.experts.111.gate_proj.weight": "model-00019-of-00047.safetensors", + "model.layers.18.mlp.experts.111.gate_proj.weight_scale": "model-00019-of-00047.safetensors", + "model.layers.18.mlp.experts.111.up_proj.weight": "model-00019-of-00047.safetensors", + "model.layers.18.mlp.experts.111.up_proj.weight_scale": "model-00019-of-00047.safetensors", + "model.layers.18.mlp.experts.112.down_proj.weight": "model-00019-of-00047.safetensors", + "model.layers.18.mlp.experts.112.down_proj.weight_scale": "model-00019-of-00047.safetensors", + "model.layers.18.mlp.experts.112.gate_proj.weight": "model-00019-of-00047.safetensors", + "model.layers.18.mlp.experts.112.gate_proj.weight_scale": "model-00019-of-00047.safetensors", + "model.layers.18.mlp.experts.112.up_proj.weight": "model-00019-of-00047.safetensors", + "model.layers.18.mlp.experts.112.up_proj.weight_scale": "model-00019-of-00047.safetensors", + "model.layers.18.mlp.experts.113.down_proj.weight": "model-00019-of-00047.safetensors", + "model.layers.18.mlp.experts.113.down_proj.weight_scale": "model-00019-of-00047.safetensors", + "model.layers.18.mlp.experts.113.gate_proj.weight": "model-00019-of-00047.safetensors", + "model.layers.18.mlp.experts.113.gate_proj.weight_scale": "model-00019-of-00047.safetensors", + "model.layers.18.mlp.experts.113.up_proj.weight": "model-00019-of-00047.safetensors", + "model.layers.18.mlp.experts.113.up_proj.weight_scale": "model-00019-of-00047.safetensors", + "model.layers.18.mlp.experts.114.down_proj.weight": "model-00019-of-00047.safetensors", + "model.layers.18.mlp.experts.114.down_proj.weight_scale": "model-00019-of-00047.safetensors", + "model.layers.18.mlp.experts.114.gate_proj.weight": "model-00019-of-00047.safetensors", + "model.layers.18.mlp.experts.114.gate_proj.weight_scale": "model-00019-of-00047.safetensors", + "model.layers.18.mlp.experts.114.up_proj.weight": "model-00019-of-00047.safetensors", + "model.layers.18.mlp.experts.114.up_proj.weight_scale": "model-00019-of-00047.safetensors", + "model.layers.18.mlp.experts.115.down_proj.weight": "model-00019-of-00047.safetensors", + "model.layers.18.mlp.experts.115.down_proj.weight_scale": "model-00019-of-00047.safetensors", + "model.layers.18.mlp.experts.115.gate_proj.weight": "model-00019-of-00047.safetensors", + "model.layers.18.mlp.experts.115.gate_proj.weight_scale": "model-00019-of-00047.safetensors", + "model.layers.18.mlp.experts.115.up_proj.weight": "model-00019-of-00047.safetensors", + "model.layers.18.mlp.experts.115.up_proj.weight_scale": "model-00019-of-00047.safetensors", + "model.layers.18.mlp.experts.116.down_proj.weight": "model-00019-of-00047.safetensors", + "model.layers.18.mlp.experts.116.down_proj.weight_scale": "model-00019-of-00047.safetensors", + "model.layers.18.mlp.experts.116.gate_proj.weight": "model-00019-of-00047.safetensors", + "model.layers.18.mlp.experts.116.gate_proj.weight_scale": "model-00019-of-00047.safetensors", + "model.layers.18.mlp.experts.116.up_proj.weight": "model-00019-of-00047.safetensors", + "model.layers.18.mlp.experts.116.up_proj.weight_scale": "model-00019-of-00047.safetensors", + "model.layers.18.mlp.experts.117.down_proj.weight": "model-00019-of-00047.safetensors", + "model.layers.18.mlp.experts.117.down_proj.weight_scale": "model-00019-of-00047.safetensors", + "model.layers.18.mlp.experts.117.gate_proj.weight": "model-00019-of-00047.safetensors", + "model.layers.18.mlp.experts.117.gate_proj.weight_scale": "model-00019-of-00047.safetensors", + "model.layers.18.mlp.experts.117.up_proj.weight": "model-00019-of-00047.safetensors", + "model.layers.18.mlp.experts.117.up_proj.weight_scale": "model-00019-of-00047.safetensors", + "model.layers.18.mlp.experts.118.down_proj.weight": "model-00019-of-00047.safetensors", + "model.layers.18.mlp.experts.118.down_proj.weight_scale": "model-00019-of-00047.safetensors", + "model.layers.18.mlp.experts.118.gate_proj.weight": "model-00019-of-00047.safetensors", + "model.layers.18.mlp.experts.118.gate_proj.weight_scale": "model-00019-of-00047.safetensors", + "model.layers.18.mlp.experts.118.up_proj.weight": "model-00019-of-00047.safetensors", + "model.layers.18.mlp.experts.118.up_proj.weight_scale": "model-00019-of-00047.safetensors", + "model.layers.18.mlp.experts.119.down_proj.weight": "model-00019-of-00047.safetensors", + "model.layers.18.mlp.experts.119.down_proj.weight_scale": "model-00019-of-00047.safetensors", + "model.layers.18.mlp.experts.119.gate_proj.weight": "model-00019-of-00047.safetensors", + "model.layers.18.mlp.experts.119.gate_proj.weight_scale": "model-00019-of-00047.safetensors", + "model.layers.18.mlp.experts.119.up_proj.weight": "model-00019-of-00047.safetensors", + "model.layers.18.mlp.experts.119.up_proj.weight_scale": "model-00019-of-00047.safetensors", + "model.layers.18.mlp.experts.12.down_proj.weight": "model-00019-of-00047.safetensors", + "model.layers.18.mlp.experts.12.down_proj.weight_scale": "model-00019-of-00047.safetensors", + "model.layers.18.mlp.experts.12.gate_proj.weight": "model-00019-of-00047.safetensors", + "model.layers.18.mlp.experts.12.gate_proj.weight_scale": "model-00019-of-00047.safetensors", + "model.layers.18.mlp.experts.12.up_proj.weight": "model-00019-of-00047.safetensors", + "model.layers.18.mlp.experts.12.up_proj.weight_scale": "model-00019-of-00047.safetensors", + "model.layers.18.mlp.experts.120.down_proj.weight": "model-00019-of-00047.safetensors", + "model.layers.18.mlp.experts.120.down_proj.weight_scale": "model-00019-of-00047.safetensors", + "model.layers.18.mlp.experts.120.gate_proj.weight": "model-00019-of-00047.safetensors", + "model.layers.18.mlp.experts.120.gate_proj.weight_scale": "model-00019-of-00047.safetensors", + "model.layers.18.mlp.experts.120.up_proj.weight": "model-00019-of-00047.safetensors", + "model.layers.18.mlp.experts.120.up_proj.weight_scale": "model-00019-of-00047.safetensors", + "model.layers.18.mlp.experts.121.down_proj.weight": "model-00019-of-00047.safetensors", + "model.layers.18.mlp.experts.121.down_proj.weight_scale": "model-00019-of-00047.safetensors", + "model.layers.18.mlp.experts.121.gate_proj.weight": "model-00019-of-00047.safetensors", + "model.layers.18.mlp.experts.121.gate_proj.weight_scale": "model-00019-of-00047.safetensors", + "model.layers.18.mlp.experts.121.up_proj.weight": "model-00019-of-00047.safetensors", + "model.layers.18.mlp.experts.121.up_proj.weight_scale": "model-00019-of-00047.safetensors", + "model.layers.18.mlp.experts.122.down_proj.weight": "model-00019-of-00047.safetensors", + "model.layers.18.mlp.experts.122.down_proj.weight_scale": "model-00019-of-00047.safetensors", + "model.layers.18.mlp.experts.122.gate_proj.weight": "model-00019-of-00047.safetensors", + "model.layers.18.mlp.experts.122.gate_proj.weight_scale": "model-00019-of-00047.safetensors", + "model.layers.18.mlp.experts.122.up_proj.weight": "model-00019-of-00047.safetensors", + "model.layers.18.mlp.experts.122.up_proj.weight_scale": "model-00019-of-00047.safetensors", + "model.layers.18.mlp.experts.123.down_proj.weight": "model-00019-of-00047.safetensors", + "model.layers.18.mlp.experts.123.down_proj.weight_scale": "model-00019-of-00047.safetensors", + "model.layers.18.mlp.experts.123.gate_proj.weight": "model-00019-of-00047.safetensors", + "model.layers.18.mlp.experts.123.gate_proj.weight_scale": "model-00019-of-00047.safetensors", + "model.layers.18.mlp.experts.123.up_proj.weight": "model-00019-of-00047.safetensors", + "model.layers.18.mlp.experts.123.up_proj.weight_scale": "model-00019-of-00047.safetensors", + "model.layers.18.mlp.experts.124.down_proj.weight": "model-00019-of-00047.safetensors", + "model.layers.18.mlp.experts.124.down_proj.weight_scale": "model-00019-of-00047.safetensors", + "model.layers.18.mlp.experts.124.gate_proj.weight": "model-00019-of-00047.safetensors", + "model.layers.18.mlp.experts.124.gate_proj.weight_scale": "model-00019-of-00047.safetensors", + "model.layers.18.mlp.experts.124.up_proj.weight": "model-00019-of-00047.safetensors", + "model.layers.18.mlp.experts.124.up_proj.weight_scale": "model-00019-of-00047.safetensors", + "model.layers.18.mlp.experts.125.down_proj.weight": "model-00019-of-00047.safetensors", + "model.layers.18.mlp.experts.125.down_proj.weight_scale": "model-00019-of-00047.safetensors", + "model.layers.18.mlp.experts.125.gate_proj.weight": "model-00019-of-00047.safetensors", + "model.layers.18.mlp.experts.125.gate_proj.weight_scale": "model-00019-of-00047.safetensors", + "model.layers.18.mlp.experts.125.up_proj.weight": "model-00019-of-00047.safetensors", + "model.layers.18.mlp.experts.125.up_proj.weight_scale": "model-00019-of-00047.safetensors", + "model.layers.18.mlp.experts.126.down_proj.weight": "model-00019-of-00047.safetensors", + "model.layers.18.mlp.experts.126.down_proj.weight_scale": "model-00019-of-00047.safetensors", + "model.layers.18.mlp.experts.126.gate_proj.weight": "model-00019-of-00047.safetensors", + "model.layers.18.mlp.experts.126.gate_proj.weight_scale": "model-00019-of-00047.safetensors", + "model.layers.18.mlp.experts.126.up_proj.weight": "model-00019-of-00047.safetensors", + "model.layers.18.mlp.experts.126.up_proj.weight_scale": "model-00019-of-00047.safetensors", + "model.layers.18.mlp.experts.127.down_proj.weight": "model-00019-of-00047.safetensors", + "model.layers.18.mlp.experts.127.down_proj.weight_scale": "model-00019-of-00047.safetensors", + "model.layers.18.mlp.experts.127.gate_proj.weight": "model-00019-of-00047.safetensors", + "model.layers.18.mlp.experts.127.gate_proj.weight_scale": "model-00019-of-00047.safetensors", + "model.layers.18.mlp.experts.127.up_proj.weight": "model-00019-of-00047.safetensors", + "model.layers.18.mlp.experts.127.up_proj.weight_scale": "model-00019-of-00047.safetensors", + "model.layers.18.mlp.experts.13.down_proj.weight": "model-00019-of-00047.safetensors", + "model.layers.18.mlp.experts.13.down_proj.weight_scale": "model-00019-of-00047.safetensors", + "model.layers.18.mlp.experts.13.gate_proj.weight": "model-00019-of-00047.safetensors", + "model.layers.18.mlp.experts.13.gate_proj.weight_scale": "model-00019-of-00047.safetensors", + "model.layers.18.mlp.experts.13.up_proj.weight": "model-00019-of-00047.safetensors", + "model.layers.18.mlp.experts.13.up_proj.weight_scale": "model-00019-of-00047.safetensors", + "model.layers.18.mlp.experts.14.down_proj.weight": "model-00019-of-00047.safetensors", + "model.layers.18.mlp.experts.14.down_proj.weight_scale": "model-00019-of-00047.safetensors", + "model.layers.18.mlp.experts.14.gate_proj.weight": "model-00019-of-00047.safetensors", + "model.layers.18.mlp.experts.14.gate_proj.weight_scale": "model-00019-of-00047.safetensors", + "model.layers.18.mlp.experts.14.up_proj.weight": "model-00019-of-00047.safetensors", + "model.layers.18.mlp.experts.14.up_proj.weight_scale": "model-00019-of-00047.safetensors", + "model.layers.18.mlp.experts.15.down_proj.weight": "model-00019-of-00047.safetensors", + "model.layers.18.mlp.experts.15.down_proj.weight_scale": "model-00019-of-00047.safetensors", + "model.layers.18.mlp.experts.15.gate_proj.weight": "model-00019-of-00047.safetensors", + "model.layers.18.mlp.experts.15.gate_proj.weight_scale": "model-00019-of-00047.safetensors", + "model.layers.18.mlp.experts.15.up_proj.weight": "model-00019-of-00047.safetensors", + "model.layers.18.mlp.experts.15.up_proj.weight_scale": "model-00019-of-00047.safetensors", + "model.layers.18.mlp.experts.16.down_proj.weight": "model-00019-of-00047.safetensors", + "model.layers.18.mlp.experts.16.down_proj.weight_scale": "model-00019-of-00047.safetensors", + "model.layers.18.mlp.experts.16.gate_proj.weight": "model-00019-of-00047.safetensors", + "model.layers.18.mlp.experts.16.gate_proj.weight_scale": "model-00019-of-00047.safetensors", + "model.layers.18.mlp.experts.16.up_proj.weight": "model-00019-of-00047.safetensors", + "model.layers.18.mlp.experts.16.up_proj.weight_scale": "model-00019-of-00047.safetensors", + "model.layers.18.mlp.experts.17.down_proj.weight": "model-00019-of-00047.safetensors", + "model.layers.18.mlp.experts.17.down_proj.weight_scale": "model-00019-of-00047.safetensors", + "model.layers.18.mlp.experts.17.gate_proj.weight": "model-00019-of-00047.safetensors", + "model.layers.18.mlp.experts.17.gate_proj.weight_scale": "model-00019-of-00047.safetensors", + "model.layers.18.mlp.experts.17.up_proj.weight": "model-00019-of-00047.safetensors", + "model.layers.18.mlp.experts.17.up_proj.weight_scale": "model-00019-of-00047.safetensors", + "model.layers.18.mlp.experts.18.down_proj.weight": "model-00019-of-00047.safetensors", + "model.layers.18.mlp.experts.18.down_proj.weight_scale": "model-00019-of-00047.safetensors", + "model.layers.18.mlp.experts.18.gate_proj.weight": "model-00019-of-00047.safetensors", + "model.layers.18.mlp.experts.18.gate_proj.weight_scale": "model-00019-of-00047.safetensors", + "model.layers.18.mlp.experts.18.up_proj.weight": "model-00019-of-00047.safetensors", + "model.layers.18.mlp.experts.18.up_proj.weight_scale": "model-00019-of-00047.safetensors", + "model.layers.18.mlp.experts.19.down_proj.weight": "model-00019-of-00047.safetensors", + "model.layers.18.mlp.experts.19.down_proj.weight_scale": "model-00019-of-00047.safetensors", + "model.layers.18.mlp.experts.19.gate_proj.weight": "model-00019-of-00047.safetensors", + "model.layers.18.mlp.experts.19.gate_proj.weight_scale": "model-00019-of-00047.safetensors", + "model.layers.18.mlp.experts.19.up_proj.weight": "model-00019-of-00047.safetensors", + "model.layers.18.mlp.experts.19.up_proj.weight_scale": "model-00019-of-00047.safetensors", + "model.layers.18.mlp.experts.2.down_proj.weight": "model-00019-of-00047.safetensors", + "model.layers.18.mlp.experts.2.down_proj.weight_scale": "model-00019-of-00047.safetensors", + "model.layers.18.mlp.experts.2.gate_proj.weight": "model-00019-of-00047.safetensors", + "model.layers.18.mlp.experts.2.gate_proj.weight_scale": "model-00019-of-00047.safetensors", + "model.layers.18.mlp.experts.2.up_proj.weight": "model-00019-of-00047.safetensors", + "model.layers.18.mlp.experts.2.up_proj.weight_scale": "model-00019-of-00047.safetensors", + "model.layers.18.mlp.experts.20.down_proj.weight": "model-00019-of-00047.safetensors", + "model.layers.18.mlp.experts.20.down_proj.weight_scale": "model-00019-of-00047.safetensors", + "model.layers.18.mlp.experts.20.gate_proj.weight": "model-00019-of-00047.safetensors", + "model.layers.18.mlp.experts.20.gate_proj.weight_scale": "model-00019-of-00047.safetensors", + "model.layers.18.mlp.experts.20.up_proj.weight": "model-00019-of-00047.safetensors", + "model.layers.18.mlp.experts.20.up_proj.weight_scale": "model-00019-of-00047.safetensors", + "model.layers.18.mlp.experts.21.down_proj.weight": "model-00019-of-00047.safetensors", + "model.layers.18.mlp.experts.21.down_proj.weight_scale": "model-00019-of-00047.safetensors", + "model.layers.18.mlp.experts.21.gate_proj.weight": "model-00019-of-00047.safetensors", + "model.layers.18.mlp.experts.21.gate_proj.weight_scale": "model-00019-of-00047.safetensors", + "model.layers.18.mlp.experts.21.up_proj.weight": "model-00019-of-00047.safetensors", + "model.layers.18.mlp.experts.21.up_proj.weight_scale": "model-00019-of-00047.safetensors", + "model.layers.18.mlp.experts.22.down_proj.weight": "model-00019-of-00047.safetensors", + "model.layers.18.mlp.experts.22.down_proj.weight_scale": "model-00019-of-00047.safetensors", + "model.layers.18.mlp.experts.22.gate_proj.weight": "model-00019-of-00047.safetensors", + "model.layers.18.mlp.experts.22.gate_proj.weight_scale": "model-00019-of-00047.safetensors", + "model.layers.18.mlp.experts.22.up_proj.weight": "model-00019-of-00047.safetensors", + "model.layers.18.mlp.experts.22.up_proj.weight_scale": "model-00019-of-00047.safetensors", + "model.layers.18.mlp.experts.23.down_proj.weight": "model-00019-of-00047.safetensors", + "model.layers.18.mlp.experts.23.down_proj.weight_scale": "model-00019-of-00047.safetensors", + "model.layers.18.mlp.experts.23.gate_proj.weight": "model-00019-of-00047.safetensors", + "model.layers.18.mlp.experts.23.gate_proj.weight_scale": "model-00019-of-00047.safetensors", + "model.layers.18.mlp.experts.23.up_proj.weight": "model-00019-of-00047.safetensors", + "model.layers.18.mlp.experts.23.up_proj.weight_scale": "model-00019-of-00047.safetensors", + "model.layers.18.mlp.experts.24.down_proj.weight": "model-00019-of-00047.safetensors", + "model.layers.18.mlp.experts.24.down_proj.weight_scale": "model-00019-of-00047.safetensors", + "model.layers.18.mlp.experts.24.gate_proj.weight": "model-00019-of-00047.safetensors", + "model.layers.18.mlp.experts.24.gate_proj.weight_scale": "model-00019-of-00047.safetensors", + "model.layers.18.mlp.experts.24.up_proj.weight": "model-00019-of-00047.safetensors", + "model.layers.18.mlp.experts.24.up_proj.weight_scale": "model-00019-of-00047.safetensors", + "model.layers.18.mlp.experts.25.down_proj.weight": "model-00019-of-00047.safetensors", + "model.layers.18.mlp.experts.25.down_proj.weight_scale": "model-00019-of-00047.safetensors", + "model.layers.18.mlp.experts.25.gate_proj.weight": "model-00019-of-00047.safetensors", + "model.layers.18.mlp.experts.25.gate_proj.weight_scale": "model-00019-of-00047.safetensors", + "model.layers.18.mlp.experts.25.up_proj.weight": "model-00019-of-00047.safetensors", + "model.layers.18.mlp.experts.25.up_proj.weight_scale": "model-00019-of-00047.safetensors", + "model.layers.18.mlp.experts.26.down_proj.weight": "model-00019-of-00047.safetensors", + "model.layers.18.mlp.experts.26.down_proj.weight_scale": "model-00019-of-00047.safetensors", + "model.layers.18.mlp.experts.26.gate_proj.weight": "model-00019-of-00047.safetensors", + "model.layers.18.mlp.experts.26.gate_proj.weight_scale": "model-00019-of-00047.safetensors", + "model.layers.18.mlp.experts.26.up_proj.weight": "model-00019-of-00047.safetensors", + "model.layers.18.mlp.experts.26.up_proj.weight_scale": "model-00019-of-00047.safetensors", + "model.layers.18.mlp.experts.27.down_proj.weight": "model-00019-of-00047.safetensors", + "model.layers.18.mlp.experts.27.down_proj.weight_scale": "model-00019-of-00047.safetensors", + "model.layers.18.mlp.experts.27.gate_proj.weight": "model-00019-of-00047.safetensors", + "model.layers.18.mlp.experts.27.gate_proj.weight_scale": "model-00019-of-00047.safetensors", + "model.layers.18.mlp.experts.27.up_proj.weight": "model-00019-of-00047.safetensors", + "model.layers.18.mlp.experts.27.up_proj.weight_scale": "model-00019-of-00047.safetensors", + "model.layers.18.mlp.experts.28.down_proj.weight": "model-00019-of-00047.safetensors", + "model.layers.18.mlp.experts.28.down_proj.weight_scale": "model-00019-of-00047.safetensors", + "model.layers.18.mlp.experts.28.gate_proj.weight": "model-00019-of-00047.safetensors", + "model.layers.18.mlp.experts.28.gate_proj.weight_scale": "model-00019-of-00047.safetensors", + "model.layers.18.mlp.experts.28.up_proj.weight": "model-00019-of-00047.safetensors", + "model.layers.18.mlp.experts.28.up_proj.weight_scale": "model-00019-of-00047.safetensors", + "model.layers.18.mlp.experts.29.down_proj.weight": "model-00019-of-00047.safetensors", + "model.layers.18.mlp.experts.29.down_proj.weight_scale": "model-00019-of-00047.safetensors", + "model.layers.18.mlp.experts.29.gate_proj.weight": "model-00019-of-00047.safetensors", + "model.layers.18.mlp.experts.29.gate_proj.weight_scale": "model-00019-of-00047.safetensors", + "model.layers.18.mlp.experts.29.up_proj.weight": "model-00019-of-00047.safetensors", + "model.layers.18.mlp.experts.29.up_proj.weight_scale": "model-00019-of-00047.safetensors", + "model.layers.18.mlp.experts.3.down_proj.weight": "model-00019-of-00047.safetensors", + "model.layers.18.mlp.experts.3.down_proj.weight_scale": "model-00019-of-00047.safetensors", + "model.layers.18.mlp.experts.3.gate_proj.weight": "model-00019-of-00047.safetensors", + "model.layers.18.mlp.experts.3.gate_proj.weight_scale": "model-00019-of-00047.safetensors", + "model.layers.18.mlp.experts.3.up_proj.weight": "model-00019-of-00047.safetensors", + "model.layers.18.mlp.experts.3.up_proj.weight_scale": "model-00019-of-00047.safetensors", + "model.layers.18.mlp.experts.30.down_proj.weight": "model-00019-of-00047.safetensors", + "model.layers.18.mlp.experts.30.down_proj.weight_scale": "model-00019-of-00047.safetensors", + "model.layers.18.mlp.experts.30.gate_proj.weight": "model-00019-of-00047.safetensors", + "model.layers.18.mlp.experts.30.gate_proj.weight_scale": "model-00019-of-00047.safetensors", + "model.layers.18.mlp.experts.30.up_proj.weight": "model-00019-of-00047.safetensors", + "model.layers.18.mlp.experts.30.up_proj.weight_scale": "model-00019-of-00047.safetensors", + "model.layers.18.mlp.experts.31.down_proj.weight": "model-00019-of-00047.safetensors", + "model.layers.18.mlp.experts.31.down_proj.weight_scale": "model-00019-of-00047.safetensors", + "model.layers.18.mlp.experts.31.gate_proj.weight": "model-00019-of-00047.safetensors", + "model.layers.18.mlp.experts.31.gate_proj.weight_scale": "model-00019-of-00047.safetensors", + "model.layers.18.mlp.experts.31.up_proj.weight": "model-00019-of-00047.safetensors", + "model.layers.18.mlp.experts.31.up_proj.weight_scale": "model-00019-of-00047.safetensors", + "model.layers.18.mlp.experts.32.down_proj.weight": "model-00019-of-00047.safetensors", + "model.layers.18.mlp.experts.32.down_proj.weight_scale": "model-00019-of-00047.safetensors", + "model.layers.18.mlp.experts.32.gate_proj.weight": "model-00019-of-00047.safetensors", + "model.layers.18.mlp.experts.32.gate_proj.weight_scale": "model-00019-of-00047.safetensors", + "model.layers.18.mlp.experts.32.up_proj.weight": "model-00019-of-00047.safetensors", + "model.layers.18.mlp.experts.32.up_proj.weight_scale": "model-00019-of-00047.safetensors", + "model.layers.18.mlp.experts.33.down_proj.weight": "model-00019-of-00047.safetensors", + "model.layers.18.mlp.experts.33.down_proj.weight_scale": "model-00019-of-00047.safetensors", + "model.layers.18.mlp.experts.33.gate_proj.weight": "model-00019-of-00047.safetensors", + "model.layers.18.mlp.experts.33.gate_proj.weight_scale": "model-00019-of-00047.safetensors", + "model.layers.18.mlp.experts.33.up_proj.weight": "model-00019-of-00047.safetensors", + "model.layers.18.mlp.experts.33.up_proj.weight_scale": "model-00019-of-00047.safetensors", + "model.layers.18.mlp.experts.34.down_proj.weight": "model-00019-of-00047.safetensors", + "model.layers.18.mlp.experts.34.down_proj.weight_scale": "model-00019-of-00047.safetensors", + "model.layers.18.mlp.experts.34.gate_proj.weight": "model-00019-of-00047.safetensors", + "model.layers.18.mlp.experts.34.gate_proj.weight_scale": "model-00019-of-00047.safetensors", + "model.layers.18.mlp.experts.34.up_proj.weight": "model-00019-of-00047.safetensors", + "model.layers.18.mlp.experts.34.up_proj.weight_scale": "model-00019-of-00047.safetensors", + "model.layers.18.mlp.experts.35.down_proj.weight": "model-00019-of-00047.safetensors", + "model.layers.18.mlp.experts.35.down_proj.weight_scale": "model-00019-of-00047.safetensors", + "model.layers.18.mlp.experts.35.gate_proj.weight": "model-00019-of-00047.safetensors", + "model.layers.18.mlp.experts.35.gate_proj.weight_scale": "model-00019-of-00047.safetensors", + "model.layers.18.mlp.experts.35.up_proj.weight": "model-00019-of-00047.safetensors", + "model.layers.18.mlp.experts.35.up_proj.weight_scale": "model-00019-of-00047.safetensors", + "model.layers.18.mlp.experts.36.down_proj.weight": "model-00019-of-00047.safetensors", + "model.layers.18.mlp.experts.36.down_proj.weight_scale": "model-00019-of-00047.safetensors", + "model.layers.18.mlp.experts.36.gate_proj.weight": "model-00019-of-00047.safetensors", + "model.layers.18.mlp.experts.36.gate_proj.weight_scale": "model-00019-of-00047.safetensors", + "model.layers.18.mlp.experts.36.up_proj.weight": "model-00019-of-00047.safetensors", + "model.layers.18.mlp.experts.36.up_proj.weight_scale": "model-00019-of-00047.safetensors", + "model.layers.18.mlp.experts.37.down_proj.weight": "model-00019-of-00047.safetensors", + "model.layers.18.mlp.experts.37.down_proj.weight_scale": "model-00019-of-00047.safetensors", + "model.layers.18.mlp.experts.37.gate_proj.weight": "model-00019-of-00047.safetensors", + "model.layers.18.mlp.experts.37.gate_proj.weight_scale": "model-00019-of-00047.safetensors", + "model.layers.18.mlp.experts.37.up_proj.weight": "model-00019-of-00047.safetensors", + "model.layers.18.mlp.experts.37.up_proj.weight_scale": "model-00019-of-00047.safetensors", + "model.layers.18.mlp.experts.38.down_proj.weight": "model-00019-of-00047.safetensors", + "model.layers.18.mlp.experts.38.down_proj.weight_scale": "model-00019-of-00047.safetensors", + "model.layers.18.mlp.experts.38.gate_proj.weight": "model-00019-of-00047.safetensors", + "model.layers.18.mlp.experts.38.gate_proj.weight_scale": "model-00019-of-00047.safetensors", + "model.layers.18.mlp.experts.38.up_proj.weight": "model-00019-of-00047.safetensors", + "model.layers.18.mlp.experts.38.up_proj.weight_scale": "model-00019-of-00047.safetensors", + "model.layers.18.mlp.experts.39.down_proj.weight": "model-00019-of-00047.safetensors", + "model.layers.18.mlp.experts.39.down_proj.weight_scale": "model-00019-of-00047.safetensors", + "model.layers.18.mlp.experts.39.gate_proj.weight": "model-00019-of-00047.safetensors", + "model.layers.18.mlp.experts.39.gate_proj.weight_scale": "model-00019-of-00047.safetensors", + "model.layers.18.mlp.experts.39.up_proj.weight": "model-00019-of-00047.safetensors", + "model.layers.18.mlp.experts.39.up_proj.weight_scale": "model-00019-of-00047.safetensors", + "model.layers.18.mlp.experts.4.down_proj.weight": "model-00019-of-00047.safetensors", + "model.layers.18.mlp.experts.4.down_proj.weight_scale": "model-00019-of-00047.safetensors", + "model.layers.18.mlp.experts.4.gate_proj.weight": "model-00019-of-00047.safetensors", + "model.layers.18.mlp.experts.4.gate_proj.weight_scale": "model-00019-of-00047.safetensors", + "model.layers.18.mlp.experts.4.up_proj.weight": "model-00019-of-00047.safetensors", + "model.layers.18.mlp.experts.4.up_proj.weight_scale": "model-00019-of-00047.safetensors", + "model.layers.18.mlp.experts.40.down_proj.weight": "model-00019-of-00047.safetensors", + "model.layers.18.mlp.experts.40.down_proj.weight_scale": "model-00019-of-00047.safetensors", + "model.layers.18.mlp.experts.40.gate_proj.weight": "model-00019-of-00047.safetensors", + "model.layers.18.mlp.experts.40.gate_proj.weight_scale": "model-00019-of-00047.safetensors", + "model.layers.18.mlp.experts.40.up_proj.weight": "model-00019-of-00047.safetensors", + "model.layers.18.mlp.experts.40.up_proj.weight_scale": "model-00019-of-00047.safetensors", + "model.layers.18.mlp.experts.41.down_proj.weight": "model-00019-of-00047.safetensors", + "model.layers.18.mlp.experts.41.down_proj.weight_scale": "model-00019-of-00047.safetensors", + "model.layers.18.mlp.experts.41.gate_proj.weight": "model-00019-of-00047.safetensors", + "model.layers.18.mlp.experts.41.gate_proj.weight_scale": "model-00019-of-00047.safetensors", + "model.layers.18.mlp.experts.41.up_proj.weight": "model-00019-of-00047.safetensors", + "model.layers.18.mlp.experts.41.up_proj.weight_scale": "model-00019-of-00047.safetensors", + "model.layers.18.mlp.experts.42.down_proj.weight": "model-00019-of-00047.safetensors", + "model.layers.18.mlp.experts.42.down_proj.weight_scale": "model-00019-of-00047.safetensors", + "model.layers.18.mlp.experts.42.gate_proj.weight": "model-00019-of-00047.safetensors", + "model.layers.18.mlp.experts.42.gate_proj.weight_scale": "model-00019-of-00047.safetensors", + "model.layers.18.mlp.experts.42.up_proj.weight": "model-00019-of-00047.safetensors", + "model.layers.18.mlp.experts.42.up_proj.weight_scale": "model-00019-of-00047.safetensors", + "model.layers.18.mlp.experts.43.down_proj.weight": "model-00019-of-00047.safetensors", + "model.layers.18.mlp.experts.43.down_proj.weight_scale": "model-00019-of-00047.safetensors", + "model.layers.18.mlp.experts.43.gate_proj.weight": "model-00019-of-00047.safetensors", + "model.layers.18.mlp.experts.43.gate_proj.weight_scale": "model-00019-of-00047.safetensors", + "model.layers.18.mlp.experts.43.up_proj.weight": "model-00019-of-00047.safetensors", + "model.layers.18.mlp.experts.43.up_proj.weight_scale": "model-00019-of-00047.safetensors", + "model.layers.18.mlp.experts.44.down_proj.weight": "model-00019-of-00047.safetensors", + "model.layers.18.mlp.experts.44.down_proj.weight_scale": "model-00019-of-00047.safetensors", + "model.layers.18.mlp.experts.44.gate_proj.weight": "model-00019-of-00047.safetensors", + "model.layers.18.mlp.experts.44.gate_proj.weight_scale": "model-00019-of-00047.safetensors", + "model.layers.18.mlp.experts.44.up_proj.weight": "model-00019-of-00047.safetensors", + "model.layers.18.mlp.experts.44.up_proj.weight_scale": "model-00019-of-00047.safetensors", + "model.layers.18.mlp.experts.45.down_proj.weight": "model-00019-of-00047.safetensors", + "model.layers.18.mlp.experts.45.down_proj.weight_scale": "model-00019-of-00047.safetensors", + "model.layers.18.mlp.experts.45.gate_proj.weight": "model-00019-of-00047.safetensors", + "model.layers.18.mlp.experts.45.gate_proj.weight_scale": "model-00019-of-00047.safetensors", + "model.layers.18.mlp.experts.45.up_proj.weight": "model-00019-of-00047.safetensors", + "model.layers.18.mlp.experts.45.up_proj.weight_scale": "model-00019-of-00047.safetensors", + "model.layers.18.mlp.experts.46.down_proj.weight": "model-00019-of-00047.safetensors", + "model.layers.18.mlp.experts.46.down_proj.weight_scale": "model-00019-of-00047.safetensors", + "model.layers.18.mlp.experts.46.gate_proj.weight": "model-00019-of-00047.safetensors", + "model.layers.18.mlp.experts.46.gate_proj.weight_scale": "model-00019-of-00047.safetensors", + "model.layers.18.mlp.experts.46.up_proj.weight": "model-00019-of-00047.safetensors", + "model.layers.18.mlp.experts.46.up_proj.weight_scale": "model-00019-of-00047.safetensors", + "model.layers.18.mlp.experts.47.down_proj.weight": "model-00019-of-00047.safetensors", + "model.layers.18.mlp.experts.47.down_proj.weight_scale": "model-00019-of-00047.safetensors", + "model.layers.18.mlp.experts.47.gate_proj.weight": "model-00019-of-00047.safetensors", + "model.layers.18.mlp.experts.47.gate_proj.weight_scale": "model-00019-of-00047.safetensors", + "model.layers.18.mlp.experts.47.up_proj.weight": "model-00019-of-00047.safetensors", + "model.layers.18.mlp.experts.47.up_proj.weight_scale": "model-00019-of-00047.safetensors", + "model.layers.18.mlp.experts.48.down_proj.weight": "model-00019-of-00047.safetensors", + "model.layers.18.mlp.experts.48.down_proj.weight_scale": "model-00019-of-00047.safetensors", + "model.layers.18.mlp.experts.48.gate_proj.weight": "model-00019-of-00047.safetensors", + "model.layers.18.mlp.experts.48.gate_proj.weight_scale": "model-00019-of-00047.safetensors", + "model.layers.18.mlp.experts.48.up_proj.weight": "model-00019-of-00047.safetensors", + "model.layers.18.mlp.experts.48.up_proj.weight_scale": "model-00019-of-00047.safetensors", + "model.layers.18.mlp.experts.49.down_proj.weight": "model-00019-of-00047.safetensors", + "model.layers.18.mlp.experts.49.down_proj.weight_scale": "model-00019-of-00047.safetensors", + "model.layers.18.mlp.experts.49.gate_proj.weight": "model-00019-of-00047.safetensors", + "model.layers.18.mlp.experts.49.gate_proj.weight_scale": "model-00019-of-00047.safetensors", + "model.layers.18.mlp.experts.49.up_proj.weight": "model-00019-of-00047.safetensors", + "model.layers.18.mlp.experts.49.up_proj.weight_scale": "model-00019-of-00047.safetensors", + "model.layers.18.mlp.experts.5.down_proj.weight": "model-00019-of-00047.safetensors", + "model.layers.18.mlp.experts.5.down_proj.weight_scale": "model-00019-of-00047.safetensors", + "model.layers.18.mlp.experts.5.gate_proj.weight": "model-00019-of-00047.safetensors", + "model.layers.18.mlp.experts.5.gate_proj.weight_scale": "model-00019-of-00047.safetensors", + "model.layers.18.mlp.experts.5.up_proj.weight": "model-00019-of-00047.safetensors", + "model.layers.18.mlp.experts.5.up_proj.weight_scale": "model-00019-of-00047.safetensors", + "model.layers.18.mlp.experts.50.down_proj.weight": "model-00019-of-00047.safetensors", + "model.layers.18.mlp.experts.50.down_proj.weight_scale": "model-00019-of-00047.safetensors", + "model.layers.18.mlp.experts.50.gate_proj.weight": "model-00019-of-00047.safetensors", + "model.layers.18.mlp.experts.50.gate_proj.weight_scale": "model-00019-of-00047.safetensors", + "model.layers.18.mlp.experts.50.up_proj.weight": "model-00019-of-00047.safetensors", + "model.layers.18.mlp.experts.50.up_proj.weight_scale": "model-00019-of-00047.safetensors", + "model.layers.18.mlp.experts.51.down_proj.weight": "model-00019-of-00047.safetensors", + "model.layers.18.mlp.experts.51.down_proj.weight_scale": "model-00019-of-00047.safetensors", + "model.layers.18.mlp.experts.51.gate_proj.weight": "model-00019-of-00047.safetensors", + "model.layers.18.mlp.experts.51.gate_proj.weight_scale": "model-00019-of-00047.safetensors", + "model.layers.18.mlp.experts.51.up_proj.weight": "model-00019-of-00047.safetensors", + "model.layers.18.mlp.experts.51.up_proj.weight_scale": "model-00019-of-00047.safetensors", + "model.layers.18.mlp.experts.52.down_proj.weight": "model-00019-of-00047.safetensors", + "model.layers.18.mlp.experts.52.down_proj.weight_scale": "model-00019-of-00047.safetensors", + "model.layers.18.mlp.experts.52.gate_proj.weight": "model-00019-of-00047.safetensors", + "model.layers.18.mlp.experts.52.gate_proj.weight_scale": "model-00019-of-00047.safetensors", + "model.layers.18.mlp.experts.52.up_proj.weight": "model-00019-of-00047.safetensors", + "model.layers.18.mlp.experts.52.up_proj.weight_scale": "model-00019-of-00047.safetensors", + "model.layers.18.mlp.experts.53.down_proj.weight": "model-00019-of-00047.safetensors", + "model.layers.18.mlp.experts.53.down_proj.weight_scale": "model-00019-of-00047.safetensors", + "model.layers.18.mlp.experts.53.gate_proj.weight": "model-00019-of-00047.safetensors", + "model.layers.18.mlp.experts.53.gate_proj.weight_scale": "model-00019-of-00047.safetensors", + "model.layers.18.mlp.experts.53.up_proj.weight": "model-00019-of-00047.safetensors", + "model.layers.18.mlp.experts.53.up_proj.weight_scale": "model-00019-of-00047.safetensors", + "model.layers.18.mlp.experts.54.down_proj.weight": "model-00019-of-00047.safetensors", + "model.layers.18.mlp.experts.54.down_proj.weight_scale": "model-00019-of-00047.safetensors", + "model.layers.18.mlp.experts.54.gate_proj.weight": "model-00019-of-00047.safetensors", + "model.layers.18.mlp.experts.54.gate_proj.weight_scale": "model-00019-of-00047.safetensors", + "model.layers.18.mlp.experts.54.up_proj.weight": "model-00019-of-00047.safetensors", + "model.layers.18.mlp.experts.54.up_proj.weight_scale": "model-00019-of-00047.safetensors", + "model.layers.18.mlp.experts.55.down_proj.weight": "model-00019-of-00047.safetensors", + "model.layers.18.mlp.experts.55.down_proj.weight_scale": "model-00019-of-00047.safetensors", + "model.layers.18.mlp.experts.55.gate_proj.weight": "model-00019-of-00047.safetensors", + "model.layers.18.mlp.experts.55.gate_proj.weight_scale": "model-00019-of-00047.safetensors", + "model.layers.18.mlp.experts.55.up_proj.weight": "model-00019-of-00047.safetensors", + "model.layers.18.mlp.experts.55.up_proj.weight_scale": "model-00019-of-00047.safetensors", + "model.layers.18.mlp.experts.56.down_proj.weight": "model-00019-of-00047.safetensors", + "model.layers.18.mlp.experts.56.down_proj.weight_scale": "model-00019-of-00047.safetensors", + "model.layers.18.mlp.experts.56.gate_proj.weight": "model-00019-of-00047.safetensors", + "model.layers.18.mlp.experts.56.gate_proj.weight_scale": "model-00019-of-00047.safetensors", + "model.layers.18.mlp.experts.56.up_proj.weight": "model-00019-of-00047.safetensors", + "model.layers.18.mlp.experts.56.up_proj.weight_scale": "model-00019-of-00047.safetensors", + "model.layers.18.mlp.experts.57.down_proj.weight": "model-00019-of-00047.safetensors", + "model.layers.18.mlp.experts.57.down_proj.weight_scale": "model-00019-of-00047.safetensors", + "model.layers.18.mlp.experts.57.gate_proj.weight": "model-00019-of-00047.safetensors", + "model.layers.18.mlp.experts.57.gate_proj.weight_scale": "model-00019-of-00047.safetensors", + "model.layers.18.mlp.experts.57.up_proj.weight": "model-00019-of-00047.safetensors", + "model.layers.18.mlp.experts.57.up_proj.weight_scale": "model-00019-of-00047.safetensors", + "model.layers.18.mlp.experts.58.down_proj.weight": "model-00019-of-00047.safetensors", + "model.layers.18.mlp.experts.58.down_proj.weight_scale": "model-00019-of-00047.safetensors", + "model.layers.18.mlp.experts.58.gate_proj.weight": "model-00019-of-00047.safetensors", + "model.layers.18.mlp.experts.58.gate_proj.weight_scale": "model-00019-of-00047.safetensors", + "model.layers.18.mlp.experts.58.up_proj.weight": "model-00019-of-00047.safetensors", + "model.layers.18.mlp.experts.58.up_proj.weight_scale": "model-00019-of-00047.safetensors", + "model.layers.18.mlp.experts.59.down_proj.weight": "model-00019-of-00047.safetensors", + "model.layers.18.mlp.experts.59.down_proj.weight_scale": "model-00019-of-00047.safetensors", + "model.layers.18.mlp.experts.59.gate_proj.weight": "model-00019-of-00047.safetensors", + "model.layers.18.mlp.experts.59.gate_proj.weight_scale": "model-00019-of-00047.safetensors", + "model.layers.18.mlp.experts.59.up_proj.weight": "model-00019-of-00047.safetensors", + "model.layers.18.mlp.experts.59.up_proj.weight_scale": "model-00019-of-00047.safetensors", + "model.layers.18.mlp.experts.6.down_proj.weight": "model-00019-of-00047.safetensors", + "model.layers.18.mlp.experts.6.down_proj.weight_scale": "model-00019-of-00047.safetensors", + "model.layers.18.mlp.experts.6.gate_proj.weight": "model-00019-of-00047.safetensors", + "model.layers.18.mlp.experts.6.gate_proj.weight_scale": "model-00019-of-00047.safetensors", + "model.layers.18.mlp.experts.6.up_proj.weight": "model-00019-of-00047.safetensors", + "model.layers.18.mlp.experts.6.up_proj.weight_scale": "model-00019-of-00047.safetensors", + "model.layers.18.mlp.experts.60.down_proj.weight": "model-00019-of-00047.safetensors", + "model.layers.18.mlp.experts.60.down_proj.weight_scale": "model-00019-of-00047.safetensors", + "model.layers.18.mlp.experts.60.gate_proj.weight": "model-00019-of-00047.safetensors", + "model.layers.18.mlp.experts.60.gate_proj.weight_scale": "model-00019-of-00047.safetensors", + "model.layers.18.mlp.experts.60.up_proj.weight": "model-00019-of-00047.safetensors", + "model.layers.18.mlp.experts.60.up_proj.weight_scale": "model-00019-of-00047.safetensors", + "model.layers.18.mlp.experts.61.down_proj.weight": "model-00019-of-00047.safetensors", + "model.layers.18.mlp.experts.61.down_proj.weight_scale": "model-00019-of-00047.safetensors", + "model.layers.18.mlp.experts.61.gate_proj.weight": "model-00019-of-00047.safetensors", + "model.layers.18.mlp.experts.61.gate_proj.weight_scale": "model-00019-of-00047.safetensors", + "model.layers.18.mlp.experts.61.up_proj.weight": "model-00019-of-00047.safetensors", + "model.layers.18.mlp.experts.61.up_proj.weight_scale": "model-00019-of-00047.safetensors", + "model.layers.18.mlp.experts.62.down_proj.weight": "model-00019-of-00047.safetensors", + "model.layers.18.mlp.experts.62.down_proj.weight_scale": "model-00019-of-00047.safetensors", + "model.layers.18.mlp.experts.62.gate_proj.weight": "model-00019-of-00047.safetensors", + "model.layers.18.mlp.experts.62.gate_proj.weight_scale": "model-00019-of-00047.safetensors", + "model.layers.18.mlp.experts.62.up_proj.weight": "model-00019-of-00047.safetensors", + "model.layers.18.mlp.experts.62.up_proj.weight_scale": "model-00019-of-00047.safetensors", + "model.layers.18.mlp.experts.63.down_proj.weight": "model-00019-of-00047.safetensors", + "model.layers.18.mlp.experts.63.down_proj.weight_scale": "model-00019-of-00047.safetensors", + "model.layers.18.mlp.experts.63.gate_proj.weight": "model-00019-of-00047.safetensors", + "model.layers.18.mlp.experts.63.gate_proj.weight_scale": "model-00019-of-00047.safetensors", + "model.layers.18.mlp.experts.63.up_proj.weight": "model-00019-of-00047.safetensors", + "model.layers.18.mlp.experts.63.up_proj.weight_scale": "model-00019-of-00047.safetensors", + "model.layers.18.mlp.experts.64.down_proj.weight": "model-00019-of-00047.safetensors", + "model.layers.18.mlp.experts.64.down_proj.weight_scale": "model-00019-of-00047.safetensors", + "model.layers.18.mlp.experts.64.gate_proj.weight": "model-00019-of-00047.safetensors", + "model.layers.18.mlp.experts.64.gate_proj.weight_scale": "model-00019-of-00047.safetensors", + "model.layers.18.mlp.experts.64.up_proj.weight": "model-00019-of-00047.safetensors", + "model.layers.18.mlp.experts.64.up_proj.weight_scale": "model-00019-of-00047.safetensors", + "model.layers.18.mlp.experts.65.down_proj.weight": "model-00019-of-00047.safetensors", + "model.layers.18.mlp.experts.65.down_proj.weight_scale": "model-00019-of-00047.safetensors", + "model.layers.18.mlp.experts.65.gate_proj.weight": "model-00019-of-00047.safetensors", + "model.layers.18.mlp.experts.65.gate_proj.weight_scale": "model-00019-of-00047.safetensors", + "model.layers.18.mlp.experts.65.up_proj.weight": "model-00019-of-00047.safetensors", + "model.layers.18.mlp.experts.65.up_proj.weight_scale": "model-00019-of-00047.safetensors", + "model.layers.18.mlp.experts.66.down_proj.weight": "model-00019-of-00047.safetensors", + "model.layers.18.mlp.experts.66.down_proj.weight_scale": "model-00019-of-00047.safetensors", + "model.layers.18.mlp.experts.66.gate_proj.weight": "model-00019-of-00047.safetensors", + "model.layers.18.mlp.experts.66.gate_proj.weight_scale": "model-00019-of-00047.safetensors", + "model.layers.18.mlp.experts.66.up_proj.weight": "model-00019-of-00047.safetensors", + "model.layers.18.mlp.experts.66.up_proj.weight_scale": "model-00019-of-00047.safetensors", + "model.layers.18.mlp.experts.67.down_proj.weight": "model-00019-of-00047.safetensors", + "model.layers.18.mlp.experts.67.down_proj.weight_scale": "model-00019-of-00047.safetensors", + "model.layers.18.mlp.experts.67.gate_proj.weight": "model-00019-of-00047.safetensors", + "model.layers.18.mlp.experts.67.gate_proj.weight_scale": "model-00019-of-00047.safetensors", + "model.layers.18.mlp.experts.67.up_proj.weight": "model-00019-of-00047.safetensors", + "model.layers.18.mlp.experts.67.up_proj.weight_scale": "model-00019-of-00047.safetensors", + "model.layers.18.mlp.experts.68.down_proj.weight": "model-00019-of-00047.safetensors", + "model.layers.18.mlp.experts.68.down_proj.weight_scale": "model-00019-of-00047.safetensors", + "model.layers.18.mlp.experts.68.gate_proj.weight": "model-00019-of-00047.safetensors", + "model.layers.18.mlp.experts.68.gate_proj.weight_scale": "model-00019-of-00047.safetensors", + "model.layers.18.mlp.experts.68.up_proj.weight": "model-00019-of-00047.safetensors", + "model.layers.18.mlp.experts.68.up_proj.weight_scale": "model-00019-of-00047.safetensors", + "model.layers.18.mlp.experts.69.down_proj.weight": "model-00019-of-00047.safetensors", + "model.layers.18.mlp.experts.69.down_proj.weight_scale": "model-00019-of-00047.safetensors", + "model.layers.18.mlp.experts.69.gate_proj.weight": "model-00019-of-00047.safetensors", + "model.layers.18.mlp.experts.69.gate_proj.weight_scale": "model-00019-of-00047.safetensors", + "model.layers.18.mlp.experts.69.up_proj.weight": "model-00019-of-00047.safetensors", + "model.layers.18.mlp.experts.69.up_proj.weight_scale": "model-00019-of-00047.safetensors", + "model.layers.18.mlp.experts.7.down_proj.weight": "model-00019-of-00047.safetensors", + "model.layers.18.mlp.experts.7.down_proj.weight_scale": "model-00019-of-00047.safetensors", + "model.layers.18.mlp.experts.7.gate_proj.weight": "model-00019-of-00047.safetensors", + "model.layers.18.mlp.experts.7.gate_proj.weight_scale": "model-00019-of-00047.safetensors", + "model.layers.18.mlp.experts.7.up_proj.weight": "model-00019-of-00047.safetensors", + "model.layers.18.mlp.experts.7.up_proj.weight_scale": "model-00019-of-00047.safetensors", + "model.layers.18.mlp.experts.70.down_proj.weight": "model-00019-of-00047.safetensors", + "model.layers.18.mlp.experts.70.down_proj.weight_scale": "model-00019-of-00047.safetensors", + "model.layers.18.mlp.experts.70.gate_proj.weight": "model-00019-of-00047.safetensors", + "model.layers.18.mlp.experts.70.gate_proj.weight_scale": "model-00019-of-00047.safetensors", + "model.layers.18.mlp.experts.70.up_proj.weight": "model-00019-of-00047.safetensors", + "model.layers.18.mlp.experts.70.up_proj.weight_scale": "model-00019-of-00047.safetensors", + "model.layers.18.mlp.experts.71.down_proj.weight": "model-00019-of-00047.safetensors", + "model.layers.18.mlp.experts.71.down_proj.weight_scale": "model-00019-of-00047.safetensors", + "model.layers.18.mlp.experts.71.gate_proj.weight": "model-00019-of-00047.safetensors", + "model.layers.18.mlp.experts.71.gate_proj.weight_scale": "model-00019-of-00047.safetensors", + "model.layers.18.mlp.experts.71.up_proj.weight": "model-00019-of-00047.safetensors", + "model.layers.18.mlp.experts.71.up_proj.weight_scale": "model-00019-of-00047.safetensors", + "model.layers.18.mlp.experts.72.down_proj.weight": "model-00019-of-00047.safetensors", + "model.layers.18.mlp.experts.72.down_proj.weight_scale": "model-00019-of-00047.safetensors", + "model.layers.18.mlp.experts.72.gate_proj.weight": "model-00019-of-00047.safetensors", + "model.layers.18.mlp.experts.72.gate_proj.weight_scale": "model-00019-of-00047.safetensors", + "model.layers.18.mlp.experts.72.up_proj.weight": "model-00019-of-00047.safetensors", + "model.layers.18.mlp.experts.72.up_proj.weight_scale": "model-00019-of-00047.safetensors", + "model.layers.18.mlp.experts.73.down_proj.weight": "model-00019-of-00047.safetensors", + "model.layers.18.mlp.experts.73.down_proj.weight_scale": "model-00019-of-00047.safetensors", + "model.layers.18.mlp.experts.73.gate_proj.weight": "model-00019-of-00047.safetensors", + "model.layers.18.mlp.experts.73.gate_proj.weight_scale": "model-00019-of-00047.safetensors", + "model.layers.18.mlp.experts.73.up_proj.weight": "model-00019-of-00047.safetensors", + "model.layers.18.mlp.experts.73.up_proj.weight_scale": "model-00019-of-00047.safetensors", + "model.layers.18.mlp.experts.74.down_proj.weight": "model-00019-of-00047.safetensors", + "model.layers.18.mlp.experts.74.down_proj.weight_scale": "model-00019-of-00047.safetensors", + "model.layers.18.mlp.experts.74.gate_proj.weight": "model-00019-of-00047.safetensors", + "model.layers.18.mlp.experts.74.gate_proj.weight_scale": "model-00019-of-00047.safetensors", + "model.layers.18.mlp.experts.74.up_proj.weight": "model-00019-of-00047.safetensors", + "model.layers.18.mlp.experts.74.up_proj.weight_scale": "model-00019-of-00047.safetensors", + "model.layers.18.mlp.experts.75.down_proj.weight": "model-00019-of-00047.safetensors", + "model.layers.18.mlp.experts.75.down_proj.weight_scale": "model-00019-of-00047.safetensors", + "model.layers.18.mlp.experts.75.gate_proj.weight": "model-00019-of-00047.safetensors", + "model.layers.18.mlp.experts.75.gate_proj.weight_scale": "model-00019-of-00047.safetensors", + "model.layers.18.mlp.experts.75.up_proj.weight": "model-00019-of-00047.safetensors", + "model.layers.18.mlp.experts.75.up_proj.weight_scale": "model-00019-of-00047.safetensors", + "model.layers.18.mlp.experts.76.down_proj.weight": "model-00019-of-00047.safetensors", + "model.layers.18.mlp.experts.76.down_proj.weight_scale": "model-00019-of-00047.safetensors", + "model.layers.18.mlp.experts.76.gate_proj.weight": "model-00019-of-00047.safetensors", + "model.layers.18.mlp.experts.76.gate_proj.weight_scale": "model-00019-of-00047.safetensors", + "model.layers.18.mlp.experts.76.up_proj.weight": "model-00019-of-00047.safetensors", + "model.layers.18.mlp.experts.76.up_proj.weight_scale": "model-00019-of-00047.safetensors", + "model.layers.18.mlp.experts.77.down_proj.weight": "model-00019-of-00047.safetensors", + "model.layers.18.mlp.experts.77.down_proj.weight_scale": "model-00019-of-00047.safetensors", + "model.layers.18.mlp.experts.77.gate_proj.weight": "model-00019-of-00047.safetensors", + "model.layers.18.mlp.experts.77.gate_proj.weight_scale": "model-00019-of-00047.safetensors", + "model.layers.18.mlp.experts.77.up_proj.weight": "model-00019-of-00047.safetensors", + "model.layers.18.mlp.experts.77.up_proj.weight_scale": "model-00019-of-00047.safetensors", + "model.layers.18.mlp.experts.78.down_proj.weight": "model-00019-of-00047.safetensors", + "model.layers.18.mlp.experts.78.down_proj.weight_scale": "model-00019-of-00047.safetensors", + "model.layers.18.mlp.experts.78.gate_proj.weight": "model-00019-of-00047.safetensors", + "model.layers.18.mlp.experts.78.gate_proj.weight_scale": "model-00019-of-00047.safetensors", + "model.layers.18.mlp.experts.78.up_proj.weight": "model-00019-of-00047.safetensors", + "model.layers.18.mlp.experts.78.up_proj.weight_scale": "model-00019-of-00047.safetensors", + "model.layers.18.mlp.experts.79.down_proj.weight": "model-00019-of-00047.safetensors", + "model.layers.18.mlp.experts.79.down_proj.weight_scale": "model-00019-of-00047.safetensors", + "model.layers.18.mlp.experts.79.gate_proj.weight": "model-00019-of-00047.safetensors", + "model.layers.18.mlp.experts.79.gate_proj.weight_scale": "model-00019-of-00047.safetensors", + "model.layers.18.mlp.experts.79.up_proj.weight": "model-00019-of-00047.safetensors", + "model.layers.18.mlp.experts.79.up_proj.weight_scale": "model-00019-of-00047.safetensors", + "model.layers.18.mlp.experts.8.down_proj.weight": "model-00019-of-00047.safetensors", + "model.layers.18.mlp.experts.8.down_proj.weight_scale": "model-00019-of-00047.safetensors", + "model.layers.18.mlp.experts.8.gate_proj.weight": "model-00019-of-00047.safetensors", + "model.layers.18.mlp.experts.8.gate_proj.weight_scale": "model-00019-of-00047.safetensors", + "model.layers.18.mlp.experts.8.up_proj.weight": "model-00019-of-00047.safetensors", + "model.layers.18.mlp.experts.8.up_proj.weight_scale": "model-00019-of-00047.safetensors", + "model.layers.18.mlp.experts.80.down_proj.weight": "model-00019-of-00047.safetensors", + "model.layers.18.mlp.experts.80.down_proj.weight_scale": "model-00019-of-00047.safetensors", + "model.layers.18.mlp.experts.80.gate_proj.weight": "model-00019-of-00047.safetensors", + "model.layers.18.mlp.experts.80.gate_proj.weight_scale": "model-00019-of-00047.safetensors", + "model.layers.18.mlp.experts.80.up_proj.weight": "model-00019-of-00047.safetensors", + "model.layers.18.mlp.experts.80.up_proj.weight_scale": "model-00019-of-00047.safetensors", + "model.layers.18.mlp.experts.81.down_proj.weight": "model-00019-of-00047.safetensors", + "model.layers.18.mlp.experts.81.down_proj.weight_scale": "model-00019-of-00047.safetensors", + "model.layers.18.mlp.experts.81.gate_proj.weight": "model-00019-of-00047.safetensors", + "model.layers.18.mlp.experts.81.gate_proj.weight_scale": "model-00019-of-00047.safetensors", + "model.layers.18.mlp.experts.81.up_proj.weight": "model-00019-of-00047.safetensors", + "model.layers.18.mlp.experts.81.up_proj.weight_scale": "model-00019-of-00047.safetensors", + "model.layers.18.mlp.experts.82.down_proj.weight": "model-00019-of-00047.safetensors", + "model.layers.18.mlp.experts.82.down_proj.weight_scale": "model-00019-of-00047.safetensors", + "model.layers.18.mlp.experts.82.gate_proj.weight": "model-00019-of-00047.safetensors", + "model.layers.18.mlp.experts.82.gate_proj.weight_scale": "model-00019-of-00047.safetensors", + "model.layers.18.mlp.experts.82.up_proj.weight": "model-00019-of-00047.safetensors", + "model.layers.18.mlp.experts.82.up_proj.weight_scale": "model-00019-of-00047.safetensors", + "model.layers.18.mlp.experts.83.down_proj.weight": "model-00019-of-00047.safetensors", + "model.layers.18.mlp.experts.83.down_proj.weight_scale": "model-00019-of-00047.safetensors", + "model.layers.18.mlp.experts.83.gate_proj.weight": "model-00019-of-00047.safetensors", + "model.layers.18.mlp.experts.83.gate_proj.weight_scale": "model-00019-of-00047.safetensors", + "model.layers.18.mlp.experts.83.up_proj.weight": "model-00019-of-00047.safetensors", + "model.layers.18.mlp.experts.83.up_proj.weight_scale": "model-00019-of-00047.safetensors", + "model.layers.18.mlp.experts.84.down_proj.weight": "model-00019-of-00047.safetensors", + "model.layers.18.mlp.experts.84.down_proj.weight_scale": "model-00019-of-00047.safetensors", + "model.layers.18.mlp.experts.84.gate_proj.weight": "model-00019-of-00047.safetensors", + "model.layers.18.mlp.experts.84.gate_proj.weight_scale": "model-00019-of-00047.safetensors", + "model.layers.18.mlp.experts.84.up_proj.weight": "model-00019-of-00047.safetensors", + "model.layers.18.mlp.experts.84.up_proj.weight_scale": "model-00019-of-00047.safetensors", + "model.layers.18.mlp.experts.85.down_proj.weight": "model-00019-of-00047.safetensors", + "model.layers.18.mlp.experts.85.down_proj.weight_scale": "model-00019-of-00047.safetensors", + "model.layers.18.mlp.experts.85.gate_proj.weight": "model-00019-of-00047.safetensors", + "model.layers.18.mlp.experts.85.gate_proj.weight_scale": "model-00019-of-00047.safetensors", + "model.layers.18.mlp.experts.85.up_proj.weight": "model-00019-of-00047.safetensors", + "model.layers.18.mlp.experts.85.up_proj.weight_scale": "model-00019-of-00047.safetensors", + "model.layers.18.mlp.experts.86.down_proj.weight": "model-00019-of-00047.safetensors", + "model.layers.18.mlp.experts.86.down_proj.weight_scale": "model-00019-of-00047.safetensors", + "model.layers.18.mlp.experts.86.gate_proj.weight": "model-00019-of-00047.safetensors", + "model.layers.18.mlp.experts.86.gate_proj.weight_scale": "model-00019-of-00047.safetensors", + "model.layers.18.mlp.experts.86.up_proj.weight": "model-00019-of-00047.safetensors", + "model.layers.18.mlp.experts.86.up_proj.weight_scale": "model-00019-of-00047.safetensors", + "model.layers.18.mlp.experts.87.down_proj.weight": "model-00019-of-00047.safetensors", + "model.layers.18.mlp.experts.87.down_proj.weight_scale": "model-00019-of-00047.safetensors", + "model.layers.18.mlp.experts.87.gate_proj.weight": "model-00019-of-00047.safetensors", + "model.layers.18.mlp.experts.87.gate_proj.weight_scale": "model-00019-of-00047.safetensors", + "model.layers.18.mlp.experts.87.up_proj.weight": "model-00019-of-00047.safetensors", + "model.layers.18.mlp.experts.87.up_proj.weight_scale": "model-00019-of-00047.safetensors", + "model.layers.18.mlp.experts.88.down_proj.weight": "model-00019-of-00047.safetensors", + "model.layers.18.mlp.experts.88.down_proj.weight_scale": "model-00019-of-00047.safetensors", + "model.layers.18.mlp.experts.88.gate_proj.weight": "model-00019-of-00047.safetensors", + "model.layers.18.mlp.experts.88.gate_proj.weight_scale": "model-00019-of-00047.safetensors", + "model.layers.18.mlp.experts.88.up_proj.weight": "model-00019-of-00047.safetensors", + "model.layers.18.mlp.experts.88.up_proj.weight_scale": "model-00019-of-00047.safetensors", + "model.layers.18.mlp.experts.89.down_proj.weight": "model-00019-of-00047.safetensors", + "model.layers.18.mlp.experts.89.down_proj.weight_scale": "model-00019-of-00047.safetensors", + "model.layers.18.mlp.experts.89.gate_proj.weight": "model-00019-of-00047.safetensors", + "model.layers.18.mlp.experts.89.gate_proj.weight_scale": "model-00019-of-00047.safetensors", + "model.layers.18.mlp.experts.89.up_proj.weight": "model-00019-of-00047.safetensors", + "model.layers.18.mlp.experts.89.up_proj.weight_scale": "model-00019-of-00047.safetensors", + "model.layers.18.mlp.experts.9.down_proj.weight": "model-00019-of-00047.safetensors", + "model.layers.18.mlp.experts.9.down_proj.weight_scale": "model-00019-of-00047.safetensors", + "model.layers.18.mlp.experts.9.gate_proj.weight": "model-00019-of-00047.safetensors", + "model.layers.18.mlp.experts.9.gate_proj.weight_scale": "model-00019-of-00047.safetensors", + "model.layers.18.mlp.experts.9.up_proj.weight": "model-00019-of-00047.safetensors", + "model.layers.18.mlp.experts.9.up_proj.weight_scale": "model-00019-of-00047.safetensors", + "model.layers.18.mlp.experts.90.down_proj.weight": "model-00019-of-00047.safetensors", + "model.layers.18.mlp.experts.90.down_proj.weight_scale": "model-00019-of-00047.safetensors", + "model.layers.18.mlp.experts.90.gate_proj.weight": "model-00019-of-00047.safetensors", + "model.layers.18.mlp.experts.90.gate_proj.weight_scale": "model-00019-of-00047.safetensors", + "model.layers.18.mlp.experts.90.up_proj.weight": "model-00019-of-00047.safetensors", + "model.layers.18.mlp.experts.90.up_proj.weight_scale": "model-00019-of-00047.safetensors", + "model.layers.18.mlp.experts.91.down_proj.weight": "model-00019-of-00047.safetensors", + "model.layers.18.mlp.experts.91.down_proj.weight_scale": "model-00019-of-00047.safetensors", + "model.layers.18.mlp.experts.91.gate_proj.weight": "model-00019-of-00047.safetensors", + "model.layers.18.mlp.experts.91.gate_proj.weight_scale": "model-00019-of-00047.safetensors", + "model.layers.18.mlp.experts.91.up_proj.weight": "model-00019-of-00047.safetensors", + "model.layers.18.mlp.experts.91.up_proj.weight_scale": "model-00019-of-00047.safetensors", + "model.layers.18.mlp.experts.92.down_proj.weight": "model-00019-of-00047.safetensors", + "model.layers.18.mlp.experts.92.down_proj.weight_scale": "model-00019-of-00047.safetensors", + "model.layers.18.mlp.experts.92.gate_proj.weight": "model-00019-of-00047.safetensors", + "model.layers.18.mlp.experts.92.gate_proj.weight_scale": "model-00019-of-00047.safetensors", + "model.layers.18.mlp.experts.92.up_proj.weight": "model-00019-of-00047.safetensors", + "model.layers.18.mlp.experts.92.up_proj.weight_scale": "model-00019-of-00047.safetensors", + "model.layers.18.mlp.experts.93.down_proj.weight": "model-00019-of-00047.safetensors", + "model.layers.18.mlp.experts.93.down_proj.weight_scale": "model-00019-of-00047.safetensors", + "model.layers.18.mlp.experts.93.gate_proj.weight": "model-00019-of-00047.safetensors", + "model.layers.18.mlp.experts.93.gate_proj.weight_scale": "model-00019-of-00047.safetensors", + "model.layers.18.mlp.experts.93.up_proj.weight": "model-00019-of-00047.safetensors", + "model.layers.18.mlp.experts.93.up_proj.weight_scale": "model-00019-of-00047.safetensors", + "model.layers.18.mlp.experts.94.down_proj.weight": "model-00019-of-00047.safetensors", + "model.layers.18.mlp.experts.94.down_proj.weight_scale": "model-00019-of-00047.safetensors", + "model.layers.18.mlp.experts.94.gate_proj.weight": "model-00019-of-00047.safetensors", + "model.layers.18.mlp.experts.94.gate_proj.weight_scale": "model-00019-of-00047.safetensors", + "model.layers.18.mlp.experts.94.up_proj.weight": "model-00019-of-00047.safetensors", + "model.layers.18.mlp.experts.94.up_proj.weight_scale": "model-00019-of-00047.safetensors", + "model.layers.18.mlp.experts.95.down_proj.weight": "model-00019-of-00047.safetensors", + "model.layers.18.mlp.experts.95.down_proj.weight_scale": "model-00019-of-00047.safetensors", + "model.layers.18.mlp.experts.95.gate_proj.weight": "model-00019-of-00047.safetensors", + "model.layers.18.mlp.experts.95.gate_proj.weight_scale": "model-00019-of-00047.safetensors", + "model.layers.18.mlp.experts.95.up_proj.weight": "model-00019-of-00047.safetensors", + "model.layers.18.mlp.experts.95.up_proj.weight_scale": "model-00019-of-00047.safetensors", + "model.layers.18.mlp.experts.96.down_proj.weight": "model-00019-of-00047.safetensors", + "model.layers.18.mlp.experts.96.down_proj.weight_scale": "model-00019-of-00047.safetensors", + "model.layers.18.mlp.experts.96.gate_proj.weight": "model-00019-of-00047.safetensors", + "model.layers.18.mlp.experts.96.gate_proj.weight_scale": "model-00019-of-00047.safetensors", + "model.layers.18.mlp.experts.96.up_proj.weight": "model-00019-of-00047.safetensors", + "model.layers.18.mlp.experts.96.up_proj.weight_scale": "model-00019-of-00047.safetensors", + "model.layers.18.mlp.experts.97.down_proj.weight": "model-00019-of-00047.safetensors", + "model.layers.18.mlp.experts.97.down_proj.weight_scale": "model-00019-of-00047.safetensors", + "model.layers.18.mlp.experts.97.gate_proj.weight": "model-00019-of-00047.safetensors", + "model.layers.18.mlp.experts.97.gate_proj.weight_scale": "model-00019-of-00047.safetensors", + "model.layers.18.mlp.experts.97.up_proj.weight": "model-00019-of-00047.safetensors", + "model.layers.18.mlp.experts.97.up_proj.weight_scale": "model-00019-of-00047.safetensors", + "model.layers.18.mlp.experts.98.down_proj.weight": "model-00019-of-00047.safetensors", + "model.layers.18.mlp.experts.98.down_proj.weight_scale": "model-00019-of-00047.safetensors", + "model.layers.18.mlp.experts.98.gate_proj.weight": "model-00019-of-00047.safetensors", + "model.layers.18.mlp.experts.98.gate_proj.weight_scale": "model-00019-of-00047.safetensors", + "model.layers.18.mlp.experts.98.up_proj.weight": "model-00019-of-00047.safetensors", + "model.layers.18.mlp.experts.98.up_proj.weight_scale": "model-00019-of-00047.safetensors", + "model.layers.18.mlp.experts.99.down_proj.weight": "model-00019-of-00047.safetensors", + "model.layers.18.mlp.experts.99.down_proj.weight_scale": "model-00019-of-00047.safetensors", + "model.layers.18.mlp.experts.99.gate_proj.weight": "model-00019-of-00047.safetensors", + "model.layers.18.mlp.experts.99.gate_proj.weight_scale": "model-00019-of-00047.safetensors", + "model.layers.18.mlp.experts.99.up_proj.weight": "model-00019-of-00047.safetensors", + "model.layers.18.mlp.experts.99.up_proj.weight_scale": "model-00019-of-00047.safetensors", + "model.layers.18.mlp.gate.e_score_correction_bias": "model-00019-of-00047.safetensors", + "model.layers.18.mlp.gate.weight": "model-00019-of-00047.safetensors", + "model.layers.18.mlp.shared_experts.down_proj.weight": "model-00019-of-00047.safetensors", + "model.layers.18.mlp.shared_experts.down_proj.weight_scale": "model-00019-of-00047.safetensors", + "model.layers.18.mlp.shared_experts.gate_proj.weight": "model-00019-of-00047.safetensors", + "model.layers.18.mlp.shared_experts.gate_proj.weight_scale": "model-00019-of-00047.safetensors", + "model.layers.18.mlp.shared_experts.up_proj.weight": "model-00019-of-00047.safetensors", + "model.layers.18.mlp.shared_experts.up_proj.weight_scale": "model-00019-of-00047.safetensors", + "model.layers.18.post_attention_layernorm.weight": "model-00019-of-00047.safetensors", + "model.layers.18.self_attn.k_proj.bias": "model-00019-of-00047.safetensors", + "model.layers.18.self_attn.k_proj.weight": "model-00019-of-00047.safetensors", + "model.layers.18.self_attn.k_proj.weight_scale": "model-00019-of-00047.safetensors", + "model.layers.18.self_attn.o_proj.weight": "model-00019-of-00047.safetensors", + "model.layers.18.self_attn.o_proj.weight_scale": "model-00019-of-00047.safetensors", + "model.layers.18.self_attn.q_proj.bias": "model-00019-of-00047.safetensors", + "model.layers.18.self_attn.q_proj.weight": "model-00019-of-00047.safetensors", + "model.layers.18.self_attn.q_proj.weight_scale": "model-00019-of-00047.safetensors", + "model.layers.18.self_attn.v_proj.bias": "model-00019-of-00047.safetensors", + "model.layers.18.self_attn.v_proj.weight": "model-00019-of-00047.safetensors", + "model.layers.18.self_attn.v_proj.weight_scale": "model-00019-of-00047.safetensors", + "model.layers.19.input_layernorm.weight": "model-00020-of-00047.safetensors", + "model.layers.19.mlp.experts.0.down_proj.weight": "model-00020-of-00047.safetensors", + "model.layers.19.mlp.experts.0.down_proj.weight_scale": "model-00020-of-00047.safetensors", + "model.layers.19.mlp.experts.0.gate_proj.weight": "model-00020-of-00047.safetensors", + "model.layers.19.mlp.experts.0.gate_proj.weight_scale": "model-00020-of-00047.safetensors", + "model.layers.19.mlp.experts.0.up_proj.weight": "model-00020-of-00047.safetensors", + "model.layers.19.mlp.experts.0.up_proj.weight_scale": "model-00020-of-00047.safetensors", + "model.layers.19.mlp.experts.1.down_proj.weight": "model-00020-of-00047.safetensors", + "model.layers.19.mlp.experts.1.down_proj.weight_scale": "model-00020-of-00047.safetensors", + "model.layers.19.mlp.experts.1.gate_proj.weight": "model-00020-of-00047.safetensors", + "model.layers.19.mlp.experts.1.gate_proj.weight_scale": "model-00020-of-00047.safetensors", + "model.layers.19.mlp.experts.1.up_proj.weight": "model-00020-of-00047.safetensors", + "model.layers.19.mlp.experts.1.up_proj.weight_scale": "model-00020-of-00047.safetensors", + "model.layers.19.mlp.experts.10.down_proj.weight": "model-00020-of-00047.safetensors", + "model.layers.19.mlp.experts.10.down_proj.weight_scale": "model-00020-of-00047.safetensors", + "model.layers.19.mlp.experts.10.gate_proj.weight": "model-00020-of-00047.safetensors", + "model.layers.19.mlp.experts.10.gate_proj.weight_scale": "model-00020-of-00047.safetensors", + "model.layers.19.mlp.experts.10.up_proj.weight": "model-00020-of-00047.safetensors", + "model.layers.19.mlp.experts.10.up_proj.weight_scale": "model-00020-of-00047.safetensors", + "model.layers.19.mlp.experts.100.down_proj.weight": "model-00020-of-00047.safetensors", + "model.layers.19.mlp.experts.100.down_proj.weight_scale": "model-00020-of-00047.safetensors", + "model.layers.19.mlp.experts.100.gate_proj.weight": "model-00020-of-00047.safetensors", + "model.layers.19.mlp.experts.100.gate_proj.weight_scale": "model-00020-of-00047.safetensors", + "model.layers.19.mlp.experts.100.up_proj.weight": "model-00020-of-00047.safetensors", + "model.layers.19.mlp.experts.100.up_proj.weight_scale": "model-00020-of-00047.safetensors", + "model.layers.19.mlp.experts.101.down_proj.weight": "model-00020-of-00047.safetensors", + "model.layers.19.mlp.experts.101.down_proj.weight_scale": "model-00020-of-00047.safetensors", + "model.layers.19.mlp.experts.101.gate_proj.weight": "model-00020-of-00047.safetensors", + "model.layers.19.mlp.experts.101.gate_proj.weight_scale": "model-00020-of-00047.safetensors", + "model.layers.19.mlp.experts.101.up_proj.weight": "model-00020-of-00047.safetensors", + "model.layers.19.mlp.experts.101.up_proj.weight_scale": "model-00020-of-00047.safetensors", + "model.layers.19.mlp.experts.102.down_proj.weight": "model-00020-of-00047.safetensors", + "model.layers.19.mlp.experts.102.down_proj.weight_scale": "model-00020-of-00047.safetensors", + "model.layers.19.mlp.experts.102.gate_proj.weight": "model-00020-of-00047.safetensors", + "model.layers.19.mlp.experts.102.gate_proj.weight_scale": "model-00020-of-00047.safetensors", + "model.layers.19.mlp.experts.102.up_proj.weight": "model-00020-of-00047.safetensors", + "model.layers.19.mlp.experts.102.up_proj.weight_scale": "model-00020-of-00047.safetensors", + "model.layers.19.mlp.experts.103.down_proj.weight": "model-00020-of-00047.safetensors", + "model.layers.19.mlp.experts.103.down_proj.weight_scale": "model-00020-of-00047.safetensors", + "model.layers.19.mlp.experts.103.gate_proj.weight": "model-00020-of-00047.safetensors", + "model.layers.19.mlp.experts.103.gate_proj.weight_scale": "model-00020-of-00047.safetensors", + "model.layers.19.mlp.experts.103.up_proj.weight": "model-00020-of-00047.safetensors", + "model.layers.19.mlp.experts.103.up_proj.weight_scale": "model-00020-of-00047.safetensors", + "model.layers.19.mlp.experts.104.down_proj.weight": "model-00020-of-00047.safetensors", + "model.layers.19.mlp.experts.104.down_proj.weight_scale": "model-00020-of-00047.safetensors", + "model.layers.19.mlp.experts.104.gate_proj.weight": "model-00020-of-00047.safetensors", + "model.layers.19.mlp.experts.104.gate_proj.weight_scale": "model-00020-of-00047.safetensors", + "model.layers.19.mlp.experts.104.up_proj.weight": "model-00020-of-00047.safetensors", + "model.layers.19.mlp.experts.104.up_proj.weight_scale": "model-00020-of-00047.safetensors", + "model.layers.19.mlp.experts.105.down_proj.weight": "model-00020-of-00047.safetensors", + "model.layers.19.mlp.experts.105.down_proj.weight_scale": "model-00020-of-00047.safetensors", + "model.layers.19.mlp.experts.105.gate_proj.weight": "model-00020-of-00047.safetensors", + "model.layers.19.mlp.experts.105.gate_proj.weight_scale": "model-00020-of-00047.safetensors", + "model.layers.19.mlp.experts.105.up_proj.weight": "model-00020-of-00047.safetensors", + "model.layers.19.mlp.experts.105.up_proj.weight_scale": "model-00020-of-00047.safetensors", + "model.layers.19.mlp.experts.106.down_proj.weight": "model-00020-of-00047.safetensors", + "model.layers.19.mlp.experts.106.down_proj.weight_scale": "model-00020-of-00047.safetensors", + "model.layers.19.mlp.experts.106.gate_proj.weight": "model-00020-of-00047.safetensors", + "model.layers.19.mlp.experts.106.gate_proj.weight_scale": "model-00020-of-00047.safetensors", + "model.layers.19.mlp.experts.106.up_proj.weight": "model-00020-of-00047.safetensors", + "model.layers.19.mlp.experts.106.up_proj.weight_scale": "model-00020-of-00047.safetensors", + "model.layers.19.mlp.experts.107.down_proj.weight": "model-00020-of-00047.safetensors", + "model.layers.19.mlp.experts.107.down_proj.weight_scale": "model-00020-of-00047.safetensors", + "model.layers.19.mlp.experts.107.gate_proj.weight": "model-00020-of-00047.safetensors", + "model.layers.19.mlp.experts.107.gate_proj.weight_scale": "model-00020-of-00047.safetensors", + "model.layers.19.mlp.experts.107.up_proj.weight": "model-00020-of-00047.safetensors", + "model.layers.19.mlp.experts.107.up_proj.weight_scale": "model-00020-of-00047.safetensors", + "model.layers.19.mlp.experts.108.down_proj.weight": "model-00020-of-00047.safetensors", + "model.layers.19.mlp.experts.108.down_proj.weight_scale": "model-00020-of-00047.safetensors", + "model.layers.19.mlp.experts.108.gate_proj.weight": "model-00020-of-00047.safetensors", + "model.layers.19.mlp.experts.108.gate_proj.weight_scale": "model-00020-of-00047.safetensors", + "model.layers.19.mlp.experts.108.up_proj.weight": "model-00020-of-00047.safetensors", + "model.layers.19.mlp.experts.108.up_proj.weight_scale": "model-00020-of-00047.safetensors", + "model.layers.19.mlp.experts.109.down_proj.weight": "model-00020-of-00047.safetensors", + "model.layers.19.mlp.experts.109.down_proj.weight_scale": "model-00020-of-00047.safetensors", + "model.layers.19.mlp.experts.109.gate_proj.weight": "model-00020-of-00047.safetensors", + "model.layers.19.mlp.experts.109.gate_proj.weight_scale": "model-00020-of-00047.safetensors", + "model.layers.19.mlp.experts.109.up_proj.weight": "model-00020-of-00047.safetensors", + "model.layers.19.mlp.experts.109.up_proj.weight_scale": "model-00020-of-00047.safetensors", + "model.layers.19.mlp.experts.11.down_proj.weight": "model-00020-of-00047.safetensors", + "model.layers.19.mlp.experts.11.down_proj.weight_scale": "model-00020-of-00047.safetensors", + "model.layers.19.mlp.experts.11.gate_proj.weight": "model-00020-of-00047.safetensors", + "model.layers.19.mlp.experts.11.gate_proj.weight_scale": "model-00020-of-00047.safetensors", + "model.layers.19.mlp.experts.11.up_proj.weight": "model-00020-of-00047.safetensors", + "model.layers.19.mlp.experts.11.up_proj.weight_scale": "model-00020-of-00047.safetensors", + "model.layers.19.mlp.experts.110.down_proj.weight": "model-00020-of-00047.safetensors", + "model.layers.19.mlp.experts.110.down_proj.weight_scale": "model-00020-of-00047.safetensors", + "model.layers.19.mlp.experts.110.gate_proj.weight": "model-00020-of-00047.safetensors", + "model.layers.19.mlp.experts.110.gate_proj.weight_scale": "model-00020-of-00047.safetensors", + "model.layers.19.mlp.experts.110.up_proj.weight": "model-00020-of-00047.safetensors", + "model.layers.19.mlp.experts.110.up_proj.weight_scale": "model-00020-of-00047.safetensors", + "model.layers.19.mlp.experts.111.down_proj.weight": "model-00020-of-00047.safetensors", + "model.layers.19.mlp.experts.111.down_proj.weight_scale": "model-00020-of-00047.safetensors", + "model.layers.19.mlp.experts.111.gate_proj.weight": "model-00020-of-00047.safetensors", + "model.layers.19.mlp.experts.111.gate_proj.weight_scale": "model-00020-of-00047.safetensors", + "model.layers.19.mlp.experts.111.up_proj.weight": "model-00020-of-00047.safetensors", + "model.layers.19.mlp.experts.111.up_proj.weight_scale": "model-00020-of-00047.safetensors", + "model.layers.19.mlp.experts.112.down_proj.weight": "model-00020-of-00047.safetensors", + "model.layers.19.mlp.experts.112.down_proj.weight_scale": "model-00020-of-00047.safetensors", + "model.layers.19.mlp.experts.112.gate_proj.weight": "model-00020-of-00047.safetensors", + "model.layers.19.mlp.experts.112.gate_proj.weight_scale": "model-00020-of-00047.safetensors", + "model.layers.19.mlp.experts.112.up_proj.weight": "model-00020-of-00047.safetensors", + "model.layers.19.mlp.experts.112.up_proj.weight_scale": "model-00020-of-00047.safetensors", + "model.layers.19.mlp.experts.113.down_proj.weight": "model-00020-of-00047.safetensors", + "model.layers.19.mlp.experts.113.down_proj.weight_scale": "model-00020-of-00047.safetensors", + "model.layers.19.mlp.experts.113.gate_proj.weight": "model-00020-of-00047.safetensors", + "model.layers.19.mlp.experts.113.gate_proj.weight_scale": "model-00020-of-00047.safetensors", + "model.layers.19.mlp.experts.113.up_proj.weight": "model-00020-of-00047.safetensors", + "model.layers.19.mlp.experts.113.up_proj.weight_scale": "model-00020-of-00047.safetensors", + "model.layers.19.mlp.experts.114.down_proj.weight": "model-00020-of-00047.safetensors", + "model.layers.19.mlp.experts.114.down_proj.weight_scale": "model-00020-of-00047.safetensors", + "model.layers.19.mlp.experts.114.gate_proj.weight": "model-00020-of-00047.safetensors", + "model.layers.19.mlp.experts.114.gate_proj.weight_scale": "model-00020-of-00047.safetensors", + "model.layers.19.mlp.experts.114.up_proj.weight": "model-00020-of-00047.safetensors", + "model.layers.19.mlp.experts.114.up_proj.weight_scale": "model-00020-of-00047.safetensors", + "model.layers.19.mlp.experts.115.down_proj.weight": "model-00020-of-00047.safetensors", + "model.layers.19.mlp.experts.115.down_proj.weight_scale": "model-00020-of-00047.safetensors", + "model.layers.19.mlp.experts.115.gate_proj.weight": "model-00020-of-00047.safetensors", + "model.layers.19.mlp.experts.115.gate_proj.weight_scale": "model-00020-of-00047.safetensors", + "model.layers.19.mlp.experts.115.up_proj.weight": "model-00020-of-00047.safetensors", + "model.layers.19.mlp.experts.115.up_proj.weight_scale": "model-00020-of-00047.safetensors", + "model.layers.19.mlp.experts.116.down_proj.weight": "model-00020-of-00047.safetensors", + "model.layers.19.mlp.experts.116.down_proj.weight_scale": "model-00020-of-00047.safetensors", + "model.layers.19.mlp.experts.116.gate_proj.weight": "model-00020-of-00047.safetensors", + "model.layers.19.mlp.experts.116.gate_proj.weight_scale": "model-00020-of-00047.safetensors", + "model.layers.19.mlp.experts.116.up_proj.weight": "model-00020-of-00047.safetensors", + "model.layers.19.mlp.experts.116.up_proj.weight_scale": "model-00020-of-00047.safetensors", + "model.layers.19.mlp.experts.117.down_proj.weight": "model-00020-of-00047.safetensors", + "model.layers.19.mlp.experts.117.down_proj.weight_scale": "model-00020-of-00047.safetensors", + "model.layers.19.mlp.experts.117.gate_proj.weight": "model-00020-of-00047.safetensors", + "model.layers.19.mlp.experts.117.gate_proj.weight_scale": "model-00020-of-00047.safetensors", + "model.layers.19.mlp.experts.117.up_proj.weight": "model-00020-of-00047.safetensors", + "model.layers.19.mlp.experts.117.up_proj.weight_scale": "model-00020-of-00047.safetensors", + "model.layers.19.mlp.experts.118.down_proj.weight": "model-00020-of-00047.safetensors", + "model.layers.19.mlp.experts.118.down_proj.weight_scale": "model-00020-of-00047.safetensors", + "model.layers.19.mlp.experts.118.gate_proj.weight": "model-00020-of-00047.safetensors", + "model.layers.19.mlp.experts.118.gate_proj.weight_scale": "model-00020-of-00047.safetensors", + "model.layers.19.mlp.experts.118.up_proj.weight": "model-00020-of-00047.safetensors", + "model.layers.19.mlp.experts.118.up_proj.weight_scale": "model-00020-of-00047.safetensors", + "model.layers.19.mlp.experts.119.down_proj.weight": "model-00020-of-00047.safetensors", + "model.layers.19.mlp.experts.119.down_proj.weight_scale": "model-00020-of-00047.safetensors", + "model.layers.19.mlp.experts.119.gate_proj.weight": "model-00020-of-00047.safetensors", + "model.layers.19.mlp.experts.119.gate_proj.weight_scale": "model-00020-of-00047.safetensors", + "model.layers.19.mlp.experts.119.up_proj.weight": "model-00020-of-00047.safetensors", + "model.layers.19.mlp.experts.119.up_proj.weight_scale": "model-00020-of-00047.safetensors", + "model.layers.19.mlp.experts.12.down_proj.weight": "model-00020-of-00047.safetensors", + "model.layers.19.mlp.experts.12.down_proj.weight_scale": "model-00020-of-00047.safetensors", + "model.layers.19.mlp.experts.12.gate_proj.weight": "model-00020-of-00047.safetensors", + "model.layers.19.mlp.experts.12.gate_proj.weight_scale": "model-00020-of-00047.safetensors", + "model.layers.19.mlp.experts.12.up_proj.weight": "model-00020-of-00047.safetensors", + "model.layers.19.mlp.experts.12.up_proj.weight_scale": "model-00020-of-00047.safetensors", + "model.layers.19.mlp.experts.120.down_proj.weight": "model-00020-of-00047.safetensors", + "model.layers.19.mlp.experts.120.down_proj.weight_scale": "model-00020-of-00047.safetensors", + "model.layers.19.mlp.experts.120.gate_proj.weight": "model-00020-of-00047.safetensors", + "model.layers.19.mlp.experts.120.gate_proj.weight_scale": "model-00020-of-00047.safetensors", + "model.layers.19.mlp.experts.120.up_proj.weight": "model-00020-of-00047.safetensors", + "model.layers.19.mlp.experts.120.up_proj.weight_scale": "model-00020-of-00047.safetensors", + "model.layers.19.mlp.experts.121.down_proj.weight": "model-00020-of-00047.safetensors", + "model.layers.19.mlp.experts.121.down_proj.weight_scale": "model-00020-of-00047.safetensors", + "model.layers.19.mlp.experts.121.gate_proj.weight": "model-00020-of-00047.safetensors", + "model.layers.19.mlp.experts.121.gate_proj.weight_scale": "model-00020-of-00047.safetensors", + "model.layers.19.mlp.experts.121.up_proj.weight": "model-00020-of-00047.safetensors", + "model.layers.19.mlp.experts.121.up_proj.weight_scale": "model-00020-of-00047.safetensors", + "model.layers.19.mlp.experts.122.down_proj.weight": "model-00020-of-00047.safetensors", + "model.layers.19.mlp.experts.122.down_proj.weight_scale": "model-00020-of-00047.safetensors", + "model.layers.19.mlp.experts.122.gate_proj.weight": "model-00020-of-00047.safetensors", + "model.layers.19.mlp.experts.122.gate_proj.weight_scale": "model-00020-of-00047.safetensors", + "model.layers.19.mlp.experts.122.up_proj.weight": "model-00020-of-00047.safetensors", + "model.layers.19.mlp.experts.122.up_proj.weight_scale": "model-00020-of-00047.safetensors", + "model.layers.19.mlp.experts.123.down_proj.weight": "model-00020-of-00047.safetensors", + "model.layers.19.mlp.experts.123.down_proj.weight_scale": "model-00020-of-00047.safetensors", + "model.layers.19.mlp.experts.123.gate_proj.weight": "model-00020-of-00047.safetensors", + "model.layers.19.mlp.experts.123.gate_proj.weight_scale": "model-00020-of-00047.safetensors", + "model.layers.19.mlp.experts.123.up_proj.weight": "model-00020-of-00047.safetensors", + "model.layers.19.mlp.experts.123.up_proj.weight_scale": "model-00020-of-00047.safetensors", + "model.layers.19.mlp.experts.124.down_proj.weight": "model-00020-of-00047.safetensors", + "model.layers.19.mlp.experts.124.down_proj.weight_scale": "model-00020-of-00047.safetensors", + "model.layers.19.mlp.experts.124.gate_proj.weight": "model-00020-of-00047.safetensors", + "model.layers.19.mlp.experts.124.gate_proj.weight_scale": "model-00020-of-00047.safetensors", + "model.layers.19.mlp.experts.124.up_proj.weight": "model-00020-of-00047.safetensors", + "model.layers.19.mlp.experts.124.up_proj.weight_scale": "model-00020-of-00047.safetensors", + "model.layers.19.mlp.experts.125.down_proj.weight": "model-00020-of-00047.safetensors", + "model.layers.19.mlp.experts.125.down_proj.weight_scale": "model-00020-of-00047.safetensors", + "model.layers.19.mlp.experts.125.gate_proj.weight": "model-00020-of-00047.safetensors", + "model.layers.19.mlp.experts.125.gate_proj.weight_scale": "model-00020-of-00047.safetensors", + "model.layers.19.mlp.experts.125.up_proj.weight": "model-00020-of-00047.safetensors", + "model.layers.19.mlp.experts.125.up_proj.weight_scale": "model-00020-of-00047.safetensors", + "model.layers.19.mlp.experts.126.down_proj.weight": "model-00020-of-00047.safetensors", + "model.layers.19.mlp.experts.126.down_proj.weight_scale": "model-00020-of-00047.safetensors", + "model.layers.19.mlp.experts.126.gate_proj.weight": "model-00020-of-00047.safetensors", + "model.layers.19.mlp.experts.126.gate_proj.weight_scale": "model-00020-of-00047.safetensors", + "model.layers.19.mlp.experts.126.up_proj.weight": "model-00020-of-00047.safetensors", + "model.layers.19.mlp.experts.126.up_proj.weight_scale": "model-00020-of-00047.safetensors", + "model.layers.19.mlp.experts.127.down_proj.weight": "model-00020-of-00047.safetensors", + "model.layers.19.mlp.experts.127.down_proj.weight_scale": "model-00020-of-00047.safetensors", + "model.layers.19.mlp.experts.127.gate_proj.weight": "model-00020-of-00047.safetensors", + "model.layers.19.mlp.experts.127.gate_proj.weight_scale": "model-00020-of-00047.safetensors", + "model.layers.19.mlp.experts.127.up_proj.weight": "model-00020-of-00047.safetensors", + "model.layers.19.mlp.experts.127.up_proj.weight_scale": "model-00020-of-00047.safetensors", + "model.layers.19.mlp.experts.13.down_proj.weight": "model-00020-of-00047.safetensors", + "model.layers.19.mlp.experts.13.down_proj.weight_scale": "model-00020-of-00047.safetensors", + "model.layers.19.mlp.experts.13.gate_proj.weight": "model-00020-of-00047.safetensors", + "model.layers.19.mlp.experts.13.gate_proj.weight_scale": "model-00020-of-00047.safetensors", + "model.layers.19.mlp.experts.13.up_proj.weight": "model-00020-of-00047.safetensors", + "model.layers.19.mlp.experts.13.up_proj.weight_scale": "model-00020-of-00047.safetensors", + "model.layers.19.mlp.experts.14.down_proj.weight": "model-00020-of-00047.safetensors", + "model.layers.19.mlp.experts.14.down_proj.weight_scale": "model-00020-of-00047.safetensors", + "model.layers.19.mlp.experts.14.gate_proj.weight": "model-00020-of-00047.safetensors", + "model.layers.19.mlp.experts.14.gate_proj.weight_scale": "model-00020-of-00047.safetensors", + "model.layers.19.mlp.experts.14.up_proj.weight": "model-00020-of-00047.safetensors", + "model.layers.19.mlp.experts.14.up_proj.weight_scale": "model-00020-of-00047.safetensors", + "model.layers.19.mlp.experts.15.down_proj.weight": "model-00020-of-00047.safetensors", + "model.layers.19.mlp.experts.15.down_proj.weight_scale": "model-00020-of-00047.safetensors", + "model.layers.19.mlp.experts.15.gate_proj.weight": "model-00020-of-00047.safetensors", + "model.layers.19.mlp.experts.15.gate_proj.weight_scale": "model-00020-of-00047.safetensors", + "model.layers.19.mlp.experts.15.up_proj.weight": "model-00020-of-00047.safetensors", + "model.layers.19.mlp.experts.15.up_proj.weight_scale": "model-00020-of-00047.safetensors", + "model.layers.19.mlp.experts.16.down_proj.weight": "model-00020-of-00047.safetensors", + "model.layers.19.mlp.experts.16.down_proj.weight_scale": "model-00020-of-00047.safetensors", + "model.layers.19.mlp.experts.16.gate_proj.weight": "model-00020-of-00047.safetensors", + "model.layers.19.mlp.experts.16.gate_proj.weight_scale": "model-00020-of-00047.safetensors", + "model.layers.19.mlp.experts.16.up_proj.weight": "model-00020-of-00047.safetensors", + "model.layers.19.mlp.experts.16.up_proj.weight_scale": "model-00020-of-00047.safetensors", + "model.layers.19.mlp.experts.17.down_proj.weight": "model-00020-of-00047.safetensors", + "model.layers.19.mlp.experts.17.down_proj.weight_scale": "model-00020-of-00047.safetensors", + "model.layers.19.mlp.experts.17.gate_proj.weight": "model-00020-of-00047.safetensors", + "model.layers.19.mlp.experts.17.gate_proj.weight_scale": "model-00020-of-00047.safetensors", + "model.layers.19.mlp.experts.17.up_proj.weight": "model-00020-of-00047.safetensors", + "model.layers.19.mlp.experts.17.up_proj.weight_scale": "model-00020-of-00047.safetensors", + "model.layers.19.mlp.experts.18.down_proj.weight": "model-00020-of-00047.safetensors", + "model.layers.19.mlp.experts.18.down_proj.weight_scale": "model-00020-of-00047.safetensors", + "model.layers.19.mlp.experts.18.gate_proj.weight": "model-00020-of-00047.safetensors", + "model.layers.19.mlp.experts.18.gate_proj.weight_scale": "model-00020-of-00047.safetensors", + "model.layers.19.mlp.experts.18.up_proj.weight": "model-00020-of-00047.safetensors", + "model.layers.19.mlp.experts.18.up_proj.weight_scale": "model-00020-of-00047.safetensors", + "model.layers.19.mlp.experts.19.down_proj.weight": "model-00020-of-00047.safetensors", + "model.layers.19.mlp.experts.19.down_proj.weight_scale": "model-00020-of-00047.safetensors", + "model.layers.19.mlp.experts.19.gate_proj.weight": "model-00020-of-00047.safetensors", + "model.layers.19.mlp.experts.19.gate_proj.weight_scale": "model-00020-of-00047.safetensors", + "model.layers.19.mlp.experts.19.up_proj.weight": "model-00020-of-00047.safetensors", + "model.layers.19.mlp.experts.19.up_proj.weight_scale": "model-00020-of-00047.safetensors", + "model.layers.19.mlp.experts.2.down_proj.weight": "model-00020-of-00047.safetensors", + "model.layers.19.mlp.experts.2.down_proj.weight_scale": "model-00020-of-00047.safetensors", + "model.layers.19.mlp.experts.2.gate_proj.weight": "model-00020-of-00047.safetensors", + "model.layers.19.mlp.experts.2.gate_proj.weight_scale": "model-00020-of-00047.safetensors", + "model.layers.19.mlp.experts.2.up_proj.weight": "model-00020-of-00047.safetensors", + "model.layers.19.mlp.experts.2.up_proj.weight_scale": "model-00020-of-00047.safetensors", + "model.layers.19.mlp.experts.20.down_proj.weight": "model-00020-of-00047.safetensors", + "model.layers.19.mlp.experts.20.down_proj.weight_scale": "model-00020-of-00047.safetensors", + "model.layers.19.mlp.experts.20.gate_proj.weight": "model-00020-of-00047.safetensors", + "model.layers.19.mlp.experts.20.gate_proj.weight_scale": "model-00020-of-00047.safetensors", + "model.layers.19.mlp.experts.20.up_proj.weight": "model-00020-of-00047.safetensors", + "model.layers.19.mlp.experts.20.up_proj.weight_scale": "model-00020-of-00047.safetensors", + "model.layers.19.mlp.experts.21.down_proj.weight": "model-00020-of-00047.safetensors", + "model.layers.19.mlp.experts.21.down_proj.weight_scale": "model-00020-of-00047.safetensors", + "model.layers.19.mlp.experts.21.gate_proj.weight": "model-00020-of-00047.safetensors", + "model.layers.19.mlp.experts.21.gate_proj.weight_scale": "model-00020-of-00047.safetensors", + "model.layers.19.mlp.experts.21.up_proj.weight": "model-00020-of-00047.safetensors", + "model.layers.19.mlp.experts.21.up_proj.weight_scale": "model-00020-of-00047.safetensors", + "model.layers.19.mlp.experts.22.down_proj.weight": "model-00020-of-00047.safetensors", + "model.layers.19.mlp.experts.22.down_proj.weight_scale": "model-00020-of-00047.safetensors", + "model.layers.19.mlp.experts.22.gate_proj.weight": "model-00020-of-00047.safetensors", + "model.layers.19.mlp.experts.22.gate_proj.weight_scale": "model-00020-of-00047.safetensors", + "model.layers.19.mlp.experts.22.up_proj.weight": "model-00020-of-00047.safetensors", + "model.layers.19.mlp.experts.22.up_proj.weight_scale": "model-00020-of-00047.safetensors", + "model.layers.19.mlp.experts.23.down_proj.weight": "model-00020-of-00047.safetensors", + "model.layers.19.mlp.experts.23.down_proj.weight_scale": "model-00020-of-00047.safetensors", + "model.layers.19.mlp.experts.23.gate_proj.weight": "model-00020-of-00047.safetensors", + "model.layers.19.mlp.experts.23.gate_proj.weight_scale": "model-00020-of-00047.safetensors", + "model.layers.19.mlp.experts.23.up_proj.weight": "model-00020-of-00047.safetensors", + "model.layers.19.mlp.experts.23.up_proj.weight_scale": "model-00020-of-00047.safetensors", + "model.layers.19.mlp.experts.24.down_proj.weight": "model-00020-of-00047.safetensors", + "model.layers.19.mlp.experts.24.down_proj.weight_scale": "model-00020-of-00047.safetensors", + "model.layers.19.mlp.experts.24.gate_proj.weight": "model-00020-of-00047.safetensors", + "model.layers.19.mlp.experts.24.gate_proj.weight_scale": "model-00020-of-00047.safetensors", + "model.layers.19.mlp.experts.24.up_proj.weight": "model-00020-of-00047.safetensors", + "model.layers.19.mlp.experts.24.up_proj.weight_scale": "model-00020-of-00047.safetensors", + "model.layers.19.mlp.experts.25.down_proj.weight": "model-00020-of-00047.safetensors", + "model.layers.19.mlp.experts.25.down_proj.weight_scale": "model-00020-of-00047.safetensors", + "model.layers.19.mlp.experts.25.gate_proj.weight": "model-00020-of-00047.safetensors", + "model.layers.19.mlp.experts.25.gate_proj.weight_scale": "model-00020-of-00047.safetensors", + "model.layers.19.mlp.experts.25.up_proj.weight": "model-00020-of-00047.safetensors", + "model.layers.19.mlp.experts.25.up_proj.weight_scale": "model-00020-of-00047.safetensors", + "model.layers.19.mlp.experts.26.down_proj.weight": "model-00020-of-00047.safetensors", + "model.layers.19.mlp.experts.26.down_proj.weight_scale": "model-00020-of-00047.safetensors", + "model.layers.19.mlp.experts.26.gate_proj.weight": "model-00020-of-00047.safetensors", + "model.layers.19.mlp.experts.26.gate_proj.weight_scale": "model-00020-of-00047.safetensors", + "model.layers.19.mlp.experts.26.up_proj.weight": "model-00020-of-00047.safetensors", + "model.layers.19.mlp.experts.26.up_proj.weight_scale": "model-00020-of-00047.safetensors", + "model.layers.19.mlp.experts.27.down_proj.weight": "model-00020-of-00047.safetensors", + "model.layers.19.mlp.experts.27.down_proj.weight_scale": "model-00020-of-00047.safetensors", + "model.layers.19.mlp.experts.27.gate_proj.weight": "model-00020-of-00047.safetensors", + "model.layers.19.mlp.experts.27.gate_proj.weight_scale": "model-00020-of-00047.safetensors", + "model.layers.19.mlp.experts.27.up_proj.weight": "model-00020-of-00047.safetensors", + "model.layers.19.mlp.experts.27.up_proj.weight_scale": "model-00020-of-00047.safetensors", + "model.layers.19.mlp.experts.28.down_proj.weight": "model-00020-of-00047.safetensors", + "model.layers.19.mlp.experts.28.down_proj.weight_scale": "model-00020-of-00047.safetensors", + "model.layers.19.mlp.experts.28.gate_proj.weight": "model-00020-of-00047.safetensors", + "model.layers.19.mlp.experts.28.gate_proj.weight_scale": "model-00020-of-00047.safetensors", + "model.layers.19.mlp.experts.28.up_proj.weight": "model-00020-of-00047.safetensors", + "model.layers.19.mlp.experts.28.up_proj.weight_scale": "model-00020-of-00047.safetensors", + "model.layers.19.mlp.experts.29.down_proj.weight": "model-00020-of-00047.safetensors", + "model.layers.19.mlp.experts.29.down_proj.weight_scale": "model-00020-of-00047.safetensors", + "model.layers.19.mlp.experts.29.gate_proj.weight": "model-00020-of-00047.safetensors", + "model.layers.19.mlp.experts.29.gate_proj.weight_scale": "model-00020-of-00047.safetensors", + "model.layers.19.mlp.experts.29.up_proj.weight": "model-00020-of-00047.safetensors", + "model.layers.19.mlp.experts.29.up_proj.weight_scale": "model-00020-of-00047.safetensors", + "model.layers.19.mlp.experts.3.down_proj.weight": "model-00020-of-00047.safetensors", + "model.layers.19.mlp.experts.3.down_proj.weight_scale": "model-00020-of-00047.safetensors", + "model.layers.19.mlp.experts.3.gate_proj.weight": "model-00020-of-00047.safetensors", + "model.layers.19.mlp.experts.3.gate_proj.weight_scale": "model-00020-of-00047.safetensors", + "model.layers.19.mlp.experts.3.up_proj.weight": "model-00020-of-00047.safetensors", + "model.layers.19.mlp.experts.3.up_proj.weight_scale": "model-00020-of-00047.safetensors", + "model.layers.19.mlp.experts.30.down_proj.weight": "model-00020-of-00047.safetensors", + "model.layers.19.mlp.experts.30.down_proj.weight_scale": "model-00020-of-00047.safetensors", + "model.layers.19.mlp.experts.30.gate_proj.weight": "model-00020-of-00047.safetensors", + "model.layers.19.mlp.experts.30.gate_proj.weight_scale": "model-00020-of-00047.safetensors", + "model.layers.19.mlp.experts.30.up_proj.weight": "model-00020-of-00047.safetensors", + "model.layers.19.mlp.experts.30.up_proj.weight_scale": "model-00020-of-00047.safetensors", + "model.layers.19.mlp.experts.31.down_proj.weight": "model-00020-of-00047.safetensors", + "model.layers.19.mlp.experts.31.down_proj.weight_scale": "model-00020-of-00047.safetensors", + "model.layers.19.mlp.experts.31.gate_proj.weight": "model-00020-of-00047.safetensors", + "model.layers.19.mlp.experts.31.gate_proj.weight_scale": "model-00020-of-00047.safetensors", + "model.layers.19.mlp.experts.31.up_proj.weight": "model-00020-of-00047.safetensors", + "model.layers.19.mlp.experts.31.up_proj.weight_scale": "model-00020-of-00047.safetensors", + "model.layers.19.mlp.experts.32.down_proj.weight": "model-00020-of-00047.safetensors", + "model.layers.19.mlp.experts.32.down_proj.weight_scale": "model-00020-of-00047.safetensors", + "model.layers.19.mlp.experts.32.gate_proj.weight": "model-00020-of-00047.safetensors", + "model.layers.19.mlp.experts.32.gate_proj.weight_scale": "model-00020-of-00047.safetensors", + "model.layers.19.mlp.experts.32.up_proj.weight": "model-00020-of-00047.safetensors", + "model.layers.19.mlp.experts.32.up_proj.weight_scale": "model-00020-of-00047.safetensors", + "model.layers.19.mlp.experts.33.down_proj.weight": "model-00020-of-00047.safetensors", + "model.layers.19.mlp.experts.33.down_proj.weight_scale": "model-00020-of-00047.safetensors", + "model.layers.19.mlp.experts.33.gate_proj.weight": "model-00020-of-00047.safetensors", + "model.layers.19.mlp.experts.33.gate_proj.weight_scale": "model-00020-of-00047.safetensors", + "model.layers.19.mlp.experts.33.up_proj.weight": "model-00020-of-00047.safetensors", + "model.layers.19.mlp.experts.33.up_proj.weight_scale": "model-00020-of-00047.safetensors", + "model.layers.19.mlp.experts.34.down_proj.weight": "model-00020-of-00047.safetensors", + "model.layers.19.mlp.experts.34.down_proj.weight_scale": "model-00020-of-00047.safetensors", + "model.layers.19.mlp.experts.34.gate_proj.weight": "model-00020-of-00047.safetensors", + "model.layers.19.mlp.experts.34.gate_proj.weight_scale": "model-00020-of-00047.safetensors", + "model.layers.19.mlp.experts.34.up_proj.weight": "model-00020-of-00047.safetensors", + "model.layers.19.mlp.experts.34.up_proj.weight_scale": "model-00020-of-00047.safetensors", + "model.layers.19.mlp.experts.35.down_proj.weight": "model-00020-of-00047.safetensors", + "model.layers.19.mlp.experts.35.down_proj.weight_scale": "model-00020-of-00047.safetensors", + "model.layers.19.mlp.experts.35.gate_proj.weight": "model-00020-of-00047.safetensors", + "model.layers.19.mlp.experts.35.gate_proj.weight_scale": "model-00020-of-00047.safetensors", + "model.layers.19.mlp.experts.35.up_proj.weight": "model-00020-of-00047.safetensors", + "model.layers.19.mlp.experts.35.up_proj.weight_scale": "model-00020-of-00047.safetensors", + "model.layers.19.mlp.experts.36.down_proj.weight": "model-00020-of-00047.safetensors", + "model.layers.19.mlp.experts.36.down_proj.weight_scale": "model-00020-of-00047.safetensors", + "model.layers.19.mlp.experts.36.gate_proj.weight": "model-00020-of-00047.safetensors", + "model.layers.19.mlp.experts.36.gate_proj.weight_scale": "model-00020-of-00047.safetensors", + "model.layers.19.mlp.experts.36.up_proj.weight": "model-00020-of-00047.safetensors", + "model.layers.19.mlp.experts.36.up_proj.weight_scale": "model-00020-of-00047.safetensors", + "model.layers.19.mlp.experts.37.down_proj.weight": "model-00020-of-00047.safetensors", + "model.layers.19.mlp.experts.37.down_proj.weight_scale": "model-00020-of-00047.safetensors", + "model.layers.19.mlp.experts.37.gate_proj.weight": "model-00020-of-00047.safetensors", + "model.layers.19.mlp.experts.37.gate_proj.weight_scale": "model-00020-of-00047.safetensors", + "model.layers.19.mlp.experts.37.up_proj.weight": "model-00020-of-00047.safetensors", + "model.layers.19.mlp.experts.37.up_proj.weight_scale": "model-00020-of-00047.safetensors", + "model.layers.19.mlp.experts.38.down_proj.weight": "model-00020-of-00047.safetensors", + "model.layers.19.mlp.experts.38.down_proj.weight_scale": "model-00020-of-00047.safetensors", + "model.layers.19.mlp.experts.38.gate_proj.weight": "model-00020-of-00047.safetensors", + "model.layers.19.mlp.experts.38.gate_proj.weight_scale": "model-00020-of-00047.safetensors", + "model.layers.19.mlp.experts.38.up_proj.weight": "model-00020-of-00047.safetensors", + "model.layers.19.mlp.experts.38.up_proj.weight_scale": "model-00020-of-00047.safetensors", + "model.layers.19.mlp.experts.39.down_proj.weight": "model-00020-of-00047.safetensors", + "model.layers.19.mlp.experts.39.down_proj.weight_scale": "model-00020-of-00047.safetensors", + "model.layers.19.mlp.experts.39.gate_proj.weight": "model-00020-of-00047.safetensors", + "model.layers.19.mlp.experts.39.gate_proj.weight_scale": "model-00020-of-00047.safetensors", + "model.layers.19.mlp.experts.39.up_proj.weight": "model-00020-of-00047.safetensors", + "model.layers.19.mlp.experts.39.up_proj.weight_scale": "model-00020-of-00047.safetensors", + "model.layers.19.mlp.experts.4.down_proj.weight": "model-00020-of-00047.safetensors", + "model.layers.19.mlp.experts.4.down_proj.weight_scale": "model-00020-of-00047.safetensors", + "model.layers.19.mlp.experts.4.gate_proj.weight": "model-00020-of-00047.safetensors", + "model.layers.19.mlp.experts.4.gate_proj.weight_scale": "model-00020-of-00047.safetensors", + "model.layers.19.mlp.experts.4.up_proj.weight": "model-00020-of-00047.safetensors", + "model.layers.19.mlp.experts.4.up_proj.weight_scale": "model-00020-of-00047.safetensors", + "model.layers.19.mlp.experts.40.down_proj.weight": "model-00020-of-00047.safetensors", + "model.layers.19.mlp.experts.40.down_proj.weight_scale": "model-00020-of-00047.safetensors", + "model.layers.19.mlp.experts.40.gate_proj.weight": "model-00020-of-00047.safetensors", + "model.layers.19.mlp.experts.40.gate_proj.weight_scale": "model-00020-of-00047.safetensors", + "model.layers.19.mlp.experts.40.up_proj.weight": "model-00020-of-00047.safetensors", + "model.layers.19.mlp.experts.40.up_proj.weight_scale": "model-00020-of-00047.safetensors", + "model.layers.19.mlp.experts.41.down_proj.weight": "model-00020-of-00047.safetensors", + "model.layers.19.mlp.experts.41.down_proj.weight_scale": "model-00020-of-00047.safetensors", + "model.layers.19.mlp.experts.41.gate_proj.weight": "model-00020-of-00047.safetensors", + "model.layers.19.mlp.experts.41.gate_proj.weight_scale": "model-00020-of-00047.safetensors", + "model.layers.19.mlp.experts.41.up_proj.weight": "model-00020-of-00047.safetensors", + "model.layers.19.mlp.experts.41.up_proj.weight_scale": "model-00020-of-00047.safetensors", + "model.layers.19.mlp.experts.42.down_proj.weight": "model-00020-of-00047.safetensors", + "model.layers.19.mlp.experts.42.down_proj.weight_scale": "model-00020-of-00047.safetensors", + "model.layers.19.mlp.experts.42.gate_proj.weight": "model-00020-of-00047.safetensors", + "model.layers.19.mlp.experts.42.gate_proj.weight_scale": "model-00020-of-00047.safetensors", + "model.layers.19.mlp.experts.42.up_proj.weight": "model-00020-of-00047.safetensors", + "model.layers.19.mlp.experts.42.up_proj.weight_scale": "model-00020-of-00047.safetensors", + "model.layers.19.mlp.experts.43.down_proj.weight": "model-00020-of-00047.safetensors", + "model.layers.19.mlp.experts.43.down_proj.weight_scale": "model-00020-of-00047.safetensors", + "model.layers.19.mlp.experts.43.gate_proj.weight": "model-00020-of-00047.safetensors", + "model.layers.19.mlp.experts.43.gate_proj.weight_scale": "model-00020-of-00047.safetensors", + "model.layers.19.mlp.experts.43.up_proj.weight": "model-00020-of-00047.safetensors", + "model.layers.19.mlp.experts.43.up_proj.weight_scale": "model-00020-of-00047.safetensors", + "model.layers.19.mlp.experts.44.down_proj.weight": "model-00020-of-00047.safetensors", + "model.layers.19.mlp.experts.44.down_proj.weight_scale": "model-00020-of-00047.safetensors", + "model.layers.19.mlp.experts.44.gate_proj.weight": "model-00020-of-00047.safetensors", + "model.layers.19.mlp.experts.44.gate_proj.weight_scale": "model-00020-of-00047.safetensors", + "model.layers.19.mlp.experts.44.up_proj.weight": "model-00020-of-00047.safetensors", + "model.layers.19.mlp.experts.44.up_proj.weight_scale": "model-00020-of-00047.safetensors", + "model.layers.19.mlp.experts.45.down_proj.weight": "model-00020-of-00047.safetensors", + "model.layers.19.mlp.experts.45.down_proj.weight_scale": "model-00020-of-00047.safetensors", + "model.layers.19.mlp.experts.45.gate_proj.weight": "model-00020-of-00047.safetensors", + "model.layers.19.mlp.experts.45.gate_proj.weight_scale": "model-00020-of-00047.safetensors", + "model.layers.19.mlp.experts.45.up_proj.weight": "model-00020-of-00047.safetensors", + "model.layers.19.mlp.experts.45.up_proj.weight_scale": "model-00020-of-00047.safetensors", + "model.layers.19.mlp.experts.46.down_proj.weight": "model-00020-of-00047.safetensors", + "model.layers.19.mlp.experts.46.down_proj.weight_scale": "model-00020-of-00047.safetensors", + "model.layers.19.mlp.experts.46.gate_proj.weight": "model-00020-of-00047.safetensors", + "model.layers.19.mlp.experts.46.gate_proj.weight_scale": "model-00020-of-00047.safetensors", + "model.layers.19.mlp.experts.46.up_proj.weight": "model-00020-of-00047.safetensors", + "model.layers.19.mlp.experts.46.up_proj.weight_scale": "model-00020-of-00047.safetensors", + "model.layers.19.mlp.experts.47.down_proj.weight": "model-00020-of-00047.safetensors", + "model.layers.19.mlp.experts.47.down_proj.weight_scale": "model-00020-of-00047.safetensors", + "model.layers.19.mlp.experts.47.gate_proj.weight": "model-00020-of-00047.safetensors", + "model.layers.19.mlp.experts.47.gate_proj.weight_scale": "model-00020-of-00047.safetensors", + "model.layers.19.mlp.experts.47.up_proj.weight": "model-00020-of-00047.safetensors", + "model.layers.19.mlp.experts.47.up_proj.weight_scale": "model-00020-of-00047.safetensors", + "model.layers.19.mlp.experts.48.down_proj.weight": "model-00020-of-00047.safetensors", + "model.layers.19.mlp.experts.48.down_proj.weight_scale": "model-00020-of-00047.safetensors", + "model.layers.19.mlp.experts.48.gate_proj.weight": "model-00020-of-00047.safetensors", + "model.layers.19.mlp.experts.48.gate_proj.weight_scale": "model-00020-of-00047.safetensors", + "model.layers.19.mlp.experts.48.up_proj.weight": "model-00020-of-00047.safetensors", + "model.layers.19.mlp.experts.48.up_proj.weight_scale": "model-00020-of-00047.safetensors", + "model.layers.19.mlp.experts.49.down_proj.weight": "model-00020-of-00047.safetensors", + "model.layers.19.mlp.experts.49.down_proj.weight_scale": "model-00020-of-00047.safetensors", + "model.layers.19.mlp.experts.49.gate_proj.weight": "model-00020-of-00047.safetensors", + "model.layers.19.mlp.experts.49.gate_proj.weight_scale": "model-00020-of-00047.safetensors", + "model.layers.19.mlp.experts.49.up_proj.weight": "model-00020-of-00047.safetensors", + "model.layers.19.mlp.experts.49.up_proj.weight_scale": "model-00020-of-00047.safetensors", + "model.layers.19.mlp.experts.5.down_proj.weight": "model-00020-of-00047.safetensors", + "model.layers.19.mlp.experts.5.down_proj.weight_scale": "model-00020-of-00047.safetensors", + "model.layers.19.mlp.experts.5.gate_proj.weight": "model-00020-of-00047.safetensors", + "model.layers.19.mlp.experts.5.gate_proj.weight_scale": "model-00020-of-00047.safetensors", + "model.layers.19.mlp.experts.5.up_proj.weight": "model-00020-of-00047.safetensors", + "model.layers.19.mlp.experts.5.up_proj.weight_scale": "model-00020-of-00047.safetensors", + "model.layers.19.mlp.experts.50.down_proj.weight": "model-00020-of-00047.safetensors", + "model.layers.19.mlp.experts.50.down_proj.weight_scale": "model-00020-of-00047.safetensors", + "model.layers.19.mlp.experts.50.gate_proj.weight": "model-00020-of-00047.safetensors", + "model.layers.19.mlp.experts.50.gate_proj.weight_scale": "model-00020-of-00047.safetensors", + "model.layers.19.mlp.experts.50.up_proj.weight": "model-00020-of-00047.safetensors", + "model.layers.19.mlp.experts.50.up_proj.weight_scale": "model-00020-of-00047.safetensors", + "model.layers.19.mlp.experts.51.down_proj.weight": "model-00020-of-00047.safetensors", + "model.layers.19.mlp.experts.51.down_proj.weight_scale": "model-00020-of-00047.safetensors", + "model.layers.19.mlp.experts.51.gate_proj.weight": "model-00020-of-00047.safetensors", + "model.layers.19.mlp.experts.51.gate_proj.weight_scale": "model-00020-of-00047.safetensors", + "model.layers.19.mlp.experts.51.up_proj.weight": "model-00020-of-00047.safetensors", + "model.layers.19.mlp.experts.51.up_proj.weight_scale": "model-00020-of-00047.safetensors", + "model.layers.19.mlp.experts.52.down_proj.weight": "model-00020-of-00047.safetensors", + "model.layers.19.mlp.experts.52.down_proj.weight_scale": "model-00020-of-00047.safetensors", + "model.layers.19.mlp.experts.52.gate_proj.weight": "model-00020-of-00047.safetensors", + "model.layers.19.mlp.experts.52.gate_proj.weight_scale": "model-00020-of-00047.safetensors", + "model.layers.19.mlp.experts.52.up_proj.weight": "model-00020-of-00047.safetensors", + "model.layers.19.mlp.experts.52.up_proj.weight_scale": "model-00020-of-00047.safetensors", + "model.layers.19.mlp.experts.53.down_proj.weight": "model-00020-of-00047.safetensors", + "model.layers.19.mlp.experts.53.down_proj.weight_scale": "model-00020-of-00047.safetensors", + "model.layers.19.mlp.experts.53.gate_proj.weight": "model-00020-of-00047.safetensors", + "model.layers.19.mlp.experts.53.gate_proj.weight_scale": "model-00020-of-00047.safetensors", + "model.layers.19.mlp.experts.53.up_proj.weight": "model-00020-of-00047.safetensors", + "model.layers.19.mlp.experts.53.up_proj.weight_scale": "model-00020-of-00047.safetensors", + "model.layers.19.mlp.experts.54.down_proj.weight": "model-00020-of-00047.safetensors", + "model.layers.19.mlp.experts.54.down_proj.weight_scale": "model-00020-of-00047.safetensors", + "model.layers.19.mlp.experts.54.gate_proj.weight": "model-00020-of-00047.safetensors", + "model.layers.19.mlp.experts.54.gate_proj.weight_scale": "model-00020-of-00047.safetensors", + "model.layers.19.mlp.experts.54.up_proj.weight": "model-00020-of-00047.safetensors", + "model.layers.19.mlp.experts.54.up_proj.weight_scale": "model-00020-of-00047.safetensors", + "model.layers.19.mlp.experts.55.down_proj.weight": "model-00020-of-00047.safetensors", + "model.layers.19.mlp.experts.55.down_proj.weight_scale": "model-00020-of-00047.safetensors", + "model.layers.19.mlp.experts.55.gate_proj.weight": "model-00020-of-00047.safetensors", + "model.layers.19.mlp.experts.55.gate_proj.weight_scale": "model-00020-of-00047.safetensors", + "model.layers.19.mlp.experts.55.up_proj.weight": "model-00020-of-00047.safetensors", + "model.layers.19.mlp.experts.55.up_proj.weight_scale": "model-00020-of-00047.safetensors", + "model.layers.19.mlp.experts.56.down_proj.weight": "model-00020-of-00047.safetensors", + "model.layers.19.mlp.experts.56.down_proj.weight_scale": "model-00020-of-00047.safetensors", + "model.layers.19.mlp.experts.56.gate_proj.weight": "model-00020-of-00047.safetensors", + "model.layers.19.mlp.experts.56.gate_proj.weight_scale": "model-00020-of-00047.safetensors", + "model.layers.19.mlp.experts.56.up_proj.weight": "model-00020-of-00047.safetensors", + "model.layers.19.mlp.experts.56.up_proj.weight_scale": "model-00020-of-00047.safetensors", + "model.layers.19.mlp.experts.57.down_proj.weight": "model-00020-of-00047.safetensors", + "model.layers.19.mlp.experts.57.down_proj.weight_scale": "model-00020-of-00047.safetensors", + "model.layers.19.mlp.experts.57.gate_proj.weight": "model-00020-of-00047.safetensors", + "model.layers.19.mlp.experts.57.gate_proj.weight_scale": "model-00020-of-00047.safetensors", + "model.layers.19.mlp.experts.57.up_proj.weight": "model-00020-of-00047.safetensors", + "model.layers.19.mlp.experts.57.up_proj.weight_scale": "model-00020-of-00047.safetensors", + "model.layers.19.mlp.experts.58.down_proj.weight": "model-00020-of-00047.safetensors", + "model.layers.19.mlp.experts.58.down_proj.weight_scale": "model-00020-of-00047.safetensors", + "model.layers.19.mlp.experts.58.gate_proj.weight": "model-00020-of-00047.safetensors", + "model.layers.19.mlp.experts.58.gate_proj.weight_scale": "model-00020-of-00047.safetensors", + "model.layers.19.mlp.experts.58.up_proj.weight": "model-00020-of-00047.safetensors", + "model.layers.19.mlp.experts.58.up_proj.weight_scale": "model-00020-of-00047.safetensors", + "model.layers.19.mlp.experts.59.down_proj.weight": "model-00020-of-00047.safetensors", + "model.layers.19.mlp.experts.59.down_proj.weight_scale": "model-00020-of-00047.safetensors", + "model.layers.19.mlp.experts.59.gate_proj.weight": "model-00020-of-00047.safetensors", + "model.layers.19.mlp.experts.59.gate_proj.weight_scale": "model-00020-of-00047.safetensors", + "model.layers.19.mlp.experts.59.up_proj.weight": "model-00020-of-00047.safetensors", + "model.layers.19.mlp.experts.59.up_proj.weight_scale": "model-00020-of-00047.safetensors", + "model.layers.19.mlp.experts.6.down_proj.weight": "model-00020-of-00047.safetensors", + "model.layers.19.mlp.experts.6.down_proj.weight_scale": "model-00020-of-00047.safetensors", + "model.layers.19.mlp.experts.6.gate_proj.weight": "model-00020-of-00047.safetensors", + "model.layers.19.mlp.experts.6.gate_proj.weight_scale": "model-00020-of-00047.safetensors", + "model.layers.19.mlp.experts.6.up_proj.weight": "model-00020-of-00047.safetensors", + "model.layers.19.mlp.experts.6.up_proj.weight_scale": "model-00020-of-00047.safetensors", + "model.layers.19.mlp.experts.60.down_proj.weight": "model-00020-of-00047.safetensors", + "model.layers.19.mlp.experts.60.down_proj.weight_scale": "model-00020-of-00047.safetensors", + "model.layers.19.mlp.experts.60.gate_proj.weight": "model-00020-of-00047.safetensors", + "model.layers.19.mlp.experts.60.gate_proj.weight_scale": "model-00020-of-00047.safetensors", + "model.layers.19.mlp.experts.60.up_proj.weight": "model-00020-of-00047.safetensors", + "model.layers.19.mlp.experts.60.up_proj.weight_scale": "model-00020-of-00047.safetensors", + "model.layers.19.mlp.experts.61.down_proj.weight": "model-00020-of-00047.safetensors", + "model.layers.19.mlp.experts.61.down_proj.weight_scale": "model-00020-of-00047.safetensors", + "model.layers.19.mlp.experts.61.gate_proj.weight": "model-00020-of-00047.safetensors", + "model.layers.19.mlp.experts.61.gate_proj.weight_scale": "model-00020-of-00047.safetensors", + "model.layers.19.mlp.experts.61.up_proj.weight": "model-00020-of-00047.safetensors", + "model.layers.19.mlp.experts.61.up_proj.weight_scale": "model-00020-of-00047.safetensors", + "model.layers.19.mlp.experts.62.down_proj.weight": "model-00020-of-00047.safetensors", + "model.layers.19.mlp.experts.62.down_proj.weight_scale": "model-00020-of-00047.safetensors", + "model.layers.19.mlp.experts.62.gate_proj.weight": "model-00020-of-00047.safetensors", + "model.layers.19.mlp.experts.62.gate_proj.weight_scale": "model-00020-of-00047.safetensors", + "model.layers.19.mlp.experts.62.up_proj.weight": "model-00020-of-00047.safetensors", + "model.layers.19.mlp.experts.62.up_proj.weight_scale": "model-00020-of-00047.safetensors", + "model.layers.19.mlp.experts.63.down_proj.weight": "model-00020-of-00047.safetensors", + "model.layers.19.mlp.experts.63.down_proj.weight_scale": "model-00020-of-00047.safetensors", + "model.layers.19.mlp.experts.63.gate_proj.weight": "model-00020-of-00047.safetensors", + "model.layers.19.mlp.experts.63.gate_proj.weight_scale": "model-00020-of-00047.safetensors", + "model.layers.19.mlp.experts.63.up_proj.weight": "model-00020-of-00047.safetensors", + "model.layers.19.mlp.experts.63.up_proj.weight_scale": "model-00020-of-00047.safetensors", + "model.layers.19.mlp.experts.64.down_proj.weight": "model-00020-of-00047.safetensors", + "model.layers.19.mlp.experts.64.down_proj.weight_scale": "model-00020-of-00047.safetensors", + "model.layers.19.mlp.experts.64.gate_proj.weight": "model-00020-of-00047.safetensors", + "model.layers.19.mlp.experts.64.gate_proj.weight_scale": "model-00020-of-00047.safetensors", + "model.layers.19.mlp.experts.64.up_proj.weight": "model-00020-of-00047.safetensors", + "model.layers.19.mlp.experts.64.up_proj.weight_scale": "model-00020-of-00047.safetensors", + "model.layers.19.mlp.experts.65.down_proj.weight": "model-00020-of-00047.safetensors", + "model.layers.19.mlp.experts.65.down_proj.weight_scale": "model-00020-of-00047.safetensors", + "model.layers.19.mlp.experts.65.gate_proj.weight": "model-00020-of-00047.safetensors", + "model.layers.19.mlp.experts.65.gate_proj.weight_scale": "model-00020-of-00047.safetensors", + "model.layers.19.mlp.experts.65.up_proj.weight": "model-00020-of-00047.safetensors", + "model.layers.19.mlp.experts.65.up_proj.weight_scale": "model-00020-of-00047.safetensors", + "model.layers.19.mlp.experts.66.down_proj.weight": "model-00020-of-00047.safetensors", + "model.layers.19.mlp.experts.66.down_proj.weight_scale": "model-00020-of-00047.safetensors", + "model.layers.19.mlp.experts.66.gate_proj.weight": "model-00020-of-00047.safetensors", + "model.layers.19.mlp.experts.66.gate_proj.weight_scale": "model-00020-of-00047.safetensors", + "model.layers.19.mlp.experts.66.up_proj.weight": "model-00020-of-00047.safetensors", + "model.layers.19.mlp.experts.66.up_proj.weight_scale": "model-00020-of-00047.safetensors", + "model.layers.19.mlp.experts.67.down_proj.weight": "model-00020-of-00047.safetensors", + "model.layers.19.mlp.experts.67.down_proj.weight_scale": "model-00020-of-00047.safetensors", + "model.layers.19.mlp.experts.67.gate_proj.weight": "model-00020-of-00047.safetensors", + "model.layers.19.mlp.experts.67.gate_proj.weight_scale": "model-00020-of-00047.safetensors", + "model.layers.19.mlp.experts.67.up_proj.weight": "model-00020-of-00047.safetensors", + "model.layers.19.mlp.experts.67.up_proj.weight_scale": "model-00020-of-00047.safetensors", + "model.layers.19.mlp.experts.68.down_proj.weight": "model-00020-of-00047.safetensors", + "model.layers.19.mlp.experts.68.down_proj.weight_scale": "model-00020-of-00047.safetensors", + "model.layers.19.mlp.experts.68.gate_proj.weight": "model-00020-of-00047.safetensors", + "model.layers.19.mlp.experts.68.gate_proj.weight_scale": "model-00020-of-00047.safetensors", + "model.layers.19.mlp.experts.68.up_proj.weight": "model-00020-of-00047.safetensors", + "model.layers.19.mlp.experts.68.up_proj.weight_scale": "model-00020-of-00047.safetensors", + "model.layers.19.mlp.experts.69.down_proj.weight": "model-00020-of-00047.safetensors", + "model.layers.19.mlp.experts.69.down_proj.weight_scale": "model-00020-of-00047.safetensors", + "model.layers.19.mlp.experts.69.gate_proj.weight": "model-00020-of-00047.safetensors", + "model.layers.19.mlp.experts.69.gate_proj.weight_scale": "model-00020-of-00047.safetensors", + "model.layers.19.mlp.experts.69.up_proj.weight": "model-00020-of-00047.safetensors", + "model.layers.19.mlp.experts.69.up_proj.weight_scale": "model-00020-of-00047.safetensors", + "model.layers.19.mlp.experts.7.down_proj.weight": "model-00020-of-00047.safetensors", + "model.layers.19.mlp.experts.7.down_proj.weight_scale": "model-00020-of-00047.safetensors", + "model.layers.19.mlp.experts.7.gate_proj.weight": "model-00020-of-00047.safetensors", + "model.layers.19.mlp.experts.7.gate_proj.weight_scale": "model-00020-of-00047.safetensors", + "model.layers.19.mlp.experts.7.up_proj.weight": "model-00020-of-00047.safetensors", + "model.layers.19.mlp.experts.7.up_proj.weight_scale": "model-00020-of-00047.safetensors", + "model.layers.19.mlp.experts.70.down_proj.weight": "model-00020-of-00047.safetensors", + "model.layers.19.mlp.experts.70.down_proj.weight_scale": "model-00020-of-00047.safetensors", + "model.layers.19.mlp.experts.70.gate_proj.weight": "model-00020-of-00047.safetensors", + "model.layers.19.mlp.experts.70.gate_proj.weight_scale": "model-00020-of-00047.safetensors", + "model.layers.19.mlp.experts.70.up_proj.weight": "model-00020-of-00047.safetensors", + "model.layers.19.mlp.experts.70.up_proj.weight_scale": "model-00020-of-00047.safetensors", + "model.layers.19.mlp.experts.71.down_proj.weight": "model-00020-of-00047.safetensors", + "model.layers.19.mlp.experts.71.down_proj.weight_scale": "model-00020-of-00047.safetensors", + "model.layers.19.mlp.experts.71.gate_proj.weight": "model-00020-of-00047.safetensors", + "model.layers.19.mlp.experts.71.gate_proj.weight_scale": "model-00020-of-00047.safetensors", + "model.layers.19.mlp.experts.71.up_proj.weight": "model-00020-of-00047.safetensors", + "model.layers.19.mlp.experts.71.up_proj.weight_scale": "model-00020-of-00047.safetensors", + "model.layers.19.mlp.experts.72.down_proj.weight": "model-00020-of-00047.safetensors", + "model.layers.19.mlp.experts.72.down_proj.weight_scale": "model-00020-of-00047.safetensors", + "model.layers.19.mlp.experts.72.gate_proj.weight": "model-00020-of-00047.safetensors", + "model.layers.19.mlp.experts.72.gate_proj.weight_scale": "model-00020-of-00047.safetensors", + "model.layers.19.mlp.experts.72.up_proj.weight": "model-00020-of-00047.safetensors", + "model.layers.19.mlp.experts.72.up_proj.weight_scale": "model-00020-of-00047.safetensors", + "model.layers.19.mlp.experts.73.down_proj.weight": "model-00020-of-00047.safetensors", + "model.layers.19.mlp.experts.73.down_proj.weight_scale": "model-00020-of-00047.safetensors", + "model.layers.19.mlp.experts.73.gate_proj.weight": "model-00020-of-00047.safetensors", + "model.layers.19.mlp.experts.73.gate_proj.weight_scale": "model-00020-of-00047.safetensors", + "model.layers.19.mlp.experts.73.up_proj.weight": "model-00020-of-00047.safetensors", + "model.layers.19.mlp.experts.73.up_proj.weight_scale": "model-00020-of-00047.safetensors", + "model.layers.19.mlp.experts.74.down_proj.weight": "model-00020-of-00047.safetensors", + "model.layers.19.mlp.experts.74.down_proj.weight_scale": "model-00020-of-00047.safetensors", + "model.layers.19.mlp.experts.74.gate_proj.weight": "model-00020-of-00047.safetensors", + "model.layers.19.mlp.experts.74.gate_proj.weight_scale": "model-00020-of-00047.safetensors", + "model.layers.19.mlp.experts.74.up_proj.weight": "model-00020-of-00047.safetensors", + "model.layers.19.mlp.experts.74.up_proj.weight_scale": "model-00020-of-00047.safetensors", + "model.layers.19.mlp.experts.75.down_proj.weight": "model-00020-of-00047.safetensors", + "model.layers.19.mlp.experts.75.down_proj.weight_scale": "model-00020-of-00047.safetensors", + "model.layers.19.mlp.experts.75.gate_proj.weight": "model-00020-of-00047.safetensors", + "model.layers.19.mlp.experts.75.gate_proj.weight_scale": "model-00020-of-00047.safetensors", + "model.layers.19.mlp.experts.75.up_proj.weight": "model-00020-of-00047.safetensors", + "model.layers.19.mlp.experts.75.up_proj.weight_scale": "model-00020-of-00047.safetensors", + "model.layers.19.mlp.experts.76.down_proj.weight": "model-00020-of-00047.safetensors", + "model.layers.19.mlp.experts.76.down_proj.weight_scale": "model-00020-of-00047.safetensors", + "model.layers.19.mlp.experts.76.gate_proj.weight": "model-00020-of-00047.safetensors", + "model.layers.19.mlp.experts.76.gate_proj.weight_scale": "model-00020-of-00047.safetensors", + "model.layers.19.mlp.experts.76.up_proj.weight": "model-00020-of-00047.safetensors", + "model.layers.19.mlp.experts.76.up_proj.weight_scale": "model-00020-of-00047.safetensors", + "model.layers.19.mlp.experts.77.down_proj.weight": "model-00020-of-00047.safetensors", + "model.layers.19.mlp.experts.77.down_proj.weight_scale": "model-00020-of-00047.safetensors", + "model.layers.19.mlp.experts.77.gate_proj.weight": "model-00020-of-00047.safetensors", + "model.layers.19.mlp.experts.77.gate_proj.weight_scale": "model-00020-of-00047.safetensors", + "model.layers.19.mlp.experts.77.up_proj.weight": "model-00020-of-00047.safetensors", + "model.layers.19.mlp.experts.77.up_proj.weight_scale": "model-00020-of-00047.safetensors", + "model.layers.19.mlp.experts.78.down_proj.weight": "model-00020-of-00047.safetensors", + "model.layers.19.mlp.experts.78.down_proj.weight_scale": "model-00020-of-00047.safetensors", + "model.layers.19.mlp.experts.78.gate_proj.weight": "model-00020-of-00047.safetensors", + "model.layers.19.mlp.experts.78.gate_proj.weight_scale": "model-00020-of-00047.safetensors", + "model.layers.19.mlp.experts.78.up_proj.weight": "model-00020-of-00047.safetensors", + "model.layers.19.mlp.experts.78.up_proj.weight_scale": "model-00020-of-00047.safetensors", + "model.layers.19.mlp.experts.79.down_proj.weight": "model-00020-of-00047.safetensors", + "model.layers.19.mlp.experts.79.down_proj.weight_scale": "model-00020-of-00047.safetensors", + "model.layers.19.mlp.experts.79.gate_proj.weight": "model-00020-of-00047.safetensors", + "model.layers.19.mlp.experts.79.gate_proj.weight_scale": "model-00020-of-00047.safetensors", + "model.layers.19.mlp.experts.79.up_proj.weight": "model-00020-of-00047.safetensors", + "model.layers.19.mlp.experts.79.up_proj.weight_scale": "model-00020-of-00047.safetensors", + "model.layers.19.mlp.experts.8.down_proj.weight": "model-00020-of-00047.safetensors", + "model.layers.19.mlp.experts.8.down_proj.weight_scale": "model-00020-of-00047.safetensors", + "model.layers.19.mlp.experts.8.gate_proj.weight": "model-00020-of-00047.safetensors", + "model.layers.19.mlp.experts.8.gate_proj.weight_scale": "model-00020-of-00047.safetensors", + "model.layers.19.mlp.experts.8.up_proj.weight": "model-00020-of-00047.safetensors", + "model.layers.19.mlp.experts.8.up_proj.weight_scale": "model-00020-of-00047.safetensors", + "model.layers.19.mlp.experts.80.down_proj.weight": "model-00020-of-00047.safetensors", + "model.layers.19.mlp.experts.80.down_proj.weight_scale": "model-00020-of-00047.safetensors", + "model.layers.19.mlp.experts.80.gate_proj.weight": "model-00020-of-00047.safetensors", + "model.layers.19.mlp.experts.80.gate_proj.weight_scale": "model-00020-of-00047.safetensors", + "model.layers.19.mlp.experts.80.up_proj.weight": "model-00020-of-00047.safetensors", + "model.layers.19.mlp.experts.80.up_proj.weight_scale": "model-00020-of-00047.safetensors", + "model.layers.19.mlp.experts.81.down_proj.weight": "model-00020-of-00047.safetensors", + "model.layers.19.mlp.experts.81.down_proj.weight_scale": "model-00020-of-00047.safetensors", + "model.layers.19.mlp.experts.81.gate_proj.weight": "model-00020-of-00047.safetensors", + "model.layers.19.mlp.experts.81.gate_proj.weight_scale": "model-00020-of-00047.safetensors", + "model.layers.19.mlp.experts.81.up_proj.weight": "model-00020-of-00047.safetensors", + "model.layers.19.mlp.experts.81.up_proj.weight_scale": "model-00020-of-00047.safetensors", + "model.layers.19.mlp.experts.82.down_proj.weight": "model-00020-of-00047.safetensors", + "model.layers.19.mlp.experts.82.down_proj.weight_scale": "model-00020-of-00047.safetensors", + "model.layers.19.mlp.experts.82.gate_proj.weight": "model-00020-of-00047.safetensors", + "model.layers.19.mlp.experts.82.gate_proj.weight_scale": "model-00020-of-00047.safetensors", + "model.layers.19.mlp.experts.82.up_proj.weight": "model-00020-of-00047.safetensors", + "model.layers.19.mlp.experts.82.up_proj.weight_scale": "model-00020-of-00047.safetensors", + "model.layers.19.mlp.experts.83.down_proj.weight": "model-00020-of-00047.safetensors", + "model.layers.19.mlp.experts.83.down_proj.weight_scale": "model-00020-of-00047.safetensors", + "model.layers.19.mlp.experts.83.gate_proj.weight": "model-00020-of-00047.safetensors", + "model.layers.19.mlp.experts.83.gate_proj.weight_scale": "model-00020-of-00047.safetensors", + "model.layers.19.mlp.experts.83.up_proj.weight": "model-00020-of-00047.safetensors", + "model.layers.19.mlp.experts.83.up_proj.weight_scale": "model-00020-of-00047.safetensors", + "model.layers.19.mlp.experts.84.down_proj.weight": "model-00020-of-00047.safetensors", + "model.layers.19.mlp.experts.84.down_proj.weight_scale": "model-00020-of-00047.safetensors", + "model.layers.19.mlp.experts.84.gate_proj.weight": "model-00020-of-00047.safetensors", + "model.layers.19.mlp.experts.84.gate_proj.weight_scale": "model-00020-of-00047.safetensors", + "model.layers.19.mlp.experts.84.up_proj.weight": "model-00020-of-00047.safetensors", + "model.layers.19.mlp.experts.84.up_proj.weight_scale": "model-00020-of-00047.safetensors", + "model.layers.19.mlp.experts.85.down_proj.weight": "model-00020-of-00047.safetensors", + "model.layers.19.mlp.experts.85.down_proj.weight_scale": "model-00020-of-00047.safetensors", + "model.layers.19.mlp.experts.85.gate_proj.weight": "model-00020-of-00047.safetensors", + "model.layers.19.mlp.experts.85.gate_proj.weight_scale": "model-00020-of-00047.safetensors", + "model.layers.19.mlp.experts.85.up_proj.weight": "model-00020-of-00047.safetensors", + "model.layers.19.mlp.experts.85.up_proj.weight_scale": "model-00020-of-00047.safetensors", + "model.layers.19.mlp.experts.86.down_proj.weight": "model-00020-of-00047.safetensors", + "model.layers.19.mlp.experts.86.down_proj.weight_scale": "model-00020-of-00047.safetensors", + "model.layers.19.mlp.experts.86.gate_proj.weight": "model-00020-of-00047.safetensors", + "model.layers.19.mlp.experts.86.gate_proj.weight_scale": "model-00020-of-00047.safetensors", + "model.layers.19.mlp.experts.86.up_proj.weight": "model-00020-of-00047.safetensors", + "model.layers.19.mlp.experts.86.up_proj.weight_scale": "model-00020-of-00047.safetensors", + "model.layers.19.mlp.experts.87.down_proj.weight": "model-00020-of-00047.safetensors", + "model.layers.19.mlp.experts.87.down_proj.weight_scale": "model-00020-of-00047.safetensors", + "model.layers.19.mlp.experts.87.gate_proj.weight": "model-00020-of-00047.safetensors", + "model.layers.19.mlp.experts.87.gate_proj.weight_scale": "model-00020-of-00047.safetensors", + "model.layers.19.mlp.experts.87.up_proj.weight": "model-00020-of-00047.safetensors", + "model.layers.19.mlp.experts.87.up_proj.weight_scale": "model-00020-of-00047.safetensors", + "model.layers.19.mlp.experts.88.down_proj.weight": "model-00020-of-00047.safetensors", + "model.layers.19.mlp.experts.88.down_proj.weight_scale": "model-00020-of-00047.safetensors", + "model.layers.19.mlp.experts.88.gate_proj.weight": "model-00020-of-00047.safetensors", + "model.layers.19.mlp.experts.88.gate_proj.weight_scale": "model-00020-of-00047.safetensors", + "model.layers.19.mlp.experts.88.up_proj.weight": "model-00020-of-00047.safetensors", + "model.layers.19.mlp.experts.88.up_proj.weight_scale": "model-00020-of-00047.safetensors", + "model.layers.19.mlp.experts.89.down_proj.weight": "model-00020-of-00047.safetensors", + "model.layers.19.mlp.experts.89.down_proj.weight_scale": "model-00020-of-00047.safetensors", + "model.layers.19.mlp.experts.89.gate_proj.weight": "model-00020-of-00047.safetensors", + "model.layers.19.mlp.experts.89.gate_proj.weight_scale": "model-00020-of-00047.safetensors", + "model.layers.19.mlp.experts.89.up_proj.weight": "model-00020-of-00047.safetensors", + "model.layers.19.mlp.experts.89.up_proj.weight_scale": "model-00020-of-00047.safetensors", + "model.layers.19.mlp.experts.9.down_proj.weight": "model-00020-of-00047.safetensors", + "model.layers.19.mlp.experts.9.down_proj.weight_scale": "model-00020-of-00047.safetensors", + "model.layers.19.mlp.experts.9.gate_proj.weight": "model-00020-of-00047.safetensors", + "model.layers.19.mlp.experts.9.gate_proj.weight_scale": "model-00020-of-00047.safetensors", + "model.layers.19.mlp.experts.9.up_proj.weight": "model-00020-of-00047.safetensors", + "model.layers.19.mlp.experts.9.up_proj.weight_scale": "model-00020-of-00047.safetensors", + "model.layers.19.mlp.experts.90.down_proj.weight": "model-00020-of-00047.safetensors", + "model.layers.19.mlp.experts.90.down_proj.weight_scale": "model-00020-of-00047.safetensors", + "model.layers.19.mlp.experts.90.gate_proj.weight": "model-00020-of-00047.safetensors", + "model.layers.19.mlp.experts.90.gate_proj.weight_scale": "model-00020-of-00047.safetensors", + "model.layers.19.mlp.experts.90.up_proj.weight": "model-00020-of-00047.safetensors", + "model.layers.19.mlp.experts.90.up_proj.weight_scale": "model-00020-of-00047.safetensors", + "model.layers.19.mlp.experts.91.down_proj.weight": "model-00020-of-00047.safetensors", + "model.layers.19.mlp.experts.91.down_proj.weight_scale": "model-00020-of-00047.safetensors", + "model.layers.19.mlp.experts.91.gate_proj.weight": "model-00020-of-00047.safetensors", + "model.layers.19.mlp.experts.91.gate_proj.weight_scale": "model-00020-of-00047.safetensors", + "model.layers.19.mlp.experts.91.up_proj.weight": "model-00020-of-00047.safetensors", + "model.layers.19.mlp.experts.91.up_proj.weight_scale": "model-00020-of-00047.safetensors", + "model.layers.19.mlp.experts.92.down_proj.weight": "model-00020-of-00047.safetensors", + "model.layers.19.mlp.experts.92.down_proj.weight_scale": "model-00020-of-00047.safetensors", + "model.layers.19.mlp.experts.92.gate_proj.weight": "model-00020-of-00047.safetensors", + "model.layers.19.mlp.experts.92.gate_proj.weight_scale": "model-00020-of-00047.safetensors", + "model.layers.19.mlp.experts.92.up_proj.weight": "model-00020-of-00047.safetensors", + "model.layers.19.mlp.experts.92.up_proj.weight_scale": "model-00020-of-00047.safetensors", + "model.layers.19.mlp.experts.93.down_proj.weight": "model-00020-of-00047.safetensors", + "model.layers.19.mlp.experts.93.down_proj.weight_scale": "model-00020-of-00047.safetensors", + "model.layers.19.mlp.experts.93.gate_proj.weight": "model-00020-of-00047.safetensors", + "model.layers.19.mlp.experts.93.gate_proj.weight_scale": "model-00020-of-00047.safetensors", + "model.layers.19.mlp.experts.93.up_proj.weight": "model-00020-of-00047.safetensors", + "model.layers.19.mlp.experts.93.up_proj.weight_scale": "model-00020-of-00047.safetensors", + "model.layers.19.mlp.experts.94.down_proj.weight": "model-00020-of-00047.safetensors", + "model.layers.19.mlp.experts.94.down_proj.weight_scale": "model-00020-of-00047.safetensors", + "model.layers.19.mlp.experts.94.gate_proj.weight": "model-00020-of-00047.safetensors", + "model.layers.19.mlp.experts.94.gate_proj.weight_scale": "model-00020-of-00047.safetensors", + "model.layers.19.mlp.experts.94.up_proj.weight": "model-00020-of-00047.safetensors", + "model.layers.19.mlp.experts.94.up_proj.weight_scale": "model-00020-of-00047.safetensors", + "model.layers.19.mlp.experts.95.down_proj.weight": "model-00020-of-00047.safetensors", + "model.layers.19.mlp.experts.95.down_proj.weight_scale": "model-00020-of-00047.safetensors", + "model.layers.19.mlp.experts.95.gate_proj.weight": "model-00020-of-00047.safetensors", + "model.layers.19.mlp.experts.95.gate_proj.weight_scale": "model-00020-of-00047.safetensors", + "model.layers.19.mlp.experts.95.up_proj.weight": "model-00020-of-00047.safetensors", + "model.layers.19.mlp.experts.95.up_proj.weight_scale": "model-00020-of-00047.safetensors", + "model.layers.19.mlp.experts.96.down_proj.weight": "model-00020-of-00047.safetensors", + "model.layers.19.mlp.experts.96.down_proj.weight_scale": "model-00020-of-00047.safetensors", + "model.layers.19.mlp.experts.96.gate_proj.weight": "model-00020-of-00047.safetensors", + "model.layers.19.mlp.experts.96.gate_proj.weight_scale": "model-00020-of-00047.safetensors", + "model.layers.19.mlp.experts.96.up_proj.weight": "model-00020-of-00047.safetensors", + "model.layers.19.mlp.experts.96.up_proj.weight_scale": "model-00020-of-00047.safetensors", + "model.layers.19.mlp.experts.97.down_proj.weight": "model-00020-of-00047.safetensors", + "model.layers.19.mlp.experts.97.down_proj.weight_scale": "model-00020-of-00047.safetensors", + "model.layers.19.mlp.experts.97.gate_proj.weight": "model-00020-of-00047.safetensors", + "model.layers.19.mlp.experts.97.gate_proj.weight_scale": "model-00020-of-00047.safetensors", + "model.layers.19.mlp.experts.97.up_proj.weight": "model-00020-of-00047.safetensors", + "model.layers.19.mlp.experts.97.up_proj.weight_scale": "model-00020-of-00047.safetensors", + "model.layers.19.mlp.experts.98.down_proj.weight": "model-00020-of-00047.safetensors", + "model.layers.19.mlp.experts.98.down_proj.weight_scale": "model-00020-of-00047.safetensors", + "model.layers.19.mlp.experts.98.gate_proj.weight": "model-00020-of-00047.safetensors", + "model.layers.19.mlp.experts.98.gate_proj.weight_scale": "model-00020-of-00047.safetensors", + "model.layers.19.mlp.experts.98.up_proj.weight": "model-00020-of-00047.safetensors", + "model.layers.19.mlp.experts.98.up_proj.weight_scale": "model-00020-of-00047.safetensors", + "model.layers.19.mlp.experts.99.down_proj.weight": "model-00020-of-00047.safetensors", + "model.layers.19.mlp.experts.99.down_proj.weight_scale": "model-00020-of-00047.safetensors", + "model.layers.19.mlp.experts.99.gate_proj.weight": "model-00020-of-00047.safetensors", + "model.layers.19.mlp.experts.99.gate_proj.weight_scale": "model-00020-of-00047.safetensors", + "model.layers.19.mlp.experts.99.up_proj.weight": "model-00020-of-00047.safetensors", + "model.layers.19.mlp.experts.99.up_proj.weight_scale": "model-00020-of-00047.safetensors", + "model.layers.19.mlp.gate.e_score_correction_bias": "model-00020-of-00047.safetensors", + "model.layers.19.mlp.gate.weight": "model-00020-of-00047.safetensors", + "model.layers.19.mlp.shared_experts.down_proj.weight": "model-00020-of-00047.safetensors", + "model.layers.19.mlp.shared_experts.down_proj.weight_scale": "model-00020-of-00047.safetensors", + "model.layers.19.mlp.shared_experts.gate_proj.weight": "model-00020-of-00047.safetensors", + "model.layers.19.mlp.shared_experts.gate_proj.weight_scale": "model-00020-of-00047.safetensors", + "model.layers.19.mlp.shared_experts.up_proj.weight": "model-00020-of-00047.safetensors", + "model.layers.19.mlp.shared_experts.up_proj.weight_scale": "model-00020-of-00047.safetensors", + "model.layers.19.post_attention_layernorm.weight": "model-00020-of-00047.safetensors", + "model.layers.19.self_attn.k_proj.bias": "model-00020-of-00047.safetensors", + "model.layers.19.self_attn.k_proj.weight": "model-00020-of-00047.safetensors", + "model.layers.19.self_attn.k_proj.weight_scale": "model-00020-of-00047.safetensors", + "model.layers.19.self_attn.o_proj.weight": "model-00020-of-00047.safetensors", + "model.layers.19.self_attn.o_proj.weight_scale": "model-00020-of-00047.safetensors", + "model.layers.19.self_attn.q_proj.bias": "model-00020-of-00047.safetensors", + "model.layers.19.self_attn.q_proj.weight": "model-00020-of-00047.safetensors", + "model.layers.19.self_attn.q_proj.weight_scale": "model-00020-of-00047.safetensors", + "model.layers.19.self_attn.v_proj.bias": "model-00020-of-00047.safetensors", + "model.layers.19.self_attn.v_proj.weight": "model-00020-of-00047.safetensors", + "model.layers.19.self_attn.v_proj.weight_scale": "model-00020-of-00047.safetensors", + "model.layers.20.input_layernorm.weight": "model-00021-of-00047.safetensors", + "model.layers.20.mlp.experts.0.down_proj.weight": "model-00021-of-00047.safetensors", + "model.layers.20.mlp.experts.0.down_proj.weight_scale": "model-00021-of-00047.safetensors", + "model.layers.20.mlp.experts.0.gate_proj.weight": "model-00021-of-00047.safetensors", + "model.layers.20.mlp.experts.0.gate_proj.weight_scale": "model-00021-of-00047.safetensors", + "model.layers.20.mlp.experts.0.up_proj.weight": "model-00021-of-00047.safetensors", + "model.layers.20.mlp.experts.0.up_proj.weight_scale": "model-00021-of-00047.safetensors", + "model.layers.20.mlp.experts.1.down_proj.weight": "model-00021-of-00047.safetensors", + "model.layers.20.mlp.experts.1.down_proj.weight_scale": "model-00021-of-00047.safetensors", + "model.layers.20.mlp.experts.1.gate_proj.weight": "model-00021-of-00047.safetensors", + "model.layers.20.mlp.experts.1.gate_proj.weight_scale": "model-00021-of-00047.safetensors", + "model.layers.20.mlp.experts.1.up_proj.weight": "model-00021-of-00047.safetensors", + "model.layers.20.mlp.experts.1.up_proj.weight_scale": "model-00021-of-00047.safetensors", + "model.layers.20.mlp.experts.10.down_proj.weight": "model-00021-of-00047.safetensors", + "model.layers.20.mlp.experts.10.down_proj.weight_scale": "model-00021-of-00047.safetensors", + "model.layers.20.mlp.experts.10.gate_proj.weight": "model-00021-of-00047.safetensors", + "model.layers.20.mlp.experts.10.gate_proj.weight_scale": "model-00021-of-00047.safetensors", + "model.layers.20.mlp.experts.10.up_proj.weight": "model-00021-of-00047.safetensors", + "model.layers.20.mlp.experts.10.up_proj.weight_scale": "model-00021-of-00047.safetensors", + "model.layers.20.mlp.experts.100.down_proj.weight": "model-00021-of-00047.safetensors", + "model.layers.20.mlp.experts.100.down_proj.weight_scale": "model-00021-of-00047.safetensors", + "model.layers.20.mlp.experts.100.gate_proj.weight": "model-00021-of-00047.safetensors", + "model.layers.20.mlp.experts.100.gate_proj.weight_scale": "model-00021-of-00047.safetensors", + "model.layers.20.mlp.experts.100.up_proj.weight": "model-00021-of-00047.safetensors", + "model.layers.20.mlp.experts.100.up_proj.weight_scale": "model-00021-of-00047.safetensors", + "model.layers.20.mlp.experts.101.down_proj.weight": "model-00021-of-00047.safetensors", + "model.layers.20.mlp.experts.101.down_proj.weight_scale": "model-00021-of-00047.safetensors", + "model.layers.20.mlp.experts.101.gate_proj.weight": "model-00021-of-00047.safetensors", + "model.layers.20.mlp.experts.101.gate_proj.weight_scale": "model-00021-of-00047.safetensors", + "model.layers.20.mlp.experts.101.up_proj.weight": "model-00021-of-00047.safetensors", + "model.layers.20.mlp.experts.101.up_proj.weight_scale": "model-00021-of-00047.safetensors", + "model.layers.20.mlp.experts.102.down_proj.weight": "model-00021-of-00047.safetensors", + "model.layers.20.mlp.experts.102.down_proj.weight_scale": "model-00021-of-00047.safetensors", + "model.layers.20.mlp.experts.102.gate_proj.weight": "model-00021-of-00047.safetensors", + "model.layers.20.mlp.experts.102.gate_proj.weight_scale": "model-00021-of-00047.safetensors", + "model.layers.20.mlp.experts.102.up_proj.weight": "model-00021-of-00047.safetensors", + "model.layers.20.mlp.experts.102.up_proj.weight_scale": "model-00021-of-00047.safetensors", + "model.layers.20.mlp.experts.103.down_proj.weight": "model-00021-of-00047.safetensors", + "model.layers.20.mlp.experts.103.down_proj.weight_scale": "model-00021-of-00047.safetensors", + "model.layers.20.mlp.experts.103.gate_proj.weight": "model-00021-of-00047.safetensors", + "model.layers.20.mlp.experts.103.gate_proj.weight_scale": "model-00021-of-00047.safetensors", + "model.layers.20.mlp.experts.103.up_proj.weight": "model-00021-of-00047.safetensors", + "model.layers.20.mlp.experts.103.up_proj.weight_scale": "model-00021-of-00047.safetensors", + "model.layers.20.mlp.experts.104.down_proj.weight": "model-00021-of-00047.safetensors", + "model.layers.20.mlp.experts.104.down_proj.weight_scale": "model-00021-of-00047.safetensors", + "model.layers.20.mlp.experts.104.gate_proj.weight": "model-00021-of-00047.safetensors", + "model.layers.20.mlp.experts.104.gate_proj.weight_scale": "model-00021-of-00047.safetensors", + "model.layers.20.mlp.experts.104.up_proj.weight": "model-00021-of-00047.safetensors", + "model.layers.20.mlp.experts.104.up_proj.weight_scale": "model-00021-of-00047.safetensors", + "model.layers.20.mlp.experts.105.down_proj.weight": "model-00021-of-00047.safetensors", + "model.layers.20.mlp.experts.105.down_proj.weight_scale": "model-00021-of-00047.safetensors", + "model.layers.20.mlp.experts.105.gate_proj.weight": "model-00021-of-00047.safetensors", + "model.layers.20.mlp.experts.105.gate_proj.weight_scale": "model-00021-of-00047.safetensors", + "model.layers.20.mlp.experts.105.up_proj.weight": "model-00021-of-00047.safetensors", + "model.layers.20.mlp.experts.105.up_proj.weight_scale": "model-00021-of-00047.safetensors", + "model.layers.20.mlp.experts.106.down_proj.weight": "model-00021-of-00047.safetensors", + "model.layers.20.mlp.experts.106.down_proj.weight_scale": "model-00021-of-00047.safetensors", + "model.layers.20.mlp.experts.106.gate_proj.weight": "model-00021-of-00047.safetensors", + "model.layers.20.mlp.experts.106.gate_proj.weight_scale": "model-00021-of-00047.safetensors", + "model.layers.20.mlp.experts.106.up_proj.weight": "model-00021-of-00047.safetensors", + "model.layers.20.mlp.experts.106.up_proj.weight_scale": "model-00021-of-00047.safetensors", + "model.layers.20.mlp.experts.107.down_proj.weight": "model-00021-of-00047.safetensors", + "model.layers.20.mlp.experts.107.down_proj.weight_scale": "model-00021-of-00047.safetensors", + "model.layers.20.mlp.experts.107.gate_proj.weight": "model-00021-of-00047.safetensors", + "model.layers.20.mlp.experts.107.gate_proj.weight_scale": "model-00021-of-00047.safetensors", + "model.layers.20.mlp.experts.107.up_proj.weight": "model-00021-of-00047.safetensors", + "model.layers.20.mlp.experts.107.up_proj.weight_scale": "model-00021-of-00047.safetensors", + "model.layers.20.mlp.experts.108.down_proj.weight": "model-00021-of-00047.safetensors", + "model.layers.20.mlp.experts.108.down_proj.weight_scale": "model-00021-of-00047.safetensors", + "model.layers.20.mlp.experts.108.gate_proj.weight": "model-00021-of-00047.safetensors", + "model.layers.20.mlp.experts.108.gate_proj.weight_scale": "model-00021-of-00047.safetensors", + "model.layers.20.mlp.experts.108.up_proj.weight": "model-00021-of-00047.safetensors", + "model.layers.20.mlp.experts.108.up_proj.weight_scale": "model-00021-of-00047.safetensors", + "model.layers.20.mlp.experts.109.down_proj.weight": "model-00021-of-00047.safetensors", + "model.layers.20.mlp.experts.109.down_proj.weight_scale": "model-00021-of-00047.safetensors", + "model.layers.20.mlp.experts.109.gate_proj.weight": "model-00021-of-00047.safetensors", + "model.layers.20.mlp.experts.109.gate_proj.weight_scale": "model-00021-of-00047.safetensors", + "model.layers.20.mlp.experts.109.up_proj.weight": "model-00021-of-00047.safetensors", + "model.layers.20.mlp.experts.109.up_proj.weight_scale": "model-00021-of-00047.safetensors", + "model.layers.20.mlp.experts.11.down_proj.weight": "model-00021-of-00047.safetensors", + "model.layers.20.mlp.experts.11.down_proj.weight_scale": "model-00021-of-00047.safetensors", + "model.layers.20.mlp.experts.11.gate_proj.weight": "model-00021-of-00047.safetensors", + "model.layers.20.mlp.experts.11.gate_proj.weight_scale": "model-00021-of-00047.safetensors", + "model.layers.20.mlp.experts.11.up_proj.weight": "model-00021-of-00047.safetensors", + "model.layers.20.mlp.experts.11.up_proj.weight_scale": "model-00021-of-00047.safetensors", + "model.layers.20.mlp.experts.110.down_proj.weight": "model-00021-of-00047.safetensors", + "model.layers.20.mlp.experts.110.down_proj.weight_scale": "model-00021-of-00047.safetensors", + "model.layers.20.mlp.experts.110.gate_proj.weight": "model-00021-of-00047.safetensors", + "model.layers.20.mlp.experts.110.gate_proj.weight_scale": "model-00021-of-00047.safetensors", + "model.layers.20.mlp.experts.110.up_proj.weight": "model-00021-of-00047.safetensors", + "model.layers.20.mlp.experts.110.up_proj.weight_scale": "model-00021-of-00047.safetensors", + "model.layers.20.mlp.experts.111.down_proj.weight": "model-00021-of-00047.safetensors", + "model.layers.20.mlp.experts.111.down_proj.weight_scale": "model-00021-of-00047.safetensors", + "model.layers.20.mlp.experts.111.gate_proj.weight": "model-00021-of-00047.safetensors", + "model.layers.20.mlp.experts.111.gate_proj.weight_scale": "model-00021-of-00047.safetensors", + "model.layers.20.mlp.experts.111.up_proj.weight": "model-00021-of-00047.safetensors", + "model.layers.20.mlp.experts.111.up_proj.weight_scale": "model-00021-of-00047.safetensors", + "model.layers.20.mlp.experts.112.down_proj.weight": "model-00021-of-00047.safetensors", + "model.layers.20.mlp.experts.112.down_proj.weight_scale": "model-00021-of-00047.safetensors", + "model.layers.20.mlp.experts.112.gate_proj.weight": "model-00021-of-00047.safetensors", + "model.layers.20.mlp.experts.112.gate_proj.weight_scale": "model-00021-of-00047.safetensors", + "model.layers.20.mlp.experts.112.up_proj.weight": "model-00021-of-00047.safetensors", + "model.layers.20.mlp.experts.112.up_proj.weight_scale": "model-00021-of-00047.safetensors", + "model.layers.20.mlp.experts.113.down_proj.weight": "model-00021-of-00047.safetensors", + "model.layers.20.mlp.experts.113.down_proj.weight_scale": "model-00021-of-00047.safetensors", + "model.layers.20.mlp.experts.113.gate_proj.weight": "model-00021-of-00047.safetensors", + "model.layers.20.mlp.experts.113.gate_proj.weight_scale": "model-00021-of-00047.safetensors", + "model.layers.20.mlp.experts.113.up_proj.weight": "model-00021-of-00047.safetensors", + "model.layers.20.mlp.experts.113.up_proj.weight_scale": "model-00021-of-00047.safetensors", + "model.layers.20.mlp.experts.114.down_proj.weight": "model-00021-of-00047.safetensors", + "model.layers.20.mlp.experts.114.down_proj.weight_scale": "model-00021-of-00047.safetensors", + "model.layers.20.mlp.experts.114.gate_proj.weight": "model-00021-of-00047.safetensors", + "model.layers.20.mlp.experts.114.gate_proj.weight_scale": "model-00021-of-00047.safetensors", + "model.layers.20.mlp.experts.114.up_proj.weight": "model-00021-of-00047.safetensors", + "model.layers.20.mlp.experts.114.up_proj.weight_scale": "model-00021-of-00047.safetensors", + "model.layers.20.mlp.experts.115.down_proj.weight": "model-00021-of-00047.safetensors", + "model.layers.20.mlp.experts.115.down_proj.weight_scale": "model-00021-of-00047.safetensors", + "model.layers.20.mlp.experts.115.gate_proj.weight": "model-00021-of-00047.safetensors", + "model.layers.20.mlp.experts.115.gate_proj.weight_scale": "model-00021-of-00047.safetensors", + "model.layers.20.mlp.experts.115.up_proj.weight": "model-00021-of-00047.safetensors", + "model.layers.20.mlp.experts.115.up_proj.weight_scale": "model-00021-of-00047.safetensors", + "model.layers.20.mlp.experts.116.down_proj.weight": "model-00021-of-00047.safetensors", + "model.layers.20.mlp.experts.116.down_proj.weight_scale": "model-00021-of-00047.safetensors", + "model.layers.20.mlp.experts.116.gate_proj.weight": "model-00021-of-00047.safetensors", + "model.layers.20.mlp.experts.116.gate_proj.weight_scale": "model-00021-of-00047.safetensors", + "model.layers.20.mlp.experts.116.up_proj.weight": "model-00021-of-00047.safetensors", + "model.layers.20.mlp.experts.116.up_proj.weight_scale": "model-00021-of-00047.safetensors", + "model.layers.20.mlp.experts.117.down_proj.weight": "model-00021-of-00047.safetensors", + "model.layers.20.mlp.experts.117.down_proj.weight_scale": "model-00021-of-00047.safetensors", + "model.layers.20.mlp.experts.117.gate_proj.weight": "model-00021-of-00047.safetensors", + "model.layers.20.mlp.experts.117.gate_proj.weight_scale": "model-00021-of-00047.safetensors", + "model.layers.20.mlp.experts.117.up_proj.weight": "model-00021-of-00047.safetensors", + "model.layers.20.mlp.experts.117.up_proj.weight_scale": "model-00021-of-00047.safetensors", + "model.layers.20.mlp.experts.118.down_proj.weight": "model-00021-of-00047.safetensors", + "model.layers.20.mlp.experts.118.down_proj.weight_scale": "model-00021-of-00047.safetensors", + "model.layers.20.mlp.experts.118.gate_proj.weight": "model-00021-of-00047.safetensors", + "model.layers.20.mlp.experts.118.gate_proj.weight_scale": "model-00021-of-00047.safetensors", + "model.layers.20.mlp.experts.118.up_proj.weight": "model-00021-of-00047.safetensors", + "model.layers.20.mlp.experts.118.up_proj.weight_scale": "model-00021-of-00047.safetensors", + "model.layers.20.mlp.experts.119.down_proj.weight": "model-00021-of-00047.safetensors", + "model.layers.20.mlp.experts.119.down_proj.weight_scale": "model-00021-of-00047.safetensors", + "model.layers.20.mlp.experts.119.gate_proj.weight": "model-00021-of-00047.safetensors", + "model.layers.20.mlp.experts.119.gate_proj.weight_scale": "model-00021-of-00047.safetensors", + "model.layers.20.mlp.experts.119.up_proj.weight": "model-00021-of-00047.safetensors", + "model.layers.20.mlp.experts.119.up_proj.weight_scale": "model-00021-of-00047.safetensors", + "model.layers.20.mlp.experts.12.down_proj.weight": "model-00021-of-00047.safetensors", + "model.layers.20.mlp.experts.12.down_proj.weight_scale": "model-00021-of-00047.safetensors", + "model.layers.20.mlp.experts.12.gate_proj.weight": "model-00021-of-00047.safetensors", + "model.layers.20.mlp.experts.12.gate_proj.weight_scale": "model-00021-of-00047.safetensors", + "model.layers.20.mlp.experts.12.up_proj.weight": "model-00021-of-00047.safetensors", + "model.layers.20.mlp.experts.12.up_proj.weight_scale": "model-00021-of-00047.safetensors", + "model.layers.20.mlp.experts.120.down_proj.weight": "model-00021-of-00047.safetensors", + "model.layers.20.mlp.experts.120.down_proj.weight_scale": "model-00021-of-00047.safetensors", + "model.layers.20.mlp.experts.120.gate_proj.weight": "model-00021-of-00047.safetensors", + "model.layers.20.mlp.experts.120.gate_proj.weight_scale": "model-00021-of-00047.safetensors", + "model.layers.20.mlp.experts.120.up_proj.weight": "model-00021-of-00047.safetensors", + "model.layers.20.mlp.experts.120.up_proj.weight_scale": "model-00021-of-00047.safetensors", + "model.layers.20.mlp.experts.121.down_proj.weight": "model-00021-of-00047.safetensors", + "model.layers.20.mlp.experts.121.down_proj.weight_scale": "model-00021-of-00047.safetensors", + "model.layers.20.mlp.experts.121.gate_proj.weight": "model-00021-of-00047.safetensors", + "model.layers.20.mlp.experts.121.gate_proj.weight_scale": "model-00021-of-00047.safetensors", + "model.layers.20.mlp.experts.121.up_proj.weight": "model-00021-of-00047.safetensors", + "model.layers.20.mlp.experts.121.up_proj.weight_scale": "model-00021-of-00047.safetensors", + "model.layers.20.mlp.experts.122.down_proj.weight": "model-00021-of-00047.safetensors", + "model.layers.20.mlp.experts.122.down_proj.weight_scale": "model-00021-of-00047.safetensors", + "model.layers.20.mlp.experts.122.gate_proj.weight": "model-00021-of-00047.safetensors", + "model.layers.20.mlp.experts.122.gate_proj.weight_scale": "model-00021-of-00047.safetensors", + "model.layers.20.mlp.experts.122.up_proj.weight": "model-00021-of-00047.safetensors", + "model.layers.20.mlp.experts.122.up_proj.weight_scale": "model-00021-of-00047.safetensors", + "model.layers.20.mlp.experts.123.down_proj.weight": "model-00021-of-00047.safetensors", + "model.layers.20.mlp.experts.123.down_proj.weight_scale": "model-00021-of-00047.safetensors", + "model.layers.20.mlp.experts.123.gate_proj.weight": "model-00021-of-00047.safetensors", + "model.layers.20.mlp.experts.123.gate_proj.weight_scale": "model-00021-of-00047.safetensors", + "model.layers.20.mlp.experts.123.up_proj.weight": "model-00021-of-00047.safetensors", + "model.layers.20.mlp.experts.123.up_proj.weight_scale": "model-00021-of-00047.safetensors", + "model.layers.20.mlp.experts.124.down_proj.weight": "model-00021-of-00047.safetensors", + "model.layers.20.mlp.experts.124.down_proj.weight_scale": "model-00021-of-00047.safetensors", + "model.layers.20.mlp.experts.124.gate_proj.weight": "model-00021-of-00047.safetensors", + "model.layers.20.mlp.experts.124.gate_proj.weight_scale": "model-00021-of-00047.safetensors", + "model.layers.20.mlp.experts.124.up_proj.weight": "model-00021-of-00047.safetensors", + "model.layers.20.mlp.experts.124.up_proj.weight_scale": "model-00021-of-00047.safetensors", + "model.layers.20.mlp.experts.125.down_proj.weight": "model-00021-of-00047.safetensors", + "model.layers.20.mlp.experts.125.down_proj.weight_scale": "model-00021-of-00047.safetensors", + "model.layers.20.mlp.experts.125.gate_proj.weight": "model-00021-of-00047.safetensors", + "model.layers.20.mlp.experts.125.gate_proj.weight_scale": "model-00021-of-00047.safetensors", + "model.layers.20.mlp.experts.125.up_proj.weight": "model-00021-of-00047.safetensors", + "model.layers.20.mlp.experts.125.up_proj.weight_scale": "model-00021-of-00047.safetensors", + "model.layers.20.mlp.experts.126.down_proj.weight": "model-00021-of-00047.safetensors", + "model.layers.20.mlp.experts.126.down_proj.weight_scale": "model-00021-of-00047.safetensors", + "model.layers.20.mlp.experts.126.gate_proj.weight": "model-00021-of-00047.safetensors", + "model.layers.20.mlp.experts.126.gate_proj.weight_scale": "model-00021-of-00047.safetensors", + "model.layers.20.mlp.experts.126.up_proj.weight": "model-00021-of-00047.safetensors", + "model.layers.20.mlp.experts.126.up_proj.weight_scale": "model-00021-of-00047.safetensors", + "model.layers.20.mlp.experts.127.down_proj.weight": "model-00021-of-00047.safetensors", + "model.layers.20.mlp.experts.127.down_proj.weight_scale": "model-00021-of-00047.safetensors", + "model.layers.20.mlp.experts.127.gate_proj.weight": "model-00021-of-00047.safetensors", + "model.layers.20.mlp.experts.127.gate_proj.weight_scale": "model-00021-of-00047.safetensors", + "model.layers.20.mlp.experts.127.up_proj.weight": "model-00021-of-00047.safetensors", + "model.layers.20.mlp.experts.127.up_proj.weight_scale": "model-00021-of-00047.safetensors", + "model.layers.20.mlp.experts.13.down_proj.weight": "model-00021-of-00047.safetensors", + "model.layers.20.mlp.experts.13.down_proj.weight_scale": "model-00021-of-00047.safetensors", + "model.layers.20.mlp.experts.13.gate_proj.weight": "model-00021-of-00047.safetensors", + "model.layers.20.mlp.experts.13.gate_proj.weight_scale": "model-00021-of-00047.safetensors", + "model.layers.20.mlp.experts.13.up_proj.weight": "model-00021-of-00047.safetensors", + "model.layers.20.mlp.experts.13.up_proj.weight_scale": "model-00021-of-00047.safetensors", + "model.layers.20.mlp.experts.14.down_proj.weight": "model-00021-of-00047.safetensors", + "model.layers.20.mlp.experts.14.down_proj.weight_scale": "model-00021-of-00047.safetensors", + "model.layers.20.mlp.experts.14.gate_proj.weight": "model-00021-of-00047.safetensors", + "model.layers.20.mlp.experts.14.gate_proj.weight_scale": "model-00021-of-00047.safetensors", + "model.layers.20.mlp.experts.14.up_proj.weight": "model-00021-of-00047.safetensors", + "model.layers.20.mlp.experts.14.up_proj.weight_scale": "model-00021-of-00047.safetensors", + "model.layers.20.mlp.experts.15.down_proj.weight": "model-00021-of-00047.safetensors", + "model.layers.20.mlp.experts.15.down_proj.weight_scale": "model-00021-of-00047.safetensors", + "model.layers.20.mlp.experts.15.gate_proj.weight": "model-00021-of-00047.safetensors", + "model.layers.20.mlp.experts.15.gate_proj.weight_scale": "model-00021-of-00047.safetensors", + "model.layers.20.mlp.experts.15.up_proj.weight": "model-00021-of-00047.safetensors", + "model.layers.20.mlp.experts.15.up_proj.weight_scale": "model-00021-of-00047.safetensors", + "model.layers.20.mlp.experts.16.down_proj.weight": "model-00021-of-00047.safetensors", + "model.layers.20.mlp.experts.16.down_proj.weight_scale": "model-00021-of-00047.safetensors", + "model.layers.20.mlp.experts.16.gate_proj.weight": "model-00021-of-00047.safetensors", + "model.layers.20.mlp.experts.16.gate_proj.weight_scale": "model-00021-of-00047.safetensors", + "model.layers.20.mlp.experts.16.up_proj.weight": "model-00021-of-00047.safetensors", + "model.layers.20.mlp.experts.16.up_proj.weight_scale": "model-00021-of-00047.safetensors", + "model.layers.20.mlp.experts.17.down_proj.weight": "model-00021-of-00047.safetensors", + "model.layers.20.mlp.experts.17.down_proj.weight_scale": "model-00021-of-00047.safetensors", + "model.layers.20.mlp.experts.17.gate_proj.weight": "model-00021-of-00047.safetensors", + "model.layers.20.mlp.experts.17.gate_proj.weight_scale": "model-00021-of-00047.safetensors", + "model.layers.20.mlp.experts.17.up_proj.weight": "model-00021-of-00047.safetensors", + "model.layers.20.mlp.experts.17.up_proj.weight_scale": "model-00021-of-00047.safetensors", + "model.layers.20.mlp.experts.18.down_proj.weight": "model-00021-of-00047.safetensors", + "model.layers.20.mlp.experts.18.down_proj.weight_scale": "model-00021-of-00047.safetensors", + "model.layers.20.mlp.experts.18.gate_proj.weight": "model-00021-of-00047.safetensors", + "model.layers.20.mlp.experts.18.gate_proj.weight_scale": "model-00021-of-00047.safetensors", + "model.layers.20.mlp.experts.18.up_proj.weight": "model-00021-of-00047.safetensors", + "model.layers.20.mlp.experts.18.up_proj.weight_scale": "model-00021-of-00047.safetensors", + "model.layers.20.mlp.experts.19.down_proj.weight": "model-00021-of-00047.safetensors", + "model.layers.20.mlp.experts.19.down_proj.weight_scale": "model-00021-of-00047.safetensors", + "model.layers.20.mlp.experts.19.gate_proj.weight": "model-00021-of-00047.safetensors", + "model.layers.20.mlp.experts.19.gate_proj.weight_scale": "model-00021-of-00047.safetensors", + "model.layers.20.mlp.experts.19.up_proj.weight": "model-00021-of-00047.safetensors", + "model.layers.20.mlp.experts.19.up_proj.weight_scale": "model-00021-of-00047.safetensors", + "model.layers.20.mlp.experts.2.down_proj.weight": "model-00021-of-00047.safetensors", + "model.layers.20.mlp.experts.2.down_proj.weight_scale": "model-00021-of-00047.safetensors", + "model.layers.20.mlp.experts.2.gate_proj.weight": "model-00021-of-00047.safetensors", + "model.layers.20.mlp.experts.2.gate_proj.weight_scale": "model-00021-of-00047.safetensors", + "model.layers.20.mlp.experts.2.up_proj.weight": "model-00021-of-00047.safetensors", + "model.layers.20.mlp.experts.2.up_proj.weight_scale": "model-00021-of-00047.safetensors", + "model.layers.20.mlp.experts.20.down_proj.weight": "model-00021-of-00047.safetensors", + "model.layers.20.mlp.experts.20.down_proj.weight_scale": "model-00021-of-00047.safetensors", + "model.layers.20.mlp.experts.20.gate_proj.weight": "model-00021-of-00047.safetensors", + "model.layers.20.mlp.experts.20.gate_proj.weight_scale": "model-00021-of-00047.safetensors", + "model.layers.20.mlp.experts.20.up_proj.weight": "model-00021-of-00047.safetensors", + "model.layers.20.mlp.experts.20.up_proj.weight_scale": "model-00021-of-00047.safetensors", + "model.layers.20.mlp.experts.21.down_proj.weight": "model-00021-of-00047.safetensors", + "model.layers.20.mlp.experts.21.down_proj.weight_scale": "model-00021-of-00047.safetensors", + "model.layers.20.mlp.experts.21.gate_proj.weight": "model-00021-of-00047.safetensors", + "model.layers.20.mlp.experts.21.gate_proj.weight_scale": "model-00021-of-00047.safetensors", + "model.layers.20.mlp.experts.21.up_proj.weight": "model-00021-of-00047.safetensors", + "model.layers.20.mlp.experts.21.up_proj.weight_scale": "model-00021-of-00047.safetensors", + "model.layers.20.mlp.experts.22.down_proj.weight": "model-00021-of-00047.safetensors", + "model.layers.20.mlp.experts.22.down_proj.weight_scale": "model-00021-of-00047.safetensors", + "model.layers.20.mlp.experts.22.gate_proj.weight": "model-00021-of-00047.safetensors", + "model.layers.20.mlp.experts.22.gate_proj.weight_scale": "model-00021-of-00047.safetensors", + "model.layers.20.mlp.experts.22.up_proj.weight": "model-00021-of-00047.safetensors", + "model.layers.20.mlp.experts.22.up_proj.weight_scale": "model-00021-of-00047.safetensors", + "model.layers.20.mlp.experts.23.down_proj.weight": "model-00021-of-00047.safetensors", + "model.layers.20.mlp.experts.23.down_proj.weight_scale": "model-00021-of-00047.safetensors", + "model.layers.20.mlp.experts.23.gate_proj.weight": "model-00021-of-00047.safetensors", + "model.layers.20.mlp.experts.23.gate_proj.weight_scale": "model-00021-of-00047.safetensors", + "model.layers.20.mlp.experts.23.up_proj.weight": "model-00021-of-00047.safetensors", + "model.layers.20.mlp.experts.23.up_proj.weight_scale": "model-00021-of-00047.safetensors", + "model.layers.20.mlp.experts.24.down_proj.weight": "model-00021-of-00047.safetensors", + "model.layers.20.mlp.experts.24.down_proj.weight_scale": "model-00021-of-00047.safetensors", + "model.layers.20.mlp.experts.24.gate_proj.weight": "model-00021-of-00047.safetensors", + "model.layers.20.mlp.experts.24.gate_proj.weight_scale": "model-00021-of-00047.safetensors", + "model.layers.20.mlp.experts.24.up_proj.weight": "model-00021-of-00047.safetensors", + "model.layers.20.mlp.experts.24.up_proj.weight_scale": "model-00021-of-00047.safetensors", + "model.layers.20.mlp.experts.25.down_proj.weight": "model-00021-of-00047.safetensors", + "model.layers.20.mlp.experts.25.down_proj.weight_scale": "model-00021-of-00047.safetensors", + "model.layers.20.mlp.experts.25.gate_proj.weight": "model-00021-of-00047.safetensors", + "model.layers.20.mlp.experts.25.gate_proj.weight_scale": "model-00021-of-00047.safetensors", + "model.layers.20.mlp.experts.25.up_proj.weight": "model-00021-of-00047.safetensors", + "model.layers.20.mlp.experts.25.up_proj.weight_scale": "model-00021-of-00047.safetensors", + "model.layers.20.mlp.experts.26.down_proj.weight": "model-00021-of-00047.safetensors", + "model.layers.20.mlp.experts.26.down_proj.weight_scale": "model-00021-of-00047.safetensors", + "model.layers.20.mlp.experts.26.gate_proj.weight": "model-00021-of-00047.safetensors", + "model.layers.20.mlp.experts.26.gate_proj.weight_scale": "model-00021-of-00047.safetensors", + "model.layers.20.mlp.experts.26.up_proj.weight": "model-00021-of-00047.safetensors", + "model.layers.20.mlp.experts.26.up_proj.weight_scale": "model-00021-of-00047.safetensors", + "model.layers.20.mlp.experts.27.down_proj.weight": "model-00021-of-00047.safetensors", + "model.layers.20.mlp.experts.27.down_proj.weight_scale": "model-00021-of-00047.safetensors", + "model.layers.20.mlp.experts.27.gate_proj.weight": "model-00021-of-00047.safetensors", + "model.layers.20.mlp.experts.27.gate_proj.weight_scale": "model-00021-of-00047.safetensors", + "model.layers.20.mlp.experts.27.up_proj.weight": "model-00021-of-00047.safetensors", + "model.layers.20.mlp.experts.27.up_proj.weight_scale": "model-00021-of-00047.safetensors", + "model.layers.20.mlp.experts.28.down_proj.weight": "model-00021-of-00047.safetensors", + "model.layers.20.mlp.experts.28.down_proj.weight_scale": "model-00021-of-00047.safetensors", + "model.layers.20.mlp.experts.28.gate_proj.weight": "model-00021-of-00047.safetensors", + "model.layers.20.mlp.experts.28.gate_proj.weight_scale": "model-00021-of-00047.safetensors", + "model.layers.20.mlp.experts.28.up_proj.weight": "model-00021-of-00047.safetensors", + "model.layers.20.mlp.experts.28.up_proj.weight_scale": "model-00021-of-00047.safetensors", + "model.layers.20.mlp.experts.29.down_proj.weight": "model-00021-of-00047.safetensors", + "model.layers.20.mlp.experts.29.down_proj.weight_scale": "model-00021-of-00047.safetensors", + "model.layers.20.mlp.experts.29.gate_proj.weight": "model-00021-of-00047.safetensors", + "model.layers.20.mlp.experts.29.gate_proj.weight_scale": "model-00021-of-00047.safetensors", + "model.layers.20.mlp.experts.29.up_proj.weight": "model-00021-of-00047.safetensors", + "model.layers.20.mlp.experts.29.up_proj.weight_scale": "model-00021-of-00047.safetensors", + "model.layers.20.mlp.experts.3.down_proj.weight": "model-00021-of-00047.safetensors", + "model.layers.20.mlp.experts.3.down_proj.weight_scale": "model-00021-of-00047.safetensors", + "model.layers.20.mlp.experts.3.gate_proj.weight": "model-00021-of-00047.safetensors", + "model.layers.20.mlp.experts.3.gate_proj.weight_scale": "model-00021-of-00047.safetensors", + "model.layers.20.mlp.experts.3.up_proj.weight": "model-00021-of-00047.safetensors", + "model.layers.20.mlp.experts.3.up_proj.weight_scale": "model-00021-of-00047.safetensors", + "model.layers.20.mlp.experts.30.down_proj.weight": "model-00021-of-00047.safetensors", + "model.layers.20.mlp.experts.30.down_proj.weight_scale": "model-00021-of-00047.safetensors", + "model.layers.20.mlp.experts.30.gate_proj.weight": "model-00021-of-00047.safetensors", + "model.layers.20.mlp.experts.30.gate_proj.weight_scale": "model-00021-of-00047.safetensors", + "model.layers.20.mlp.experts.30.up_proj.weight": "model-00021-of-00047.safetensors", + "model.layers.20.mlp.experts.30.up_proj.weight_scale": "model-00021-of-00047.safetensors", + "model.layers.20.mlp.experts.31.down_proj.weight": "model-00021-of-00047.safetensors", + "model.layers.20.mlp.experts.31.down_proj.weight_scale": "model-00021-of-00047.safetensors", + "model.layers.20.mlp.experts.31.gate_proj.weight": "model-00021-of-00047.safetensors", + "model.layers.20.mlp.experts.31.gate_proj.weight_scale": "model-00021-of-00047.safetensors", + "model.layers.20.mlp.experts.31.up_proj.weight": "model-00021-of-00047.safetensors", + "model.layers.20.mlp.experts.31.up_proj.weight_scale": "model-00021-of-00047.safetensors", + "model.layers.20.mlp.experts.32.down_proj.weight": "model-00021-of-00047.safetensors", + "model.layers.20.mlp.experts.32.down_proj.weight_scale": "model-00021-of-00047.safetensors", + "model.layers.20.mlp.experts.32.gate_proj.weight": "model-00021-of-00047.safetensors", + "model.layers.20.mlp.experts.32.gate_proj.weight_scale": "model-00021-of-00047.safetensors", + "model.layers.20.mlp.experts.32.up_proj.weight": "model-00021-of-00047.safetensors", + "model.layers.20.mlp.experts.32.up_proj.weight_scale": "model-00021-of-00047.safetensors", + "model.layers.20.mlp.experts.33.down_proj.weight": "model-00021-of-00047.safetensors", + "model.layers.20.mlp.experts.33.down_proj.weight_scale": "model-00021-of-00047.safetensors", + "model.layers.20.mlp.experts.33.gate_proj.weight": "model-00021-of-00047.safetensors", + "model.layers.20.mlp.experts.33.gate_proj.weight_scale": "model-00021-of-00047.safetensors", + "model.layers.20.mlp.experts.33.up_proj.weight": "model-00021-of-00047.safetensors", + "model.layers.20.mlp.experts.33.up_proj.weight_scale": "model-00021-of-00047.safetensors", + "model.layers.20.mlp.experts.34.down_proj.weight": "model-00021-of-00047.safetensors", + "model.layers.20.mlp.experts.34.down_proj.weight_scale": "model-00021-of-00047.safetensors", + "model.layers.20.mlp.experts.34.gate_proj.weight": "model-00021-of-00047.safetensors", + "model.layers.20.mlp.experts.34.gate_proj.weight_scale": "model-00021-of-00047.safetensors", + "model.layers.20.mlp.experts.34.up_proj.weight": "model-00021-of-00047.safetensors", + "model.layers.20.mlp.experts.34.up_proj.weight_scale": "model-00021-of-00047.safetensors", + "model.layers.20.mlp.experts.35.down_proj.weight": "model-00021-of-00047.safetensors", + "model.layers.20.mlp.experts.35.down_proj.weight_scale": "model-00021-of-00047.safetensors", + "model.layers.20.mlp.experts.35.gate_proj.weight": "model-00021-of-00047.safetensors", + "model.layers.20.mlp.experts.35.gate_proj.weight_scale": "model-00021-of-00047.safetensors", + "model.layers.20.mlp.experts.35.up_proj.weight": "model-00021-of-00047.safetensors", + "model.layers.20.mlp.experts.35.up_proj.weight_scale": "model-00021-of-00047.safetensors", + "model.layers.20.mlp.experts.36.down_proj.weight": "model-00021-of-00047.safetensors", + "model.layers.20.mlp.experts.36.down_proj.weight_scale": "model-00021-of-00047.safetensors", + "model.layers.20.mlp.experts.36.gate_proj.weight": "model-00021-of-00047.safetensors", + "model.layers.20.mlp.experts.36.gate_proj.weight_scale": "model-00021-of-00047.safetensors", + "model.layers.20.mlp.experts.36.up_proj.weight": "model-00021-of-00047.safetensors", + "model.layers.20.mlp.experts.36.up_proj.weight_scale": "model-00021-of-00047.safetensors", + "model.layers.20.mlp.experts.37.down_proj.weight": "model-00021-of-00047.safetensors", + "model.layers.20.mlp.experts.37.down_proj.weight_scale": "model-00021-of-00047.safetensors", + "model.layers.20.mlp.experts.37.gate_proj.weight": "model-00021-of-00047.safetensors", + "model.layers.20.mlp.experts.37.gate_proj.weight_scale": "model-00021-of-00047.safetensors", + "model.layers.20.mlp.experts.37.up_proj.weight": "model-00021-of-00047.safetensors", + "model.layers.20.mlp.experts.37.up_proj.weight_scale": "model-00021-of-00047.safetensors", + "model.layers.20.mlp.experts.38.down_proj.weight": "model-00021-of-00047.safetensors", + "model.layers.20.mlp.experts.38.down_proj.weight_scale": "model-00021-of-00047.safetensors", + "model.layers.20.mlp.experts.38.gate_proj.weight": "model-00021-of-00047.safetensors", + "model.layers.20.mlp.experts.38.gate_proj.weight_scale": "model-00021-of-00047.safetensors", + "model.layers.20.mlp.experts.38.up_proj.weight": "model-00021-of-00047.safetensors", + "model.layers.20.mlp.experts.38.up_proj.weight_scale": "model-00021-of-00047.safetensors", + "model.layers.20.mlp.experts.39.down_proj.weight": "model-00021-of-00047.safetensors", + "model.layers.20.mlp.experts.39.down_proj.weight_scale": "model-00021-of-00047.safetensors", + "model.layers.20.mlp.experts.39.gate_proj.weight": "model-00021-of-00047.safetensors", + "model.layers.20.mlp.experts.39.gate_proj.weight_scale": "model-00021-of-00047.safetensors", + "model.layers.20.mlp.experts.39.up_proj.weight": "model-00021-of-00047.safetensors", + "model.layers.20.mlp.experts.39.up_proj.weight_scale": "model-00021-of-00047.safetensors", + "model.layers.20.mlp.experts.4.down_proj.weight": "model-00021-of-00047.safetensors", + "model.layers.20.mlp.experts.4.down_proj.weight_scale": "model-00021-of-00047.safetensors", + "model.layers.20.mlp.experts.4.gate_proj.weight": "model-00021-of-00047.safetensors", + "model.layers.20.mlp.experts.4.gate_proj.weight_scale": "model-00021-of-00047.safetensors", + "model.layers.20.mlp.experts.4.up_proj.weight": "model-00021-of-00047.safetensors", + "model.layers.20.mlp.experts.4.up_proj.weight_scale": "model-00021-of-00047.safetensors", + "model.layers.20.mlp.experts.40.down_proj.weight": "model-00021-of-00047.safetensors", + "model.layers.20.mlp.experts.40.down_proj.weight_scale": "model-00021-of-00047.safetensors", + "model.layers.20.mlp.experts.40.gate_proj.weight": "model-00021-of-00047.safetensors", + "model.layers.20.mlp.experts.40.gate_proj.weight_scale": "model-00021-of-00047.safetensors", + "model.layers.20.mlp.experts.40.up_proj.weight": "model-00021-of-00047.safetensors", + "model.layers.20.mlp.experts.40.up_proj.weight_scale": "model-00021-of-00047.safetensors", + "model.layers.20.mlp.experts.41.down_proj.weight": "model-00021-of-00047.safetensors", + "model.layers.20.mlp.experts.41.down_proj.weight_scale": "model-00021-of-00047.safetensors", + "model.layers.20.mlp.experts.41.gate_proj.weight": "model-00021-of-00047.safetensors", + "model.layers.20.mlp.experts.41.gate_proj.weight_scale": "model-00021-of-00047.safetensors", + "model.layers.20.mlp.experts.41.up_proj.weight": "model-00021-of-00047.safetensors", + "model.layers.20.mlp.experts.41.up_proj.weight_scale": "model-00021-of-00047.safetensors", + "model.layers.20.mlp.experts.42.down_proj.weight": "model-00021-of-00047.safetensors", + "model.layers.20.mlp.experts.42.down_proj.weight_scale": "model-00021-of-00047.safetensors", + "model.layers.20.mlp.experts.42.gate_proj.weight": "model-00021-of-00047.safetensors", + "model.layers.20.mlp.experts.42.gate_proj.weight_scale": "model-00021-of-00047.safetensors", + "model.layers.20.mlp.experts.42.up_proj.weight": "model-00021-of-00047.safetensors", + "model.layers.20.mlp.experts.42.up_proj.weight_scale": "model-00021-of-00047.safetensors", + "model.layers.20.mlp.experts.43.down_proj.weight": "model-00021-of-00047.safetensors", + "model.layers.20.mlp.experts.43.down_proj.weight_scale": "model-00021-of-00047.safetensors", + "model.layers.20.mlp.experts.43.gate_proj.weight": "model-00021-of-00047.safetensors", + "model.layers.20.mlp.experts.43.gate_proj.weight_scale": "model-00021-of-00047.safetensors", + "model.layers.20.mlp.experts.43.up_proj.weight": "model-00021-of-00047.safetensors", + "model.layers.20.mlp.experts.43.up_proj.weight_scale": "model-00021-of-00047.safetensors", + "model.layers.20.mlp.experts.44.down_proj.weight": "model-00021-of-00047.safetensors", + "model.layers.20.mlp.experts.44.down_proj.weight_scale": "model-00021-of-00047.safetensors", + "model.layers.20.mlp.experts.44.gate_proj.weight": "model-00021-of-00047.safetensors", + "model.layers.20.mlp.experts.44.gate_proj.weight_scale": "model-00021-of-00047.safetensors", + "model.layers.20.mlp.experts.44.up_proj.weight": "model-00021-of-00047.safetensors", + "model.layers.20.mlp.experts.44.up_proj.weight_scale": "model-00021-of-00047.safetensors", + "model.layers.20.mlp.experts.45.down_proj.weight": "model-00021-of-00047.safetensors", + "model.layers.20.mlp.experts.45.down_proj.weight_scale": "model-00021-of-00047.safetensors", + "model.layers.20.mlp.experts.45.gate_proj.weight": "model-00021-of-00047.safetensors", + "model.layers.20.mlp.experts.45.gate_proj.weight_scale": "model-00021-of-00047.safetensors", + "model.layers.20.mlp.experts.45.up_proj.weight": "model-00021-of-00047.safetensors", + "model.layers.20.mlp.experts.45.up_proj.weight_scale": "model-00021-of-00047.safetensors", + "model.layers.20.mlp.experts.46.down_proj.weight": "model-00021-of-00047.safetensors", + "model.layers.20.mlp.experts.46.down_proj.weight_scale": "model-00021-of-00047.safetensors", + "model.layers.20.mlp.experts.46.gate_proj.weight": "model-00021-of-00047.safetensors", + "model.layers.20.mlp.experts.46.gate_proj.weight_scale": "model-00021-of-00047.safetensors", + "model.layers.20.mlp.experts.46.up_proj.weight": "model-00021-of-00047.safetensors", + "model.layers.20.mlp.experts.46.up_proj.weight_scale": "model-00021-of-00047.safetensors", + "model.layers.20.mlp.experts.47.down_proj.weight": "model-00021-of-00047.safetensors", + "model.layers.20.mlp.experts.47.down_proj.weight_scale": "model-00021-of-00047.safetensors", + "model.layers.20.mlp.experts.47.gate_proj.weight": "model-00021-of-00047.safetensors", + "model.layers.20.mlp.experts.47.gate_proj.weight_scale": "model-00021-of-00047.safetensors", + "model.layers.20.mlp.experts.47.up_proj.weight": "model-00021-of-00047.safetensors", + "model.layers.20.mlp.experts.47.up_proj.weight_scale": "model-00021-of-00047.safetensors", + "model.layers.20.mlp.experts.48.down_proj.weight": "model-00021-of-00047.safetensors", + "model.layers.20.mlp.experts.48.down_proj.weight_scale": "model-00021-of-00047.safetensors", + "model.layers.20.mlp.experts.48.gate_proj.weight": "model-00021-of-00047.safetensors", + "model.layers.20.mlp.experts.48.gate_proj.weight_scale": "model-00021-of-00047.safetensors", + "model.layers.20.mlp.experts.48.up_proj.weight": "model-00021-of-00047.safetensors", + "model.layers.20.mlp.experts.48.up_proj.weight_scale": "model-00021-of-00047.safetensors", + "model.layers.20.mlp.experts.49.down_proj.weight": "model-00021-of-00047.safetensors", + "model.layers.20.mlp.experts.49.down_proj.weight_scale": "model-00021-of-00047.safetensors", + "model.layers.20.mlp.experts.49.gate_proj.weight": "model-00021-of-00047.safetensors", + "model.layers.20.mlp.experts.49.gate_proj.weight_scale": "model-00021-of-00047.safetensors", + "model.layers.20.mlp.experts.49.up_proj.weight": "model-00021-of-00047.safetensors", + "model.layers.20.mlp.experts.49.up_proj.weight_scale": "model-00021-of-00047.safetensors", + "model.layers.20.mlp.experts.5.down_proj.weight": "model-00021-of-00047.safetensors", + "model.layers.20.mlp.experts.5.down_proj.weight_scale": "model-00021-of-00047.safetensors", + "model.layers.20.mlp.experts.5.gate_proj.weight": "model-00021-of-00047.safetensors", + "model.layers.20.mlp.experts.5.gate_proj.weight_scale": "model-00021-of-00047.safetensors", + "model.layers.20.mlp.experts.5.up_proj.weight": "model-00021-of-00047.safetensors", + "model.layers.20.mlp.experts.5.up_proj.weight_scale": "model-00021-of-00047.safetensors", + "model.layers.20.mlp.experts.50.down_proj.weight": "model-00021-of-00047.safetensors", + "model.layers.20.mlp.experts.50.down_proj.weight_scale": "model-00021-of-00047.safetensors", + "model.layers.20.mlp.experts.50.gate_proj.weight": "model-00021-of-00047.safetensors", + "model.layers.20.mlp.experts.50.gate_proj.weight_scale": "model-00021-of-00047.safetensors", + "model.layers.20.mlp.experts.50.up_proj.weight": "model-00021-of-00047.safetensors", + "model.layers.20.mlp.experts.50.up_proj.weight_scale": "model-00021-of-00047.safetensors", + "model.layers.20.mlp.experts.51.down_proj.weight": "model-00021-of-00047.safetensors", + "model.layers.20.mlp.experts.51.down_proj.weight_scale": "model-00021-of-00047.safetensors", + "model.layers.20.mlp.experts.51.gate_proj.weight": "model-00021-of-00047.safetensors", + "model.layers.20.mlp.experts.51.gate_proj.weight_scale": "model-00021-of-00047.safetensors", + "model.layers.20.mlp.experts.51.up_proj.weight": "model-00021-of-00047.safetensors", + "model.layers.20.mlp.experts.51.up_proj.weight_scale": "model-00021-of-00047.safetensors", + "model.layers.20.mlp.experts.52.down_proj.weight": "model-00021-of-00047.safetensors", + "model.layers.20.mlp.experts.52.down_proj.weight_scale": "model-00021-of-00047.safetensors", + "model.layers.20.mlp.experts.52.gate_proj.weight": "model-00021-of-00047.safetensors", + "model.layers.20.mlp.experts.52.gate_proj.weight_scale": "model-00021-of-00047.safetensors", + "model.layers.20.mlp.experts.52.up_proj.weight": "model-00021-of-00047.safetensors", + "model.layers.20.mlp.experts.52.up_proj.weight_scale": "model-00021-of-00047.safetensors", + "model.layers.20.mlp.experts.53.down_proj.weight": "model-00021-of-00047.safetensors", + "model.layers.20.mlp.experts.53.down_proj.weight_scale": "model-00021-of-00047.safetensors", + "model.layers.20.mlp.experts.53.gate_proj.weight": "model-00021-of-00047.safetensors", + "model.layers.20.mlp.experts.53.gate_proj.weight_scale": "model-00021-of-00047.safetensors", + "model.layers.20.mlp.experts.53.up_proj.weight": "model-00021-of-00047.safetensors", + "model.layers.20.mlp.experts.53.up_proj.weight_scale": "model-00021-of-00047.safetensors", + "model.layers.20.mlp.experts.54.down_proj.weight": "model-00021-of-00047.safetensors", + "model.layers.20.mlp.experts.54.down_proj.weight_scale": "model-00021-of-00047.safetensors", + "model.layers.20.mlp.experts.54.gate_proj.weight": "model-00021-of-00047.safetensors", + "model.layers.20.mlp.experts.54.gate_proj.weight_scale": "model-00021-of-00047.safetensors", + "model.layers.20.mlp.experts.54.up_proj.weight": "model-00021-of-00047.safetensors", + "model.layers.20.mlp.experts.54.up_proj.weight_scale": "model-00021-of-00047.safetensors", + "model.layers.20.mlp.experts.55.down_proj.weight": "model-00021-of-00047.safetensors", + "model.layers.20.mlp.experts.55.down_proj.weight_scale": "model-00021-of-00047.safetensors", + "model.layers.20.mlp.experts.55.gate_proj.weight": "model-00021-of-00047.safetensors", + "model.layers.20.mlp.experts.55.gate_proj.weight_scale": "model-00021-of-00047.safetensors", + "model.layers.20.mlp.experts.55.up_proj.weight": "model-00021-of-00047.safetensors", + "model.layers.20.mlp.experts.55.up_proj.weight_scale": "model-00021-of-00047.safetensors", + "model.layers.20.mlp.experts.56.down_proj.weight": "model-00021-of-00047.safetensors", + "model.layers.20.mlp.experts.56.down_proj.weight_scale": "model-00021-of-00047.safetensors", + "model.layers.20.mlp.experts.56.gate_proj.weight": "model-00021-of-00047.safetensors", + "model.layers.20.mlp.experts.56.gate_proj.weight_scale": "model-00021-of-00047.safetensors", + "model.layers.20.mlp.experts.56.up_proj.weight": "model-00021-of-00047.safetensors", + "model.layers.20.mlp.experts.56.up_proj.weight_scale": "model-00021-of-00047.safetensors", + "model.layers.20.mlp.experts.57.down_proj.weight": "model-00021-of-00047.safetensors", + "model.layers.20.mlp.experts.57.down_proj.weight_scale": "model-00021-of-00047.safetensors", + "model.layers.20.mlp.experts.57.gate_proj.weight": "model-00021-of-00047.safetensors", + "model.layers.20.mlp.experts.57.gate_proj.weight_scale": "model-00021-of-00047.safetensors", + "model.layers.20.mlp.experts.57.up_proj.weight": "model-00021-of-00047.safetensors", + "model.layers.20.mlp.experts.57.up_proj.weight_scale": "model-00021-of-00047.safetensors", + "model.layers.20.mlp.experts.58.down_proj.weight": "model-00021-of-00047.safetensors", + "model.layers.20.mlp.experts.58.down_proj.weight_scale": "model-00021-of-00047.safetensors", + "model.layers.20.mlp.experts.58.gate_proj.weight": "model-00021-of-00047.safetensors", + "model.layers.20.mlp.experts.58.gate_proj.weight_scale": "model-00021-of-00047.safetensors", + "model.layers.20.mlp.experts.58.up_proj.weight": "model-00021-of-00047.safetensors", + "model.layers.20.mlp.experts.58.up_proj.weight_scale": "model-00021-of-00047.safetensors", + "model.layers.20.mlp.experts.59.down_proj.weight": "model-00021-of-00047.safetensors", + "model.layers.20.mlp.experts.59.down_proj.weight_scale": "model-00021-of-00047.safetensors", + "model.layers.20.mlp.experts.59.gate_proj.weight": "model-00021-of-00047.safetensors", + "model.layers.20.mlp.experts.59.gate_proj.weight_scale": "model-00021-of-00047.safetensors", + "model.layers.20.mlp.experts.59.up_proj.weight": "model-00021-of-00047.safetensors", + "model.layers.20.mlp.experts.59.up_proj.weight_scale": "model-00021-of-00047.safetensors", + "model.layers.20.mlp.experts.6.down_proj.weight": "model-00021-of-00047.safetensors", + "model.layers.20.mlp.experts.6.down_proj.weight_scale": "model-00021-of-00047.safetensors", + "model.layers.20.mlp.experts.6.gate_proj.weight": "model-00021-of-00047.safetensors", + "model.layers.20.mlp.experts.6.gate_proj.weight_scale": "model-00021-of-00047.safetensors", + "model.layers.20.mlp.experts.6.up_proj.weight": "model-00021-of-00047.safetensors", + "model.layers.20.mlp.experts.6.up_proj.weight_scale": "model-00021-of-00047.safetensors", + "model.layers.20.mlp.experts.60.down_proj.weight": "model-00021-of-00047.safetensors", + "model.layers.20.mlp.experts.60.down_proj.weight_scale": "model-00021-of-00047.safetensors", + "model.layers.20.mlp.experts.60.gate_proj.weight": "model-00021-of-00047.safetensors", + "model.layers.20.mlp.experts.60.gate_proj.weight_scale": "model-00021-of-00047.safetensors", + "model.layers.20.mlp.experts.60.up_proj.weight": "model-00021-of-00047.safetensors", + "model.layers.20.mlp.experts.60.up_proj.weight_scale": "model-00021-of-00047.safetensors", + "model.layers.20.mlp.experts.61.down_proj.weight": "model-00021-of-00047.safetensors", + "model.layers.20.mlp.experts.61.down_proj.weight_scale": "model-00021-of-00047.safetensors", + "model.layers.20.mlp.experts.61.gate_proj.weight": "model-00021-of-00047.safetensors", + "model.layers.20.mlp.experts.61.gate_proj.weight_scale": "model-00021-of-00047.safetensors", + "model.layers.20.mlp.experts.61.up_proj.weight": "model-00021-of-00047.safetensors", + "model.layers.20.mlp.experts.61.up_proj.weight_scale": "model-00021-of-00047.safetensors", + "model.layers.20.mlp.experts.62.down_proj.weight": "model-00021-of-00047.safetensors", + "model.layers.20.mlp.experts.62.down_proj.weight_scale": "model-00021-of-00047.safetensors", + "model.layers.20.mlp.experts.62.gate_proj.weight": "model-00021-of-00047.safetensors", + "model.layers.20.mlp.experts.62.gate_proj.weight_scale": "model-00021-of-00047.safetensors", + "model.layers.20.mlp.experts.62.up_proj.weight": "model-00021-of-00047.safetensors", + "model.layers.20.mlp.experts.62.up_proj.weight_scale": "model-00021-of-00047.safetensors", + "model.layers.20.mlp.experts.63.down_proj.weight": "model-00021-of-00047.safetensors", + "model.layers.20.mlp.experts.63.down_proj.weight_scale": "model-00021-of-00047.safetensors", + "model.layers.20.mlp.experts.63.gate_proj.weight": "model-00021-of-00047.safetensors", + "model.layers.20.mlp.experts.63.gate_proj.weight_scale": "model-00021-of-00047.safetensors", + "model.layers.20.mlp.experts.63.up_proj.weight": "model-00021-of-00047.safetensors", + "model.layers.20.mlp.experts.63.up_proj.weight_scale": "model-00021-of-00047.safetensors", + "model.layers.20.mlp.experts.64.down_proj.weight": "model-00021-of-00047.safetensors", + "model.layers.20.mlp.experts.64.down_proj.weight_scale": "model-00021-of-00047.safetensors", + "model.layers.20.mlp.experts.64.gate_proj.weight": "model-00021-of-00047.safetensors", + "model.layers.20.mlp.experts.64.gate_proj.weight_scale": "model-00021-of-00047.safetensors", + "model.layers.20.mlp.experts.64.up_proj.weight": "model-00021-of-00047.safetensors", + "model.layers.20.mlp.experts.64.up_proj.weight_scale": "model-00021-of-00047.safetensors", + "model.layers.20.mlp.experts.65.down_proj.weight": "model-00021-of-00047.safetensors", + "model.layers.20.mlp.experts.65.down_proj.weight_scale": "model-00021-of-00047.safetensors", + "model.layers.20.mlp.experts.65.gate_proj.weight": "model-00021-of-00047.safetensors", + "model.layers.20.mlp.experts.65.gate_proj.weight_scale": "model-00021-of-00047.safetensors", + "model.layers.20.mlp.experts.65.up_proj.weight": "model-00021-of-00047.safetensors", + "model.layers.20.mlp.experts.65.up_proj.weight_scale": "model-00021-of-00047.safetensors", + "model.layers.20.mlp.experts.66.down_proj.weight": "model-00021-of-00047.safetensors", + "model.layers.20.mlp.experts.66.down_proj.weight_scale": "model-00021-of-00047.safetensors", + "model.layers.20.mlp.experts.66.gate_proj.weight": "model-00021-of-00047.safetensors", + "model.layers.20.mlp.experts.66.gate_proj.weight_scale": "model-00021-of-00047.safetensors", + "model.layers.20.mlp.experts.66.up_proj.weight": "model-00021-of-00047.safetensors", + "model.layers.20.mlp.experts.66.up_proj.weight_scale": "model-00021-of-00047.safetensors", + "model.layers.20.mlp.experts.67.down_proj.weight": "model-00021-of-00047.safetensors", + "model.layers.20.mlp.experts.67.down_proj.weight_scale": "model-00021-of-00047.safetensors", + "model.layers.20.mlp.experts.67.gate_proj.weight": "model-00021-of-00047.safetensors", + "model.layers.20.mlp.experts.67.gate_proj.weight_scale": "model-00021-of-00047.safetensors", + "model.layers.20.mlp.experts.67.up_proj.weight": "model-00021-of-00047.safetensors", + "model.layers.20.mlp.experts.67.up_proj.weight_scale": "model-00021-of-00047.safetensors", + "model.layers.20.mlp.experts.68.down_proj.weight": "model-00021-of-00047.safetensors", + "model.layers.20.mlp.experts.68.down_proj.weight_scale": "model-00021-of-00047.safetensors", + "model.layers.20.mlp.experts.68.gate_proj.weight": "model-00021-of-00047.safetensors", + "model.layers.20.mlp.experts.68.gate_proj.weight_scale": "model-00021-of-00047.safetensors", + "model.layers.20.mlp.experts.68.up_proj.weight": "model-00021-of-00047.safetensors", + "model.layers.20.mlp.experts.68.up_proj.weight_scale": "model-00021-of-00047.safetensors", + "model.layers.20.mlp.experts.69.down_proj.weight": "model-00021-of-00047.safetensors", + "model.layers.20.mlp.experts.69.down_proj.weight_scale": "model-00021-of-00047.safetensors", + "model.layers.20.mlp.experts.69.gate_proj.weight": "model-00021-of-00047.safetensors", + "model.layers.20.mlp.experts.69.gate_proj.weight_scale": "model-00021-of-00047.safetensors", + "model.layers.20.mlp.experts.69.up_proj.weight": "model-00021-of-00047.safetensors", + "model.layers.20.mlp.experts.69.up_proj.weight_scale": "model-00021-of-00047.safetensors", + "model.layers.20.mlp.experts.7.down_proj.weight": "model-00021-of-00047.safetensors", + "model.layers.20.mlp.experts.7.down_proj.weight_scale": "model-00021-of-00047.safetensors", + "model.layers.20.mlp.experts.7.gate_proj.weight": "model-00021-of-00047.safetensors", + "model.layers.20.mlp.experts.7.gate_proj.weight_scale": "model-00021-of-00047.safetensors", + "model.layers.20.mlp.experts.7.up_proj.weight": "model-00021-of-00047.safetensors", + "model.layers.20.mlp.experts.7.up_proj.weight_scale": "model-00021-of-00047.safetensors", + "model.layers.20.mlp.experts.70.down_proj.weight": "model-00021-of-00047.safetensors", + "model.layers.20.mlp.experts.70.down_proj.weight_scale": "model-00021-of-00047.safetensors", + "model.layers.20.mlp.experts.70.gate_proj.weight": "model-00021-of-00047.safetensors", + "model.layers.20.mlp.experts.70.gate_proj.weight_scale": "model-00021-of-00047.safetensors", + "model.layers.20.mlp.experts.70.up_proj.weight": "model-00021-of-00047.safetensors", + "model.layers.20.mlp.experts.70.up_proj.weight_scale": "model-00021-of-00047.safetensors", + "model.layers.20.mlp.experts.71.down_proj.weight": "model-00021-of-00047.safetensors", + "model.layers.20.mlp.experts.71.down_proj.weight_scale": "model-00021-of-00047.safetensors", + "model.layers.20.mlp.experts.71.gate_proj.weight": "model-00021-of-00047.safetensors", + "model.layers.20.mlp.experts.71.gate_proj.weight_scale": "model-00021-of-00047.safetensors", + "model.layers.20.mlp.experts.71.up_proj.weight": "model-00021-of-00047.safetensors", + "model.layers.20.mlp.experts.71.up_proj.weight_scale": "model-00021-of-00047.safetensors", + "model.layers.20.mlp.experts.72.down_proj.weight": "model-00021-of-00047.safetensors", + "model.layers.20.mlp.experts.72.down_proj.weight_scale": "model-00021-of-00047.safetensors", + "model.layers.20.mlp.experts.72.gate_proj.weight": "model-00021-of-00047.safetensors", + "model.layers.20.mlp.experts.72.gate_proj.weight_scale": "model-00021-of-00047.safetensors", + "model.layers.20.mlp.experts.72.up_proj.weight": "model-00021-of-00047.safetensors", + "model.layers.20.mlp.experts.72.up_proj.weight_scale": "model-00021-of-00047.safetensors", + "model.layers.20.mlp.experts.73.down_proj.weight": "model-00021-of-00047.safetensors", + "model.layers.20.mlp.experts.73.down_proj.weight_scale": "model-00021-of-00047.safetensors", + "model.layers.20.mlp.experts.73.gate_proj.weight": "model-00021-of-00047.safetensors", + "model.layers.20.mlp.experts.73.gate_proj.weight_scale": "model-00021-of-00047.safetensors", + "model.layers.20.mlp.experts.73.up_proj.weight": "model-00021-of-00047.safetensors", + "model.layers.20.mlp.experts.73.up_proj.weight_scale": "model-00021-of-00047.safetensors", + "model.layers.20.mlp.experts.74.down_proj.weight": "model-00021-of-00047.safetensors", + "model.layers.20.mlp.experts.74.down_proj.weight_scale": "model-00021-of-00047.safetensors", + "model.layers.20.mlp.experts.74.gate_proj.weight": "model-00021-of-00047.safetensors", + "model.layers.20.mlp.experts.74.gate_proj.weight_scale": "model-00021-of-00047.safetensors", + "model.layers.20.mlp.experts.74.up_proj.weight": "model-00021-of-00047.safetensors", + "model.layers.20.mlp.experts.74.up_proj.weight_scale": "model-00021-of-00047.safetensors", + "model.layers.20.mlp.experts.75.down_proj.weight": "model-00021-of-00047.safetensors", + "model.layers.20.mlp.experts.75.down_proj.weight_scale": "model-00021-of-00047.safetensors", + "model.layers.20.mlp.experts.75.gate_proj.weight": "model-00021-of-00047.safetensors", + "model.layers.20.mlp.experts.75.gate_proj.weight_scale": "model-00021-of-00047.safetensors", + "model.layers.20.mlp.experts.75.up_proj.weight": "model-00021-of-00047.safetensors", + "model.layers.20.mlp.experts.75.up_proj.weight_scale": "model-00021-of-00047.safetensors", + "model.layers.20.mlp.experts.76.down_proj.weight": "model-00021-of-00047.safetensors", + "model.layers.20.mlp.experts.76.down_proj.weight_scale": "model-00021-of-00047.safetensors", + "model.layers.20.mlp.experts.76.gate_proj.weight": "model-00021-of-00047.safetensors", + "model.layers.20.mlp.experts.76.gate_proj.weight_scale": "model-00021-of-00047.safetensors", + "model.layers.20.mlp.experts.76.up_proj.weight": "model-00021-of-00047.safetensors", + "model.layers.20.mlp.experts.76.up_proj.weight_scale": "model-00021-of-00047.safetensors", + "model.layers.20.mlp.experts.77.down_proj.weight": "model-00021-of-00047.safetensors", + "model.layers.20.mlp.experts.77.down_proj.weight_scale": "model-00021-of-00047.safetensors", + "model.layers.20.mlp.experts.77.gate_proj.weight": "model-00021-of-00047.safetensors", + "model.layers.20.mlp.experts.77.gate_proj.weight_scale": "model-00021-of-00047.safetensors", + "model.layers.20.mlp.experts.77.up_proj.weight": "model-00021-of-00047.safetensors", + "model.layers.20.mlp.experts.77.up_proj.weight_scale": "model-00021-of-00047.safetensors", + "model.layers.20.mlp.experts.78.down_proj.weight": "model-00021-of-00047.safetensors", + "model.layers.20.mlp.experts.78.down_proj.weight_scale": "model-00021-of-00047.safetensors", + "model.layers.20.mlp.experts.78.gate_proj.weight": "model-00021-of-00047.safetensors", + "model.layers.20.mlp.experts.78.gate_proj.weight_scale": "model-00021-of-00047.safetensors", + "model.layers.20.mlp.experts.78.up_proj.weight": "model-00021-of-00047.safetensors", + "model.layers.20.mlp.experts.78.up_proj.weight_scale": "model-00021-of-00047.safetensors", + "model.layers.20.mlp.experts.79.down_proj.weight": "model-00021-of-00047.safetensors", + "model.layers.20.mlp.experts.79.down_proj.weight_scale": "model-00021-of-00047.safetensors", + "model.layers.20.mlp.experts.79.gate_proj.weight": "model-00021-of-00047.safetensors", + "model.layers.20.mlp.experts.79.gate_proj.weight_scale": "model-00021-of-00047.safetensors", + "model.layers.20.mlp.experts.79.up_proj.weight": "model-00021-of-00047.safetensors", + "model.layers.20.mlp.experts.79.up_proj.weight_scale": "model-00021-of-00047.safetensors", + "model.layers.20.mlp.experts.8.down_proj.weight": "model-00021-of-00047.safetensors", + "model.layers.20.mlp.experts.8.down_proj.weight_scale": "model-00021-of-00047.safetensors", + "model.layers.20.mlp.experts.8.gate_proj.weight": "model-00021-of-00047.safetensors", + "model.layers.20.mlp.experts.8.gate_proj.weight_scale": "model-00021-of-00047.safetensors", + "model.layers.20.mlp.experts.8.up_proj.weight": "model-00021-of-00047.safetensors", + "model.layers.20.mlp.experts.8.up_proj.weight_scale": "model-00021-of-00047.safetensors", + "model.layers.20.mlp.experts.80.down_proj.weight": "model-00021-of-00047.safetensors", + "model.layers.20.mlp.experts.80.down_proj.weight_scale": "model-00021-of-00047.safetensors", + "model.layers.20.mlp.experts.80.gate_proj.weight": "model-00021-of-00047.safetensors", + "model.layers.20.mlp.experts.80.gate_proj.weight_scale": "model-00021-of-00047.safetensors", + "model.layers.20.mlp.experts.80.up_proj.weight": "model-00021-of-00047.safetensors", + "model.layers.20.mlp.experts.80.up_proj.weight_scale": "model-00021-of-00047.safetensors", + "model.layers.20.mlp.experts.81.down_proj.weight": "model-00021-of-00047.safetensors", + "model.layers.20.mlp.experts.81.down_proj.weight_scale": "model-00021-of-00047.safetensors", + "model.layers.20.mlp.experts.81.gate_proj.weight": "model-00021-of-00047.safetensors", + "model.layers.20.mlp.experts.81.gate_proj.weight_scale": "model-00021-of-00047.safetensors", + "model.layers.20.mlp.experts.81.up_proj.weight": "model-00021-of-00047.safetensors", + "model.layers.20.mlp.experts.81.up_proj.weight_scale": "model-00021-of-00047.safetensors", + "model.layers.20.mlp.experts.82.down_proj.weight": "model-00021-of-00047.safetensors", + "model.layers.20.mlp.experts.82.down_proj.weight_scale": "model-00021-of-00047.safetensors", + "model.layers.20.mlp.experts.82.gate_proj.weight": "model-00021-of-00047.safetensors", + "model.layers.20.mlp.experts.82.gate_proj.weight_scale": "model-00021-of-00047.safetensors", + "model.layers.20.mlp.experts.82.up_proj.weight": "model-00021-of-00047.safetensors", + "model.layers.20.mlp.experts.82.up_proj.weight_scale": "model-00021-of-00047.safetensors", + "model.layers.20.mlp.experts.83.down_proj.weight": "model-00021-of-00047.safetensors", + "model.layers.20.mlp.experts.83.down_proj.weight_scale": "model-00021-of-00047.safetensors", + "model.layers.20.mlp.experts.83.gate_proj.weight": "model-00021-of-00047.safetensors", + "model.layers.20.mlp.experts.83.gate_proj.weight_scale": "model-00021-of-00047.safetensors", + "model.layers.20.mlp.experts.83.up_proj.weight": "model-00021-of-00047.safetensors", + "model.layers.20.mlp.experts.83.up_proj.weight_scale": "model-00021-of-00047.safetensors", + "model.layers.20.mlp.experts.84.down_proj.weight": "model-00021-of-00047.safetensors", + "model.layers.20.mlp.experts.84.down_proj.weight_scale": "model-00021-of-00047.safetensors", + "model.layers.20.mlp.experts.84.gate_proj.weight": "model-00021-of-00047.safetensors", + "model.layers.20.mlp.experts.84.gate_proj.weight_scale": "model-00021-of-00047.safetensors", + "model.layers.20.mlp.experts.84.up_proj.weight": "model-00021-of-00047.safetensors", + "model.layers.20.mlp.experts.84.up_proj.weight_scale": "model-00021-of-00047.safetensors", + "model.layers.20.mlp.experts.85.down_proj.weight": "model-00021-of-00047.safetensors", + "model.layers.20.mlp.experts.85.down_proj.weight_scale": "model-00021-of-00047.safetensors", + "model.layers.20.mlp.experts.85.gate_proj.weight": "model-00021-of-00047.safetensors", + "model.layers.20.mlp.experts.85.gate_proj.weight_scale": "model-00021-of-00047.safetensors", + "model.layers.20.mlp.experts.85.up_proj.weight": "model-00021-of-00047.safetensors", + "model.layers.20.mlp.experts.85.up_proj.weight_scale": "model-00021-of-00047.safetensors", + "model.layers.20.mlp.experts.86.down_proj.weight": "model-00021-of-00047.safetensors", + "model.layers.20.mlp.experts.86.down_proj.weight_scale": "model-00021-of-00047.safetensors", + "model.layers.20.mlp.experts.86.gate_proj.weight": "model-00021-of-00047.safetensors", + "model.layers.20.mlp.experts.86.gate_proj.weight_scale": "model-00021-of-00047.safetensors", + "model.layers.20.mlp.experts.86.up_proj.weight": "model-00021-of-00047.safetensors", + "model.layers.20.mlp.experts.86.up_proj.weight_scale": "model-00021-of-00047.safetensors", + "model.layers.20.mlp.experts.87.down_proj.weight": "model-00021-of-00047.safetensors", + "model.layers.20.mlp.experts.87.down_proj.weight_scale": "model-00021-of-00047.safetensors", + "model.layers.20.mlp.experts.87.gate_proj.weight": "model-00021-of-00047.safetensors", + "model.layers.20.mlp.experts.87.gate_proj.weight_scale": "model-00021-of-00047.safetensors", + "model.layers.20.mlp.experts.87.up_proj.weight": "model-00021-of-00047.safetensors", + "model.layers.20.mlp.experts.87.up_proj.weight_scale": "model-00021-of-00047.safetensors", + "model.layers.20.mlp.experts.88.down_proj.weight": "model-00021-of-00047.safetensors", + "model.layers.20.mlp.experts.88.down_proj.weight_scale": "model-00021-of-00047.safetensors", + "model.layers.20.mlp.experts.88.gate_proj.weight": "model-00021-of-00047.safetensors", + "model.layers.20.mlp.experts.88.gate_proj.weight_scale": "model-00021-of-00047.safetensors", + "model.layers.20.mlp.experts.88.up_proj.weight": "model-00021-of-00047.safetensors", + "model.layers.20.mlp.experts.88.up_proj.weight_scale": "model-00021-of-00047.safetensors", + "model.layers.20.mlp.experts.89.down_proj.weight": "model-00021-of-00047.safetensors", + "model.layers.20.mlp.experts.89.down_proj.weight_scale": "model-00021-of-00047.safetensors", + "model.layers.20.mlp.experts.89.gate_proj.weight": "model-00021-of-00047.safetensors", + "model.layers.20.mlp.experts.89.gate_proj.weight_scale": "model-00021-of-00047.safetensors", + "model.layers.20.mlp.experts.89.up_proj.weight": "model-00021-of-00047.safetensors", + "model.layers.20.mlp.experts.89.up_proj.weight_scale": "model-00021-of-00047.safetensors", + "model.layers.20.mlp.experts.9.down_proj.weight": "model-00021-of-00047.safetensors", + "model.layers.20.mlp.experts.9.down_proj.weight_scale": "model-00021-of-00047.safetensors", + "model.layers.20.mlp.experts.9.gate_proj.weight": "model-00021-of-00047.safetensors", + "model.layers.20.mlp.experts.9.gate_proj.weight_scale": "model-00021-of-00047.safetensors", + "model.layers.20.mlp.experts.9.up_proj.weight": "model-00021-of-00047.safetensors", + "model.layers.20.mlp.experts.9.up_proj.weight_scale": "model-00021-of-00047.safetensors", + "model.layers.20.mlp.experts.90.down_proj.weight": "model-00021-of-00047.safetensors", + "model.layers.20.mlp.experts.90.down_proj.weight_scale": "model-00021-of-00047.safetensors", + "model.layers.20.mlp.experts.90.gate_proj.weight": "model-00021-of-00047.safetensors", + "model.layers.20.mlp.experts.90.gate_proj.weight_scale": "model-00021-of-00047.safetensors", + "model.layers.20.mlp.experts.90.up_proj.weight": "model-00021-of-00047.safetensors", + "model.layers.20.mlp.experts.90.up_proj.weight_scale": "model-00021-of-00047.safetensors", + "model.layers.20.mlp.experts.91.down_proj.weight": "model-00021-of-00047.safetensors", + "model.layers.20.mlp.experts.91.down_proj.weight_scale": "model-00021-of-00047.safetensors", + "model.layers.20.mlp.experts.91.gate_proj.weight": "model-00021-of-00047.safetensors", + "model.layers.20.mlp.experts.91.gate_proj.weight_scale": "model-00021-of-00047.safetensors", + "model.layers.20.mlp.experts.91.up_proj.weight": "model-00021-of-00047.safetensors", + "model.layers.20.mlp.experts.91.up_proj.weight_scale": "model-00021-of-00047.safetensors", + "model.layers.20.mlp.experts.92.down_proj.weight": "model-00021-of-00047.safetensors", + "model.layers.20.mlp.experts.92.down_proj.weight_scale": "model-00021-of-00047.safetensors", + "model.layers.20.mlp.experts.92.gate_proj.weight": "model-00021-of-00047.safetensors", + "model.layers.20.mlp.experts.92.gate_proj.weight_scale": "model-00021-of-00047.safetensors", + "model.layers.20.mlp.experts.92.up_proj.weight": "model-00021-of-00047.safetensors", + "model.layers.20.mlp.experts.92.up_proj.weight_scale": "model-00021-of-00047.safetensors", + "model.layers.20.mlp.experts.93.down_proj.weight": "model-00021-of-00047.safetensors", + "model.layers.20.mlp.experts.93.down_proj.weight_scale": "model-00021-of-00047.safetensors", + "model.layers.20.mlp.experts.93.gate_proj.weight": "model-00021-of-00047.safetensors", + "model.layers.20.mlp.experts.93.gate_proj.weight_scale": "model-00021-of-00047.safetensors", + "model.layers.20.mlp.experts.93.up_proj.weight": "model-00021-of-00047.safetensors", + "model.layers.20.mlp.experts.93.up_proj.weight_scale": "model-00021-of-00047.safetensors", + "model.layers.20.mlp.experts.94.down_proj.weight": "model-00021-of-00047.safetensors", + "model.layers.20.mlp.experts.94.down_proj.weight_scale": "model-00021-of-00047.safetensors", + "model.layers.20.mlp.experts.94.gate_proj.weight": "model-00021-of-00047.safetensors", + "model.layers.20.mlp.experts.94.gate_proj.weight_scale": "model-00021-of-00047.safetensors", + "model.layers.20.mlp.experts.94.up_proj.weight": "model-00021-of-00047.safetensors", + "model.layers.20.mlp.experts.94.up_proj.weight_scale": "model-00021-of-00047.safetensors", + "model.layers.20.mlp.experts.95.down_proj.weight": "model-00021-of-00047.safetensors", + "model.layers.20.mlp.experts.95.down_proj.weight_scale": "model-00021-of-00047.safetensors", + "model.layers.20.mlp.experts.95.gate_proj.weight": "model-00021-of-00047.safetensors", + "model.layers.20.mlp.experts.95.gate_proj.weight_scale": "model-00021-of-00047.safetensors", + "model.layers.20.mlp.experts.95.up_proj.weight": "model-00021-of-00047.safetensors", + "model.layers.20.mlp.experts.95.up_proj.weight_scale": "model-00021-of-00047.safetensors", + "model.layers.20.mlp.experts.96.down_proj.weight": "model-00021-of-00047.safetensors", + "model.layers.20.mlp.experts.96.down_proj.weight_scale": "model-00021-of-00047.safetensors", + "model.layers.20.mlp.experts.96.gate_proj.weight": "model-00021-of-00047.safetensors", + "model.layers.20.mlp.experts.96.gate_proj.weight_scale": "model-00021-of-00047.safetensors", + "model.layers.20.mlp.experts.96.up_proj.weight": "model-00021-of-00047.safetensors", + "model.layers.20.mlp.experts.96.up_proj.weight_scale": "model-00021-of-00047.safetensors", + "model.layers.20.mlp.experts.97.down_proj.weight": "model-00021-of-00047.safetensors", + "model.layers.20.mlp.experts.97.down_proj.weight_scale": "model-00021-of-00047.safetensors", + "model.layers.20.mlp.experts.97.gate_proj.weight": "model-00021-of-00047.safetensors", + "model.layers.20.mlp.experts.97.gate_proj.weight_scale": "model-00021-of-00047.safetensors", + "model.layers.20.mlp.experts.97.up_proj.weight": "model-00021-of-00047.safetensors", + "model.layers.20.mlp.experts.97.up_proj.weight_scale": "model-00021-of-00047.safetensors", + "model.layers.20.mlp.experts.98.down_proj.weight": "model-00021-of-00047.safetensors", + "model.layers.20.mlp.experts.98.down_proj.weight_scale": "model-00021-of-00047.safetensors", + "model.layers.20.mlp.experts.98.gate_proj.weight": "model-00021-of-00047.safetensors", + "model.layers.20.mlp.experts.98.gate_proj.weight_scale": "model-00021-of-00047.safetensors", + "model.layers.20.mlp.experts.98.up_proj.weight": "model-00021-of-00047.safetensors", + "model.layers.20.mlp.experts.98.up_proj.weight_scale": "model-00021-of-00047.safetensors", + "model.layers.20.mlp.experts.99.down_proj.weight": "model-00021-of-00047.safetensors", + "model.layers.20.mlp.experts.99.down_proj.weight_scale": "model-00021-of-00047.safetensors", + "model.layers.20.mlp.experts.99.gate_proj.weight": "model-00021-of-00047.safetensors", + "model.layers.20.mlp.experts.99.gate_proj.weight_scale": "model-00021-of-00047.safetensors", + "model.layers.20.mlp.experts.99.up_proj.weight": "model-00021-of-00047.safetensors", + "model.layers.20.mlp.experts.99.up_proj.weight_scale": "model-00021-of-00047.safetensors", + "model.layers.20.mlp.gate.e_score_correction_bias": "model-00021-of-00047.safetensors", + "model.layers.20.mlp.gate.weight": "model-00021-of-00047.safetensors", + "model.layers.20.mlp.shared_experts.down_proj.weight": "model-00021-of-00047.safetensors", + "model.layers.20.mlp.shared_experts.down_proj.weight_scale": "model-00021-of-00047.safetensors", + "model.layers.20.mlp.shared_experts.gate_proj.weight": "model-00021-of-00047.safetensors", + "model.layers.20.mlp.shared_experts.gate_proj.weight_scale": "model-00021-of-00047.safetensors", + "model.layers.20.mlp.shared_experts.up_proj.weight": "model-00021-of-00047.safetensors", + "model.layers.20.mlp.shared_experts.up_proj.weight_scale": "model-00021-of-00047.safetensors", + "model.layers.20.post_attention_layernorm.weight": "model-00021-of-00047.safetensors", + "model.layers.20.self_attn.k_proj.bias": "model-00021-of-00047.safetensors", + "model.layers.20.self_attn.k_proj.weight": "model-00021-of-00047.safetensors", + "model.layers.20.self_attn.k_proj.weight_scale": "model-00021-of-00047.safetensors", + "model.layers.20.self_attn.o_proj.weight": "model-00021-of-00047.safetensors", + "model.layers.20.self_attn.o_proj.weight_scale": "model-00021-of-00047.safetensors", + "model.layers.20.self_attn.q_proj.bias": "model-00021-of-00047.safetensors", + "model.layers.20.self_attn.q_proj.weight": "model-00021-of-00047.safetensors", + "model.layers.20.self_attn.q_proj.weight_scale": "model-00021-of-00047.safetensors", + "model.layers.20.self_attn.v_proj.bias": "model-00021-of-00047.safetensors", + "model.layers.20.self_attn.v_proj.weight": "model-00021-of-00047.safetensors", + "model.layers.20.self_attn.v_proj.weight_scale": "model-00021-of-00047.safetensors", + "model.layers.21.input_layernorm.weight": "model-00022-of-00047.safetensors", + "model.layers.21.mlp.experts.0.down_proj.weight": "model-00022-of-00047.safetensors", + "model.layers.21.mlp.experts.0.down_proj.weight_scale": "model-00022-of-00047.safetensors", + "model.layers.21.mlp.experts.0.gate_proj.weight": "model-00022-of-00047.safetensors", + "model.layers.21.mlp.experts.0.gate_proj.weight_scale": "model-00022-of-00047.safetensors", + "model.layers.21.mlp.experts.0.up_proj.weight": "model-00022-of-00047.safetensors", + "model.layers.21.mlp.experts.0.up_proj.weight_scale": "model-00022-of-00047.safetensors", + "model.layers.21.mlp.experts.1.down_proj.weight": "model-00022-of-00047.safetensors", + "model.layers.21.mlp.experts.1.down_proj.weight_scale": "model-00022-of-00047.safetensors", + "model.layers.21.mlp.experts.1.gate_proj.weight": "model-00022-of-00047.safetensors", + "model.layers.21.mlp.experts.1.gate_proj.weight_scale": "model-00022-of-00047.safetensors", + "model.layers.21.mlp.experts.1.up_proj.weight": "model-00022-of-00047.safetensors", + "model.layers.21.mlp.experts.1.up_proj.weight_scale": "model-00022-of-00047.safetensors", + "model.layers.21.mlp.experts.10.down_proj.weight": "model-00022-of-00047.safetensors", + "model.layers.21.mlp.experts.10.down_proj.weight_scale": "model-00022-of-00047.safetensors", + "model.layers.21.mlp.experts.10.gate_proj.weight": "model-00022-of-00047.safetensors", + "model.layers.21.mlp.experts.10.gate_proj.weight_scale": "model-00022-of-00047.safetensors", + "model.layers.21.mlp.experts.10.up_proj.weight": "model-00022-of-00047.safetensors", + "model.layers.21.mlp.experts.10.up_proj.weight_scale": "model-00022-of-00047.safetensors", + "model.layers.21.mlp.experts.100.down_proj.weight": "model-00022-of-00047.safetensors", + "model.layers.21.mlp.experts.100.down_proj.weight_scale": "model-00022-of-00047.safetensors", + "model.layers.21.mlp.experts.100.gate_proj.weight": "model-00022-of-00047.safetensors", + "model.layers.21.mlp.experts.100.gate_proj.weight_scale": "model-00022-of-00047.safetensors", + "model.layers.21.mlp.experts.100.up_proj.weight": "model-00022-of-00047.safetensors", + "model.layers.21.mlp.experts.100.up_proj.weight_scale": "model-00022-of-00047.safetensors", + "model.layers.21.mlp.experts.101.down_proj.weight": "model-00022-of-00047.safetensors", + "model.layers.21.mlp.experts.101.down_proj.weight_scale": "model-00022-of-00047.safetensors", + "model.layers.21.mlp.experts.101.gate_proj.weight": "model-00022-of-00047.safetensors", + "model.layers.21.mlp.experts.101.gate_proj.weight_scale": "model-00022-of-00047.safetensors", + "model.layers.21.mlp.experts.101.up_proj.weight": "model-00022-of-00047.safetensors", + "model.layers.21.mlp.experts.101.up_proj.weight_scale": "model-00022-of-00047.safetensors", + "model.layers.21.mlp.experts.102.down_proj.weight": "model-00022-of-00047.safetensors", + "model.layers.21.mlp.experts.102.down_proj.weight_scale": "model-00022-of-00047.safetensors", + "model.layers.21.mlp.experts.102.gate_proj.weight": "model-00022-of-00047.safetensors", + "model.layers.21.mlp.experts.102.gate_proj.weight_scale": "model-00022-of-00047.safetensors", + "model.layers.21.mlp.experts.102.up_proj.weight": "model-00022-of-00047.safetensors", + "model.layers.21.mlp.experts.102.up_proj.weight_scale": "model-00022-of-00047.safetensors", + "model.layers.21.mlp.experts.103.down_proj.weight": "model-00022-of-00047.safetensors", + "model.layers.21.mlp.experts.103.down_proj.weight_scale": "model-00022-of-00047.safetensors", + "model.layers.21.mlp.experts.103.gate_proj.weight": "model-00022-of-00047.safetensors", + "model.layers.21.mlp.experts.103.gate_proj.weight_scale": "model-00022-of-00047.safetensors", + "model.layers.21.mlp.experts.103.up_proj.weight": "model-00022-of-00047.safetensors", + "model.layers.21.mlp.experts.103.up_proj.weight_scale": "model-00022-of-00047.safetensors", + "model.layers.21.mlp.experts.104.down_proj.weight": "model-00022-of-00047.safetensors", + "model.layers.21.mlp.experts.104.down_proj.weight_scale": "model-00022-of-00047.safetensors", + "model.layers.21.mlp.experts.104.gate_proj.weight": "model-00022-of-00047.safetensors", + "model.layers.21.mlp.experts.104.gate_proj.weight_scale": "model-00022-of-00047.safetensors", + "model.layers.21.mlp.experts.104.up_proj.weight": "model-00022-of-00047.safetensors", + "model.layers.21.mlp.experts.104.up_proj.weight_scale": "model-00022-of-00047.safetensors", + "model.layers.21.mlp.experts.105.down_proj.weight": "model-00022-of-00047.safetensors", + "model.layers.21.mlp.experts.105.down_proj.weight_scale": "model-00022-of-00047.safetensors", + "model.layers.21.mlp.experts.105.gate_proj.weight": "model-00022-of-00047.safetensors", + "model.layers.21.mlp.experts.105.gate_proj.weight_scale": "model-00022-of-00047.safetensors", + "model.layers.21.mlp.experts.105.up_proj.weight": "model-00022-of-00047.safetensors", + "model.layers.21.mlp.experts.105.up_proj.weight_scale": "model-00022-of-00047.safetensors", + "model.layers.21.mlp.experts.106.down_proj.weight": "model-00022-of-00047.safetensors", + "model.layers.21.mlp.experts.106.down_proj.weight_scale": "model-00022-of-00047.safetensors", + "model.layers.21.mlp.experts.106.gate_proj.weight": "model-00022-of-00047.safetensors", + "model.layers.21.mlp.experts.106.gate_proj.weight_scale": "model-00022-of-00047.safetensors", + "model.layers.21.mlp.experts.106.up_proj.weight": "model-00022-of-00047.safetensors", + "model.layers.21.mlp.experts.106.up_proj.weight_scale": "model-00022-of-00047.safetensors", + "model.layers.21.mlp.experts.107.down_proj.weight": "model-00022-of-00047.safetensors", + "model.layers.21.mlp.experts.107.down_proj.weight_scale": "model-00022-of-00047.safetensors", + "model.layers.21.mlp.experts.107.gate_proj.weight": "model-00022-of-00047.safetensors", + "model.layers.21.mlp.experts.107.gate_proj.weight_scale": "model-00022-of-00047.safetensors", + "model.layers.21.mlp.experts.107.up_proj.weight": "model-00022-of-00047.safetensors", + "model.layers.21.mlp.experts.107.up_proj.weight_scale": "model-00022-of-00047.safetensors", + "model.layers.21.mlp.experts.108.down_proj.weight": "model-00022-of-00047.safetensors", + "model.layers.21.mlp.experts.108.down_proj.weight_scale": "model-00022-of-00047.safetensors", + "model.layers.21.mlp.experts.108.gate_proj.weight": "model-00022-of-00047.safetensors", + "model.layers.21.mlp.experts.108.gate_proj.weight_scale": "model-00022-of-00047.safetensors", + "model.layers.21.mlp.experts.108.up_proj.weight": "model-00022-of-00047.safetensors", + "model.layers.21.mlp.experts.108.up_proj.weight_scale": "model-00022-of-00047.safetensors", + "model.layers.21.mlp.experts.109.down_proj.weight": "model-00022-of-00047.safetensors", + "model.layers.21.mlp.experts.109.down_proj.weight_scale": "model-00022-of-00047.safetensors", + "model.layers.21.mlp.experts.109.gate_proj.weight": "model-00022-of-00047.safetensors", + "model.layers.21.mlp.experts.109.gate_proj.weight_scale": "model-00022-of-00047.safetensors", + "model.layers.21.mlp.experts.109.up_proj.weight": "model-00022-of-00047.safetensors", + "model.layers.21.mlp.experts.109.up_proj.weight_scale": "model-00022-of-00047.safetensors", + "model.layers.21.mlp.experts.11.down_proj.weight": "model-00022-of-00047.safetensors", + "model.layers.21.mlp.experts.11.down_proj.weight_scale": "model-00022-of-00047.safetensors", + "model.layers.21.mlp.experts.11.gate_proj.weight": "model-00022-of-00047.safetensors", + "model.layers.21.mlp.experts.11.gate_proj.weight_scale": "model-00022-of-00047.safetensors", + "model.layers.21.mlp.experts.11.up_proj.weight": "model-00022-of-00047.safetensors", + "model.layers.21.mlp.experts.11.up_proj.weight_scale": "model-00022-of-00047.safetensors", + "model.layers.21.mlp.experts.110.down_proj.weight": "model-00022-of-00047.safetensors", + "model.layers.21.mlp.experts.110.down_proj.weight_scale": "model-00022-of-00047.safetensors", + "model.layers.21.mlp.experts.110.gate_proj.weight": "model-00022-of-00047.safetensors", + "model.layers.21.mlp.experts.110.gate_proj.weight_scale": "model-00022-of-00047.safetensors", + "model.layers.21.mlp.experts.110.up_proj.weight": "model-00022-of-00047.safetensors", + "model.layers.21.mlp.experts.110.up_proj.weight_scale": "model-00022-of-00047.safetensors", + "model.layers.21.mlp.experts.111.down_proj.weight": "model-00022-of-00047.safetensors", + "model.layers.21.mlp.experts.111.down_proj.weight_scale": "model-00022-of-00047.safetensors", + "model.layers.21.mlp.experts.111.gate_proj.weight": "model-00022-of-00047.safetensors", + "model.layers.21.mlp.experts.111.gate_proj.weight_scale": "model-00022-of-00047.safetensors", + "model.layers.21.mlp.experts.111.up_proj.weight": "model-00022-of-00047.safetensors", + "model.layers.21.mlp.experts.111.up_proj.weight_scale": "model-00022-of-00047.safetensors", + "model.layers.21.mlp.experts.112.down_proj.weight": "model-00022-of-00047.safetensors", + "model.layers.21.mlp.experts.112.down_proj.weight_scale": "model-00022-of-00047.safetensors", + "model.layers.21.mlp.experts.112.gate_proj.weight": "model-00022-of-00047.safetensors", + "model.layers.21.mlp.experts.112.gate_proj.weight_scale": "model-00022-of-00047.safetensors", + "model.layers.21.mlp.experts.112.up_proj.weight": "model-00022-of-00047.safetensors", + "model.layers.21.mlp.experts.112.up_proj.weight_scale": "model-00022-of-00047.safetensors", + "model.layers.21.mlp.experts.113.down_proj.weight": "model-00022-of-00047.safetensors", + "model.layers.21.mlp.experts.113.down_proj.weight_scale": "model-00022-of-00047.safetensors", + "model.layers.21.mlp.experts.113.gate_proj.weight": "model-00022-of-00047.safetensors", + "model.layers.21.mlp.experts.113.gate_proj.weight_scale": "model-00022-of-00047.safetensors", + "model.layers.21.mlp.experts.113.up_proj.weight": "model-00022-of-00047.safetensors", + "model.layers.21.mlp.experts.113.up_proj.weight_scale": "model-00022-of-00047.safetensors", + "model.layers.21.mlp.experts.114.down_proj.weight": "model-00022-of-00047.safetensors", + "model.layers.21.mlp.experts.114.down_proj.weight_scale": "model-00022-of-00047.safetensors", + "model.layers.21.mlp.experts.114.gate_proj.weight": "model-00022-of-00047.safetensors", + "model.layers.21.mlp.experts.114.gate_proj.weight_scale": "model-00022-of-00047.safetensors", + "model.layers.21.mlp.experts.114.up_proj.weight": "model-00022-of-00047.safetensors", + "model.layers.21.mlp.experts.114.up_proj.weight_scale": "model-00022-of-00047.safetensors", + "model.layers.21.mlp.experts.115.down_proj.weight": "model-00022-of-00047.safetensors", + "model.layers.21.mlp.experts.115.down_proj.weight_scale": "model-00022-of-00047.safetensors", + "model.layers.21.mlp.experts.115.gate_proj.weight": "model-00022-of-00047.safetensors", + "model.layers.21.mlp.experts.115.gate_proj.weight_scale": "model-00022-of-00047.safetensors", + "model.layers.21.mlp.experts.115.up_proj.weight": "model-00022-of-00047.safetensors", + "model.layers.21.mlp.experts.115.up_proj.weight_scale": "model-00022-of-00047.safetensors", + "model.layers.21.mlp.experts.116.down_proj.weight": "model-00022-of-00047.safetensors", + "model.layers.21.mlp.experts.116.down_proj.weight_scale": "model-00022-of-00047.safetensors", + "model.layers.21.mlp.experts.116.gate_proj.weight": "model-00022-of-00047.safetensors", + "model.layers.21.mlp.experts.116.gate_proj.weight_scale": "model-00022-of-00047.safetensors", + "model.layers.21.mlp.experts.116.up_proj.weight": "model-00022-of-00047.safetensors", + "model.layers.21.mlp.experts.116.up_proj.weight_scale": "model-00022-of-00047.safetensors", + "model.layers.21.mlp.experts.117.down_proj.weight": "model-00022-of-00047.safetensors", + "model.layers.21.mlp.experts.117.down_proj.weight_scale": "model-00022-of-00047.safetensors", + "model.layers.21.mlp.experts.117.gate_proj.weight": "model-00022-of-00047.safetensors", + "model.layers.21.mlp.experts.117.gate_proj.weight_scale": "model-00022-of-00047.safetensors", + "model.layers.21.mlp.experts.117.up_proj.weight": "model-00022-of-00047.safetensors", + "model.layers.21.mlp.experts.117.up_proj.weight_scale": "model-00022-of-00047.safetensors", + "model.layers.21.mlp.experts.118.down_proj.weight": "model-00022-of-00047.safetensors", + "model.layers.21.mlp.experts.118.down_proj.weight_scale": "model-00022-of-00047.safetensors", + "model.layers.21.mlp.experts.118.gate_proj.weight": "model-00022-of-00047.safetensors", + "model.layers.21.mlp.experts.118.gate_proj.weight_scale": "model-00022-of-00047.safetensors", + "model.layers.21.mlp.experts.118.up_proj.weight": "model-00022-of-00047.safetensors", + "model.layers.21.mlp.experts.118.up_proj.weight_scale": "model-00022-of-00047.safetensors", + "model.layers.21.mlp.experts.119.down_proj.weight": "model-00022-of-00047.safetensors", + "model.layers.21.mlp.experts.119.down_proj.weight_scale": "model-00022-of-00047.safetensors", + "model.layers.21.mlp.experts.119.gate_proj.weight": "model-00022-of-00047.safetensors", + "model.layers.21.mlp.experts.119.gate_proj.weight_scale": "model-00022-of-00047.safetensors", + "model.layers.21.mlp.experts.119.up_proj.weight": "model-00022-of-00047.safetensors", + "model.layers.21.mlp.experts.119.up_proj.weight_scale": "model-00022-of-00047.safetensors", + "model.layers.21.mlp.experts.12.down_proj.weight": "model-00022-of-00047.safetensors", + "model.layers.21.mlp.experts.12.down_proj.weight_scale": "model-00022-of-00047.safetensors", + "model.layers.21.mlp.experts.12.gate_proj.weight": "model-00022-of-00047.safetensors", + "model.layers.21.mlp.experts.12.gate_proj.weight_scale": "model-00022-of-00047.safetensors", + "model.layers.21.mlp.experts.12.up_proj.weight": "model-00022-of-00047.safetensors", + "model.layers.21.mlp.experts.12.up_proj.weight_scale": "model-00022-of-00047.safetensors", + "model.layers.21.mlp.experts.120.down_proj.weight": "model-00022-of-00047.safetensors", + "model.layers.21.mlp.experts.120.down_proj.weight_scale": "model-00022-of-00047.safetensors", + "model.layers.21.mlp.experts.120.gate_proj.weight": "model-00022-of-00047.safetensors", + "model.layers.21.mlp.experts.120.gate_proj.weight_scale": "model-00022-of-00047.safetensors", + "model.layers.21.mlp.experts.120.up_proj.weight": "model-00022-of-00047.safetensors", + "model.layers.21.mlp.experts.120.up_proj.weight_scale": "model-00022-of-00047.safetensors", + "model.layers.21.mlp.experts.121.down_proj.weight": "model-00022-of-00047.safetensors", + "model.layers.21.mlp.experts.121.down_proj.weight_scale": "model-00022-of-00047.safetensors", + "model.layers.21.mlp.experts.121.gate_proj.weight": "model-00022-of-00047.safetensors", + "model.layers.21.mlp.experts.121.gate_proj.weight_scale": "model-00022-of-00047.safetensors", + "model.layers.21.mlp.experts.121.up_proj.weight": "model-00022-of-00047.safetensors", + "model.layers.21.mlp.experts.121.up_proj.weight_scale": "model-00022-of-00047.safetensors", + "model.layers.21.mlp.experts.122.down_proj.weight": "model-00022-of-00047.safetensors", + "model.layers.21.mlp.experts.122.down_proj.weight_scale": "model-00022-of-00047.safetensors", + "model.layers.21.mlp.experts.122.gate_proj.weight": "model-00022-of-00047.safetensors", + "model.layers.21.mlp.experts.122.gate_proj.weight_scale": "model-00022-of-00047.safetensors", + "model.layers.21.mlp.experts.122.up_proj.weight": "model-00022-of-00047.safetensors", + "model.layers.21.mlp.experts.122.up_proj.weight_scale": "model-00022-of-00047.safetensors", + "model.layers.21.mlp.experts.123.down_proj.weight": "model-00022-of-00047.safetensors", + "model.layers.21.mlp.experts.123.down_proj.weight_scale": "model-00022-of-00047.safetensors", + "model.layers.21.mlp.experts.123.gate_proj.weight": "model-00022-of-00047.safetensors", + "model.layers.21.mlp.experts.123.gate_proj.weight_scale": "model-00022-of-00047.safetensors", + "model.layers.21.mlp.experts.123.up_proj.weight": "model-00022-of-00047.safetensors", + "model.layers.21.mlp.experts.123.up_proj.weight_scale": "model-00022-of-00047.safetensors", + "model.layers.21.mlp.experts.124.down_proj.weight": "model-00022-of-00047.safetensors", + "model.layers.21.mlp.experts.124.down_proj.weight_scale": "model-00022-of-00047.safetensors", + "model.layers.21.mlp.experts.124.gate_proj.weight": "model-00022-of-00047.safetensors", + "model.layers.21.mlp.experts.124.gate_proj.weight_scale": "model-00022-of-00047.safetensors", + "model.layers.21.mlp.experts.124.up_proj.weight": "model-00022-of-00047.safetensors", + "model.layers.21.mlp.experts.124.up_proj.weight_scale": "model-00022-of-00047.safetensors", + "model.layers.21.mlp.experts.125.down_proj.weight": "model-00022-of-00047.safetensors", + "model.layers.21.mlp.experts.125.down_proj.weight_scale": "model-00022-of-00047.safetensors", + "model.layers.21.mlp.experts.125.gate_proj.weight": "model-00022-of-00047.safetensors", + "model.layers.21.mlp.experts.125.gate_proj.weight_scale": "model-00022-of-00047.safetensors", + "model.layers.21.mlp.experts.125.up_proj.weight": "model-00022-of-00047.safetensors", + "model.layers.21.mlp.experts.125.up_proj.weight_scale": "model-00022-of-00047.safetensors", + "model.layers.21.mlp.experts.126.down_proj.weight": "model-00022-of-00047.safetensors", + "model.layers.21.mlp.experts.126.down_proj.weight_scale": "model-00022-of-00047.safetensors", + "model.layers.21.mlp.experts.126.gate_proj.weight": "model-00022-of-00047.safetensors", + "model.layers.21.mlp.experts.126.gate_proj.weight_scale": "model-00022-of-00047.safetensors", + "model.layers.21.mlp.experts.126.up_proj.weight": "model-00022-of-00047.safetensors", + "model.layers.21.mlp.experts.126.up_proj.weight_scale": "model-00022-of-00047.safetensors", + "model.layers.21.mlp.experts.127.down_proj.weight": "model-00022-of-00047.safetensors", + "model.layers.21.mlp.experts.127.down_proj.weight_scale": "model-00022-of-00047.safetensors", + "model.layers.21.mlp.experts.127.gate_proj.weight": "model-00022-of-00047.safetensors", + "model.layers.21.mlp.experts.127.gate_proj.weight_scale": "model-00022-of-00047.safetensors", + "model.layers.21.mlp.experts.127.up_proj.weight": "model-00022-of-00047.safetensors", + "model.layers.21.mlp.experts.127.up_proj.weight_scale": "model-00022-of-00047.safetensors", + "model.layers.21.mlp.experts.13.down_proj.weight": "model-00022-of-00047.safetensors", + "model.layers.21.mlp.experts.13.down_proj.weight_scale": "model-00022-of-00047.safetensors", + "model.layers.21.mlp.experts.13.gate_proj.weight": "model-00022-of-00047.safetensors", + "model.layers.21.mlp.experts.13.gate_proj.weight_scale": "model-00022-of-00047.safetensors", + "model.layers.21.mlp.experts.13.up_proj.weight": "model-00022-of-00047.safetensors", + "model.layers.21.mlp.experts.13.up_proj.weight_scale": "model-00022-of-00047.safetensors", + "model.layers.21.mlp.experts.14.down_proj.weight": "model-00022-of-00047.safetensors", + "model.layers.21.mlp.experts.14.down_proj.weight_scale": "model-00022-of-00047.safetensors", + "model.layers.21.mlp.experts.14.gate_proj.weight": "model-00022-of-00047.safetensors", + "model.layers.21.mlp.experts.14.gate_proj.weight_scale": "model-00022-of-00047.safetensors", + "model.layers.21.mlp.experts.14.up_proj.weight": "model-00022-of-00047.safetensors", + "model.layers.21.mlp.experts.14.up_proj.weight_scale": "model-00022-of-00047.safetensors", + "model.layers.21.mlp.experts.15.down_proj.weight": "model-00022-of-00047.safetensors", + "model.layers.21.mlp.experts.15.down_proj.weight_scale": "model-00022-of-00047.safetensors", + "model.layers.21.mlp.experts.15.gate_proj.weight": "model-00022-of-00047.safetensors", + "model.layers.21.mlp.experts.15.gate_proj.weight_scale": "model-00022-of-00047.safetensors", + "model.layers.21.mlp.experts.15.up_proj.weight": "model-00022-of-00047.safetensors", + "model.layers.21.mlp.experts.15.up_proj.weight_scale": "model-00022-of-00047.safetensors", + "model.layers.21.mlp.experts.16.down_proj.weight": "model-00022-of-00047.safetensors", + "model.layers.21.mlp.experts.16.down_proj.weight_scale": "model-00022-of-00047.safetensors", + "model.layers.21.mlp.experts.16.gate_proj.weight": "model-00022-of-00047.safetensors", + "model.layers.21.mlp.experts.16.gate_proj.weight_scale": "model-00022-of-00047.safetensors", + "model.layers.21.mlp.experts.16.up_proj.weight": "model-00022-of-00047.safetensors", + "model.layers.21.mlp.experts.16.up_proj.weight_scale": "model-00022-of-00047.safetensors", + "model.layers.21.mlp.experts.17.down_proj.weight": "model-00022-of-00047.safetensors", + "model.layers.21.mlp.experts.17.down_proj.weight_scale": "model-00022-of-00047.safetensors", + "model.layers.21.mlp.experts.17.gate_proj.weight": "model-00022-of-00047.safetensors", + "model.layers.21.mlp.experts.17.gate_proj.weight_scale": "model-00022-of-00047.safetensors", + "model.layers.21.mlp.experts.17.up_proj.weight": "model-00022-of-00047.safetensors", + "model.layers.21.mlp.experts.17.up_proj.weight_scale": "model-00022-of-00047.safetensors", + "model.layers.21.mlp.experts.18.down_proj.weight": "model-00022-of-00047.safetensors", + "model.layers.21.mlp.experts.18.down_proj.weight_scale": "model-00022-of-00047.safetensors", + "model.layers.21.mlp.experts.18.gate_proj.weight": "model-00022-of-00047.safetensors", + "model.layers.21.mlp.experts.18.gate_proj.weight_scale": "model-00022-of-00047.safetensors", + "model.layers.21.mlp.experts.18.up_proj.weight": "model-00022-of-00047.safetensors", + "model.layers.21.mlp.experts.18.up_proj.weight_scale": "model-00022-of-00047.safetensors", + "model.layers.21.mlp.experts.19.down_proj.weight": "model-00022-of-00047.safetensors", + "model.layers.21.mlp.experts.19.down_proj.weight_scale": "model-00022-of-00047.safetensors", + "model.layers.21.mlp.experts.19.gate_proj.weight": "model-00022-of-00047.safetensors", + "model.layers.21.mlp.experts.19.gate_proj.weight_scale": "model-00022-of-00047.safetensors", + "model.layers.21.mlp.experts.19.up_proj.weight": "model-00022-of-00047.safetensors", + "model.layers.21.mlp.experts.19.up_proj.weight_scale": "model-00022-of-00047.safetensors", + "model.layers.21.mlp.experts.2.down_proj.weight": "model-00022-of-00047.safetensors", + "model.layers.21.mlp.experts.2.down_proj.weight_scale": "model-00022-of-00047.safetensors", + "model.layers.21.mlp.experts.2.gate_proj.weight": "model-00022-of-00047.safetensors", + "model.layers.21.mlp.experts.2.gate_proj.weight_scale": "model-00022-of-00047.safetensors", + "model.layers.21.mlp.experts.2.up_proj.weight": "model-00022-of-00047.safetensors", + "model.layers.21.mlp.experts.2.up_proj.weight_scale": "model-00022-of-00047.safetensors", + "model.layers.21.mlp.experts.20.down_proj.weight": "model-00022-of-00047.safetensors", + "model.layers.21.mlp.experts.20.down_proj.weight_scale": "model-00022-of-00047.safetensors", + "model.layers.21.mlp.experts.20.gate_proj.weight": "model-00022-of-00047.safetensors", + "model.layers.21.mlp.experts.20.gate_proj.weight_scale": "model-00022-of-00047.safetensors", + "model.layers.21.mlp.experts.20.up_proj.weight": "model-00022-of-00047.safetensors", + "model.layers.21.mlp.experts.20.up_proj.weight_scale": "model-00022-of-00047.safetensors", + "model.layers.21.mlp.experts.21.down_proj.weight": "model-00022-of-00047.safetensors", + "model.layers.21.mlp.experts.21.down_proj.weight_scale": "model-00022-of-00047.safetensors", + "model.layers.21.mlp.experts.21.gate_proj.weight": "model-00022-of-00047.safetensors", + "model.layers.21.mlp.experts.21.gate_proj.weight_scale": "model-00022-of-00047.safetensors", + "model.layers.21.mlp.experts.21.up_proj.weight": "model-00022-of-00047.safetensors", + "model.layers.21.mlp.experts.21.up_proj.weight_scale": "model-00022-of-00047.safetensors", + "model.layers.21.mlp.experts.22.down_proj.weight": "model-00022-of-00047.safetensors", + "model.layers.21.mlp.experts.22.down_proj.weight_scale": "model-00022-of-00047.safetensors", + "model.layers.21.mlp.experts.22.gate_proj.weight": "model-00022-of-00047.safetensors", + "model.layers.21.mlp.experts.22.gate_proj.weight_scale": "model-00022-of-00047.safetensors", + "model.layers.21.mlp.experts.22.up_proj.weight": "model-00022-of-00047.safetensors", + "model.layers.21.mlp.experts.22.up_proj.weight_scale": "model-00022-of-00047.safetensors", + "model.layers.21.mlp.experts.23.down_proj.weight": "model-00022-of-00047.safetensors", + "model.layers.21.mlp.experts.23.down_proj.weight_scale": "model-00022-of-00047.safetensors", + "model.layers.21.mlp.experts.23.gate_proj.weight": "model-00022-of-00047.safetensors", + "model.layers.21.mlp.experts.23.gate_proj.weight_scale": "model-00022-of-00047.safetensors", + "model.layers.21.mlp.experts.23.up_proj.weight": "model-00022-of-00047.safetensors", + "model.layers.21.mlp.experts.23.up_proj.weight_scale": "model-00022-of-00047.safetensors", + "model.layers.21.mlp.experts.24.down_proj.weight": "model-00022-of-00047.safetensors", + "model.layers.21.mlp.experts.24.down_proj.weight_scale": "model-00022-of-00047.safetensors", + "model.layers.21.mlp.experts.24.gate_proj.weight": "model-00022-of-00047.safetensors", + "model.layers.21.mlp.experts.24.gate_proj.weight_scale": "model-00022-of-00047.safetensors", + "model.layers.21.mlp.experts.24.up_proj.weight": "model-00022-of-00047.safetensors", + "model.layers.21.mlp.experts.24.up_proj.weight_scale": "model-00022-of-00047.safetensors", + "model.layers.21.mlp.experts.25.down_proj.weight": "model-00022-of-00047.safetensors", + "model.layers.21.mlp.experts.25.down_proj.weight_scale": "model-00022-of-00047.safetensors", + "model.layers.21.mlp.experts.25.gate_proj.weight": "model-00022-of-00047.safetensors", + "model.layers.21.mlp.experts.25.gate_proj.weight_scale": "model-00022-of-00047.safetensors", + "model.layers.21.mlp.experts.25.up_proj.weight": "model-00022-of-00047.safetensors", + "model.layers.21.mlp.experts.25.up_proj.weight_scale": "model-00022-of-00047.safetensors", + "model.layers.21.mlp.experts.26.down_proj.weight": "model-00022-of-00047.safetensors", + "model.layers.21.mlp.experts.26.down_proj.weight_scale": "model-00022-of-00047.safetensors", + "model.layers.21.mlp.experts.26.gate_proj.weight": "model-00022-of-00047.safetensors", + "model.layers.21.mlp.experts.26.gate_proj.weight_scale": "model-00022-of-00047.safetensors", + "model.layers.21.mlp.experts.26.up_proj.weight": "model-00022-of-00047.safetensors", + "model.layers.21.mlp.experts.26.up_proj.weight_scale": "model-00022-of-00047.safetensors", + "model.layers.21.mlp.experts.27.down_proj.weight": "model-00022-of-00047.safetensors", + "model.layers.21.mlp.experts.27.down_proj.weight_scale": "model-00022-of-00047.safetensors", + "model.layers.21.mlp.experts.27.gate_proj.weight": "model-00022-of-00047.safetensors", + "model.layers.21.mlp.experts.27.gate_proj.weight_scale": "model-00022-of-00047.safetensors", + "model.layers.21.mlp.experts.27.up_proj.weight": "model-00022-of-00047.safetensors", + "model.layers.21.mlp.experts.27.up_proj.weight_scale": "model-00022-of-00047.safetensors", + "model.layers.21.mlp.experts.28.down_proj.weight": "model-00022-of-00047.safetensors", + "model.layers.21.mlp.experts.28.down_proj.weight_scale": "model-00022-of-00047.safetensors", + "model.layers.21.mlp.experts.28.gate_proj.weight": "model-00022-of-00047.safetensors", + "model.layers.21.mlp.experts.28.gate_proj.weight_scale": "model-00022-of-00047.safetensors", + "model.layers.21.mlp.experts.28.up_proj.weight": "model-00022-of-00047.safetensors", + "model.layers.21.mlp.experts.28.up_proj.weight_scale": "model-00022-of-00047.safetensors", + "model.layers.21.mlp.experts.29.down_proj.weight": "model-00022-of-00047.safetensors", + "model.layers.21.mlp.experts.29.down_proj.weight_scale": "model-00022-of-00047.safetensors", + "model.layers.21.mlp.experts.29.gate_proj.weight": "model-00022-of-00047.safetensors", + "model.layers.21.mlp.experts.29.gate_proj.weight_scale": "model-00022-of-00047.safetensors", + "model.layers.21.mlp.experts.29.up_proj.weight": "model-00022-of-00047.safetensors", + "model.layers.21.mlp.experts.29.up_proj.weight_scale": "model-00022-of-00047.safetensors", + "model.layers.21.mlp.experts.3.down_proj.weight": "model-00022-of-00047.safetensors", + "model.layers.21.mlp.experts.3.down_proj.weight_scale": "model-00022-of-00047.safetensors", + "model.layers.21.mlp.experts.3.gate_proj.weight": "model-00022-of-00047.safetensors", + "model.layers.21.mlp.experts.3.gate_proj.weight_scale": "model-00022-of-00047.safetensors", + "model.layers.21.mlp.experts.3.up_proj.weight": "model-00022-of-00047.safetensors", + "model.layers.21.mlp.experts.3.up_proj.weight_scale": "model-00022-of-00047.safetensors", + "model.layers.21.mlp.experts.30.down_proj.weight": "model-00022-of-00047.safetensors", + "model.layers.21.mlp.experts.30.down_proj.weight_scale": "model-00022-of-00047.safetensors", + "model.layers.21.mlp.experts.30.gate_proj.weight": "model-00022-of-00047.safetensors", + "model.layers.21.mlp.experts.30.gate_proj.weight_scale": "model-00022-of-00047.safetensors", + "model.layers.21.mlp.experts.30.up_proj.weight": "model-00022-of-00047.safetensors", + "model.layers.21.mlp.experts.30.up_proj.weight_scale": "model-00022-of-00047.safetensors", + "model.layers.21.mlp.experts.31.down_proj.weight": "model-00022-of-00047.safetensors", + "model.layers.21.mlp.experts.31.down_proj.weight_scale": "model-00022-of-00047.safetensors", + "model.layers.21.mlp.experts.31.gate_proj.weight": "model-00022-of-00047.safetensors", + "model.layers.21.mlp.experts.31.gate_proj.weight_scale": "model-00022-of-00047.safetensors", + "model.layers.21.mlp.experts.31.up_proj.weight": "model-00022-of-00047.safetensors", + "model.layers.21.mlp.experts.31.up_proj.weight_scale": "model-00022-of-00047.safetensors", + "model.layers.21.mlp.experts.32.down_proj.weight": "model-00022-of-00047.safetensors", + "model.layers.21.mlp.experts.32.down_proj.weight_scale": "model-00022-of-00047.safetensors", + "model.layers.21.mlp.experts.32.gate_proj.weight": "model-00022-of-00047.safetensors", + "model.layers.21.mlp.experts.32.gate_proj.weight_scale": "model-00022-of-00047.safetensors", + "model.layers.21.mlp.experts.32.up_proj.weight": "model-00022-of-00047.safetensors", + "model.layers.21.mlp.experts.32.up_proj.weight_scale": "model-00022-of-00047.safetensors", + "model.layers.21.mlp.experts.33.down_proj.weight": "model-00022-of-00047.safetensors", + "model.layers.21.mlp.experts.33.down_proj.weight_scale": "model-00022-of-00047.safetensors", + "model.layers.21.mlp.experts.33.gate_proj.weight": "model-00022-of-00047.safetensors", + "model.layers.21.mlp.experts.33.gate_proj.weight_scale": "model-00022-of-00047.safetensors", + "model.layers.21.mlp.experts.33.up_proj.weight": "model-00022-of-00047.safetensors", + "model.layers.21.mlp.experts.33.up_proj.weight_scale": "model-00022-of-00047.safetensors", + "model.layers.21.mlp.experts.34.down_proj.weight": "model-00022-of-00047.safetensors", + "model.layers.21.mlp.experts.34.down_proj.weight_scale": "model-00022-of-00047.safetensors", + "model.layers.21.mlp.experts.34.gate_proj.weight": "model-00022-of-00047.safetensors", + "model.layers.21.mlp.experts.34.gate_proj.weight_scale": "model-00022-of-00047.safetensors", + "model.layers.21.mlp.experts.34.up_proj.weight": "model-00022-of-00047.safetensors", + "model.layers.21.mlp.experts.34.up_proj.weight_scale": "model-00022-of-00047.safetensors", + "model.layers.21.mlp.experts.35.down_proj.weight": "model-00022-of-00047.safetensors", + "model.layers.21.mlp.experts.35.down_proj.weight_scale": "model-00022-of-00047.safetensors", + "model.layers.21.mlp.experts.35.gate_proj.weight": "model-00022-of-00047.safetensors", + "model.layers.21.mlp.experts.35.gate_proj.weight_scale": "model-00022-of-00047.safetensors", + "model.layers.21.mlp.experts.35.up_proj.weight": "model-00022-of-00047.safetensors", + "model.layers.21.mlp.experts.35.up_proj.weight_scale": "model-00022-of-00047.safetensors", + "model.layers.21.mlp.experts.36.down_proj.weight": "model-00022-of-00047.safetensors", + "model.layers.21.mlp.experts.36.down_proj.weight_scale": "model-00022-of-00047.safetensors", + "model.layers.21.mlp.experts.36.gate_proj.weight": "model-00022-of-00047.safetensors", + "model.layers.21.mlp.experts.36.gate_proj.weight_scale": "model-00022-of-00047.safetensors", + "model.layers.21.mlp.experts.36.up_proj.weight": "model-00022-of-00047.safetensors", + "model.layers.21.mlp.experts.36.up_proj.weight_scale": "model-00022-of-00047.safetensors", + "model.layers.21.mlp.experts.37.down_proj.weight": "model-00022-of-00047.safetensors", + "model.layers.21.mlp.experts.37.down_proj.weight_scale": "model-00022-of-00047.safetensors", + "model.layers.21.mlp.experts.37.gate_proj.weight": "model-00022-of-00047.safetensors", + "model.layers.21.mlp.experts.37.gate_proj.weight_scale": "model-00022-of-00047.safetensors", + "model.layers.21.mlp.experts.37.up_proj.weight": "model-00022-of-00047.safetensors", + "model.layers.21.mlp.experts.37.up_proj.weight_scale": "model-00022-of-00047.safetensors", + "model.layers.21.mlp.experts.38.down_proj.weight": "model-00022-of-00047.safetensors", + "model.layers.21.mlp.experts.38.down_proj.weight_scale": "model-00022-of-00047.safetensors", + "model.layers.21.mlp.experts.38.gate_proj.weight": "model-00022-of-00047.safetensors", + "model.layers.21.mlp.experts.38.gate_proj.weight_scale": "model-00022-of-00047.safetensors", + "model.layers.21.mlp.experts.38.up_proj.weight": "model-00022-of-00047.safetensors", + "model.layers.21.mlp.experts.38.up_proj.weight_scale": "model-00022-of-00047.safetensors", + "model.layers.21.mlp.experts.39.down_proj.weight": "model-00022-of-00047.safetensors", + "model.layers.21.mlp.experts.39.down_proj.weight_scale": "model-00022-of-00047.safetensors", + "model.layers.21.mlp.experts.39.gate_proj.weight": "model-00022-of-00047.safetensors", + "model.layers.21.mlp.experts.39.gate_proj.weight_scale": "model-00022-of-00047.safetensors", + "model.layers.21.mlp.experts.39.up_proj.weight": "model-00022-of-00047.safetensors", + "model.layers.21.mlp.experts.39.up_proj.weight_scale": "model-00022-of-00047.safetensors", + "model.layers.21.mlp.experts.4.down_proj.weight": "model-00022-of-00047.safetensors", + "model.layers.21.mlp.experts.4.down_proj.weight_scale": "model-00022-of-00047.safetensors", + "model.layers.21.mlp.experts.4.gate_proj.weight": "model-00022-of-00047.safetensors", + "model.layers.21.mlp.experts.4.gate_proj.weight_scale": "model-00022-of-00047.safetensors", + "model.layers.21.mlp.experts.4.up_proj.weight": "model-00022-of-00047.safetensors", + "model.layers.21.mlp.experts.4.up_proj.weight_scale": "model-00022-of-00047.safetensors", + "model.layers.21.mlp.experts.40.down_proj.weight": "model-00022-of-00047.safetensors", + "model.layers.21.mlp.experts.40.down_proj.weight_scale": "model-00022-of-00047.safetensors", + "model.layers.21.mlp.experts.40.gate_proj.weight": "model-00022-of-00047.safetensors", + "model.layers.21.mlp.experts.40.gate_proj.weight_scale": "model-00022-of-00047.safetensors", + "model.layers.21.mlp.experts.40.up_proj.weight": "model-00022-of-00047.safetensors", + "model.layers.21.mlp.experts.40.up_proj.weight_scale": "model-00022-of-00047.safetensors", + "model.layers.21.mlp.experts.41.down_proj.weight": "model-00022-of-00047.safetensors", + "model.layers.21.mlp.experts.41.down_proj.weight_scale": "model-00022-of-00047.safetensors", + "model.layers.21.mlp.experts.41.gate_proj.weight": "model-00022-of-00047.safetensors", + "model.layers.21.mlp.experts.41.gate_proj.weight_scale": "model-00022-of-00047.safetensors", + "model.layers.21.mlp.experts.41.up_proj.weight": "model-00022-of-00047.safetensors", + "model.layers.21.mlp.experts.41.up_proj.weight_scale": "model-00022-of-00047.safetensors", + "model.layers.21.mlp.experts.42.down_proj.weight": "model-00022-of-00047.safetensors", + "model.layers.21.mlp.experts.42.down_proj.weight_scale": "model-00022-of-00047.safetensors", + "model.layers.21.mlp.experts.42.gate_proj.weight": "model-00022-of-00047.safetensors", + "model.layers.21.mlp.experts.42.gate_proj.weight_scale": "model-00022-of-00047.safetensors", + "model.layers.21.mlp.experts.42.up_proj.weight": "model-00022-of-00047.safetensors", + "model.layers.21.mlp.experts.42.up_proj.weight_scale": "model-00022-of-00047.safetensors", + "model.layers.21.mlp.experts.43.down_proj.weight": "model-00022-of-00047.safetensors", + "model.layers.21.mlp.experts.43.down_proj.weight_scale": "model-00022-of-00047.safetensors", + "model.layers.21.mlp.experts.43.gate_proj.weight": "model-00022-of-00047.safetensors", + "model.layers.21.mlp.experts.43.gate_proj.weight_scale": "model-00022-of-00047.safetensors", + "model.layers.21.mlp.experts.43.up_proj.weight": "model-00022-of-00047.safetensors", + "model.layers.21.mlp.experts.43.up_proj.weight_scale": "model-00022-of-00047.safetensors", + "model.layers.21.mlp.experts.44.down_proj.weight": "model-00022-of-00047.safetensors", + "model.layers.21.mlp.experts.44.down_proj.weight_scale": "model-00022-of-00047.safetensors", + "model.layers.21.mlp.experts.44.gate_proj.weight": "model-00022-of-00047.safetensors", + "model.layers.21.mlp.experts.44.gate_proj.weight_scale": "model-00022-of-00047.safetensors", + "model.layers.21.mlp.experts.44.up_proj.weight": "model-00022-of-00047.safetensors", + "model.layers.21.mlp.experts.44.up_proj.weight_scale": "model-00022-of-00047.safetensors", + "model.layers.21.mlp.experts.45.down_proj.weight": "model-00022-of-00047.safetensors", + "model.layers.21.mlp.experts.45.down_proj.weight_scale": "model-00022-of-00047.safetensors", + "model.layers.21.mlp.experts.45.gate_proj.weight": "model-00022-of-00047.safetensors", + "model.layers.21.mlp.experts.45.gate_proj.weight_scale": "model-00022-of-00047.safetensors", + "model.layers.21.mlp.experts.45.up_proj.weight": "model-00022-of-00047.safetensors", + "model.layers.21.mlp.experts.45.up_proj.weight_scale": "model-00022-of-00047.safetensors", + "model.layers.21.mlp.experts.46.down_proj.weight": "model-00022-of-00047.safetensors", + "model.layers.21.mlp.experts.46.down_proj.weight_scale": "model-00022-of-00047.safetensors", + "model.layers.21.mlp.experts.46.gate_proj.weight": "model-00022-of-00047.safetensors", + "model.layers.21.mlp.experts.46.gate_proj.weight_scale": "model-00022-of-00047.safetensors", + "model.layers.21.mlp.experts.46.up_proj.weight": "model-00022-of-00047.safetensors", + "model.layers.21.mlp.experts.46.up_proj.weight_scale": "model-00022-of-00047.safetensors", + "model.layers.21.mlp.experts.47.down_proj.weight": "model-00022-of-00047.safetensors", + "model.layers.21.mlp.experts.47.down_proj.weight_scale": "model-00022-of-00047.safetensors", + "model.layers.21.mlp.experts.47.gate_proj.weight": "model-00022-of-00047.safetensors", + "model.layers.21.mlp.experts.47.gate_proj.weight_scale": "model-00022-of-00047.safetensors", + "model.layers.21.mlp.experts.47.up_proj.weight": "model-00022-of-00047.safetensors", + "model.layers.21.mlp.experts.47.up_proj.weight_scale": "model-00022-of-00047.safetensors", + "model.layers.21.mlp.experts.48.down_proj.weight": "model-00022-of-00047.safetensors", + "model.layers.21.mlp.experts.48.down_proj.weight_scale": "model-00022-of-00047.safetensors", + "model.layers.21.mlp.experts.48.gate_proj.weight": "model-00022-of-00047.safetensors", + "model.layers.21.mlp.experts.48.gate_proj.weight_scale": "model-00022-of-00047.safetensors", + "model.layers.21.mlp.experts.48.up_proj.weight": "model-00022-of-00047.safetensors", + "model.layers.21.mlp.experts.48.up_proj.weight_scale": "model-00022-of-00047.safetensors", + "model.layers.21.mlp.experts.49.down_proj.weight": "model-00022-of-00047.safetensors", + "model.layers.21.mlp.experts.49.down_proj.weight_scale": "model-00022-of-00047.safetensors", + "model.layers.21.mlp.experts.49.gate_proj.weight": "model-00022-of-00047.safetensors", + "model.layers.21.mlp.experts.49.gate_proj.weight_scale": "model-00022-of-00047.safetensors", + "model.layers.21.mlp.experts.49.up_proj.weight": "model-00022-of-00047.safetensors", + "model.layers.21.mlp.experts.49.up_proj.weight_scale": "model-00022-of-00047.safetensors", + "model.layers.21.mlp.experts.5.down_proj.weight": "model-00022-of-00047.safetensors", + "model.layers.21.mlp.experts.5.down_proj.weight_scale": "model-00022-of-00047.safetensors", + "model.layers.21.mlp.experts.5.gate_proj.weight": "model-00022-of-00047.safetensors", + "model.layers.21.mlp.experts.5.gate_proj.weight_scale": "model-00022-of-00047.safetensors", + "model.layers.21.mlp.experts.5.up_proj.weight": "model-00022-of-00047.safetensors", + "model.layers.21.mlp.experts.5.up_proj.weight_scale": "model-00022-of-00047.safetensors", + "model.layers.21.mlp.experts.50.down_proj.weight": "model-00022-of-00047.safetensors", + "model.layers.21.mlp.experts.50.down_proj.weight_scale": "model-00022-of-00047.safetensors", + "model.layers.21.mlp.experts.50.gate_proj.weight": "model-00022-of-00047.safetensors", + "model.layers.21.mlp.experts.50.gate_proj.weight_scale": "model-00022-of-00047.safetensors", + "model.layers.21.mlp.experts.50.up_proj.weight": "model-00022-of-00047.safetensors", + "model.layers.21.mlp.experts.50.up_proj.weight_scale": "model-00022-of-00047.safetensors", + "model.layers.21.mlp.experts.51.down_proj.weight": "model-00022-of-00047.safetensors", + "model.layers.21.mlp.experts.51.down_proj.weight_scale": "model-00022-of-00047.safetensors", + "model.layers.21.mlp.experts.51.gate_proj.weight": "model-00022-of-00047.safetensors", + "model.layers.21.mlp.experts.51.gate_proj.weight_scale": "model-00022-of-00047.safetensors", + "model.layers.21.mlp.experts.51.up_proj.weight": "model-00022-of-00047.safetensors", + "model.layers.21.mlp.experts.51.up_proj.weight_scale": "model-00022-of-00047.safetensors", + "model.layers.21.mlp.experts.52.down_proj.weight": "model-00022-of-00047.safetensors", + "model.layers.21.mlp.experts.52.down_proj.weight_scale": "model-00022-of-00047.safetensors", + "model.layers.21.mlp.experts.52.gate_proj.weight": "model-00022-of-00047.safetensors", + "model.layers.21.mlp.experts.52.gate_proj.weight_scale": "model-00022-of-00047.safetensors", + "model.layers.21.mlp.experts.52.up_proj.weight": "model-00022-of-00047.safetensors", + "model.layers.21.mlp.experts.52.up_proj.weight_scale": "model-00022-of-00047.safetensors", + "model.layers.21.mlp.experts.53.down_proj.weight": "model-00022-of-00047.safetensors", + "model.layers.21.mlp.experts.53.down_proj.weight_scale": "model-00022-of-00047.safetensors", + "model.layers.21.mlp.experts.53.gate_proj.weight": "model-00022-of-00047.safetensors", + "model.layers.21.mlp.experts.53.gate_proj.weight_scale": "model-00022-of-00047.safetensors", + "model.layers.21.mlp.experts.53.up_proj.weight": "model-00022-of-00047.safetensors", + "model.layers.21.mlp.experts.53.up_proj.weight_scale": "model-00022-of-00047.safetensors", + "model.layers.21.mlp.experts.54.down_proj.weight": "model-00022-of-00047.safetensors", + "model.layers.21.mlp.experts.54.down_proj.weight_scale": "model-00022-of-00047.safetensors", + "model.layers.21.mlp.experts.54.gate_proj.weight": "model-00022-of-00047.safetensors", + "model.layers.21.mlp.experts.54.gate_proj.weight_scale": "model-00022-of-00047.safetensors", + "model.layers.21.mlp.experts.54.up_proj.weight": "model-00022-of-00047.safetensors", + "model.layers.21.mlp.experts.54.up_proj.weight_scale": "model-00022-of-00047.safetensors", + "model.layers.21.mlp.experts.55.down_proj.weight": "model-00022-of-00047.safetensors", + "model.layers.21.mlp.experts.55.down_proj.weight_scale": "model-00022-of-00047.safetensors", + "model.layers.21.mlp.experts.55.gate_proj.weight": "model-00022-of-00047.safetensors", + "model.layers.21.mlp.experts.55.gate_proj.weight_scale": "model-00022-of-00047.safetensors", + "model.layers.21.mlp.experts.55.up_proj.weight": "model-00022-of-00047.safetensors", + "model.layers.21.mlp.experts.55.up_proj.weight_scale": "model-00022-of-00047.safetensors", + "model.layers.21.mlp.experts.56.down_proj.weight": "model-00022-of-00047.safetensors", + "model.layers.21.mlp.experts.56.down_proj.weight_scale": "model-00022-of-00047.safetensors", + "model.layers.21.mlp.experts.56.gate_proj.weight": "model-00022-of-00047.safetensors", + "model.layers.21.mlp.experts.56.gate_proj.weight_scale": "model-00022-of-00047.safetensors", + "model.layers.21.mlp.experts.56.up_proj.weight": "model-00022-of-00047.safetensors", + "model.layers.21.mlp.experts.56.up_proj.weight_scale": "model-00022-of-00047.safetensors", + "model.layers.21.mlp.experts.57.down_proj.weight": "model-00022-of-00047.safetensors", + "model.layers.21.mlp.experts.57.down_proj.weight_scale": "model-00022-of-00047.safetensors", + "model.layers.21.mlp.experts.57.gate_proj.weight": "model-00022-of-00047.safetensors", + "model.layers.21.mlp.experts.57.gate_proj.weight_scale": "model-00022-of-00047.safetensors", + "model.layers.21.mlp.experts.57.up_proj.weight": "model-00022-of-00047.safetensors", + "model.layers.21.mlp.experts.57.up_proj.weight_scale": "model-00022-of-00047.safetensors", + "model.layers.21.mlp.experts.58.down_proj.weight": "model-00022-of-00047.safetensors", + "model.layers.21.mlp.experts.58.down_proj.weight_scale": "model-00022-of-00047.safetensors", + "model.layers.21.mlp.experts.58.gate_proj.weight": "model-00022-of-00047.safetensors", + "model.layers.21.mlp.experts.58.gate_proj.weight_scale": "model-00022-of-00047.safetensors", + "model.layers.21.mlp.experts.58.up_proj.weight": "model-00022-of-00047.safetensors", + "model.layers.21.mlp.experts.58.up_proj.weight_scale": "model-00022-of-00047.safetensors", + "model.layers.21.mlp.experts.59.down_proj.weight": "model-00022-of-00047.safetensors", + "model.layers.21.mlp.experts.59.down_proj.weight_scale": "model-00022-of-00047.safetensors", + "model.layers.21.mlp.experts.59.gate_proj.weight": "model-00022-of-00047.safetensors", + "model.layers.21.mlp.experts.59.gate_proj.weight_scale": "model-00022-of-00047.safetensors", + "model.layers.21.mlp.experts.59.up_proj.weight": "model-00022-of-00047.safetensors", + "model.layers.21.mlp.experts.59.up_proj.weight_scale": "model-00022-of-00047.safetensors", + "model.layers.21.mlp.experts.6.down_proj.weight": "model-00022-of-00047.safetensors", + "model.layers.21.mlp.experts.6.down_proj.weight_scale": "model-00022-of-00047.safetensors", + "model.layers.21.mlp.experts.6.gate_proj.weight": "model-00022-of-00047.safetensors", + "model.layers.21.mlp.experts.6.gate_proj.weight_scale": "model-00022-of-00047.safetensors", + "model.layers.21.mlp.experts.6.up_proj.weight": "model-00022-of-00047.safetensors", + "model.layers.21.mlp.experts.6.up_proj.weight_scale": "model-00022-of-00047.safetensors", + "model.layers.21.mlp.experts.60.down_proj.weight": "model-00022-of-00047.safetensors", + "model.layers.21.mlp.experts.60.down_proj.weight_scale": "model-00022-of-00047.safetensors", + "model.layers.21.mlp.experts.60.gate_proj.weight": "model-00022-of-00047.safetensors", + "model.layers.21.mlp.experts.60.gate_proj.weight_scale": "model-00022-of-00047.safetensors", + "model.layers.21.mlp.experts.60.up_proj.weight": "model-00022-of-00047.safetensors", + "model.layers.21.mlp.experts.60.up_proj.weight_scale": "model-00022-of-00047.safetensors", + "model.layers.21.mlp.experts.61.down_proj.weight": "model-00022-of-00047.safetensors", + "model.layers.21.mlp.experts.61.down_proj.weight_scale": "model-00022-of-00047.safetensors", + "model.layers.21.mlp.experts.61.gate_proj.weight": "model-00022-of-00047.safetensors", + "model.layers.21.mlp.experts.61.gate_proj.weight_scale": "model-00022-of-00047.safetensors", + "model.layers.21.mlp.experts.61.up_proj.weight": "model-00022-of-00047.safetensors", + "model.layers.21.mlp.experts.61.up_proj.weight_scale": "model-00022-of-00047.safetensors", + "model.layers.21.mlp.experts.62.down_proj.weight": "model-00022-of-00047.safetensors", + "model.layers.21.mlp.experts.62.down_proj.weight_scale": "model-00022-of-00047.safetensors", + "model.layers.21.mlp.experts.62.gate_proj.weight": "model-00022-of-00047.safetensors", + "model.layers.21.mlp.experts.62.gate_proj.weight_scale": "model-00022-of-00047.safetensors", + "model.layers.21.mlp.experts.62.up_proj.weight": "model-00022-of-00047.safetensors", + "model.layers.21.mlp.experts.62.up_proj.weight_scale": "model-00022-of-00047.safetensors", + "model.layers.21.mlp.experts.63.down_proj.weight": "model-00022-of-00047.safetensors", + "model.layers.21.mlp.experts.63.down_proj.weight_scale": "model-00022-of-00047.safetensors", + "model.layers.21.mlp.experts.63.gate_proj.weight": "model-00022-of-00047.safetensors", + "model.layers.21.mlp.experts.63.gate_proj.weight_scale": "model-00022-of-00047.safetensors", + "model.layers.21.mlp.experts.63.up_proj.weight": "model-00022-of-00047.safetensors", + "model.layers.21.mlp.experts.63.up_proj.weight_scale": "model-00022-of-00047.safetensors", + "model.layers.21.mlp.experts.64.down_proj.weight": "model-00022-of-00047.safetensors", + "model.layers.21.mlp.experts.64.down_proj.weight_scale": "model-00022-of-00047.safetensors", + "model.layers.21.mlp.experts.64.gate_proj.weight": "model-00022-of-00047.safetensors", + "model.layers.21.mlp.experts.64.gate_proj.weight_scale": "model-00022-of-00047.safetensors", + "model.layers.21.mlp.experts.64.up_proj.weight": "model-00022-of-00047.safetensors", + "model.layers.21.mlp.experts.64.up_proj.weight_scale": "model-00022-of-00047.safetensors", + "model.layers.21.mlp.experts.65.down_proj.weight": "model-00022-of-00047.safetensors", + "model.layers.21.mlp.experts.65.down_proj.weight_scale": "model-00022-of-00047.safetensors", + "model.layers.21.mlp.experts.65.gate_proj.weight": "model-00022-of-00047.safetensors", + "model.layers.21.mlp.experts.65.gate_proj.weight_scale": "model-00022-of-00047.safetensors", + "model.layers.21.mlp.experts.65.up_proj.weight": "model-00022-of-00047.safetensors", + "model.layers.21.mlp.experts.65.up_proj.weight_scale": "model-00022-of-00047.safetensors", + "model.layers.21.mlp.experts.66.down_proj.weight": "model-00022-of-00047.safetensors", + "model.layers.21.mlp.experts.66.down_proj.weight_scale": "model-00022-of-00047.safetensors", + "model.layers.21.mlp.experts.66.gate_proj.weight": "model-00022-of-00047.safetensors", + "model.layers.21.mlp.experts.66.gate_proj.weight_scale": "model-00022-of-00047.safetensors", + "model.layers.21.mlp.experts.66.up_proj.weight": "model-00022-of-00047.safetensors", + "model.layers.21.mlp.experts.66.up_proj.weight_scale": "model-00022-of-00047.safetensors", + "model.layers.21.mlp.experts.67.down_proj.weight": "model-00022-of-00047.safetensors", + "model.layers.21.mlp.experts.67.down_proj.weight_scale": "model-00022-of-00047.safetensors", + "model.layers.21.mlp.experts.67.gate_proj.weight": "model-00022-of-00047.safetensors", + "model.layers.21.mlp.experts.67.gate_proj.weight_scale": "model-00022-of-00047.safetensors", + "model.layers.21.mlp.experts.67.up_proj.weight": "model-00022-of-00047.safetensors", + "model.layers.21.mlp.experts.67.up_proj.weight_scale": "model-00022-of-00047.safetensors", + "model.layers.21.mlp.experts.68.down_proj.weight": "model-00022-of-00047.safetensors", + "model.layers.21.mlp.experts.68.down_proj.weight_scale": "model-00022-of-00047.safetensors", + "model.layers.21.mlp.experts.68.gate_proj.weight": "model-00022-of-00047.safetensors", + "model.layers.21.mlp.experts.68.gate_proj.weight_scale": "model-00022-of-00047.safetensors", + "model.layers.21.mlp.experts.68.up_proj.weight": "model-00022-of-00047.safetensors", + "model.layers.21.mlp.experts.68.up_proj.weight_scale": "model-00022-of-00047.safetensors", + "model.layers.21.mlp.experts.69.down_proj.weight": "model-00022-of-00047.safetensors", + "model.layers.21.mlp.experts.69.down_proj.weight_scale": "model-00022-of-00047.safetensors", + "model.layers.21.mlp.experts.69.gate_proj.weight": "model-00022-of-00047.safetensors", + "model.layers.21.mlp.experts.69.gate_proj.weight_scale": "model-00022-of-00047.safetensors", + "model.layers.21.mlp.experts.69.up_proj.weight": "model-00022-of-00047.safetensors", + "model.layers.21.mlp.experts.69.up_proj.weight_scale": "model-00022-of-00047.safetensors", + "model.layers.21.mlp.experts.7.down_proj.weight": "model-00022-of-00047.safetensors", + "model.layers.21.mlp.experts.7.down_proj.weight_scale": "model-00022-of-00047.safetensors", + "model.layers.21.mlp.experts.7.gate_proj.weight": "model-00022-of-00047.safetensors", + "model.layers.21.mlp.experts.7.gate_proj.weight_scale": "model-00022-of-00047.safetensors", + "model.layers.21.mlp.experts.7.up_proj.weight": "model-00022-of-00047.safetensors", + "model.layers.21.mlp.experts.7.up_proj.weight_scale": "model-00022-of-00047.safetensors", + "model.layers.21.mlp.experts.70.down_proj.weight": "model-00022-of-00047.safetensors", + "model.layers.21.mlp.experts.70.down_proj.weight_scale": "model-00022-of-00047.safetensors", + "model.layers.21.mlp.experts.70.gate_proj.weight": "model-00022-of-00047.safetensors", + "model.layers.21.mlp.experts.70.gate_proj.weight_scale": "model-00022-of-00047.safetensors", + "model.layers.21.mlp.experts.70.up_proj.weight": "model-00022-of-00047.safetensors", + "model.layers.21.mlp.experts.70.up_proj.weight_scale": "model-00022-of-00047.safetensors", + "model.layers.21.mlp.experts.71.down_proj.weight": "model-00022-of-00047.safetensors", + "model.layers.21.mlp.experts.71.down_proj.weight_scale": "model-00022-of-00047.safetensors", + "model.layers.21.mlp.experts.71.gate_proj.weight": "model-00022-of-00047.safetensors", + "model.layers.21.mlp.experts.71.gate_proj.weight_scale": "model-00022-of-00047.safetensors", + "model.layers.21.mlp.experts.71.up_proj.weight": "model-00022-of-00047.safetensors", + "model.layers.21.mlp.experts.71.up_proj.weight_scale": "model-00022-of-00047.safetensors", + "model.layers.21.mlp.experts.72.down_proj.weight": "model-00022-of-00047.safetensors", + "model.layers.21.mlp.experts.72.down_proj.weight_scale": "model-00022-of-00047.safetensors", + "model.layers.21.mlp.experts.72.gate_proj.weight": "model-00022-of-00047.safetensors", + "model.layers.21.mlp.experts.72.gate_proj.weight_scale": "model-00022-of-00047.safetensors", + "model.layers.21.mlp.experts.72.up_proj.weight": "model-00022-of-00047.safetensors", + "model.layers.21.mlp.experts.72.up_proj.weight_scale": "model-00022-of-00047.safetensors", + "model.layers.21.mlp.experts.73.down_proj.weight": "model-00022-of-00047.safetensors", + "model.layers.21.mlp.experts.73.down_proj.weight_scale": "model-00022-of-00047.safetensors", + "model.layers.21.mlp.experts.73.gate_proj.weight": "model-00022-of-00047.safetensors", + "model.layers.21.mlp.experts.73.gate_proj.weight_scale": "model-00022-of-00047.safetensors", + "model.layers.21.mlp.experts.73.up_proj.weight": "model-00022-of-00047.safetensors", + "model.layers.21.mlp.experts.73.up_proj.weight_scale": "model-00022-of-00047.safetensors", + "model.layers.21.mlp.experts.74.down_proj.weight": "model-00022-of-00047.safetensors", + "model.layers.21.mlp.experts.74.down_proj.weight_scale": "model-00022-of-00047.safetensors", + "model.layers.21.mlp.experts.74.gate_proj.weight": "model-00022-of-00047.safetensors", + "model.layers.21.mlp.experts.74.gate_proj.weight_scale": "model-00022-of-00047.safetensors", + "model.layers.21.mlp.experts.74.up_proj.weight": "model-00022-of-00047.safetensors", + "model.layers.21.mlp.experts.74.up_proj.weight_scale": "model-00022-of-00047.safetensors", + "model.layers.21.mlp.experts.75.down_proj.weight": "model-00022-of-00047.safetensors", + "model.layers.21.mlp.experts.75.down_proj.weight_scale": "model-00022-of-00047.safetensors", + "model.layers.21.mlp.experts.75.gate_proj.weight": "model-00022-of-00047.safetensors", + "model.layers.21.mlp.experts.75.gate_proj.weight_scale": "model-00022-of-00047.safetensors", + "model.layers.21.mlp.experts.75.up_proj.weight": "model-00022-of-00047.safetensors", + "model.layers.21.mlp.experts.75.up_proj.weight_scale": "model-00022-of-00047.safetensors", + "model.layers.21.mlp.experts.76.down_proj.weight": "model-00022-of-00047.safetensors", + "model.layers.21.mlp.experts.76.down_proj.weight_scale": "model-00022-of-00047.safetensors", + "model.layers.21.mlp.experts.76.gate_proj.weight": "model-00022-of-00047.safetensors", + "model.layers.21.mlp.experts.76.gate_proj.weight_scale": "model-00022-of-00047.safetensors", + "model.layers.21.mlp.experts.76.up_proj.weight": "model-00022-of-00047.safetensors", + "model.layers.21.mlp.experts.76.up_proj.weight_scale": "model-00022-of-00047.safetensors", + "model.layers.21.mlp.experts.77.down_proj.weight": "model-00022-of-00047.safetensors", + "model.layers.21.mlp.experts.77.down_proj.weight_scale": "model-00022-of-00047.safetensors", + "model.layers.21.mlp.experts.77.gate_proj.weight": "model-00022-of-00047.safetensors", + "model.layers.21.mlp.experts.77.gate_proj.weight_scale": "model-00022-of-00047.safetensors", + "model.layers.21.mlp.experts.77.up_proj.weight": "model-00022-of-00047.safetensors", + "model.layers.21.mlp.experts.77.up_proj.weight_scale": "model-00022-of-00047.safetensors", + "model.layers.21.mlp.experts.78.down_proj.weight": "model-00022-of-00047.safetensors", + "model.layers.21.mlp.experts.78.down_proj.weight_scale": "model-00022-of-00047.safetensors", + "model.layers.21.mlp.experts.78.gate_proj.weight": "model-00022-of-00047.safetensors", + "model.layers.21.mlp.experts.78.gate_proj.weight_scale": "model-00022-of-00047.safetensors", + "model.layers.21.mlp.experts.78.up_proj.weight": "model-00022-of-00047.safetensors", + "model.layers.21.mlp.experts.78.up_proj.weight_scale": "model-00022-of-00047.safetensors", + "model.layers.21.mlp.experts.79.down_proj.weight": "model-00022-of-00047.safetensors", + "model.layers.21.mlp.experts.79.down_proj.weight_scale": "model-00022-of-00047.safetensors", + "model.layers.21.mlp.experts.79.gate_proj.weight": "model-00022-of-00047.safetensors", + "model.layers.21.mlp.experts.79.gate_proj.weight_scale": "model-00022-of-00047.safetensors", + "model.layers.21.mlp.experts.79.up_proj.weight": "model-00022-of-00047.safetensors", + "model.layers.21.mlp.experts.79.up_proj.weight_scale": "model-00022-of-00047.safetensors", + "model.layers.21.mlp.experts.8.down_proj.weight": "model-00022-of-00047.safetensors", + "model.layers.21.mlp.experts.8.down_proj.weight_scale": "model-00022-of-00047.safetensors", + "model.layers.21.mlp.experts.8.gate_proj.weight": "model-00022-of-00047.safetensors", + "model.layers.21.mlp.experts.8.gate_proj.weight_scale": "model-00022-of-00047.safetensors", + "model.layers.21.mlp.experts.8.up_proj.weight": "model-00022-of-00047.safetensors", + "model.layers.21.mlp.experts.8.up_proj.weight_scale": "model-00022-of-00047.safetensors", + "model.layers.21.mlp.experts.80.down_proj.weight": "model-00022-of-00047.safetensors", + "model.layers.21.mlp.experts.80.down_proj.weight_scale": "model-00022-of-00047.safetensors", + "model.layers.21.mlp.experts.80.gate_proj.weight": "model-00022-of-00047.safetensors", + "model.layers.21.mlp.experts.80.gate_proj.weight_scale": "model-00022-of-00047.safetensors", + "model.layers.21.mlp.experts.80.up_proj.weight": "model-00022-of-00047.safetensors", + "model.layers.21.mlp.experts.80.up_proj.weight_scale": "model-00022-of-00047.safetensors", + "model.layers.21.mlp.experts.81.down_proj.weight": "model-00022-of-00047.safetensors", + "model.layers.21.mlp.experts.81.down_proj.weight_scale": "model-00022-of-00047.safetensors", + "model.layers.21.mlp.experts.81.gate_proj.weight": "model-00022-of-00047.safetensors", + "model.layers.21.mlp.experts.81.gate_proj.weight_scale": "model-00022-of-00047.safetensors", + "model.layers.21.mlp.experts.81.up_proj.weight": "model-00022-of-00047.safetensors", + "model.layers.21.mlp.experts.81.up_proj.weight_scale": "model-00022-of-00047.safetensors", + "model.layers.21.mlp.experts.82.down_proj.weight": "model-00022-of-00047.safetensors", + "model.layers.21.mlp.experts.82.down_proj.weight_scale": "model-00022-of-00047.safetensors", + "model.layers.21.mlp.experts.82.gate_proj.weight": "model-00022-of-00047.safetensors", + "model.layers.21.mlp.experts.82.gate_proj.weight_scale": "model-00022-of-00047.safetensors", + "model.layers.21.mlp.experts.82.up_proj.weight": "model-00022-of-00047.safetensors", + "model.layers.21.mlp.experts.82.up_proj.weight_scale": "model-00022-of-00047.safetensors", + "model.layers.21.mlp.experts.83.down_proj.weight": "model-00022-of-00047.safetensors", + "model.layers.21.mlp.experts.83.down_proj.weight_scale": "model-00022-of-00047.safetensors", + "model.layers.21.mlp.experts.83.gate_proj.weight": "model-00022-of-00047.safetensors", + "model.layers.21.mlp.experts.83.gate_proj.weight_scale": "model-00022-of-00047.safetensors", + "model.layers.21.mlp.experts.83.up_proj.weight": "model-00022-of-00047.safetensors", + "model.layers.21.mlp.experts.83.up_proj.weight_scale": "model-00022-of-00047.safetensors", + "model.layers.21.mlp.experts.84.down_proj.weight": "model-00022-of-00047.safetensors", + "model.layers.21.mlp.experts.84.down_proj.weight_scale": "model-00022-of-00047.safetensors", + "model.layers.21.mlp.experts.84.gate_proj.weight": "model-00022-of-00047.safetensors", + "model.layers.21.mlp.experts.84.gate_proj.weight_scale": "model-00022-of-00047.safetensors", + "model.layers.21.mlp.experts.84.up_proj.weight": "model-00022-of-00047.safetensors", + "model.layers.21.mlp.experts.84.up_proj.weight_scale": "model-00022-of-00047.safetensors", + "model.layers.21.mlp.experts.85.down_proj.weight": "model-00022-of-00047.safetensors", + "model.layers.21.mlp.experts.85.down_proj.weight_scale": "model-00022-of-00047.safetensors", + "model.layers.21.mlp.experts.85.gate_proj.weight": "model-00022-of-00047.safetensors", + "model.layers.21.mlp.experts.85.gate_proj.weight_scale": "model-00022-of-00047.safetensors", + "model.layers.21.mlp.experts.85.up_proj.weight": "model-00022-of-00047.safetensors", + "model.layers.21.mlp.experts.85.up_proj.weight_scale": "model-00022-of-00047.safetensors", + "model.layers.21.mlp.experts.86.down_proj.weight": "model-00022-of-00047.safetensors", + "model.layers.21.mlp.experts.86.down_proj.weight_scale": "model-00022-of-00047.safetensors", + "model.layers.21.mlp.experts.86.gate_proj.weight": "model-00022-of-00047.safetensors", + "model.layers.21.mlp.experts.86.gate_proj.weight_scale": "model-00022-of-00047.safetensors", + "model.layers.21.mlp.experts.86.up_proj.weight": "model-00022-of-00047.safetensors", + "model.layers.21.mlp.experts.86.up_proj.weight_scale": "model-00022-of-00047.safetensors", + "model.layers.21.mlp.experts.87.down_proj.weight": "model-00022-of-00047.safetensors", + "model.layers.21.mlp.experts.87.down_proj.weight_scale": "model-00022-of-00047.safetensors", + "model.layers.21.mlp.experts.87.gate_proj.weight": "model-00022-of-00047.safetensors", + "model.layers.21.mlp.experts.87.gate_proj.weight_scale": "model-00022-of-00047.safetensors", + "model.layers.21.mlp.experts.87.up_proj.weight": "model-00022-of-00047.safetensors", + "model.layers.21.mlp.experts.87.up_proj.weight_scale": "model-00022-of-00047.safetensors", + "model.layers.21.mlp.experts.88.down_proj.weight": "model-00022-of-00047.safetensors", + "model.layers.21.mlp.experts.88.down_proj.weight_scale": "model-00022-of-00047.safetensors", + "model.layers.21.mlp.experts.88.gate_proj.weight": "model-00022-of-00047.safetensors", + "model.layers.21.mlp.experts.88.gate_proj.weight_scale": "model-00022-of-00047.safetensors", + "model.layers.21.mlp.experts.88.up_proj.weight": "model-00022-of-00047.safetensors", + "model.layers.21.mlp.experts.88.up_proj.weight_scale": "model-00022-of-00047.safetensors", + "model.layers.21.mlp.experts.89.down_proj.weight": "model-00022-of-00047.safetensors", + "model.layers.21.mlp.experts.89.down_proj.weight_scale": "model-00022-of-00047.safetensors", + "model.layers.21.mlp.experts.89.gate_proj.weight": "model-00022-of-00047.safetensors", + "model.layers.21.mlp.experts.89.gate_proj.weight_scale": "model-00022-of-00047.safetensors", + "model.layers.21.mlp.experts.89.up_proj.weight": "model-00022-of-00047.safetensors", + "model.layers.21.mlp.experts.89.up_proj.weight_scale": "model-00022-of-00047.safetensors", + "model.layers.21.mlp.experts.9.down_proj.weight": "model-00022-of-00047.safetensors", + "model.layers.21.mlp.experts.9.down_proj.weight_scale": "model-00022-of-00047.safetensors", + "model.layers.21.mlp.experts.9.gate_proj.weight": "model-00022-of-00047.safetensors", + "model.layers.21.mlp.experts.9.gate_proj.weight_scale": "model-00022-of-00047.safetensors", + "model.layers.21.mlp.experts.9.up_proj.weight": "model-00022-of-00047.safetensors", + "model.layers.21.mlp.experts.9.up_proj.weight_scale": "model-00022-of-00047.safetensors", + "model.layers.21.mlp.experts.90.down_proj.weight": "model-00022-of-00047.safetensors", + "model.layers.21.mlp.experts.90.down_proj.weight_scale": "model-00022-of-00047.safetensors", + "model.layers.21.mlp.experts.90.gate_proj.weight": "model-00022-of-00047.safetensors", + "model.layers.21.mlp.experts.90.gate_proj.weight_scale": "model-00022-of-00047.safetensors", + "model.layers.21.mlp.experts.90.up_proj.weight": "model-00022-of-00047.safetensors", + "model.layers.21.mlp.experts.90.up_proj.weight_scale": "model-00022-of-00047.safetensors", + "model.layers.21.mlp.experts.91.down_proj.weight": "model-00022-of-00047.safetensors", + "model.layers.21.mlp.experts.91.down_proj.weight_scale": "model-00022-of-00047.safetensors", + "model.layers.21.mlp.experts.91.gate_proj.weight": "model-00022-of-00047.safetensors", + "model.layers.21.mlp.experts.91.gate_proj.weight_scale": "model-00022-of-00047.safetensors", + "model.layers.21.mlp.experts.91.up_proj.weight": "model-00022-of-00047.safetensors", + "model.layers.21.mlp.experts.91.up_proj.weight_scale": "model-00022-of-00047.safetensors", + "model.layers.21.mlp.experts.92.down_proj.weight": "model-00022-of-00047.safetensors", + "model.layers.21.mlp.experts.92.down_proj.weight_scale": "model-00022-of-00047.safetensors", + "model.layers.21.mlp.experts.92.gate_proj.weight": "model-00022-of-00047.safetensors", + "model.layers.21.mlp.experts.92.gate_proj.weight_scale": "model-00022-of-00047.safetensors", + "model.layers.21.mlp.experts.92.up_proj.weight": "model-00022-of-00047.safetensors", + "model.layers.21.mlp.experts.92.up_proj.weight_scale": "model-00022-of-00047.safetensors", + "model.layers.21.mlp.experts.93.down_proj.weight": "model-00022-of-00047.safetensors", + "model.layers.21.mlp.experts.93.down_proj.weight_scale": "model-00022-of-00047.safetensors", + "model.layers.21.mlp.experts.93.gate_proj.weight": "model-00022-of-00047.safetensors", + "model.layers.21.mlp.experts.93.gate_proj.weight_scale": "model-00022-of-00047.safetensors", + "model.layers.21.mlp.experts.93.up_proj.weight": "model-00022-of-00047.safetensors", + "model.layers.21.mlp.experts.93.up_proj.weight_scale": "model-00022-of-00047.safetensors", + "model.layers.21.mlp.experts.94.down_proj.weight": "model-00022-of-00047.safetensors", + "model.layers.21.mlp.experts.94.down_proj.weight_scale": "model-00022-of-00047.safetensors", + "model.layers.21.mlp.experts.94.gate_proj.weight": "model-00022-of-00047.safetensors", + "model.layers.21.mlp.experts.94.gate_proj.weight_scale": "model-00022-of-00047.safetensors", + "model.layers.21.mlp.experts.94.up_proj.weight": "model-00022-of-00047.safetensors", + "model.layers.21.mlp.experts.94.up_proj.weight_scale": "model-00022-of-00047.safetensors", + "model.layers.21.mlp.experts.95.down_proj.weight": "model-00022-of-00047.safetensors", + "model.layers.21.mlp.experts.95.down_proj.weight_scale": "model-00022-of-00047.safetensors", + "model.layers.21.mlp.experts.95.gate_proj.weight": "model-00022-of-00047.safetensors", + "model.layers.21.mlp.experts.95.gate_proj.weight_scale": "model-00022-of-00047.safetensors", + "model.layers.21.mlp.experts.95.up_proj.weight": "model-00022-of-00047.safetensors", + "model.layers.21.mlp.experts.95.up_proj.weight_scale": "model-00022-of-00047.safetensors", + "model.layers.21.mlp.experts.96.down_proj.weight": "model-00022-of-00047.safetensors", + "model.layers.21.mlp.experts.96.down_proj.weight_scale": "model-00022-of-00047.safetensors", + "model.layers.21.mlp.experts.96.gate_proj.weight": "model-00022-of-00047.safetensors", + "model.layers.21.mlp.experts.96.gate_proj.weight_scale": "model-00022-of-00047.safetensors", + "model.layers.21.mlp.experts.96.up_proj.weight": "model-00022-of-00047.safetensors", + "model.layers.21.mlp.experts.96.up_proj.weight_scale": "model-00022-of-00047.safetensors", + "model.layers.21.mlp.experts.97.down_proj.weight": "model-00022-of-00047.safetensors", + "model.layers.21.mlp.experts.97.down_proj.weight_scale": "model-00022-of-00047.safetensors", + "model.layers.21.mlp.experts.97.gate_proj.weight": "model-00022-of-00047.safetensors", + "model.layers.21.mlp.experts.97.gate_proj.weight_scale": "model-00022-of-00047.safetensors", + "model.layers.21.mlp.experts.97.up_proj.weight": "model-00022-of-00047.safetensors", + "model.layers.21.mlp.experts.97.up_proj.weight_scale": "model-00022-of-00047.safetensors", + "model.layers.21.mlp.experts.98.down_proj.weight": "model-00022-of-00047.safetensors", + "model.layers.21.mlp.experts.98.down_proj.weight_scale": "model-00022-of-00047.safetensors", + "model.layers.21.mlp.experts.98.gate_proj.weight": "model-00022-of-00047.safetensors", + "model.layers.21.mlp.experts.98.gate_proj.weight_scale": "model-00022-of-00047.safetensors", + "model.layers.21.mlp.experts.98.up_proj.weight": "model-00022-of-00047.safetensors", + "model.layers.21.mlp.experts.98.up_proj.weight_scale": "model-00022-of-00047.safetensors", + "model.layers.21.mlp.experts.99.down_proj.weight": "model-00022-of-00047.safetensors", + "model.layers.21.mlp.experts.99.down_proj.weight_scale": "model-00022-of-00047.safetensors", + "model.layers.21.mlp.experts.99.gate_proj.weight": "model-00022-of-00047.safetensors", + "model.layers.21.mlp.experts.99.gate_proj.weight_scale": "model-00022-of-00047.safetensors", + "model.layers.21.mlp.experts.99.up_proj.weight": "model-00022-of-00047.safetensors", + "model.layers.21.mlp.experts.99.up_proj.weight_scale": "model-00022-of-00047.safetensors", + "model.layers.21.mlp.gate.e_score_correction_bias": "model-00022-of-00047.safetensors", + "model.layers.21.mlp.gate.weight": "model-00022-of-00047.safetensors", + "model.layers.21.mlp.shared_experts.down_proj.weight": "model-00022-of-00047.safetensors", + "model.layers.21.mlp.shared_experts.down_proj.weight_scale": "model-00022-of-00047.safetensors", + "model.layers.21.mlp.shared_experts.gate_proj.weight": "model-00022-of-00047.safetensors", + "model.layers.21.mlp.shared_experts.gate_proj.weight_scale": "model-00022-of-00047.safetensors", + "model.layers.21.mlp.shared_experts.up_proj.weight": "model-00022-of-00047.safetensors", + "model.layers.21.mlp.shared_experts.up_proj.weight_scale": "model-00022-of-00047.safetensors", + "model.layers.21.post_attention_layernorm.weight": "model-00022-of-00047.safetensors", + "model.layers.21.self_attn.k_proj.bias": "model-00022-of-00047.safetensors", + "model.layers.21.self_attn.k_proj.weight": "model-00022-of-00047.safetensors", + "model.layers.21.self_attn.k_proj.weight_scale": "model-00022-of-00047.safetensors", + "model.layers.21.self_attn.o_proj.weight": "model-00022-of-00047.safetensors", + "model.layers.21.self_attn.o_proj.weight_scale": "model-00022-of-00047.safetensors", + "model.layers.21.self_attn.q_proj.bias": "model-00022-of-00047.safetensors", + "model.layers.21.self_attn.q_proj.weight": "model-00022-of-00047.safetensors", + "model.layers.21.self_attn.q_proj.weight_scale": "model-00022-of-00047.safetensors", + "model.layers.21.self_attn.v_proj.bias": "model-00022-of-00047.safetensors", + "model.layers.21.self_attn.v_proj.weight": "model-00022-of-00047.safetensors", + "model.layers.21.self_attn.v_proj.weight_scale": "model-00022-of-00047.safetensors", + "model.layers.22.input_layernorm.weight": "model-00023-of-00047.safetensors", + "model.layers.22.mlp.experts.0.down_proj.weight": "model-00023-of-00047.safetensors", + "model.layers.22.mlp.experts.0.down_proj.weight_scale": "model-00023-of-00047.safetensors", + "model.layers.22.mlp.experts.0.gate_proj.weight": "model-00023-of-00047.safetensors", + "model.layers.22.mlp.experts.0.gate_proj.weight_scale": "model-00023-of-00047.safetensors", + "model.layers.22.mlp.experts.0.up_proj.weight": "model-00023-of-00047.safetensors", + "model.layers.22.mlp.experts.0.up_proj.weight_scale": "model-00023-of-00047.safetensors", + "model.layers.22.mlp.experts.1.down_proj.weight": "model-00023-of-00047.safetensors", + "model.layers.22.mlp.experts.1.down_proj.weight_scale": "model-00023-of-00047.safetensors", + "model.layers.22.mlp.experts.1.gate_proj.weight": "model-00023-of-00047.safetensors", + "model.layers.22.mlp.experts.1.gate_proj.weight_scale": "model-00023-of-00047.safetensors", + "model.layers.22.mlp.experts.1.up_proj.weight": "model-00023-of-00047.safetensors", + "model.layers.22.mlp.experts.1.up_proj.weight_scale": "model-00023-of-00047.safetensors", + "model.layers.22.mlp.experts.10.down_proj.weight": "model-00023-of-00047.safetensors", + "model.layers.22.mlp.experts.10.down_proj.weight_scale": "model-00023-of-00047.safetensors", + "model.layers.22.mlp.experts.10.gate_proj.weight": "model-00023-of-00047.safetensors", + "model.layers.22.mlp.experts.10.gate_proj.weight_scale": "model-00023-of-00047.safetensors", + "model.layers.22.mlp.experts.10.up_proj.weight": "model-00023-of-00047.safetensors", + "model.layers.22.mlp.experts.10.up_proj.weight_scale": "model-00023-of-00047.safetensors", + "model.layers.22.mlp.experts.100.down_proj.weight": "model-00023-of-00047.safetensors", + "model.layers.22.mlp.experts.100.down_proj.weight_scale": "model-00023-of-00047.safetensors", + "model.layers.22.mlp.experts.100.gate_proj.weight": "model-00023-of-00047.safetensors", + "model.layers.22.mlp.experts.100.gate_proj.weight_scale": "model-00023-of-00047.safetensors", + "model.layers.22.mlp.experts.100.up_proj.weight": "model-00023-of-00047.safetensors", + "model.layers.22.mlp.experts.100.up_proj.weight_scale": "model-00023-of-00047.safetensors", + "model.layers.22.mlp.experts.101.down_proj.weight": "model-00023-of-00047.safetensors", + "model.layers.22.mlp.experts.101.down_proj.weight_scale": "model-00023-of-00047.safetensors", + "model.layers.22.mlp.experts.101.gate_proj.weight": "model-00023-of-00047.safetensors", + "model.layers.22.mlp.experts.101.gate_proj.weight_scale": "model-00023-of-00047.safetensors", + "model.layers.22.mlp.experts.101.up_proj.weight": "model-00023-of-00047.safetensors", + "model.layers.22.mlp.experts.101.up_proj.weight_scale": "model-00023-of-00047.safetensors", + "model.layers.22.mlp.experts.102.down_proj.weight": "model-00023-of-00047.safetensors", + "model.layers.22.mlp.experts.102.down_proj.weight_scale": "model-00023-of-00047.safetensors", + "model.layers.22.mlp.experts.102.gate_proj.weight": "model-00023-of-00047.safetensors", + "model.layers.22.mlp.experts.102.gate_proj.weight_scale": "model-00023-of-00047.safetensors", + "model.layers.22.mlp.experts.102.up_proj.weight": "model-00023-of-00047.safetensors", + "model.layers.22.mlp.experts.102.up_proj.weight_scale": "model-00023-of-00047.safetensors", + "model.layers.22.mlp.experts.103.down_proj.weight": "model-00023-of-00047.safetensors", + "model.layers.22.mlp.experts.103.down_proj.weight_scale": "model-00023-of-00047.safetensors", + "model.layers.22.mlp.experts.103.gate_proj.weight": "model-00023-of-00047.safetensors", + "model.layers.22.mlp.experts.103.gate_proj.weight_scale": "model-00023-of-00047.safetensors", + "model.layers.22.mlp.experts.103.up_proj.weight": "model-00023-of-00047.safetensors", + "model.layers.22.mlp.experts.103.up_proj.weight_scale": "model-00023-of-00047.safetensors", + "model.layers.22.mlp.experts.104.down_proj.weight": "model-00023-of-00047.safetensors", + "model.layers.22.mlp.experts.104.down_proj.weight_scale": "model-00023-of-00047.safetensors", + "model.layers.22.mlp.experts.104.gate_proj.weight": "model-00023-of-00047.safetensors", + "model.layers.22.mlp.experts.104.gate_proj.weight_scale": "model-00023-of-00047.safetensors", + "model.layers.22.mlp.experts.104.up_proj.weight": "model-00023-of-00047.safetensors", + "model.layers.22.mlp.experts.104.up_proj.weight_scale": "model-00023-of-00047.safetensors", + "model.layers.22.mlp.experts.105.down_proj.weight": "model-00023-of-00047.safetensors", + "model.layers.22.mlp.experts.105.down_proj.weight_scale": "model-00023-of-00047.safetensors", + "model.layers.22.mlp.experts.105.gate_proj.weight": "model-00023-of-00047.safetensors", + "model.layers.22.mlp.experts.105.gate_proj.weight_scale": "model-00023-of-00047.safetensors", + "model.layers.22.mlp.experts.105.up_proj.weight": "model-00023-of-00047.safetensors", + "model.layers.22.mlp.experts.105.up_proj.weight_scale": "model-00023-of-00047.safetensors", + "model.layers.22.mlp.experts.106.down_proj.weight": "model-00023-of-00047.safetensors", + "model.layers.22.mlp.experts.106.down_proj.weight_scale": "model-00023-of-00047.safetensors", + "model.layers.22.mlp.experts.106.gate_proj.weight": "model-00023-of-00047.safetensors", + "model.layers.22.mlp.experts.106.gate_proj.weight_scale": "model-00023-of-00047.safetensors", + "model.layers.22.mlp.experts.106.up_proj.weight": "model-00023-of-00047.safetensors", + "model.layers.22.mlp.experts.106.up_proj.weight_scale": "model-00023-of-00047.safetensors", + "model.layers.22.mlp.experts.107.down_proj.weight": "model-00023-of-00047.safetensors", + "model.layers.22.mlp.experts.107.down_proj.weight_scale": "model-00023-of-00047.safetensors", + "model.layers.22.mlp.experts.107.gate_proj.weight": "model-00023-of-00047.safetensors", + "model.layers.22.mlp.experts.107.gate_proj.weight_scale": "model-00023-of-00047.safetensors", + "model.layers.22.mlp.experts.107.up_proj.weight": "model-00023-of-00047.safetensors", + "model.layers.22.mlp.experts.107.up_proj.weight_scale": "model-00023-of-00047.safetensors", + "model.layers.22.mlp.experts.108.down_proj.weight": "model-00023-of-00047.safetensors", + "model.layers.22.mlp.experts.108.down_proj.weight_scale": "model-00023-of-00047.safetensors", + "model.layers.22.mlp.experts.108.gate_proj.weight": "model-00023-of-00047.safetensors", + "model.layers.22.mlp.experts.108.gate_proj.weight_scale": "model-00023-of-00047.safetensors", + "model.layers.22.mlp.experts.108.up_proj.weight": "model-00023-of-00047.safetensors", + "model.layers.22.mlp.experts.108.up_proj.weight_scale": "model-00023-of-00047.safetensors", + "model.layers.22.mlp.experts.109.down_proj.weight": "model-00023-of-00047.safetensors", + "model.layers.22.mlp.experts.109.down_proj.weight_scale": "model-00023-of-00047.safetensors", + "model.layers.22.mlp.experts.109.gate_proj.weight": "model-00023-of-00047.safetensors", + "model.layers.22.mlp.experts.109.gate_proj.weight_scale": "model-00023-of-00047.safetensors", + "model.layers.22.mlp.experts.109.up_proj.weight": "model-00023-of-00047.safetensors", + "model.layers.22.mlp.experts.109.up_proj.weight_scale": "model-00023-of-00047.safetensors", + "model.layers.22.mlp.experts.11.down_proj.weight": "model-00023-of-00047.safetensors", + "model.layers.22.mlp.experts.11.down_proj.weight_scale": "model-00023-of-00047.safetensors", + "model.layers.22.mlp.experts.11.gate_proj.weight": "model-00023-of-00047.safetensors", + "model.layers.22.mlp.experts.11.gate_proj.weight_scale": "model-00023-of-00047.safetensors", + "model.layers.22.mlp.experts.11.up_proj.weight": "model-00023-of-00047.safetensors", + "model.layers.22.mlp.experts.11.up_proj.weight_scale": "model-00023-of-00047.safetensors", + "model.layers.22.mlp.experts.110.down_proj.weight": "model-00023-of-00047.safetensors", + "model.layers.22.mlp.experts.110.down_proj.weight_scale": "model-00023-of-00047.safetensors", + "model.layers.22.mlp.experts.110.gate_proj.weight": "model-00023-of-00047.safetensors", + "model.layers.22.mlp.experts.110.gate_proj.weight_scale": "model-00023-of-00047.safetensors", + "model.layers.22.mlp.experts.110.up_proj.weight": "model-00023-of-00047.safetensors", + "model.layers.22.mlp.experts.110.up_proj.weight_scale": "model-00023-of-00047.safetensors", + "model.layers.22.mlp.experts.111.down_proj.weight": "model-00023-of-00047.safetensors", + "model.layers.22.mlp.experts.111.down_proj.weight_scale": "model-00023-of-00047.safetensors", + "model.layers.22.mlp.experts.111.gate_proj.weight": "model-00023-of-00047.safetensors", + "model.layers.22.mlp.experts.111.gate_proj.weight_scale": "model-00023-of-00047.safetensors", + "model.layers.22.mlp.experts.111.up_proj.weight": "model-00023-of-00047.safetensors", + "model.layers.22.mlp.experts.111.up_proj.weight_scale": "model-00023-of-00047.safetensors", + "model.layers.22.mlp.experts.112.down_proj.weight": "model-00023-of-00047.safetensors", + "model.layers.22.mlp.experts.112.down_proj.weight_scale": "model-00023-of-00047.safetensors", + "model.layers.22.mlp.experts.112.gate_proj.weight": "model-00023-of-00047.safetensors", + "model.layers.22.mlp.experts.112.gate_proj.weight_scale": "model-00023-of-00047.safetensors", + "model.layers.22.mlp.experts.112.up_proj.weight": "model-00023-of-00047.safetensors", + "model.layers.22.mlp.experts.112.up_proj.weight_scale": "model-00023-of-00047.safetensors", + "model.layers.22.mlp.experts.113.down_proj.weight": "model-00023-of-00047.safetensors", + "model.layers.22.mlp.experts.113.down_proj.weight_scale": "model-00023-of-00047.safetensors", + "model.layers.22.mlp.experts.113.gate_proj.weight": "model-00023-of-00047.safetensors", + "model.layers.22.mlp.experts.113.gate_proj.weight_scale": "model-00023-of-00047.safetensors", + "model.layers.22.mlp.experts.113.up_proj.weight": "model-00023-of-00047.safetensors", + "model.layers.22.mlp.experts.113.up_proj.weight_scale": "model-00023-of-00047.safetensors", + "model.layers.22.mlp.experts.114.down_proj.weight": "model-00023-of-00047.safetensors", + "model.layers.22.mlp.experts.114.down_proj.weight_scale": "model-00023-of-00047.safetensors", + "model.layers.22.mlp.experts.114.gate_proj.weight": "model-00023-of-00047.safetensors", + "model.layers.22.mlp.experts.114.gate_proj.weight_scale": "model-00023-of-00047.safetensors", + "model.layers.22.mlp.experts.114.up_proj.weight": "model-00023-of-00047.safetensors", + "model.layers.22.mlp.experts.114.up_proj.weight_scale": "model-00023-of-00047.safetensors", + "model.layers.22.mlp.experts.115.down_proj.weight": "model-00023-of-00047.safetensors", + "model.layers.22.mlp.experts.115.down_proj.weight_scale": "model-00023-of-00047.safetensors", + "model.layers.22.mlp.experts.115.gate_proj.weight": "model-00023-of-00047.safetensors", + "model.layers.22.mlp.experts.115.gate_proj.weight_scale": "model-00023-of-00047.safetensors", + "model.layers.22.mlp.experts.115.up_proj.weight": "model-00023-of-00047.safetensors", + "model.layers.22.mlp.experts.115.up_proj.weight_scale": "model-00023-of-00047.safetensors", + "model.layers.22.mlp.experts.116.down_proj.weight": "model-00023-of-00047.safetensors", + "model.layers.22.mlp.experts.116.down_proj.weight_scale": "model-00023-of-00047.safetensors", + "model.layers.22.mlp.experts.116.gate_proj.weight": "model-00023-of-00047.safetensors", + "model.layers.22.mlp.experts.116.gate_proj.weight_scale": "model-00023-of-00047.safetensors", + "model.layers.22.mlp.experts.116.up_proj.weight": "model-00023-of-00047.safetensors", + "model.layers.22.mlp.experts.116.up_proj.weight_scale": "model-00023-of-00047.safetensors", + "model.layers.22.mlp.experts.117.down_proj.weight": "model-00023-of-00047.safetensors", + "model.layers.22.mlp.experts.117.down_proj.weight_scale": "model-00023-of-00047.safetensors", + "model.layers.22.mlp.experts.117.gate_proj.weight": "model-00023-of-00047.safetensors", + "model.layers.22.mlp.experts.117.gate_proj.weight_scale": "model-00023-of-00047.safetensors", + "model.layers.22.mlp.experts.117.up_proj.weight": "model-00023-of-00047.safetensors", + "model.layers.22.mlp.experts.117.up_proj.weight_scale": "model-00023-of-00047.safetensors", + "model.layers.22.mlp.experts.118.down_proj.weight": "model-00023-of-00047.safetensors", + "model.layers.22.mlp.experts.118.down_proj.weight_scale": "model-00023-of-00047.safetensors", + "model.layers.22.mlp.experts.118.gate_proj.weight": "model-00023-of-00047.safetensors", + "model.layers.22.mlp.experts.118.gate_proj.weight_scale": "model-00023-of-00047.safetensors", + "model.layers.22.mlp.experts.118.up_proj.weight": "model-00023-of-00047.safetensors", + "model.layers.22.mlp.experts.118.up_proj.weight_scale": "model-00023-of-00047.safetensors", + "model.layers.22.mlp.experts.119.down_proj.weight": "model-00023-of-00047.safetensors", + "model.layers.22.mlp.experts.119.down_proj.weight_scale": "model-00023-of-00047.safetensors", + "model.layers.22.mlp.experts.119.gate_proj.weight": "model-00023-of-00047.safetensors", + "model.layers.22.mlp.experts.119.gate_proj.weight_scale": "model-00023-of-00047.safetensors", + "model.layers.22.mlp.experts.119.up_proj.weight": "model-00023-of-00047.safetensors", + "model.layers.22.mlp.experts.119.up_proj.weight_scale": "model-00023-of-00047.safetensors", + "model.layers.22.mlp.experts.12.down_proj.weight": "model-00023-of-00047.safetensors", + "model.layers.22.mlp.experts.12.down_proj.weight_scale": "model-00023-of-00047.safetensors", + "model.layers.22.mlp.experts.12.gate_proj.weight": "model-00023-of-00047.safetensors", + "model.layers.22.mlp.experts.12.gate_proj.weight_scale": "model-00023-of-00047.safetensors", + "model.layers.22.mlp.experts.12.up_proj.weight": "model-00023-of-00047.safetensors", + "model.layers.22.mlp.experts.12.up_proj.weight_scale": "model-00023-of-00047.safetensors", + "model.layers.22.mlp.experts.120.down_proj.weight": "model-00023-of-00047.safetensors", + "model.layers.22.mlp.experts.120.down_proj.weight_scale": "model-00023-of-00047.safetensors", + "model.layers.22.mlp.experts.120.gate_proj.weight": "model-00023-of-00047.safetensors", + "model.layers.22.mlp.experts.120.gate_proj.weight_scale": "model-00023-of-00047.safetensors", + "model.layers.22.mlp.experts.120.up_proj.weight": "model-00023-of-00047.safetensors", + "model.layers.22.mlp.experts.120.up_proj.weight_scale": "model-00023-of-00047.safetensors", + "model.layers.22.mlp.experts.121.down_proj.weight": "model-00023-of-00047.safetensors", + "model.layers.22.mlp.experts.121.down_proj.weight_scale": "model-00023-of-00047.safetensors", + "model.layers.22.mlp.experts.121.gate_proj.weight": "model-00023-of-00047.safetensors", + "model.layers.22.mlp.experts.121.gate_proj.weight_scale": "model-00023-of-00047.safetensors", + "model.layers.22.mlp.experts.121.up_proj.weight": "model-00023-of-00047.safetensors", + "model.layers.22.mlp.experts.121.up_proj.weight_scale": "model-00023-of-00047.safetensors", + "model.layers.22.mlp.experts.122.down_proj.weight": "model-00023-of-00047.safetensors", + "model.layers.22.mlp.experts.122.down_proj.weight_scale": "model-00023-of-00047.safetensors", + "model.layers.22.mlp.experts.122.gate_proj.weight": "model-00023-of-00047.safetensors", + "model.layers.22.mlp.experts.122.gate_proj.weight_scale": "model-00023-of-00047.safetensors", + "model.layers.22.mlp.experts.122.up_proj.weight": "model-00023-of-00047.safetensors", + "model.layers.22.mlp.experts.122.up_proj.weight_scale": "model-00023-of-00047.safetensors", + "model.layers.22.mlp.experts.123.down_proj.weight": "model-00023-of-00047.safetensors", + "model.layers.22.mlp.experts.123.down_proj.weight_scale": "model-00023-of-00047.safetensors", + "model.layers.22.mlp.experts.123.gate_proj.weight": "model-00023-of-00047.safetensors", + "model.layers.22.mlp.experts.123.gate_proj.weight_scale": "model-00023-of-00047.safetensors", + "model.layers.22.mlp.experts.123.up_proj.weight": "model-00023-of-00047.safetensors", + "model.layers.22.mlp.experts.123.up_proj.weight_scale": "model-00023-of-00047.safetensors", + "model.layers.22.mlp.experts.124.down_proj.weight": "model-00023-of-00047.safetensors", + "model.layers.22.mlp.experts.124.down_proj.weight_scale": "model-00023-of-00047.safetensors", + "model.layers.22.mlp.experts.124.gate_proj.weight": "model-00023-of-00047.safetensors", + "model.layers.22.mlp.experts.124.gate_proj.weight_scale": "model-00023-of-00047.safetensors", + "model.layers.22.mlp.experts.124.up_proj.weight": "model-00023-of-00047.safetensors", + "model.layers.22.mlp.experts.124.up_proj.weight_scale": "model-00023-of-00047.safetensors", + "model.layers.22.mlp.experts.125.down_proj.weight": "model-00023-of-00047.safetensors", + "model.layers.22.mlp.experts.125.down_proj.weight_scale": "model-00023-of-00047.safetensors", + "model.layers.22.mlp.experts.125.gate_proj.weight": "model-00023-of-00047.safetensors", + "model.layers.22.mlp.experts.125.gate_proj.weight_scale": "model-00023-of-00047.safetensors", + "model.layers.22.mlp.experts.125.up_proj.weight": "model-00023-of-00047.safetensors", + "model.layers.22.mlp.experts.125.up_proj.weight_scale": "model-00023-of-00047.safetensors", + "model.layers.22.mlp.experts.126.down_proj.weight": "model-00023-of-00047.safetensors", + "model.layers.22.mlp.experts.126.down_proj.weight_scale": "model-00023-of-00047.safetensors", + "model.layers.22.mlp.experts.126.gate_proj.weight": "model-00023-of-00047.safetensors", + "model.layers.22.mlp.experts.126.gate_proj.weight_scale": "model-00023-of-00047.safetensors", + "model.layers.22.mlp.experts.126.up_proj.weight": "model-00023-of-00047.safetensors", + "model.layers.22.mlp.experts.126.up_proj.weight_scale": "model-00023-of-00047.safetensors", + "model.layers.22.mlp.experts.127.down_proj.weight": "model-00023-of-00047.safetensors", + "model.layers.22.mlp.experts.127.down_proj.weight_scale": "model-00023-of-00047.safetensors", + "model.layers.22.mlp.experts.127.gate_proj.weight": "model-00023-of-00047.safetensors", + "model.layers.22.mlp.experts.127.gate_proj.weight_scale": "model-00023-of-00047.safetensors", + "model.layers.22.mlp.experts.127.up_proj.weight": "model-00023-of-00047.safetensors", + "model.layers.22.mlp.experts.127.up_proj.weight_scale": "model-00023-of-00047.safetensors", + "model.layers.22.mlp.experts.13.down_proj.weight": "model-00023-of-00047.safetensors", + "model.layers.22.mlp.experts.13.down_proj.weight_scale": "model-00023-of-00047.safetensors", + "model.layers.22.mlp.experts.13.gate_proj.weight": "model-00023-of-00047.safetensors", + "model.layers.22.mlp.experts.13.gate_proj.weight_scale": "model-00023-of-00047.safetensors", + "model.layers.22.mlp.experts.13.up_proj.weight": "model-00023-of-00047.safetensors", + "model.layers.22.mlp.experts.13.up_proj.weight_scale": "model-00023-of-00047.safetensors", + "model.layers.22.mlp.experts.14.down_proj.weight": "model-00023-of-00047.safetensors", + "model.layers.22.mlp.experts.14.down_proj.weight_scale": "model-00023-of-00047.safetensors", + "model.layers.22.mlp.experts.14.gate_proj.weight": "model-00023-of-00047.safetensors", + "model.layers.22.mlp.experts.14.gate_proj.weight_scale": "model-00023-of-00047.safetensors", + "model.layers.22.mlp.experts.14.up_proj.weight": "model-00023-of-00047.safetensors", + "model.layers.22.mlp.experts.14.up_proj.weight_scale": "model-00023-of-00047.safetensors", + "model.layers.22.mlp.experts.15.down_proj.weight": "model-00023-of-00047.safetensors", + "model.layers.22.mlp.experts.15.down_proj.weight_scale": "model-00023-of-00047.safetensors", + "model.layers.22.mlp.experts.15.gate_proj.weight": "model-00023-of-00047.safetensors", + "model.layers.22.mlp.experts.15.gate_proj.weight_scale": "model-00023-of-00047.safetensors", + "model.layers.22.mlp.experts.15.up_proj.weight": "model-00023-of-00047.safetensors", + "model.layers.22.mlp.experts.15.up_proj.weight_scale": "model-00023-of-00047.safetensors", + "model.layers.22.mlp.experts.16.down_proj.weight": "model-00023-of-00047.safetensors", + "model.layers.22.mlp.experts.16.down_proj.weight_scale": "model-00023-of-00047.safetensors", + "model.layers.22.mlp.experts.16.gate_proj.weight": "model-00023-of-00047.safetensors", + "model.layers.22.mlp.experts.16.gate_proj.weight_scale": "model-00023-of-00047.safetensors", + "model.layers.22.mlp.experts.16.up_proj.weight": "model-00023-of-00047.safetensors", + "model.layers.22.mlp.experts.16.up_proj.weight_scale": "model-00023-of-00047.safetensors", + "model.layers.22.mlp.experts.17.down_proj.weight": "model-00023-of-00047.safetensors", + "model.layers.22.mlp.experts.17.down_proj.weight_scale": "model-00023-of-00047.safetensors", + "model.layers.22.mlp.experts.17.gate_proj.weight": "model-00023-of-00047.safetensors", + "model.layers.22.mlp.experts.17.gate_proj.weight_scale": "model-00023-of-00047.safetensors", + "model.layers.22.mlp.experts.17.up_proj.weight": "model-00023-of-00047.safetensors", + "model.layers.22.mlp.experts.17.up_proj.weight_scale": "model-00023-of-00047.safetensors", + "model.layers.22.mlp.experts.18.down_proj.weight": "model-00023-of-00047.safetensors", + "model.layers.22.mlp.experts.18.down_proj.weight_scale": "model-00023-of-00047.safetensors", + "model.layers.22.mlp.experts.18.gate_proj.weight": "model-00023-of-00047.safetensors", + "model.layers.22.mlp.experts.18.gate_proj.weight_scale": "model-00023-of-00047.safetensors", + "model.layers.22.mlp.experts.18.up_proj.weight": "model-00023-of-00047.safetensors", + "model.layers.22.mlp.experts.18.up_proj.weight_scale": "model-00023-of-00047.safetensors", + "model.layers.22.mlp.experts.19.down_proj.weight": "model-00023-of-00047.safetensors", + "model.layers.22.mlp.experts.19.down_proj.weight_scale": "model-00023-of-00047.safetensors", + "model.layers.22.mlp.experts.19.gate_proj.weight": "model-00023-of-00047.safetensors", + "model.layers.22.mlp.experts.19.gate_proj.weight_scale": "model-00023-of-00047.safetensors", + "model.layers.22.mlp.experts.19.up_proj.weight": "model-00023-of-00047.safetensors", + "model.layers.22.mlp.experts.19.up_proj.weight_scale": "model-00023-of-00047.safetensors", + "model.layers.22.mlp.experts.2.down_proj.weight": "model-00023-of-00047.safetensors", + "model.layers.22.mlp.experts.2.down_proj.weight_scale": "model-00023-of-00047.safetensors", + "model.layers.22.mlp.experts.2.gate_proj.weight": "model-00023-of-00047.safetensors", + "model.layers.22.mlp.experts.2.gate_proj.weight_scale": "model-00023-of-00047.safetensors", + "model.layers.22.mlp.experts.2.up_proj.weight": "model-00023-of-00047.safetensors", + "model.layers.22.mlp.experts.2.up_proj.weight_scale": "model-00023-of-00047.safetensors", + "model.layers.22.mlp.experts.20.down_proj.weight": "model-00023-of-00047.safetensors", + "model.layers.22.mlp.experts.20.down_proj.weight_scale": "model-00023-of-00047.safetensors", + "model.layers.22.mlp.experts.20.gate_proj.weight": "model-00023-of-00047.safetensors", + "model.layers.22.mlp.experts.20.gate_proj.weight_scale": "model-00023-of-00047.safetensors", + "model.layers.22.mlp.experts.20.up_proj.weight": "model-00023-of-00047.safetensors", + "model.layers.22.mlp.experts.20.up_proj.weight_scale": "model-00023-of-00047.safetensors", + "model.layers.22.mlp.experts.21.down_proj.weight": "model-00023-of-00047.safetensors", + "model.layers.22.mlp.experts.21.down_proj.weight_scale": "model-00023-of-00047.safetensors", + "model.layers.22.mlp.experts.21.gate_proj.weight": "model-00023-of-00047.safetensors", + "model.layers.22.mlp.experts.21.gate_proj.weight_scale": "model-00023-of-00047.safetensors", + "model.layers.22.mlp.experts.21.up_proj.weight": "model-00023-of-00047.safetensors", + "model.layers.22.mlp.experts.21.up_proj.weight_scale": "model-00023-of-00047.safetensors", + "model.layers.22.mlp.experts.22.down_proj.weight": "model-00023-of-00047.safetensors", + "model.layers.22.mlp.experts.22.down_proj.weight_scale": "model-00023-of-00047.safetensors", + "model.layers.22.mlp.experts.22.gate_proj.weight": "model-00023-of-00047.safetensors", + "model.layers.22.mlp.experts.22.gate_proj.weight_scale": "model-00023-of-00047.safetensors", + "model.layers.22.mlp.experts.22.up_proj.weight": "model-00023-of-00047.safetensors", + "model.layers.22.mlp.experts.22.up_proj.weight_scale": "model-00023-of-00047.safetensors", + "model.layers.22.mlp.experts.23.down_proj.weight": "model-00023-of-00047.safetensors", + "model.layers.22.mlp.experts.23.down_proj.weight_scale": "model-00023-of-00047.safetensors", + "model.layers.22.mlp.experts.23.gate_proj.weight": "model-00023-of-00047.safetensors", + "model.layers.22.mlp.experts.23.gate_proj.weight_scale": "model-00023-of-00047.safetensors", + "model.layers.22.mlp.experts.23.up_proj.weight": "model-00023-of-00047.safetensors", + "model.layers.22.mlp.experts.23.up_proj.weight_scale": "model-00023-of-00047.safetensors", + "model.layers.22.mlp.experts.24.down_proj.weight": "model-00023-of-00047.safetensors", + "model.layers.22.mlp.experts.24.down_proj.weight_scale": "model-00023-of-00047.safetensors", + "model.layers.22.mlp.experts.24.gate_proj.weight": "model-00023-of-00047.safetensors", + "model.layers.22.mlp.experts.24.gate_proj.weight_scale": "model-00023-of-00047.safetensors", + "model.layers.22.mlp.experts.24.up_proj.weight": "model-00023-of-00047.safetensors", + "model.layers.22.mlp.experts.24.up_proj.weight_scale": "model-00023-of-00047.safetensors", + "model.layers.22.mlp.experts.25.down_proj.weight": "model-00023-of-00047.safetensors", + "model.layers.22.mlp.experts.25.down_proj.weight_scale": "model-00023-of-00047.safetensors", + "model.layers.22.mlp.experts.25.gate_proj.weight": "model-00023-of-00047.safetensors", + "model.layers.22.mlp.experts.25.gate_proj.weight_scale": "model-00023-of-00047.safetensors", + "model.layers.22.mlp.experts.25.up_proj.weight": "model-00023-of-00047.safetensors", + "model.layers.22.mlp.experts.25.up_proj.weight_scale": "model-00023-of-00047.safetensors", + "model.layers.22.mlp.experts.26.down_proj.weight": "model-00023-of-00047.safetensors", + "model.layers.22.mlp.experts.26.down_proj.weight_scale": "model-00023-of-00047.safetensors", + "model.layers.22.mlp.experts.26.gate_proj.weight": "model-00023-of-00047.safetensors", + "model.layers.22.mlp.experts.26.gate_proj.weight_scale": "model-00023-of-00047.safetensors", + "model.layers.22.mlp.experts.26.up_proj.weight": "model-00023-of-00047.safetensors", + "model.layers.22.mlp.experts.26.up_proj.weight_scale": "model-00023-of-00047.safetensors", + "model.layers.22.mlp.experts.27.down_proj.weight": "model-00023-of-00047.safetensors", + "model.layers.22.mlp.experts.27.down_proj.weight_scale": "model-00023-of-00047.safetensors", + "model.layers.22.mlp.experts.27.gate_proj.weight": "model-00023-of-00047.safetensors", + "model.layers.22.mlp.experts.27.gate_proj.weight_scale": "model-00023-of-00047.safetensors", + "model.layers.22.mlp.experts.27.up_proj.weight": "model-00023-of-00047.safetensors", + "model.layers.22.mlp.experts.27.up_proj.weight_scale": "model-00023-of-00047.safetensors", + "model.layers.22.mlp.experts.28.down_proj.weight": "model-00023-of-00047.safetensors", + "model.layers.22.mlp.experts.28.down_proj.weight_scale": "model-00023-of-00047.safetensors", + "model.layers.22.mlp.experts.28.gate_proj.weight": "model-00023-of-00047.safetensors", + "model.layers.22.mlp.experts.28.gate_proj.weight_scale": "model-00023-of-00047.safetensors", + "model.layers.22.mlp.experts.28.up_proj.weight": "model-00023-of-00047.safetensors", + "model.layers.22.mlp.experts.28.up_proj.weight_scale": "model-00023-of-00047.safetensors", + "model.layers.22.mlp.experts.29.down_proj.weight": "model-00023-of-00047.safetensors", + "model.layers.22.mlp.experts.29.down_proj.weight_scale": "model-00023-of-00047.safetensors", + "model.layers.22.mlp.experts.29.gate_proj.weight": "model-00023-of-00047.safetensors", + "model.layers.22.mlp.experts.29.gate_proj.weight_scale": "model-00023-of-00047.safetensors", + "model.layers.22.mlp.experts.29.up_proj.weight": "model-00023-of-00047.safetensors", + "model.layers.22.mlp.experts.29.up_proj.weight_scale": "model-00023-of-00047.safetensors", + "model.layers.22.mlp.experts.3.down_proj.weight": "model-00023-of-00047.safetensors", + "model.layers.22.mlp.experts.3.down_proj.weight_scale": "model-00023-of-00047.safetensors", + "model.layers.22.mlp.experts.3.gate_proj.weight": "model-00023-of-00047.safetensors", + "model.layers.22.mlp.experts.3.gate_proj.weight_scale": "model-00023-of-00047.safetensors", + "model.layers.22.mlp.experts.3.up_proj.weight": "model-00023-of-00047.safetensors", + "model.layers.22.mlp.experts.3.up_proj.weight_scale": "model-00023-of-00047.safetensors", + "model.layers.22.mlp.experts.30.down_proj.weight": "model-00023-of-00047.safetensors", + "model.layers.22.mlp.experts.30.down_proj.weight_scale": "model-00023-of-00047.safetensors", + "model.layers.22.mlp.experts.30.gate_proj.weight": "model-00023-of-00047.safetensors", + "model.layers.22.mlp.experts.30.gate_proj.weight_scale": "model-00023-of-00047.safetensors", + "model.layers.22.mlp.experts.30.up_proj.weight": "model-00023-of-00047.safetensors", + "model.layers.22.mlp.experts.30.up_proj.weight_scale": "model-00023-of-00047.safetensors", + "model.layers.22.mlp.experts.31.down_proj.weight": "model-00023-of-00047.safetensors", + "model.layers.22.mlp.experts.31.down_proj.weight_scale": "model-00023-of-00047.safetensors", + "model.layers.22.mlp.experts.31.gate_proj.weight": "model-00023-of-00047.safetensors", + "model.layers.22.mlp.experts.31.gate_proj.weight_scale": "model-00023-of-00047.safetensors", + "model.layers.22.mlp.experts.31.up_proj.weight": "model-00023-of-00047.safetensors", + "model.layers.22.mlp.experts.31.up_proj.weight_scale": "model-00023-of-00047.safetensors", + "model.layers.22.mlp.experts.32.down_proj.weight": "model-00023-of-00047.safetensors", + "model.layers.22.mlp.experts.32.down_proj.weight_scale": "model-00023-of-00047.safetensors", + "model.layers.22.mlp.experts.32.gate_proj.weight": "model-00023-of-00047.safetensors", + "model.layers.22.mlp.experts.32.gate_proj.weight_scale": "model-00023-of-00047.safetensors", + "model.layers.22.mlp.experts.32.up_proj.weight": "model-00023-of-00047.safetensors", + "model.layers.22.mlp.experts.32.up_proj.weight_scale": "model-00023-of-00047.safetensors", + "model.layers.22.mlp.experts.33.down_proj.weight": "model-00023-of-00047.safetensors", + "model.layers.22.mlp.experts.33.down_proj.weight_scale": "model-00023-of-00047.safetensors", + "model.layers.22.mlp.experts.33.gate_proj.weight": "model-00023-of-00047.safetensors", + "model.layers.22.mlp.experts.33.gate_proj.weight_scale": "model-00023-of-00047.safetensors", + "model.layers.22.mlp.experts.33.up_proj.weight": "model-00023-of-00047.safetensors", + "model.layers.22.mlp.experts.33.up_proj.weight_scale": "model-00023-of-00047.safetensors", + "model.layers.22.mlp.experts.34.down_proj.weight": "model-00023-of-00047.safetensors", + "model.layers.22.mlp.experts.34.down_proj.weight_scale": "model-00023-of-00047.safetensors", + "model.layers.22.mlp.experts.34.gate_proj.weight": "model-00023-of-00047.safetensors", + "model.layers.22.mlp.experts.34.gate_proj.weight_scale": "model-00023-of-00047.safetensors", + "model.layers.22.mlp.experts.34.up_proj.weight": "model-00023-of-00047.safetensors", + "model.layers.22.mlp.experts.34.up_proj.weight_scale": "model-00023-of-00047.safetensors", + "model.layers.22.mlp.experts.35.down_proj.weight": "model-00023-of-00047.safetensors", + "model.layers.22.mlp.experts.35.down_proj.weight_scale": "model-00023-of-00047.safetensors", + "model.layers.22.mlp.experts.35.gate_proj.weight": "model-00023-of-00047.safetensors", + "model.layers.22.mlp.experts.35.gate_proj.weight_scale": "model-00023-of-00047.safetensors", + "model.layers.22.mlp.experts.35.up_proj.weight": "model-00023-of-00047.safetensors", + "model.layers.22.mlp.experts.35.up_proj.weight_scale": "model-00023-of-00047.safetensors", + "model.layers.22.mlp.experts.36.down_proj.weight": "model-00023-of-00047.safetensors", + "model.layers.22.mlp.experts.36.down_proj.weight_scale": "model-00023-of-00047.safetensors", + "model.layers.22.mlp.experts.36.gate_proj.weight": "model-00023-of-00047.safetensors", + "model.layers.22.mlp.experts.36.gate_proj.weight_scale": "model-00023-of-00047.safetensors", + "model.layers.22.mlp.experts.36.up_proj.weight": "model-00023-of-00047.safetensors", + "model.layers.22.mlp.experts.36.up_proj.weight_scale": "model-00023-of-00047.safetensors", + "model.layers.22.mlp.experts.37.down_proj.weight": "model-00023-of-00047.safetensors", + "model.layers.22.mlp.experts.37.down_proj.weight_scale": "model-00023-of-00047.safetensors", + "model.layers.22.mlp.experts.37.gate_proj.weight": "model-00023-of-00047.safetensors", + "model.layers.22.mlp.experts.37.gate_proj.weight_scale": "model-00023-of-00047.safetensors", + "model.layers.22.mlp.experts.37.up_proj.weight": "model-00023-of-00047.safetensors", + "model.layers.22.mlp.experts.37.up_proj.weight_scale": "model-00023-of-00047.safetensors", + "model.layers.22.mlp.experts.38.down_proj.weight": "model-00023-of-00047.safetensors", + "model.layers.22.mlp.experts.38.down_proj.weight_scale": "model-00023-of-00047.safetensors", + "model.layers.22.mlp.experts.38.gate_proj.weight": "model-00023-of-00047.safetensors", + "model.layers.22.mlp.experts.38.gate_proj.weight_scale": "model-00023-of-00047.safetensors", + "model.layers.22.mlp.experts.38.up_proj.weight": "model-00023-of-00047.safetensors", + "model.layers.22.mlp.experts.38.up_proj.weight_scale": "model-00023-of-00047.safetensors", + "model.layers.22.mlp.experts.39.down_proj.weight": "model-00023-of-00047.safetensors", + "model.layers.22.mlp.experts.39.down_proj.weight_scale": "model-00023-of-00047.safetensors", + "model.layers.22.mlp.experts.39.gate_proj.weight": "model-00023-of-00047.safetensors", + "model.layers.22.mlp.experts.39.gate_proj.weight_scale": "model-00023-of-00047.safetensors", + "model.layers.22.mlp.experts.39.up_proj.weight": "model-00023-of-00047.safetensors", + "model.layers.22.mlp.experts.39.up_proj.weight_scale": "model-00023-of-00047.safetensors", + "model.layers.22.mlp.experts.4.down_proj.weight": "model-00023-of-00047.safetensors", + "model.layers.22.mlp.experts.4.down_proj.weight_scale": "model-00023-of-00047.safetensors", + "model.layers.22.mlp.experts.4.gate_proj.weight": "model-00023-of-00047.safetensors", + "model.layers.22.mlp.experts.4.gate_proj.weight_scale": "model-00023-of-00047.safetensors", + "model.layers.22.mlp.experts.4.up_proj.weight": "model-00023-of-00047.safetensors", + "model.layers.22.mlp.experts.4.up_proj.weight_scale": "model-00023-of-00047.safetensors", + "model.layers.22.mlp.experts.40.down_proj.weight": "model-00023-of-00047.safetensors", + "model.layers.22.mlp.experts.40.down_proj.weight_scale": "model-00023-of-00047.safetensors", + "model.layers.22.mlp.experts.40.gate_proj.weight": "model-00023-of-00047.safetensors", + "model.layers.22.mlp.experts.40.gate_proj.weight_scale": "model-00023-of-00047.safetensors", + "model.layers.22.mlp.experts.40.up_proj.weight": "model-00023-of-00047.safetensors", + "model.layers.22.mlp.experts.40.up_proj.weight_scale": "model-00023-of-00047.safetensors", + "model.layers.22.mlp.experts.41.down_proj.weight": "model-00023-of-00047.safetensors", + "model.layers.22.mlp.experts.41.down_proj.weight_scale": "model-00023-of-00047.safetensors", + "model.layers.22.mlp.experts.41.gate_proj.weight": "model-00023-of-00047.safetensors", + "model.layers.22.mlp.experts.41.gate_proj.weight_scale": "model-00023-of-00047.safetensors", + "model.layers.22.mlp.experts.41.up_proj.weight": "model-00023-of-00047.safetensors", + "model.layers.22.mlp.experts.41.up_proj.weight_scale": "model-00023-of-00047.safetensors", + "model.layers.22.mlp.experts.42.down_proj.weight": "model-00023-of-00047.safetensors", + "model.layers.22.mlp.experts.42.down_proj.weight_scale": "model-00023-of-00047.safetensors", + "model.layers.22.mlp.experts.42.gate_proj.weight": "model-00023-of-00047.safetensors", + "model.layers.22.mlp.experts.42.gate_proj.weight_scale": "model-00023-of-00047.safetensors", + "model.layers.22.mlp.experts.42.up_proj.weight": "model-00023-of-00047.safetensors", + "model.layers.22.mlp.experts.42.up_proj.weight_scale": "model-00023-of-00047.safetensors", + "model.layers.22.mlp.experts.43.down_proj.weight": "model-00023-of-00047.safetensors", + "model.layers.22.mlp.experts.43.down_proj.weight_scale": "model-00023-of-00047.safetensors", + "model.layers.22.mlp.experts.43.gate_proj.weight": "model-00023-of-00047.safetensors", + "model.layers.22.mlp.experts.43.gate_proj.weight_scale": "model-00023-of-00047.safetensors", + "model.layers.22.mlp.experts.43.up_proj.weight": "model-00023-of-00047.safetensors", + "model.layers.22.mlp.experts.43.up_proj.weight_scale": "model-00023-of-00047.safetensors", + "model.layers.22.mlp.experts.44.down_proj.weight": "model-00023-of-00047.safetensors", + "model.layers.22.mlp.experts.44.down_proj.weight_scale": "model-00023-of-00047.safetensors", + "model.layers.22.mlp.experts.44.gate_proj.weight": "model-00023-of-00047.safetensors", + "model.layers.22.mlp.experts.44.gate_proj.weight_scale": "model-00023-of-00047.safetensors", + "model.layers.22.mlp.experts.44.up_proj.weight": "model-00023-of-00047.safetensors", + "model.layers.22.mlp.experts.44.up_proj.weight_scale": "model-00023-of-00047.safetensors", + "model.layers.22.mlp.experts.45.down_proj.weight": "model-00023-of-00047.safetensors", + "model.layers.22.mlp.experts.45.down_proj.weight_scale": "model-00023-of-00047.safetensors", + "model.layers.22.mlp.experts.45.gate_proj.weight": "model-00023-of-00047.safetensors", + "model.layers.22.mlp.experts.45.gate_proj.weight_scale": "model-00023-of-00047.safetensors", + "model.layers.22.mlp.experts.45.up_proj.weight": "model-00023-of-00047.safetensors", + "model.layers.22.mlp.experts.45.up_proj.weight_scale": "model-00023-of-00047.safetensors", + "model.layers.22.mlp.experts.46.down_proj.weight": "model-00023-of-00047.safetensors", + "model.layers.22.mlp.experts.46.down_proj.weight_scale": "model-00023-of-00047.safetensors", + "model.layers.22.mlp.experts.46.gate_proj.weight": "model-00023-of-00047.safetensors", + "model.layers.22.mlp.experts.46.gate_proj.weight_scale": "model-00023-of-00047.safetensors", + "model.layers.22.mlp.experts.46.up_proj.weight": "model-00023-of-00047.safetensors", + "model.layers.22.mlp.experts.46.up_proj.weight_scale": "model-00023-of-00047.safetensors", + "model.layers.22.mlp.experts.47.down_proj.weight": "model-00023-of-00047.safetensors", + "model.layers.22.mlp.experts.47.down_proj.weight_scale": "model-00023-of-00047.safetensors", + "model.layers.22.mlp.experts.47.gate_proj.weight": "model-00023-of-00047.safetensors", + "model.layers.22.mlp.experts.47.gate_proj.weight_scale": "model-00023-of-00047.safetensors", + "model.layers.22.mlp.experts.47.up_proj.weight": "model-00023-of-00047.safetensors", + "model.layers.22.mlp.experts.47.up_proj.weight_scale": "model-00023-of-00047.safetensors", + "model.layers.22.mlp.experts.48.down_proj.weight": "model-00023-of-00047.safetensors", + "model.layers.22.mlp.experts.48.down_proj.weight_scale": "model-00023-of-00047.safetensors", + "model.layers.22.mlp.experts.48.gate_proj.weight": "model-00023-of-00047.safetensors", + "model.layers.22.mlp.experts.48.gate_proj.weight_scale": "model-00023-of-00047.safetensors", + "model.layers.22.mlp.experts.48.up_proj.weight": "model-00023-of-00047.safetensors", + "model.layers.22.mlp.experts.48.up_proj.weight_scale": "model-00023-of-00047.safetensors", + "model.layers.22.mlp.experts.49.down_proj.weight": "model-00023-of-00047.safetensors", + "model.layers.22.mlp.experts.49.down_proj.weight_scale": "model-00023-of-00047.safetensors", + "model.layers.22.mlp.experts.49.gate_proj.weight": "model-00023-of-00047.safetensors", + "model.layers.22.mlp.experts.49.gate_proj.weight_scale": "model-00023-of-00047.safetensors", + "model.layers.22.mlp.experts.49.up_proj.weight": "model-00023-of-00047.safetensors", + "model.layers.22.mlp.experts.49.up_proj.weight_scale": "model-00023-of-00047.safetensors", + "model.layers.22.mlp.experts.5.down_proj.weight": "model-00023-of-00047.safetensors", + "model.layers.22.mlp.experts.5.down_proj.weight_scale": "model-00023-of-00047.safetensors", + "model.layers.22.mlp.experts.5.gate_proj.weight": "model-00023-of-00047.safetensors", + "model.layers.22.mlp.experts.5.gate_proj.weight_scale": "model-00023-of-00047.safetensors", + "model.layers.22.mlp.experts.5.up_proj.weight": "model-00023-of-00047.safetensors", + "model.layers.22.mlp.experts.5.up_proj.weight_scale": "model-00023-of-00047.safetensors", + "model.layers.22.mlp.experts.50.down_proj.weight": "model-00023-of-00047.safetensors", + "model.layers.22.mlp.experts.50.down_proj.weight_scale": "model-00023-of-00047.safetensors", + "model.layers.22.mlp.experts.50.gate_proj.weight": "model-00023-of-00047.safetensors", + "model.layers.22.mlp.experts.50.gate_proj.weight_scale": "model-00023-of-00047.safetensors", + "model.layers.22.mlp.experts.50.up_proj.weight": "model-00023-of-00047.safetensors", + "model.layers.22.mlp.experts.50.up_proj.weight_scale": "model-00023-of-00047.safetensors", + "model.layers.22.mlp.experts.51.down_proj.weight": "model-00023-of-00047.safetensors", + "model.layers.22.mlp.experts.51.down_proj.weight_scale": "model-00023-of-00047.safetensors", + "model.layers.22.mlp.experts.51.gate_proj.weight": "model-00023-of-00047.safetensors", + "model.layers.22.mlp.experts.51.gate_proj.weight_scale": "model-00023-of-00047.safetensors", + "model.layers.22.mlp.experts.51.up_proj.weight": "model-00023-of-00047.safetensors", + "model.layers.22.mlp.experts.51.up_proj.weight_scale": "model-00023-of-00047.safetensors", + "model.layers.22.mlp.experts.52.down_proj.weight": "model-00023-of-00047.safetensors", + "model.layers.22.mlp.experts.52.down_proj.weight_scale": "model-00023-of-00047.safetensors", + "model.layers.22.mlp.experts.52.gate_proj.weight": "model-00023-of-00047.safetensors", + "model.layers.22.mlp.experts.52.gate_proj.weight_scale": "model-00023-of-00047.safetensors", + "model.layers.22.mlp.experts.52.up_proj.weight": "model-00023-of-00047.safetensors", + "model.layers.22.mlp.experts.52.up_proj.weight_scale": "model-00023-of-00047.safetensors", + "model.layers.22.mlp.experts.53.down_proj.weight": "model-00023-of-00047.safetensors", + "model.layers.22.mlp.experts.53.down_proj.weight_scale": "model-00023-of-00047.safetensors", + "model.layers.22.mlp.experts.53.gate_proj.weight": "model-00023-of-00047.safetensors", + "model.layers.22.mlp.experts.53.gate_proj.weight_scale": "model-00023-of-00047.safetensors", + "model.layers.22.mlp.experts.53.up_proj.weight": "model-00023-of-00047.safetensors", + "model.layers.22.mlp.experts.53.up_proj.weight_scale": "model-00023-of-00047.safetensors", + "model.layers.22.mlp.experts.54.down_proj.weight": "model-00023-of-00047.safetensors", + "model.layers.22.mlp.experts.54.down_proj.weight_scale": "model-00023-of-00047.safetensors", + "model.layers.22.mlp.experts.54.gate_proj.weight": "model-00023-of-00047.safetensors", + "model.layers.22.mlp.experts.54.gate_proj.weight_scale": "model-00023-of-00047.safetensors", + "model.layers.22.mlp.experts.54.up_proj.weight": "model-00023-of-00047.safetensors", + "model.layers.22.mlp.experts.54.up_proj.weight_scale": "model-00023-of-00047.safetensors", + "model.layers.22.mlp.experts.55.down_proj.weight": "model-00023-of-00047.safetensors", + "model.layers.22.mlp.experts.55.down_proj.weight_scale": "model-00023-of-00047.safetensors", + "model.layers.22.mlp.experts.55.gate_proj.weight": "model-00023-of-00047.safetensors", + "model.layers.22.mlp.experts.55.gate_proj.weight_scale": "model-00023-of-00047.safetensors", + "model.layers.22.mlp.experts.55.up_proj.weight": "model-00023-of-00047.safetensors", + "model.layers.22.mlp.experts.55.up_proj.weight_scale": "model-00023-of-00047.safetensors", + "model.layers.22.mlp.experts.56.down_proj.weight": "model-00023-of-00047.safetensors", + "model.layers.22.mlp.experts.56.down_proj.weight_scale": "model-00023-of-00047.safetensors", + "model.layers.22.mlp.experts.56.gate_proj.weight": "model-00023-of-00047.safetensors", + "model.layers.22.mlp.experts.56.gate_proj.weight_scale": "model-00023-of-00047.safetensors", + "model.layers.22.mlp.experts.56.up_proj.weight": "model-00023-of-00047.safetensors", + "model.layers.22.mlp.experts.56.up_proj.weight_scale": "model-00023-of-00047.safetensors", + "model.layers.22.mlp.experts.57.down_proj.weight": "model-00023-of-00047.safetensors", + "model.layers.22.mlp.experts.57.down_proj.weight_scale": "model-00023-of-00047.safetensors", + "model.layers.22.mlp.experts.57.gate_proj.weight": "model-00023-of-00047.safetensors", + "model.layers.22.mlp.experts.57.gate_proj.weight_scale": "model-00023-of-00047.safetensors", + "model.layers.22.mlp.experts.57.up_proj.weight": "model-00023-of-00047.safetensors", + "model.layers.22.mlp.experts.57.up_proj.weight_scale": "model-00023-of-00047.safetensors", + "model.layers.22.mlp.experts.58.down_proj.weight": "model-00023-of-00047.safetensors", + "model.layers.22.mlp.experts.58.down_proj.weight_scale": "model-00023-of-00047.safetensors", + "model.layers.22.mlp.experts.58.gate_proj.weight": "model-00023-of-00047.safetensors", + "model.layers.22.mlp.experts.58.gate_proj.weight_scale": "model-00023-of-00047.safetensors", + "model.layers.22.mlp.experts.58.up_proj.weight": "model-00023-of-00047.safetensors", + "model.layers.22.mlp.experts.58.up_proj.weight_scale": "model-00023-of-00047.safetensors", + "model.layers.22.mlp.experts.59.down_proj.weight": "model-00023-of-00047.safetensors", + "model.layers.22.mlp.experts.59.down_proj.weight_scale": "model-00023-of-00047.safetensors", + "model.layers.22.mlp.experts.59.gate_proj.weight": "model-00023-of-00047.safetensors", + "model.layers.22.mlp.experts.59.gate_proj.weight_scale": "model-00023-of-00047.safetensors", + "model.layers.22.mlp.experts.59.up_proj.weight": "model-00023-of-00047.safetensors", + "model.layers.22.mlp.experts.59.up_proj.weight_scale": "model-00023-of-00047.safetensors", + "model.layers.22.mlp.experts.6.down_proj.weight": "model-00023-of-00047.safetensors", + "model.layers.22.mlp.experts.6.down_proj.weight_scale": "model-00023-of-00047.safetensors", + "model.layers.22.mlp.experts.6.gate_proj.weight": "model-00023-of-00047.safetensors", + "model.layers.22.mlp.experts.6.gate_proj.weight_scale": "model-00023-of-00047.safetensors", + "model.layers.22.mlp.experts.6.up_proj.weight": "model-00023-of-00047.safetensors", + "model.layers.22.mlp.experts.6.up_proj.weight_scale": "model-00023-of-00047.safetensors", + "model.layers.22.mlp.experts.60.down_proj.weight": "model-00023-of-00047.safetensors", + "model.layers.22.mlp.experts.60.down_proj.weight_scale": "model-00023-of-00047.safetensors", + "model.layers.22.mlp.experts.60.gate_proj.weight": "model-00023-of-00047.safetensors", + "model.layers.22.mlp.experts.60.gate_proj.weight_scale": "model-00023-of-00047.safetensors", + "model.layers.22.mlp.experts.60.up_proj.weight": "model-00023-of-00047.safetensors", + "model.layers.22.mlp.experts.60.up_proj.weight_scale": "model-00023-of-00047.safetensors", + "model.layers.22.mlp.experts.61.down_proj.weight": "model-00023-of-00047.safetensors", + "model.layers.22.mlp.experts.61.down_proj.weight_scale": "model-00023-of-00047.safetensors", + "model.layers.22.mlp.experts.61.gate_proj.weight": "model-00023-of-00047.safetensors", + "model.layers.22.mlp.experts.61.gate_proj.weight_scale": "model-00023-of-00047.safetensors", + "model.layers.22.mlp.experts.61.up_proj.weight": "model-00023-of-00047.safetensors", + "model.layers.22.mlp.experts.61.up_proj.weight_scale": "model-00023-of-00047.safetensors", + "model.layers.22.mlp.experts.62.down_proj.weight": "model-00023-of-00047.safetensors", + "model.layers.22.mlp.experts.62.down_proj.weight_scale": "model-00023-of-00047.safetensors", + "model.layers.22.mlp.experts.62.gate_proj.weight": "model-00023-of-00047.safetensors", + "model.layers.22.mlp.experts.62.gate_proj.weight_scale": "model-00023-of-00047.safetensors", + "model.layers.22.mlp.experts.62.up_proj.weight": "model-00023-of-00047.safetensors", + "model.layers.22.mlp.experts.62.up_proj.weight_scale": "model-00023-of-00047.safetensors", + "model.layers.22.mlp.experts.63.down_proj.weight": "model-00023-of-00047.safetensors", + "model.layers.22.mlp.experts.63.down_proj.weight_scale": "model-00023-of-00047.safetensors", + "model.layers.22.mlp.experts.63.gate_proj.weight": "model-00023-of-00047.safetensors", + "model.layers.22.mlp.experts.63.gate_proj.weight_scale": "model-00023-of-00047.safetensors", + "model.layers.22.mlp.experts.63.up_proj.weight": "model-00023-of-00047.safetensors", + "model.layers.22.mlp.experts.63.up_proj.weight_scale": "model-00023-of-00047.safetensors", + "model.layers.22.mlp.experts.64.down_proj.weight": "model-00023-of-00047.safetensors", + "model.layers.22.mlp.experts.64.down_proj.weight_scale": "model-00023-of-00047.safetensors", + "model.layers.22.mlp.experts.64.gate_proj.weight": "model-00023-of-00047.safetensors", + "model.layers.22.mlp.experts.64.gate_proj.weight_scale": "model-00023-of-00047.safetensors", + "model.layers.22.mlp.experts.64.up_proj.weight": "model-00023-of-00047.safetensors", + "model.layers.22.mlp.experts.64.up_proj.weight_scale": "model-00023-of-00047.safetensors", + "model.layers.22.mlp.experts.65.down_proj.weight": "model-00023-of-00047.safetensors", + "model.layers.22.mlp.experts.65.down_proj.weight_scale": "model-00023-of-00047.safetensors", + "model.layers.22.mlp.experts.65.gate_proj.weight": "model-00023-of-00047.safetensors", + "model.layers.22.mlp.experts.65.gate_proj.weight_scale": "model-00023-of-00047.safetensors", + "model.layers.22.mlp.experts.65.up_proj.weight": "model-00023-of-00047.safetensors", + "model.layers.22.mlp.experts.65.up_proj.weight_scale": "model-00023-of-00047.safetensors", + "model.layers.22.mlp.experts.66.down_proj.weight": "model-00023-of-00047.safetensors", + "model.layers.22.mlp.experts.66.down_proj.weight_scale": "model-00023-of-00047.safetensors", + "model.layers.22.mlp.experts.66.gate_proj.weight": "model-00023-of-00047.safetensors", + "model.layers.22.mlp.experts.66.gate_proj.weight_scale": "model-00023-of-00047.safetensors", + "model.layers.22.mlp.experts.66.up_proj.weight": "model-00023-of-00047.safetensors", + "model.layers.22.mlp.experts.66.up_proj.weight_scale": "model-00023-of-00047.safetensors", + "model.layers.22.mlp.experts.67.down_proj.weight": "model-00023-of-00047.safetensors", + "model.layers.22.mlp.experts.67.down_proj.weight_scale": "model-00023-of-00047.safetensors", + "model.layers.22.mlp.experts.67.gate_proj.weight": "model-00023-of-00047.safetensors", + "model.layers.22.mlp.experts.67.gate_proj.weight_scale": "model-00023-of-00047.safetensors", + "model.layers.22.mlp.experts.67.up_proj.weight": "model-00023-of-00047.safetensors", + "model.layers.22.mlp.experts.67.up_proj.weight_scale": "model-00023-of-00047.safetensors", + "model.layers.22.mlp.experts.68.down_proj.weight": "model-00023-of-00047.safetensors", + "model.layers.22.mlp.experts.68.down_proj.weight_scale": "model-00023-of-00047.safetensors", + "model.layers.22.mlp.experts.68.gate_proj.weight": "model-00023-of-00047.safetensors", + "model.layers.22.mlp.experts.68.gate_proj.weight_scale": "model-00023-of-00047.safetensors", + "model.layers.22.mlp.experts.68.up_proj.weight": "model-00023-of-00047.safetensors", + "model.layers.22.mlp.experts.68.up_proj.weight_scale": "model-00023-of-00047.safetensors", + "model.layers.22.mlp.experts.69.down_proj.weight": "model-00023-of-00047.safetensors", + "model.layers.22.mlp.experts.69.down_proj.weight_scale": "model-00023-of-00047.safetensors", + "model.layers.22.mlp.experts.69.gate_proj.weight": "model-00023-of-00047.safetensors", + "model.layers.22.mlp.experts.69.gate_proj.weight_scale": "model-00023-of-00047.safetensors", + "model.layers.22.mlp.experts.69.up_proj.weight": "model-00023-of-00047.safetensors", + "model.layers.22.mlp.experts.69.up_proj.weight_scale": "model-00023-of-00047.safetensors", + "model.layers.22.mlp.experts.7.down_proj.weight": "model-00023-of-00047.safetensors", + "model.layers.22.mlp.experts.7.down_proj.weight_scale": "model-00023-of-00047.safetensors", + "model.layers.22.mlp.experts.7.gate_proj.weight": "model-00023-of-00047.safetensors", + "model.layers.22.mlp.experts.7.gate_proj.weight_scale": "model-00023-of-00047.safetensors", + "model.layers.22.mlp.experts.7.up_proj.weight": "model-00023-of-00047.safetensors", + "model.layers.22.mlp.experts.7.up_proj.weight_scale": "model-00023-of-00047.safetensors", + "model.layers.22.mlp.experts.70.down_proj.weight": "model-00023-of-00047.safetensors", + "model.layers.22.mlp.experts.70.down_proj.weight_scale": "model-00023-of-00047.safetensors", + "model.layers.22.mlp.experts.70.gate_proj.weight": "model-00023-of-00047.safetensors", + "model.layers.22.mlp.experts.70.gate_proj.weight_scale": "model-00023-of-00047.safetensors", + "model.layers.22.mlp.experts.70.up_proj.weight": "model-00023-of-00047.safetensors", + "model.layers.22.mlp.experts.70.up_proj.weight_scale": "model-00023-of-00047.safetensors", + "model.layers.22.mlp.experts.71.down_proj.weight": "model-00023-of-00047.safetensors", + "model.layers.22.mlp.experts.71.down_proj.weight_scale": "model-00023-of-00047.safetensors", + "model.layers.22.mlp.experts.71.gate_proj.weight": "model-00023-of-00047.safetensors", + "model.layers.22.mlp.experts.71.gate_proj.weight_scale": "model-00023-of-00047.safetensors", + "model.layers.22.mlp.experts.71.up_proj.weight": "model-00023-of-00047.safetensors", + "model.layers.22.mlp.experts.71.up_proj.weight_scale": "model-00023-of-00047.safetensors", + "model.layers.22.mlp.experts.72.down_proj.weight": "model-00023-of-00047.safetensors", + "model.layers.22.mlp.experts.72.down_proj.weight_scale": "model-00023-of-00047.safetensors", + "model.layers.22.mlp.experts.72.gate_proj.weight": "model-00023-of-00047.safetensors", + "model.layers.22.mlp.experts.72.gate_proj.weight_scale": "model-00023-of-00047.safetensors", + "model.layers.22.mlp.experts.72.up_proj.weight": "model-00023-of-00047.safetensors", + "model.layers.22.mlp.experts.72.up_proj.weight_scale": "model-00023-of-00047.safetensors", + "model.layers.22.mlp.experts.73.down_proj.weight": "model-00023-of-00047.safetensors", + "model.layers.22.mlp.experts.73.down_proj.weight_scale": "model-00023-of-00047.safetensors", + "model.layers.22.mlp.experts.73.gate_proj.weight": "model-00023-of-00047.safetensors", + "model.layers.22.mlp.experts.73.gate_proj.weight_scale": "model-00023-of-00047.safetensors", + "model.layers.22.mlp.experts.73.up_proj.weight": "model-00023-of-00047.safetensors", + "model.layers.22.mlp.experts.73.up_proj.weight_scale": "model-00023-of-00047.safetensors", + "model.layers.22.mlp.experts.74.down_proj.weight": "model-00023-of-00047.safetensors", + "model.layers.22.mlp.experts.74.down_proj.weight_scale": "model-00023-of-00047.safetensors", + "model.layers.22.mlp.experts.74.gate_proj.weight": "model-00023-of-00047.safetensors", + "model.layers.22.mlp.experts.74.gate_proj.weight_scale": "model-00023-of-00047.safetensors", + "model.layers.22.mlp.experts.74.up_proj.weight": "model-00023-of-00047.safetensors", + "model.layers.22.mlp.experts.74.up_proj.weight_scale": "model-00023-of-00047.safetensors", + "model.layers.22.mlp.experts.75.down_proj.weight": "model-00023-of-00047.safetensors", + "model.layers.22.mlp.experts.75.down_proj.weight_scale": "model-00023-of-00047.safetensors", + "model.layers.22.mlp.experts.75.gate_proj.weight": "model-00023-of-00047.safetensors", + "model.layers.22.mlp.experts.75.gate_proj.weight_scale": "model-00023-of-00047.safetensors", + "model.layers.22.mlp.experts.75.up_proj.weight": "model-00023-of-00047.safetensors", + "model.layers.22.mlp.experts.75.up_proj.weight_scale": "model-00023-of-00047.safetensors", + "model.layers.22.mlp.experts.76.down_proj.weight": "model-00023-of-00047.safetensors", + "model.layers.22.mlp.experts.76.down_proj.weight_scale": "model-00023-of-00047.safetensors", + "model.layers.22.mlp.experts.76.gate_proj.weight": "model-00023-of-00047.safetensors", + "model.layers.22.mlp.experts.76.gate_proj.weight_scale": "model-00023-of-00047.safetensors", + "model.layers.22.mlp.experts.76.up_proj.weight": "model-00023-of-00047.safetensors", + "model.layers.22.mlp.experts.76.up_proj.weight_scale": "model-00023-of-00047.safetensors", + "model.layers.22.mlp.experts.77.down_proj.weight": "model-00023-of-00047.safetensors", + "model.layers.22.mlp.experts.77.down_proj.weight_scale": "model-00023-of-00047.safetensors", + "model.layers.22.mlp.experts.77.gate_proj.weight": "model-00023-of-00047.safetensors", + "model.layers.22.mlp.experts.77.gate_proj.weight_scale": "model-00023-of-00047.safetensors", + "model.layers.22.mlp.experts.77.up_proj.weight": "model-00023-of-00047.safetensors", + "model.layers.22.mlp.experts.77.up_proj.weight_scale": "model-00023-of-00047.safetensors", + "model.layers.22.mlp.experts.78.down_proj.weight": "model-00023-of-00047.safetensors", + "model.layers.22.mlp.experts.78.down_proj.weight_scale": "model-00023-of-00047.safetensors", + "model.layers.22.mlp.experts.78.gate_proj.weight": "model-00023-of-00047.safetensors", + "model.layers.22.mlp.experts.78.gate_proj.weight_scale": "model-00023-of-00047.safetensors", + "model.layers.22.mlp.experts.78.up_proj.weight": "model-00023-of-00047.safetensors", + "model.layers.22.mlp.experts.78.up_proj.weight_scale": "model-00023-of-00047.safetensors", + "model.layers.22.mlp.experts.79.down_proj.weight": "model-00023-of-00047.safetensors", + "model.layers.22.mlp.experts.79.down_proj.weight_scale": "model-00023-of-00047.safetensors", + "model.layers.22.mlp.experts.79.gate_proj.weight": "model-00023-of-00047.safetensors", + "model.layers.22.mlp.experts.79.gate_proj.weight_scale": "model-00023-of-00047.safetensors", + "model.layers.22.mlp.experts.79.up_proj.weight": "model-00023-of-00047.safetensors", + "model.layers.22.mlp.experts.79.up_proj.weight_scale": "model-00023-of-00047.safetensors", + "model.layers.22.mlp.experts.8.down_proj.weight": "model-00023-of-00047.safetensors", + "model.layers.22.mlp.experts.8.down_proj.weight_scale": "model-00023-of-00047.safetensors", + "model.layers.22.mlp.experts.8.gate_proj.weight": "model-00023-of-00047.safetensors", + "model.layers.22.mlp.experts.8.gate_proj.weight_scale": "model-00023-of-00047.safetensors", + "model.layers.22.mlp.experts.8.up_proj.weight": "model-00023-of-00047.safetensors", + "model.layers.22.mlp.experts.8.up_proj.weight_scale": "model-00023-of-00047.safetensors", + "model.layers.22.mlp.experts.80.down_proj.weight": "model-00023-of-00047.safetensors", + "model.layers.22.mlp.experts.80.down_proj.weight_scale": "model-00023-of-00047.safetensors", + "model.layers.22.mlp.experts.80.gate_proj.weight": "model-00023-of-00047.safetensors", + "model.layers.22.mlp.experts.80.gate_proj.weight_scale": "model-00023-of-00047.safetensors", + "model.layers.22.mlp.experts.80.up_proj.weight": "model-00023-of-00047.safetensors", + "model.layers.22.mlp.experts.80.up_proj.weight_scale": "model-00023-of-00047.safetensors", + "model.layers.22.mlp.experts.81.down_proj.weight": "model-00023-of-00047.safetensors", + "model.layers.22.mlp.experts.81.down_proj.weight_scale": "model-00023-of-00047.safetensors", + "model.layers.22.mlp.experts.81.gate_proj.weight": "model-00023-of-00047.safetensors", + "model.layers.22.mlp.experts.81.gate_proj.weight_scale": "model-00023-of-00047.safetensors", + "model.layers.22.mlp.experts.81.up_proj.weight": "model-00023-of-00047.safetensors", + "model.layers.22.mlp.experts.81.up_proj.weight_scale": "model-00023-of-00047.safetensors", + "model.layers.22.mlp.experts.82.down_proj.weight": "model-00023-of-00047.safetensors", + "model.layers.22.mlp.experts.82.down_proj.weight_scale": "model-00023-of-00047.safetensors", + "model.layers.22.mlp.experts.82.gate_proj.weight": "model-00023-of-00047.safetensors", + "model.layers.22.mlp.experts.82.gate_proj.weight_scale": "model-00023-of-00047.safetensors", + "model.layers.22.mlp.experts.82.up_proj.weight": "model-00023-of-00047.safetensors", + "model.layers.22.mlp.experts.82.up_proj.weight_scale": "model-00023-of-00047.safetensors", + "model.layers.22.mlp.experts.83.down_proj.weight": "model-00023-of-00047.safetensors", + "model.layers.22.mlp.experts.83.down_proj.weight_scale": "model-00023-of-00047.safetensors", + "model.layers.22.mlp.experts.83.gate_proj.weight": "model-00023-of-00047.safetensors", + "model.layers.22.mlp.experts.83.gate_proj.weight_scale": "model-00023-of-00047.safetensors", + "model.layers.22.mlp.experts.83.up_proj.weight": "model-00023-of-00047.safetensors", + "model.layers.22.mlp.experts.83.up_proj.weight_scale": "model-00023-of-00047.safetensors", + "model.layers.22.mlp.experts.84.down_proj.weight": "model-00023-of-00047.safetensors", + "model.layers.22.mlp.experts.84.down_proj.weight_scale": "model-00023-of-00047.safetensors", + "model.layers.22.mlp.experts.84.gate_proj.weight": "model-00023-of-00047.safetensors", + "model.layers.22.mlp.experts.84.gate_proj.weight_scale": "model-00023-of-00047.safetensors", + "model.layers.22.mlp.experts.84.up_proj.weight": "model-00023-of-00047.safetensors", + "model.layers.22.mlp.experts.84.up_proj.weight_scale": "model-00023-of-00047.safetensors", + "model.layers.22.mlp.experts.85.down_proj.weight": "model-00023-of-00047.safetensors", + "model.layers.22.mlp.experts.85.down_proj.weight_scale": "model-00023-of-00047.safetensors", + "model.layers.22.mlp.experts.85.gate_proj.weight": "model-00023-of-00047.safetensors", + "model.layers.22.mlp.experts.85.gate_proj.weight_scale": "model-00023-of-00047.safetensors", + "model.layers.22.mlp.experts.85.up_proj.weight": "model-00023-of-00047.safetensors", + "model.layers.22.mlp.experts.85.up_proj.weight_scale": "model-00023-of-00047.safetensors", + "model.layers.22.mlp.experts.86.down_proj.weight": "model-00023-of-00047.safetensors", + "model.layers.22.mlp.experts.86.down_proj.weight_scale": "model-00023-of-00047.safetensors", + "model.layers.22.mlp.experts.86.gate_proj.weight": "model-00023-of-00047.safetensors", + "model.layers.22.mlp.experts.86.gate_proj.weight_scale": "model-00023-of-00047.safetensors", + "model.layers.22.mlp.experts.86.up_proj.weight": "model-00023-of-00047.safetensors", + "model.layers.22.mlp.experts.86.up_proj.weight_scale": "model-00023-of-00047.safetensors", + "model.layers.22.mlp.experts.87.down_proj.weight": "model-00023-of-00047.safetensors", + "model.layers.22.mlp.experts.87.down_proj.weight_scale": "model-00023-of-00047.safetensors", + "model.layers.22.mlp.experts.87.gate_proj.weight": "model-00023-of-00047.safetensors", + "model.layers.22.mlp.experts.87.gate_proj.weight_scale": "model-00023-of-00047.safetensors", + "model.layers.22.mlp.experts.87.up_proj.weight": "model-00023-of-00047.safetensors", + "model.layers.22.mlp.experts.87.up_proj.weight_scale": "model-00023-of-00047.safetensors", + "model.layers.22.mlp.experts.88.down_proj.weight": "model-00023-of-00047.safetensors", + "model.layers.22.mlp.experts.88.down_proj.weight_scale": "model-00023-of-00047.safetensors", + "model.layers.22.mlp.experts.88.gate_proj.weight": "model-00023-of-00047.safetensors", + "model.layers.22.mlp.experts.88.gate_proj.weight_scale": "model-00023-of-00047.safetensors", + "model.layers.22.mlp.experts.88.up_proj.weight": "model-00023-of-00047.safetensors", + "model.layers.22.mlp.experts.88.up_proj.weight_scale": "model-00023-of-00047.safetensors", + "model.layers.22.mlp.experts.89.down_proj.weight": "model-00023-of-00047.safetensors", + "model.layers.22.mlp.experts.89.down_proj.weight_scale": "model-00023-of-00047.safetensors", + "model.layers.22.mlp.experts.89.gate_proj.weight": "model-00023-of-00047.safetensors", + "model.layers.22.mlp.experts.89.gate_proj.weight_scale": "model-00023-of-00047.safetensors", + "model.layers.22.mlp.experts.89.up_proj.weight": "model-00023-of-00047.safetensors", + "model.layers.22.mlp.experts.89.up_proj.weight_scale": "model-00023-of-00047.safetensors", + "model.layers.22.mlp.experts.9.down_proj.weight": "model-00023-of-00047.safetensors", + "model.layers.22.mlp.experts.9.down_proj.weight_scale": "model-00023-of-00047.safetensors", + "model.layers.22.mlp.experts.9.gate_proj.weight": "model-00023-of-00047.safetensors", + "model.layers.22.mlp.experts.9.gate_proj.weight_scale": "model-00023-of-00047.safetensors", + "model.layers.22.mlp.experts.9.up_proj.weight": "model-00023-of-00047.safetensors", + "model.layers.22.mlp.experts.9.up_proj.weight_scale": "model-00023-of-00047.safetensors", + "model.layers.22.mlp.experts.90.down_proj.weight": "model-00023-of-00047.safetensors", + "model.layers.22.mlp.experts.90.down_proj.weight_scale": "model-00023-of-00047.safetensors", + "model.layers.22.mlp.experts.90.gate_proj.weight": "model-00023-of-00047.safetensors", + "model.layers.22.mlp.experts.90.gate_proj.weight_scale": "model-00023-of-00047.safetensors", + "model.layers.22.mlp.experts.90.up_proj.weight": "model-00023-of-00047.safetensors", + "model.layers.22.mlp.experts.90.up_proj.weight_scale": "model-00023-of-00047.safetensors", + "model.layers.22.mlp.experts.91.down_proj.weight": "model-00023-of-00047.safetensors", + "model.layers.22.mlp.experts.91.down_proj.weight_scale": "model-00023-of-00047.safetensors", + "model.layers.22.mlp.experts.91.gate_proj.weight": "model-00023-of-00047.safetensors", + "model.layers.22.mlp.experts.91.gate_proj.weight_scale": "model-00023-of-00047.safetensors", + "model.layers.22.mlp.experts.91.up_proj.weight": "model-00023-of-00047.safetensors", + "model.layers.22.mlp.experts.91.up_proj.weight_scale": "model-00023-of-00047.safetensors", + "model.layers.22.mlp.experts.92.down_proj.weight": "model-00023-of-00047.safetensors", + "model.layers.22.mlp.experts.92.down_proj.weight_scale": "model-00023-of-00047.safetensors", + "model.layers.22.mlp.experts.92.gate_proj.weight": "model-00023-of-00047.safetensors", + "model.layers.22.mlp.experts.92.gate_proj.weight_scale": "model-00023-of-00047.safetensors", + "model.layers.22.mlp.experts.92.up_proj.weight": "model-00023-of-00047.safetensors", + "model.layers.22.mlp.experts.92.up_proj.weight_scale": "model-00023-of-00047.safetensors", + "model.layers.22.mlp.experts.93.down_proj.weight": "model-00023-of-00047.safetensors", + "model.layers.22.mlp.experts.93.down_proj.weight_scale": "model-00023-of-00047.safetensors", + "model.layers.22.mlp.experts.93.gate_proj.weight": "model-00023-of-00047.safetensors", + "model.layers.22.mlp.experts.93.gate_proj.weight_scale": "model-00023-of-00047.safetensors", + "model.layers.22.mlp.experts.93.up_proj.weight": "model-00023-of-00047.safetensors", + "model.layers.22.mlp.experts.93.up_proj.weight_scale": "model-00023-of-00047.safetensors", + "model.layers.22.mlp.experts.94.down_proj.weight": "model-00023-of-00047.safetensors", + "model.layers.22.mlp.experts.94.down_proj.weight_scale": "model-00023-of-00047.safetensors", + "model.layers.22.mlp.experts.94.gate_proj.weight": "model-00023-of-00047.safetensors", + "model.layers.22.mlp.experts.94.gate_proj.weight_scale": "model-00023-of-00047.safetensors", + "model.layers.22.mlp.experts.94.up_proj.weight": "model-00023-of-00047.safetensors", + "model.layers.22.mlp.experts.94.up_proj.weight_scale": "model-00023-of-00047.safetensors", + "model.layers.22.mlp.experts.95.down_proj.weight": "model-00023-of-00047.safetensors", + "model.layers.22.mlp.experts.95.down_proj.weight_scale": "model-00023-of-00047.safetensors", + "model.layers.22.mlp.experts.95.gate_proj.weight": "model-00023-of-00047.safetensors", + "model.layers.22.mlp.experts.95.gate_proj.weight_scale": "model-00023-of-00047.safetensors", + "model.layers.22.mlp.experts.95.up_proj.weight": "model-00023-of-00047.safetensors", + "model.layers.22.mlp.experts.95.up_proj.weight_scale": "model-00023-of-00047.safetensors", + "model.layers.22.mlp.experts.96.down_proj.weight": "model-00023-of-00047.safetensors", + "model.layers.22.mlp.experts.96.down_proj.weight_scale": "model-00023-of-00047.safetensors", + "model.layers.22.mlp.experts.96.gate_proj.weight": "model-00023-of-00047.safetensors", + "model.layers.22.mlp.experts.96.gate_proj.weight_scale": "model-00023-of-00047.safetensors", + "model.layers.22.mlp.experts.96.up_proj.weight": "model-00023-of-00047.safetensors", + "model.layers.22.mlp.experts.96.up_proj.weight_scale": "model-00023-of-00047.safetensors", + "model.layers.22.mlp.experts.97.down_proj.weight": "model-00023-of-00047.safetensors", + "model.layers.22.mlp.experts.97.down_proj.weight_scale": "model-00023-of-00047.safetensors", + "model.layers.22.mlp.experts.97.gate_proj.weight": "model-00023-of-00047.safetensors", + "model.layers.22.mlp.experts.97.gate_proj.weight_scale": "model-00023-of-00047.safetensors", + "model.layers.22.mlp.experts.97.up_proj.weight": "model-00023-of-00047.safetensors", + "model.layers.22.mlp.experts.97.up_proj.weight_scale": "model-00023-of-00047.safetensors", + "model.layers.22.mlp.experts.98.down_proj.weight": "model-00023-of-00047.safetensors", + "model.layers.22.mlp.experts.98.down_proj.weight_scale": "model-00023-of-00047.safetensors", + "model.layers.22.mlp.experts.98.gate_proj.weight": "model-00023-of-00047.safetensors", + "model.layers.22.mlp.experts.98.gate_proj.weight_scale": "model-00023-of-00047.safetensors", + "model.layers.22.mlp.experts.98.up_proj.weight": "model-00023-of-00047.safetensors", + "model.layers.22.mlp.experts.98.up_proj.weight_scale": "model-00023-of-00047.safetensors", + "model.layers.22.mlp.experts.99.down_proj.weight": "model-00023-of-00047.safetensors", + "model.layers.22.mlp.experts.99.down_proj.weight_scale": "model-00023-of-00047.safetensors", + "model.layers.22.mlp.experts.99.gate_proj.weight": "model-00023-of-00047.safetensors", + "model.layers.22.mlp.experts.99.gate_proj.weight_scale": "model-00023-of-00047.safetensors", + "model.layers.22.mlp.experts.99.up_proj.weight": "model-00023-of-00047.safetensors", + "model.layers.22.mlp.experts.99.up_proj.weight_scale": "model-00023-of-00047.safetensors", + "model.layers.22.mlp.gate.e_score_correction_bias": "model-00023-of-00047.safetensors", + "model.layers.22.mlp.gate.weight": "model-00023-of-00047.safetensors", + "model.layers.22.mlp.shared_experts.down_proj.weight": "model-00023-of-00047.safetensors", + "model.layers.22.mlp.shared_experts.down_proj.weight_scale": "model-00023-of-00047.safetensors", + "model.layers.22.mlp.shared_experts.gate_proj.weight": "model-00023-of-00047.safetensors", + "model.layers.22.mlp.shared_experts.gate_proj.weight_scale": "model-00023-of-00047.safetensors", + "model.layers.22.mlp.shared_experts.up_proj.weight": "model-00023-of-00047.safetensors", + "model.layers.22.mlp.shared_experts.up_proj.weight_scale": "model-00023-of-00047.safetensors", + "model.layers.22.post_attention_layernorm.weight": "model-00023-of-00047.safetensors", + "model.layers.22.self_attn.k_proj.bias": "model-00023-of-00047.safetensors", + "model.layers.22.self_attn.k_proj.weight": "model-00023-of-00047.safetensors", + "model.layers.22.self_attn.k_proj.weight_scale": "model-00023-of-00047.safetensors", + "model.layers.22.self_attn.o_proj.weight": "model-00023-of-00047.safetensors", + "model.layers.22.self_attn.o_proj.weight_scale": "model-00023-of-00047.safetensors", + "model.layers.22.self_attn.q_proj.bias": "model-00023-of-00047.safetensors", + "model.layers.22.self_attn.q_proj.weight": "model-00023-of-00047.safetensors", + "model.layers.22.self_attn.q_proj.weight_scale": "model-00023-of-00047.safetensors", + "model.layers.22.self_attn.v_proj.bias": "model-00023-of-00047.safetensors", + "model.layers.22.self_attn.v_proj.weight": "model-00023-of-00047.safetensors", + "model.layers.22.self_attn.v_proj.weight_scale": "model-00023-of-00047.safetensors", + "model.layers.23.input_layernorm.weight": "model-00024-of-00047.safetensors", + "model.layers.23.mlp.experts.0.down_proj.weight": "model-00024-of-00047.safetensors", + "model.layers.23.mlp.experts.0.down_proj.weight_scale": "model-00024-of-00047.safetensors", + "model.layers.23.mlp.experts.0.gate_proj.weight": "model-00024-of-00047.safetensors", + "model.layers.23.mlp.experts.0.gate_proj.weight_scale": "model-00024-of-00047.safetensors", + "model.layers.23.mlp.experts.0.up_proj.weight": "model-00024-of-00047.safetensors", + "model.layers.23.mlp.experts.0.up_proj.weight_scale": "model-00024-of-00047.safetensors", + "model.layers.23.mlp.experts.1.down_proj.weight": "model-00024-of-00047.safetensors", + "model.layers.23.mlp.experts.1.down_proj.weight_scale": "model-00024-of-00047.safetensors", + "model.layers.23.mlp.experts.1.gate_proj.weight": "model-00024-of-00047.safetensors", + "model.layers.23.mlp.experts.1.gate_proj.weight_scale": "model-00024-of-00047.safetensors", + "model.layers.23.mlp.experts.1.up_proj.weight": "model-00024-of-00047.safetensors", + "model.layers.23.mlp.experts.1.up_proj.weight_scale": "model-00024-of-00047.safetensors", + "model.layers.23.mlp.experts.10.down_proj.weight": "model-00024-of-00047.safetensors", + "model.layers.23.mlp.experts.10.down_proj.weight_scale": "model-00024-of-00047.safetensors", + "model.layers.23.mlp.experts.10.gate_proj.weight": "model-00024-of-00047.safetensors", + "model.layers.23.mlp.experts.10.gate_proj.weight_scale": "model-00024-of-00047.safetensors", + "model.layers.23.mlp.experts.10.up_proj.weight": "model-00024-of-00047.safetensors", + "model.layers.23.mlp.experts.10.up_proj.weight_scale": "model-00024-of-00047.safetensors", + "model.layers.23.mlp.experts.100.down_proj.weight": "model-00024-of-00047.safetensors", + "model.layers.23.mlp.experts.100.down_proj.weight_scale": "model-00024-of-00047.safetensors", + "model.layers.23.mlp.experts.100.gate_proj.weight": "model-00024-of-00047.safetensors", + "model.layers.23.mlp.experts.100.gate_proj.weight_scale": "model-00024-of-00047.safetensors", + "model.layers.23.mlp.experts.100.up_proj.weight": "model-00024-of-00047.safetensors", + "model.layers.23.mlp.experts.100.up_proj.weight_scale": "model-00024-of-00047.safetensors", + "model.layers.23.mlp.experts.101.down_proj.weight": "model-00024-of-00047.safetensors", + "model.layers.23.mlp.experts.101.down_proj.weight_scale": "model-00024-of-00047.safetensors", + "model.layers.23.mlp.experts.101.gate_proj.weight": "model-00024-of-00047.safetensors", + "model.layers.23.mlp.experts.101.gate_proj.weight_scale": "model-00024-of-00047.safetensors", + "model.layers.23.mlp.experts.101.up_proj.weight": "model-00024-of-00047.safetensors", + "model.layers.23.mlp.experts.101.up_proj.weight_scale": "model-00024-of-00047.safetensors", + "model.layers.23.mlp.experts.102.down_proj.weight": "model-00024-of-00047.safetensors", + "model.layers.23.mlp.experts.102.down_proj.weight_scale": "model-00024-of-00047.safetensors", + "model.layers.23.mlp.experts.102.gate_proj.weight": "model-00024-of-00047.safetensors", + "model.layers.23.mlp.experts.102.gate_proj.weight_scale": "model-00024-of-00047.safetensors", + "model.layers.23.mlp.experts.102.up_proj.weight": "model-00024-of-00047.safetensors", + "model.layers.23.mlp.experts.102.up_proj.weight_scale": "model-00024-of-00047.safetensors", + "model.layers.23.mlp.experts.103.down_proj.weight": "model-00024-of-00047.safetensors", + "model.layers.23.mlp.experts.103.down_proj.weight_scale": "model-00024-of-00047.safetensors", + "model.layers.23.mlp.experts.103.gate_proj.weight": "model-00024-of-00047.safetensors", + "model.layers.23.mlp.experts.103.gate_proj.weight_scale": "model-00024-of-00047.safetensors", + "model.layers.23.mlp.experts.103.up_proj.weight": "model-00024-of-00047.safetensors", + "model.layers.23.mlp.experts.103.up_proj.weight_scale": "model-00024-of-00047.safetensors", + "model.layers.23.mlp.experts.104.down_proj.weight": "model-00024-of-00047.safetensors", + "model.layers.23.mlp.experts.104.down_proj.weight_scale": "model-00024-of-00047.safetensors", + "model.layers.23.mlp.experts.104.gate_proj.weight": "model-00024-of-00047.safetensors", + "model.layers.23.mlp.experts.104.gate_proj.weight_scale": "model-00024-of-00047.safetensors", + "model.layers.23.mlp.experts.104.up_proj.weight": "model-00024-of-00047.safetensors", + "model.layers.23.mlp.experts.104.up_proj.weight_scale": "model-00024-of-00047.safetensors", + "model.layers.23.mlp.experts.105.down_proj.weight": "model-00024-of-00047.safetensors", + "model.layers.23.mlp.experts.105.down_proj.weight_scale": "model-00024-of-00047.safetensors", + "model.layers.23.mlp.experts.105.gate_proj.weight": "model-00024-of-00047.safetensors", + "model.layers.23.mlp.experts.105.gate_proj.weight_scale": "model-00024-of-00047.safetensors", + "model.layers.23.mlp.experts.105.up_proj.weight": "model-00024-of-00047.safetensors", + "model.layers.23.mlp.experts.105.up_proj.weight_scale": "model-00024-of-00047.safetensors", + "model.layers.23.mlp.experts.106.down_proj.weight": "model-00024-of-00047.safetensors", + "model.layers.23.mlp.experts.106.down_proj.weight_scale": "model-00024-of-00047.safetensors", + "model.layers.23.mlp.experts.106.gate_proj.weight": "model-00024-of-00047.safetensors", + "model.layers.23.mlp.experts.106.gate_proj.weight_scale": "model-00024-of-00047.safetensors", + "model.layers.23.mlp.experts.106.up_proj.weight": "model-00024-of-00047.safetensors", + "model.layers.23.mlp.experts.106.up_proj.weight_scale": "model-00024-of-00047.safetensors", + "model.layers.23.mlp.experts.107.down_proj.weight": "model-00024-of-00047.safetensors", + "model.layers.23.mlp.experts.107.down_proj.weight_scale": "model-00024-of-00047.safetensors", + "model.layers.23.mlp.experts.107.gate_proj.weight": "model-00024-of-00047.safetensors", + "model.layers.23.mlp.experts.107.gate_proj.weight_scale": "model-00024-of-00047.safetensors", + "model.layers.23.mlp.experts.107.up_proj.weight": "model-00024-of-00047.safetensors", + "model.layers.23.mlp.experts.107.up_proj.weight_scale": "model-00024-of-00047.safetensors", + "model.layers.23.mlp.experts.108.down_proj.weight": "model-00024-of-00047.safetensors", + "model.layers.23.mlp.experts.108.down_proj.weight_scale": "model-00024-of-00047.safetensors", + "model.layers.23.mlp.experts.108.gate_proj.weight": "model-00024-of-00047.safetensors", + "model.layers.23.mlp.experts.108.gate_proj.weight_scale": "model-00024-of-00047.safetensors", + "model.layers.23.mlp.experts.108.up_proj.weight": "model-00024-of-00047.safetensors", + "model.layers.23.mlp.experts.108.up_proj.weight_scale": "model-00024-of-00047.safetensors", + "model.layers.23.mlp.experts.109.down_proj.weight": "model-00024-of-00047.safetensors", + "model.layers.23.mlp.experts.109.down_proj.weight_scale": "model-00024-of-00047.safetensors", + "model.layers.23.mlp.experts.109.gate_proj.weight": "model-00024-of-00047.safetensors", + "model.layers.23.mlp.experts.109.gate_proj.weight_scale": "model-00024-of-00047.safetensors", + "model.layers.23.mlp.experts.109.up_proj.weight": "model-00024-of-00047.safetensors", + "model.layers.23.mlp.experts.109.up_proj.weight_scale": "model-00024-of-00047.safetensors", + "model.layers.23.mlp.experts.11.down_proj.weight": "model-00024-of-00047.safetensors", + "model.layers.23.mlp.experts.11.down_proj.weight_scale": "model-00024-of-00047.safetensors", + "model.layers.23.mlp.experts.11.gate_proj.weight": "model-00024-of-00047.safetensors", + "model.layers.23.mlp.experts.11.gate_proj.weight_scale": "model-00024-of-00047.safetensors", + "model.layers.23.mlp.experts.11.up_proj.weight": "model-00024-of-00047.safetensors", + "model.layers.23.mlp.experts.11.up_proj.weight_scale": "model-00024-of-00047.safetensors", + "model.layers.23.mlp.experts.110.down_proj.weight": "model-00024-of-00047.safetensors", + "model.layers.23.mlp.experts.110.down_proj.weight_scale": "model-00024-of-00047.safetensors", + "model.layers.23.mlp.experts.110.gate_proj.weight": "model-00024-of-00047.safetensors", + "model.layers.23.mlp.experts.110.gate_proj.weight_scale": "model-00024-of-00047.safetensors", + "model.layers.23.mlp.experts.110.up_proj.weight": "model-00024-of-00047.safetensors", + "model.layers.23.mlp.experts.110.up_proj.weight_scale": "model-00024-of-00047.safetensors", + "model.layers.23.mlp.experts.111.down_proj.weight": "model-00024-of-00047.safetensors", + "model.layers.23.mlp.experts.111.down_proj.weight_scale": "model-00024-of-00047.safetensors", + "model.layers.23.mlp.experts.111.gate_proj.weight": "model-00024-of-00047.safetensors", + "model.layers.23.mlp.experts.111.gate_proj.weight_scale": "model-00024-of-00047.safetensors", + "model.layers.23.mlp.experts.111.up_proj.weight": "model-00024-of-00047.safetensors", + "model.layers.23.mlp.experts.111.up_proj.weight_scale": "model-00024-of-00047.safetensors", + "model.layers.23.mlp.experts.112.down_proj.weight": "model-00024-of-00047.safetensors", + "model.layers.23.mlp.experts.112.down_proj.weight_scale": "model-00024-of-00047.safetensors", + "model.layers.23.mlp.experts.112.gate_proj.weight": "model-00024-of-00047.safetensors", + "model.layers.23.mlp.experts.112.gate_proj.weight_scale": "model-00024-of-00047.safetensors", + "model.layers.23.mlp.experts.112.up_proj.weight": "model-00024-of-00047.safetensors", + "model.layers.23.mlp.experts.112.up_proj.weight_scale": "model-00024-of-00047.safetensors", + "model.layers.23.mlp.experts.113.down_proj.weight": "model-00024-of-00047.safetensors", + "model.layers.23.mlp.experts.113.down_proj.weight_scale": "model-00024-of-00047.safetensors", + "model.layers.23.mlp.experts.113.gate_proj.weight": "model-00024-of-00047.safetensors", + "model.layers.23.mlp.experts.113.gate_proj.weight_scale": "model-00024-of-00047.safetensors", + "model.layers.23.mlp.experts.113.up_proj.weight": "model-00024-of-00047.safetensors", + "model.layers.23.mlp.experts.113.up_proj.weight_scale": "model-00024-of-00047.safetensors", + "model.layers.23.mlp.experts.114.down_proj.weight": "model-00024-of-00047.safetensors", + "model.layers.23.mlp.experts.114.down_proj.weight_scale": "model-00024-of-00047.safetensors", + "model.layers.23.mlp.experts.114.gate_proj.weight": "model-00024-of-00047.safetensors", + "model.layers.23.mlp.experts.114.gate_proj.weight_scale": "model-00024-of-00047.safetensors", + "model.layers.23.mlp.experts.114.up_proj.weight": "model-00024-of-00047.safetensors", + "model.layers.23.mlp.experts.114.up_proj.weight_scale": "model-00024-of-00047.safetensors", + "model.layers.23.mlp.experts.115.down_proj.weight": "model-00024-of-00047.safetensors", + "model.layers.23.mlp.experts.115.down_proj.weight_scale": "model-00024-of-00047.safetensors", + "model.layers.23.mlp.experts.115.gate_proj.weight": "model-00024-of-00047.safetensors", + "model.layers.23.mlp.experts.115.gate_proj.weight_scale": "model-00024-of-00047.safetensors", + "model.layers.23.mlp.experts.115.up_proj.weight": "model-00024-of-00047.safetensors", + "model.layers.23.mlp.experts.115.up_proj.weight_scale": "model-00024-of-00047.safetensors", + "model.layers.23.mlp.experts.116.down_proj.weight": "model-00024-of-00047.safetensors", + "model.layers.23.mlp.experts.116.down_proj.weight_scale": "model-00024-of-00047.safetensors", + "model.layers.23.mlp.experts.116.gate_proj.weight": "model-00024-of-00047.safetensors", + "model.layers.23.mlp.experts.116.gate_proj.weight_scale": "model-00024-of-00047.safetensors", + "model.layers.23.mlp.experts.116.up_proj.weight": "model-00024-of-00047.safetensors", + "model.layers.23.mlp.experts.116.up_proj.weight_scale": "model-00024-of-00047.safetensors", + "model.layers.23.mlp.experts.117.down_proj.weight": "model-00024-of-00047.safetensors", + "model.layers.23.mlp.experts.117.down_proj.weight_scale": "model-00024-of-00047.safetensors", + "model.layers.23.mlp.experts.117.gate_proj.weight": "model-00024-of-00047.safetensors", + "model.layers.23.mlp.experts.117.gate_proj.weight_scale": "model-00024-of-00047.safetensors", + "model.layers.23.mlp.experts.117.up_proj.weight": "model-00024-of-00047.safetensors", + "model.layers.23.mlp.experts.117.up_proj.weight_scale": "model-00024-of-00047.safetensors", + "model.layers.23.mlp.experts.118.down_proj.weight": "model-00024-of-00047.safetensors", + "model.layers.23.mlp.experts.118.down_proj.weight_scale": "model-00024-of-00047.safetensors", + "model.layers.23.mlp.experts.118.gate_proj.weight": "model-00024-of-00047.safetensors", + "model.layers.23.mlp.experts.118.gate_proj.weight_scale": "model-00024-of-00047.safetensors", + "model.layers.23.mlp.experts.118.up_proj.weight": "model-00024-of-00047.safetensors", + "model.layers.23.mlp.experts.118.up_proj.weight_scale": "model-00024-of-00047.safetensors", + "model.layers.23.mlp.experts.119.down_proj.weight": "model-00024-of-00047.safetensors", + "model.layers.23.mlp.experts.119.down_proj.weight_scale": "model-00024-of-00047.safetensors", + "model.layers.23.mlp.experts.119.gate_proj.weight": "model-00024-of-00047.safetensors", + "model.layers.23.mlp.experts.119.gate_proj.weight_scale": "model-00024-of-00047.safetensors", + "model.layers.23.mlp.experts.119.up_proj.weight": "model-00024-of-00047.safetensors", + "model.layers.23.mlp.experts.119.up_proj.weight_scale": "model-00024-of-00047.safetensors", + "model.layers.23.mlp.experts.12.down_proj.weight": "model-00024-of-00047.safetensors", + "model.layers.23.mlp.experts.12.down_proj.weight_scale": "model-00024-of-00047.safetensors", + "model.layers.23.mlp.experts.12.gate_proj.weight": "model-00024-of-00047.safetensors", + "model.layers.23.mlp.experts.12.gate_proj.weight_scale": "model-00024-of-00047.safetensors", + "model.layers.23.mlp.experts.12.up_proj.weight": "model-00024-of-00047.safetensors", + "model.layers.23.mlp.experts.12.up_proj.weight_scale": "model-00024-of-00047.safetensors", + "model.layers.23.mlp.experts.120.down_proj.weight": "model-00024-of-00047.safetensors", + "model.layers.23.mlp.experts.120.down_proj.weight_scale": "model-00024-of-00047.safetensors", + "model.layers.23.mlp.experts.120.gate_proj.weight": "model-00024-of-00047.safetensors", + "model.layers.23.mlp.experts.120.gate_proj.weight_scale": "model-00024-of-00047.safetensors", + "model.layers.23.mlp.experts.120.up_proj.weight": "model-00024-of-00047.safetensors", + "model.layers.23.mlp.experts.120.up_proj.weight_scale": "model-00024-of-00047.safetensors", + "model.layers.23.mlp.experts.121.down_proj.weight": "model-00024-of-00047.safetensors", + "model.layers.23.mlp.experts.121.down_proj.weight_scale": "model-00024-of-00047.safetensors", + "model.layers.23.mlp.experts.121.gate_proj.weight": "model-00024-of-00047.safetensors", + "model.layers.23.mlp.experts.121.gate_proj.weight_scale": "model-00024-of-00047.safetensors", + "model.layers.23.mlp.experts.121.up_proj.weight": "model-00024-of-00047.safetensors", + "model.layers.23.mlp.experts.121.up_proj.weight_scale": "model-00024-of-00047.safetensors", + "model.layers.23.mlp.experts.122.down_proj.weight": "model-00024-of-00047.safetensors", + "model.layers.23.mlp.experts.122.down_proj.weight_scale": "model-00024-of-00047.safetensors", + "model.layers.23.mlp.experts.122.gate_proj.weight": "model-00024-of-00047.safetensors", + "model.layers.23.mlp.experts.122.gate_proj.weight_scale": "model-00024-of-00047.safetensors", + "model.layers.23.mlp.experts.122.up_proj.weight": "model-00024-of-00047.safetensors", + "model.layers.23.mlp.experts.122.up_proj.weight_scale": "model-00024-of-00047.safetensors", + "model.layers.23.mlp.experts.123.down_proj.weight": "model-00024-of-00047.safetensors", + "model.layers.23.mlp.experts.123.down_proj.weight_scale": "model-00024-of-00047.safetensors", + "model.layers.23.mlp.experts.123.gate_proj.weight": "model-00024-of-00047.safetensors", + "model.layers.23.mlp.experts.123.gate_proj.weight_scale": "model-00024-of-00047.safetensors", + "model.layers.23.mlp.experts.123.up_proj.weight": "model-00024-of-00047.safetensors", + "model.layers.23.mlp.experts.123.up_proj.weight_scale": "model-00024-of-00047.safetensors", + "model.layers.23.mlp.experts.124.down_proj.weight": "model-00024-of-00047.safetensors", + "model.layers.23.mlp.experts.124.down_proj.weight_scale": "model-00024-of-00047.safetensors", + "model.layers.23.mlp.experts.124.gate_proj.weight": "model-00024-of-00047.safetensors", + "model.layers.23.mlp.experts.124.gate_proj.weight_scale": "model-00024-of-00047.safetensors", + "model.layers.23.mlp.experts.124.up_proj.weight": "model-00024-of-00047.safetensors", + "model.layers.23.mlp.experts.124.up_proj.weight_scale": "model-00024-of-00047.safetensors", + "model.layers.23.mlp.experts.125.down_proj.weight": "model-00024-of-00047.safetensors", + "model.layers.23.mlp.experts.125.down_proj.weight_scale": "model-00024-of-00047.safetensors", + "model.layers.23.mlp.experts.125.gate_proj.weight": "model-00024-of-00047.safetensors", + "model.layers.23.mlp.experts.125.gate_proj.weight_scale": "model-00024-of-00047.safetensors", + "model.layers.23.mlp.experts.125.up_proj.weight": "model-00024-of-00047.safetensors", + "model.layers.23.mlp.experts.125.up_proj.weight_scale": "model-00024-of-00047.safetensors", + "model.layers.23.mlp.experts.126.down_proj.weight": "model-00024-of-00047.safetensors", + "model.layers.23.mlp.experts.126.down_proj.weight_scale": "model-00024-of-00047.safetensors", + "model.layers.23.mlp.experts.126.gate_proj.weight": "model-00024-of-00047.safetensors", + "model.layers.23.mlp.experts.126.gate_proj.weight_scale": "model-00024-of-00047.safetensors", + "model.layers.23.mlp.experts.126.up_proj.weight": "model-00024-of-00047.safetensors", + "model.layers.23.mlp.experts.126.up_proj.weight_scale": "model-00024-of-00047.safetensors", + "model.layers.23.mlp.experts.127.down_proj.weight": "model-00024-of-00047.safetensors", + "model.layers.23.mlp.experts.127.down_proj.weight_scale": "model-00024-of-00047.safetensors", + "model.layers.23.mlp.experts.127.gate_proj.weight": "model-00024-of-00047.safetensors", + "model.layers.23.mlp.experts.127.gate_proj.weight_scale": "model-00024-of-00047.safetensors", + "model.layers.23.mlp.experts.127.up_proj.weight": "model-00024-of-00047.safetensors", + "model.layers.23.mlp.experts.127.up_proj.weight_scale": "model-00024-of-00047.safetensors", + "model.layers.23.mlp.experts.13.down_proj.weight": "model-00024-of-00047.safetensors", + "model.layers.23.mlp.experts.13.down_proj.weight_scale": "model-00024-of-00047.safetensors", + "model.layers.23.mlp.experts.13.gate_proj.weight": "model-00024-of-00047.safetensors", + "model.layers.23.mlp.experts.13.gate_proj.weight_scale": "model-00024-of-00047.safetensors", + "model.layers.23.mlp.experts.13.up_proj.weight": "model-00024-of-00047.safetensors", + "model.layers.23.mlp.experts.13.up_proj.weight_scale": "model-00024-of-00047.safetensors", + "model.layers.23.mlp.experts.14.down_proj.weight": "model-00024-of-00047.safetensors", + "model.layers.23.mlp.experts.14.down_proj.weight_scale": "model-00024-of-00047.safetensors", + "model.layers.23.mlp.experts.14.gate_proj.weight": "model-00024-of-00047.safetensors", + "model.layers.23.mlp.experts.14.gate_proj.weight_scale": "model-00024-of-00047.safetensors", + "model.layers.23.mlp.experts.14.up_proj.weight": "model-00024-of-00047.safetensors", + "model.layers.23.mlp.experts.14.up_proj.weight_scale": "model-00024-of-00047.safetensors", + "model.layers.23.mlp.experts.15.down_proj.weight": "model-00024-of-00047.safetensors", + "model.layers.23.mlp.experts.15.down_proj.weight_scale": "model-00024-of-00047.safetensors", + "model.layers.23.mlp.experts.15.gate_proj.weight": "model-00024-of-00047.safetensors", + "model.layers.23.mlp.experts.15.gate_proj.weight_scale": "model-00024-of-00047.safetensors", + "model.layers.23.mlp.experts.15.up_proj.weight": "model-00024-of-00047.safetensors", + "model.layers.23.mlp.experts.15.up_proj.weight_scale": "model-00024-of-00047.safetensors", + "model.layers.23.mlp.experts.16.down_proj.weight": "model-00024-of-00047.safetensors", + "model.layers.23.mlp.experts.16.down_proj.weight_scale": "model-00024-of-00047.safetensors", + "model.layers.23.mlp.experts.16.gate_proj.weight": "model-00024-of-00047.safetensors", + "model.layers.23.mlp.experts.16.gate_proj.weight_scale": "model-00024-of-00047.safetensors", + "model.layers.23.mlp.experts.16.up_proj.weight": "model-00024-of-00047.safetensors", + "model.layers.23.mlp.experts.16.up_proj.weight_scale": "model-00024-of-00047.safetensors", + "model.layers.23.mlp.experts.17.down_proj.weight": "model-00024-of-00047.safetensors", + "model.layers.23.mlp.experts.17.down_proj.weight_scale": "model-00024-of-00047.safetensors", + "model.layers.23.mlp.experts.17.gate_proj.weight": "model-00024-of-00047.safetensors", + "model.layers.23.mlp.experts.17.gate_proj.weight_scale": "model-00024-of-00047.safetensors", + "model.layers.23.mlp.experts.17.up_proj.weight": "model-00024-of-00047.safetensors", + "model.layers.23.mlp.experts.17.up_proj.weight_scale": "model-00024-of-00047.safetensors", + "model.layers.23.mlp.experts.18.down_proj.weight": "model-00024-of-00047.safetensors", + "model.layers.23.mlp.experts.18.down_proj.weight_scale": "model-00024-of-00047.safetensors", + "model.layers.23.mlp.experts.18.gate_proj.weight": "model-00024-of-00047.safetensors", + "model.layers.23.mlp.experts.18.gate_proj.weight_scale": "model-00024-of-00047.safetensors", + "model.layers.23.mlp.experts.18.up_proj.weight": "model-00024-of-00047.safetensors", + "model.layers.23.mlp.experts.18.up_proj.weight_scale": "model-00024-of-00047.safetensors", + "model.layers.23.mlp.experts.19.down_proj.weight": "model-00024-of-00047.safetensors", + "model.layers.23.mlp.experts.19.down_proj.weight_scale": "model-00024-of-00047.safetensors", + "model.layers.23.mlp.experts.19.gate_proj.weight": "model-00024-of-00047.safetensors", + "model.layers.23.mlp.experts.19.gate_proj.weight_scale": "model-00024-of-00047.safetensors", + "model.layers.23.mlp.experts.19.up_proj.weight": "model-00024-of-00047.safetensors", + "model.layers.23.mlp.experts.19.up_proj.weight_scale": "model-00024-of-00047.safetensors", + "model.layers.23.mlp.experts.2.down_proj.weight": "model-00024-of-00047.safetensors", + "model.layers.23.mlp.experts.2.down_proj.weight_scale": "model-00024-of-00047.safetensors", + "model.layers.23.mlp.experts.2.gate_proj.weight": "model-00024-of-00047.safetensors", + "model.layers.23.mlp.experts.2.gate_proj.weight_scale": "model-00024-of-00047.safetensors", + "model.layers.23.mlp.experts.2.up_proj.weight": "model-00024-of-00047.safetensors", + "model.layers.23.mlp.experts.2.up_proj.weight_scale": "model-00024-of-00047.safetensors", + "model.layers.23.mlp.experts.20.down_proj.weight": "model-00024-of-00047.safetensors", + "model.layers.23.mlp.experts.20.down_proj.weight_scale": "model-00024-of-00047.safetensors", + "model.layers.23.mlp.experts.20.gate_proj.weight": "model-00024-of-00047.safetensors", + "model.layers.23.mlp.experts.20.gate_proj.weight_scale": "model-00024-of-00047.safetensors", + "model.layers.23.mlp.experts.20.up_proj.weight": "model-00024-of-00047.safetensors", + "model.layers.23.mlp.experts.20.up_proj.weight_scale": "model-00024-of-00047.safetensors", + "model.layers.23.mlp.experts.21.down_proj.weight": "model-00024-of-00047.safetensors", + "model.layers.23.mlp.experts.21.down_proj.weight_scale": "model-00024-of-00047.safetensors", + "model.layers.23.mlp.experts.21.gate_proj.weight": "model-00024-of-00047.safetensors", + "model.layers.23.mlp.experts.21.gate_proj.weight_scale": "model-00024-of-00047.safetensors", + "model.layers.23.mlp.experts.21.up_proj.weight": "model-00024-of-00047.safetensors", + "model.layers.23.mlp.experts.21.up_proj.weight_scale": "model-00024-of-00047.safetensors", + "model.layers.23.mlp.experts.22.down_proj.weight": "model-00024-of-00047.safetensors", + "model.layers.23.mlp.experts.22.down_proj.weight_scale": "model-00024-of-00047.safetensors", + "model.layers.23.mlp.experts.22.gate_proj.weight": "model-00024-of-00047.safetensors", + "model.layers.23.mlp.experts.22.gate_proj.weight_scale": "model-00024-of-00047.safetensors", + "model.layers.23.mlp.experts.22.up_proj.weight": "model-00024-of-00047.safetensors", + "model.layers.23.mlp.experts.22.up_proj.weight_scale": "model-00024-of-00047.safetensors", + "model.layers.23.mlp.experts.23.down_proj.weight": "model-00024-of-00047.safetensors", + "model.layers.23.mlp.experts.23.down_proj.weight_scale": "model-00024-of-00047.safetensors", + "model.layers.23.mlp.experts.23.gate_proj.weight": "model-00024-of-00047.safetensors", + "model.layers.23.mlp.experts.23.gate_proj.weight_scale": "model-00024-of-00047.safetensors", + "model.layers.23.mlp.experts.23.up_proj.weight": "model-00024-of-00047.safetensors", + "model.layers.23.mlp.experts.23.up_proj.weight_scale": "model-00024-of-00047.safetensors", + "model.layers.23.mlp.experts.24.down_proj.weight": "model-00024-of-00047.safetensors", + "model.layers.23.mlp.experts.24.down_proj.weight_scale": "model-00024-of-00047.safetensors", + "model.layers.23.mlp.experts.24.gate_proj.weight": "model-00024-of-00047.safetensors", + "model.layers.23.mlp.experts.24.gate_proj.weight_scale": "model-00024-of-00047.safetensors", + "model.layers.23.mlp.experts.24.up_proj.weight": "model-00024-of-00047.safetensors", + "model.layers.23.mlp.experts.24.up_proj.weight_scale": "model-00024-of-00047.safetensors", + "model.layers.23.mlp.experts.25.down_proj.weight": "model-00024-of-00047.safetensors", + "model.layers.23.mlp.experts.25.down_proj.weight_scale": "model-00024-of-00047.safetensors", + "model.layers.23.mlp.experts.25.gate_proj.weight": "model-00024-of-00047.safetensors", + "model.layers.23.mlp.experts.25.gate_proj.weight_scale": "model-00024-of-00047.safetensors", + "model.layers.23.mlp.experts.25.up_proj.weight": "model-00024-of-00047.safetensors", + "model.layers.23.mlp.experts.25.up_proj.weight_scale": "model-00024-of-00047.safetensors", + "model.layers.23.mlp.experts.26.down_proj.weight": "model-00024-of-00047.safetensors", + "model.layers.23.mlp.experts.26.down_proj.weight_scale": "model-00024-of-00047.safetensors", + "model.layers.23.mlp.experts.26.gate_proj.weight": "model-00024-of-00047.safetensors", + "model.layers.23.mlp.experts.26.gate_proj.weight_scale": "model-00024-of-00047.safetensors", + "model.layers.23.mlp.experts.26.up_proj.weight": "model-00024-of-00047.safetensors", + "model.layers.23.mlp.experts.26.up_proj.weight_scale": "model-00024-of-00047.safetensors", + "model.layers.23.mlp.experts.27.down_proj.weight": "model-00024-of-00047.safetensors", + "model.layers.23.mlp.experts.27.down_proj.weight_scale": "model-00024-of-00047.safetensors", + "model.layers.23.mlp.experts.27.gate_proj.weight": "model-00024-of-00047.safetensors", + "model.layers.23.mlp.experts.27.gate_proj.weight_scale": "model-00024-of-00047.safetensors", + "model.layers.23.mlp.experts.27.up_proj.weight": "model-00024-of-00047.safetensors", + "model.layers.23.mlp.experts.27.up_proj.weight_scale": "model-00024-of-00047.safetensors", + "model.layers.23.mlp.experts.28.down_proj.weight": "model-00024-of-00047.safetensors", + "model.layers.23.mlp.experts.28.down_proj.weight_scale": "model-00024-of-00047.safetensors", + "model.layers.23.mlp.experts.28.gate_proj.weight": "model-00024-of-00047.safetensors", + "model.layers.23.mlp.experts.28.gate_proj.weight_scale": "model-00024-of-00047.safetensors", + "model.layers.23.mlp.experts.28.up_proj.weight": "model-00024-of-00047.safetensors", + "model.layers.23.mlp.experts.28.up_proj.weight_scale": "model-00024-of-00047.safetensors", + "model.layers.23.mlp.experts.29.down_proj.weight": "model-00024-of-00047.safetensors", + "model.layers.23.mlp.experts.29.down_proj.weight_scale": "model-00024-of-00047.safetensors", + "model.layers.23.mlp.experts.29.gate_proj.weight": "model-00024-of-00047.safetensors", + "model.layers.23.mlp.experts.29.gate_proj.weight_scale": "model-00024-of-00047.safetensors", + "model.layers.23.mlp.experts.29.up_proj.weight": "model-00024-of-00047.safetensors", + "model.layers.23.mlp.experts.29.up_proj.weight_scale": "model-00024-of-00047.safetensors", + "model.layers.23.mlp.experts.3.down_proj.weight": "model-00024-of-00047.safetensors", + "model.layers.23.mlp.experts.3.down_proj.weight_scale": "model-00024-of-00047.safetensors", + "model.layers.23.mlp.experts.3.gate_proj.weight": "model-00024-of-00047.safetensors", + "model.layers.23.mlp.experts.3.gate_proj.weight_scale": "model-00024-of-00047.safetensors", + "model.layers.23.mlp.experts.3.up_proj.weight": "model-00024-of-00047.safetensors", + "model.layers.23.mlp.experts.3.up_proj.weight_scale": "model-00024-of-00047.safetensors", + "model.layers.23.mlp.experts.30.down_proj.weight": "model-00024-of-00047.safetensors", + "model.layers.23.mlp.experts.30.down_proj.weight_scale": "model-00024-of-00047.safetensors", + "model.layers.23.mlp.experts.30.gate_proj.weight": "model-00024-of-00047.safetensors", + "model.layers.23.mlp.experts.30.gate_proj.weight_scale": "model-00024-of-00047.safetensors", + "model.layers.23.mlp.experts.30.up_proj.weight": "model-00024-of-00047.safetensors", + "model.layers.23.mlp.experts.30.up_proj.weight_scale": "model-00024-of-00047.safetensors", + "model.layers.23.mlp.experts.31.down_proj.weight": "model-00024-of-00047.safetensors", + "model.layers.23.mlp.experts.31.down_proj.weight_scale": "model-00024-of-00047.safetensors", + "model.layers.23.mlp.experts.31.gate_proj.weight": "model-00024-of-00047.safetensors", + "model.layers.23.mlp.experts.31.gate_proj.weight_scale": "model-00024-of-00047.safetensors", + "model.layers.23.mlp.experts.31.up_proj.weight": "model-00024-of-00047.safetensors", + "model.layers.23.mlp.experts.31.up_proj.weight_scale": "model-00024-of-00047.safetensors", + "model.layers.23.mlp.experts.32.down_proj.weight": "model-00024-of-00047.safetensors", + "model.layers.23.mlp.experts.32.down_proj.weight_scale": "model-00024-of-00047.safetensors", + "model.layers.23.mlp.experts.32.gate_proj.weight": "model-00024-of-00047.safetensors", + "model.layers.23.mlp.experts.32.gate_proj.weight_scale": "model-00024-of-00047.safetensors", + "model.layers.23.mlp.experts.32.up_proj.weight": "model-00024-of-00047.safetensors", + "model.layers.23.mlp.experts.32.up_proj.weight_scale": "model-00024-of-00047.safetensors", + "model.layers.23.mlp.experts.33.down_proj.weight": "model-00024-of-00047.safetensors", + "model.layers.23.mlp.experts.33.down_proj.weight_scale": "model-00024-of-00047.safetensors", + "model.layers.23.mlp.experts.33.gate_proj.weight": "model-00024-of-00047.safetensors", + "model.layers.23.mlp.experts.33.gate_proj.weight_scale": "model-00024-of-00047.safetensors", + "model.layers.23.mlp.experts.33.up_proj.weight": "model-00024-of-00047.safetensors", + "model.layers.23.mlp.experts.33.up_proj.weight_scale": "model-00024-of-00047.safetensors", + "model.layers.23.mlp.experts.34.down_proj.weight": "model-00024-of-00047.safetensors", + "model.layers.23.mlp.experts.34.down_proj.weight_scale": "model-00024-of-00047.safetensors", + "model.layers.23.mlp.experts.34.gate_proj.weight": "model-00024-of-00047.safetensors", + "model.layers.23.mlp.experts.34.gate_proj.weight_scale": "model-00024-of-00047.safetensors", + "model.layers.23.mlp.experts.34.up_proj.weight": "model-00024-of-00047.safetensors", + "model.layers.23.mlp.experts.34.up_proj.weight_scale": "model-00024-of-00047.safetensors", + "model.layers.23.mlp.experts.35.down_proj.weight": "model-00024-of-00047.safetensors", + "model.layers.23.mlp.experts.35.down_proj.weight_scale": "model-00024-of-00047.safetensors", + "model.layers.23.mlp.experts.35.gate_proj.weight": "model-00024-of-00047.safetensors", + "model.layers.23.mlp.experts.35.gate_proj.weight_scale": "model-00024-of-00047.safetensors", + "model.layers.23.mlp.experts.35.up_proj.weight": "model-00024-of-00047.safetensors", + "model.layers.23.mlp.experts.35.up_proj.weight_scale": "model-00024-of-00047.safetensors", + "model.layers.23.mlp.experts.36.down_proj.weight": "model-00024-of-00047.safetensors", + "model.layers.23.mlp.experts.36.down_proj.weight_scale": "model-00024-of-00047.safetensors", + "model.layers.23.mlp.experts.36.gate_proj.weight": "model-00024-of-00047.safetensors", + "model.layers.23.mlp.experts.36.gate_proj.weight_scale": "model-00024-of-00047.safetensors", + "model.layers.23.mlp.experts.36.up_proj.weight": "model-00024-of-00047.safetensors", + "model.layers.23.mlp.experts.36.up_proj.weight_scale": "model-00024-of-00047.safetensors", + "model.layers.23.mlp.experts.37.down_proj.weight": "model-00024-of-00047.safetensors", + "model.layers.23.mlp.experts.37.down_proj.weight_scale": "model-00024-of-00047.safetensors", + "model.layers.23.mlp.experts.37.gate_proj.weight": "model-00024-of-00047.safetensors", + "model.layers.23.mlp.experts.37.gate_proj.weight_scale": "model-00024-of-00047.safetensors", + "model.layers.23.mlp.experts.37.up_proj.weight": "model-00024-of-00047.safetensors", + "model.layers.23.mlp.experts.37.up_proj.weight_scale": "model-00024-of-00047.safetensors", + "model.layers.23.mlp.experts.38.down_proj.weight": "model-00024-of-00047.safetensors", + "model.layers.23.mlp.experts.38.down_proj.weight_scale": "model-00024-of-00047.safetensors", + "model.layers.23.mlp.experts.38.gate_proj.weight": "model-00024-of-00047.safetensors", + "model.layers.23.mlp.experts.38.gate_proj.weight_scale": "model-00024-of-00047.safetensors", + "model.layers.23.mlp.experts.38.up_proj.weight": "model-00024-of-00047.safetensors", + "model.layers.23.mlp.experts.38.up_proj.weight_scale": "model-00024-of-00047.safetensors", + "model.layers.23.mlp.experts.39.down_proj.weight": "model-00024-of-00047.safetensors", + "model.layers.23.mlp.experts.39.down_proj.weight_scale": "model-00024-of-00047.safetensors", + "model.layers.23.mlp.experts.39.gate_proj.weight": "model-00024-of-00047.safetensors", + "model.layers.23.mlp.experts.39.gate_proj.weight_scale": "model-00024-of-00047.safetensors", + "model.layers.23.mlp.experts.39.up_proj.weight": "model-00024-of-00047.safetensors", + "model.layers.23.mlp.experts.39.up_proj.weight_scale": "model-00024-of-00047.safetensors", + "model.layers.23.mlp.experts.4.down_proj.weight": "model-00024-of-00047.safetensors", + "model.layers.23.mlp.experts.4.down_proj.weight_scale": "model-00024-of-00047.safetensors", + "model.layers.23.mlp.experts.4.gate_proj.weight": "model-00024-of-00047.safetensors", + "model.layers.23.mlp.experts.4.gate_proj.weight_scale": "model-00024-of-00047.safetensors", + "model.layers.23.mlp.experts.4.up_proj.weight": "model-00024-of-00047.safetensors", + "model.layers.23.mlp.experts.4.up_proj.weight_scale": "model-00024-of-00047.safetensors", + "model.layers.23.mlp.experts.40.down_proj.weight": "model-00024-of-00047.safetensors", + "model.layers.23.mlp.experts.40.down_proj.weight_scale": "model-00024-of-00047.safetensors", + "model.layers.23.mlp.experts.40.gate_proj.weight": "model-00024-of-00047.safetensors", + "model.layers.23.mlp.experts.40.gate_proj.weight_scale": "model-00024-of-00047.safetensors", + "model.layers.23.mlp.experts.40.up_proj.weight": "model-00024-of-00047.safetensors", + "model.layers.23.mlp.experts.40.up_proj.weight_scale": "model-00024-of-00047.safetensors", + "model.layers.23.mlp.experts.41.down_proj.weight": "model-00024-of-00047.safetensors", + "model.layers.23.mlp.experts.41.down_proj.weight_scale": "model-00024-of-00047.safetensors", + "model.layers.23.mlp.experts.41.gate_proj.weight": "model-00024-of-00047.safetensors", + "model.layers.23.mlp.experts.41.gate_proj.weight_scale": "model-00024-of-00047.safetensors", + "model.layers.23.mlp.experts.41.up_proj.weight": "model-00024-of-00047.safetensors", + "model.layers.23.mlp.experts.41.up_proj.weight_scale": "model-00024-of-00047.safetensors", + "model.layers.23.mlp.experts.42.down_proj.weight": "model-00024-of-00047.safetensors", + "model.layers.23.mlp.experts.42.down_proj.weight_scale": "model-00024-of-00047.safetensors", + "model.layers.23.mlp.experts.42.gate_proj.weight": "model-00024-of-00047.safetensors", + "model.layers.23.mlp.experts.42.gate_proj.weight_scale": "model-00024-of-00047.safetensors", + "model.layers.23.mlp.experts.42.up_proj.weight": "model-00024-of-00047.safetensors", + "model.layers.23.mlp.experts.42.up_proj.weight_scale": "model-00024-of-00047.safetensors", + "model.layers.23.mlp.experts.43.down_proj.weight": "model-00024-of-00047.safetensors", + "model.layers.23.mlp.experts.43.down_proj.weight_scale": "model-00024-of-00047.safetensors", + "model.layers.23.mlp.experts.43.gate_proj.weight": "model-00024-of-00047.safetensors", + "model.layers.23.mlp.experts.43.gate_proj.weight_scale": "model-00024-of-00047.safetensors", + "model.layers.23.mlp.experts.43.up_proj.weight": "model-00024-of-00047.safetensors", + "model.layers.23.mlp.experts.43.up_proj.weight_scale": "model-00024-of-00047.safetensors", + "model.layers.23.mlp.experts.44.down_proj.weight": "model-00024-of-00047.safetensors", + "model.layers.23.mlp.experts.44.down_proj.weight_scale": "model-00024-of-00047.safetensors", + "model.layers.23.mlp.experts.44.gate_proj.weight": "model-00024-of-00047.safetensors", + "model.layers.23.mlp.experts.44.gate_proj.weight_scale": "model-00024-of-00047.safetensors", + "model.layers.23.mlp.experts.44.up_proj.weight": "model-00024-of-00047.safetensors", + "model.layers.23.mlp.experts.44.up_proj.weight_scale": "model-00024-of-00047.safetensors", + "model.layers.23.mlp.experts.45.down_proj.weight": "model-00024-of-00047.safetensors", + "model.layers.23.mlp.experts.45.down_proj.weight_scale": "model-00024-of-00047.safetensors", + "model.layers.23.mlp.experts.45.gate_proj.weight": "model-00024-of-00047.safetensors", + "model.layers.23.mlp.experts.45.gate_proj.weight_scale": "model-00024-of-00047.safetensors", + "model.layers.23.mlp.experts.45.up_proj.weight": "model-00024-of-00047.safetensors", + "model.layers.23.mlp.experts.45.up_proj.weight_scale": "model-00024-of-00047.safetensors", + "model.layers.23.mlp.experts.46.down_proj.weight": "model-00024-of-00047.safetensors", + "model.layers.23.mlp.experts.46.down_proj.weight_scale": "model-00024-of-00047.safetensors", + "model.layers.23.mlp.experts.46.gate_proj.weight": "model-00024-of-00047.safetensors", + "model.layers.23.mlp.experts.46.gate_proj.weight_scale": "model-00024-of-00047.safetensors", + "model.layers.23.mlp.experts.46.up_proj.weight": "model-00024-of-00047.safetensors", + "model.layers.23.mlp.experts.46.up_proj.weight_scale": "model-00024-of-00047.safetensors", + "model.layers.23.mlp.experts.47.down_proj.weight": "model-00024-of-00047.safetensors", + "model.layers.23.mlp.experts.47.down_proj.weight_scale": "model-00024-of-00047.safetensors", + "model.layers.23.mlp.experts.47.gate_proj.weight": "model-00024-of-00047.safetensors", + "model.layers.23.mlp.experts.47.gate_proj.weight_scale": "model-00024-of-00047.safetensors", + "model.layers.23.mlp.experts.47.up_proj.weight": "model-00024-of-00047.safetensors", + "model.layers.23.mlp.experts.47.up_proj.weight_scale": "model-00024-of-00047.safetensors", + "model.layers.23.mlp.experts.48.down_proj.weight": "model-00024-of-00047.safetensors", + "model.layers.23.mlp.experts.48.down_proj.weight_scale": "model-00024-of-00047.safetensors", + "model.layers.23.mlp.experts.48.gate_proj.weight": "model-00024-of-00047.safetensors", + "model.layers.23.mlp.experts.48.gate_proj.weight_scale": "model-00024-of-00047.safetensors", + "model.layers.23.mlp.experts.48.up_proj.weight": "model-00024-of-00047.safetensors", + "model.layers.23.mlp.experts.48.up_proj.weight_scale": "model-00024-of-00047.safetensors", + "model.layers.23.mlp.experts.49.down_proj.weight": "model-00024-of-00047.safetensors", + "model.layers.23.mlp.experts.49.down_proj.weight_scale": "model-00024-of-00047.safetensors", + "model.layers.23.mlp.experts.49.gate_proj.weight": "model-00024-of-00047.safetensors", + "model.layers.23.mlp.experts.49.gate_proj.weight_scale": "model-00024-of-00047.safetensors", + "model.layers.23.mlp.experts.49.up_proj.weight": "model-00024-of-00047.safetensors", + "model.layers.23.mlp.experts.49.up_proj.weight_scale": "model-00024-of-00047.safetensors", + "model.layers.23.mlp.experts.5.down_proj.weight": "model-00024-of-00047.safetensors", + "model.layers.23.mlp.experts.5.down_proj.weight_scale": "model-00024-of-00047.safetensors", + "model.layers.23.mlp.experts.5.gate_proj.weight": "model-00024-of-00047.safetensors", + "model.layers.23.mlp.experts.5.gate_proj.weight_scale": "model-00024-of-00047.safetensors", + "model.layers.23.mlp.experts.5.up_proj.weight": "model-00024-of-00047.safetensors", + "model.layers.23.mlp.experts.5.up_proj.weight_scale": "model-00024-of-00047.safetensors", + "model.layers.23.mlp.experts.50.down_proj.weight": "model-00024-of-00047.safetensors", + "model.layers.23.mlp.experts.50.down_proj.weight_scale": "model-00024-of-00047.safetensors", + "model.layers.23.mlp.experts.50.gate_proj.weight": "model-00024-of-00047.safetensors", + "model.layers.23.mlp.experts.50.gate_proj.weight_scale": "model-00024-of-00047.safetensors", + "model.layers.23.mlp.experts.50.up_proj.weight": "model-00024-of-00047.safetensors", + "model.layers.23.mlp.experts.50.up_proj.weight_scale": "model-00024-of-00047.safetensors", + "model.layers.23.mlp.experts.51.down_proj.weight": "model-00024-of-00047.safetensors", + "model.layers.23.mlp.experts.51.down_proj.weight_scale": "model-00024-of-00047.safetensors", + "model.layers.23.mlp.experts.51.gate_proj.weight": "model-00024-of-00047.safetensors", + "model.layers.23.mlp.experts.51.gate_proj.weight_scale": "model-00024-of-00047.safetensors", + "model.layers.23.mlp.experts.51.up_proj.weight": "model-00024-of-00047.safetensors", + "model.layers.23.mlp.experts.51.up_proj.weight_scale": "model-00024-of-00047.safetensors", + "model.layers.23.mlp.experts.52.down_proj.weight": "model-00024-of-00047.safetensors", + "model.layers.23.mlp.experts.52.down_proj.weight_scale": "model-00024-of-00047.safetensors", + "model.layers.23.mlp.experts.52.gate_proj.weight": "model-00024-of-00047.safetensors", + "model.layers.23.mlp.experts.52.gate_proj.weight_scale": "model-00024-of-00047.safetensors", + "model.layers.23.mlp.experts.52.up_proj.weight": "model-00024-of-00047.safetensors", + "model.layers.23.mlp.experts.52.up_proj.weight_scale": "model-00024-of-00047.safetensors", + "model.layers.23.mlp.experts.53.down_proj.weight": "model-00024-of-00047.safetensors", + "model.layers.23.mlp.experts.53.down_proj.weight_scale": "model-00024-of-00047.safetensors", + "model.layers.23.mlp.experts.53.gate_proj.weight": "model-00024-of-00047.safetensors", + "model.layers.23.mlp.experts.53.gate_proj.weight_scale": "model-00024-of-00047.safetensors", + "model.layers.23.mlp.experts.53.up_proj.weight": "model-00024-of-00047.safetensors", + "model.layers.23.mlp.experts.53.up_proj.weight_scale": "model-00024-of-00047.safetensors", + "model.layers.23.mlp.experts.54.down_proj.weight": "model-00024-of-00047.safetensors", + "model.layers.23.mlp.experts.54.down_proj.weight_scale": "model-00024-of-00047.safetensors", + "model.layers.23.mlp.experts.54.gate_proj.weight": "model-00024-of-00047.safetensors", + "model.layers.23.mlp.experts.54.gate_proj.weight_scale": "model-00024-of-00047.safetensors", + "model.layers.23.mlp.experts.54.up_proj.weight": "model-00024-of-00047.safetensors", + "model.layers.23.mlp.experts.54.up_proj.weight_scale": "model-00024-of-00047.safetensors", + "model.layers.23.mlp.experts.55.down_proj.weight": "model-00024-of-00047.safetensors", + "model.layers.23.mlp.experts.55.down_proj.weight_scale": "model-00024-of-00047.safetensors", + "model.layers.23.mlp.experts.55.gate_proj.weight": "model-00024-of-00047.safetensors", + "model.layers.23.mlp.experts.55.gate_proj.weight_scale": "model-00024-of-00047.safetensors", + "model.layers.23.mlp.experts.55.up_proj.weight": "model-00024-of-00047.safetensors", + "model.layers.23.mlp.experts.55.up_proj.weight_scale": "model-00024-of-00047.safetensors", + "model.layers.23.mlp.experts.56.down_proj.weight": "model-00024-of-00047.safetensors", + "model.layers.23.mlp.experts.56.down_proj.weight_scale": "model-00024-of-00047.safetensors", + "model.layers.23.mlp.experts.56.gate_proj.weight": "model-00024-of-00047.safetensors", + "model.layers.23.mlp.experts.56.gate_proj.weight_scale": "model-00024-of-00047.safetensors", + "model.layers.23.mlp.experts.56.up_proj.weight": "model-00024-of-00047.safetensors", + "model.layers.23.mlp.experts.56.up_proj.weight_scale": "model-00024-of-00047.safetensors", + "model.layers.23.mlp.experts.57.down_proj.weight": "model-00024-of-00047.safetensors", + "model.layers.23.mlp.experts.57.down_proj.weight_scale": "model-00024-of-00047.safetensors", + "model.layers.23.mlp.experts.57.gate_proj.weight": "model-00024-of-00047.safetensors", + "model.layers.23.mlp.experts.57.gate_proj.weight_scale": "model-00024-of-00047.safetensors", + "model.layers.23.mlp.experts.57.up_proj.weight": "model-00024-of-00047.safetensors", + "model.layers.23.mlp.experts.57.up_proj.weight_scale": "model-00024-of-00047.safetensors", + "model.layers.23.mlp.experts.58.down_proj.weight": "model-00024-of-00047.safetensors", + "model.layers.23.mlp.experts.58.down_proj.weight_scale": "model-00024-of-00047.safetensors", + "model.layers.23.mlp.experts.58.gate_proj.weight": "model-00024-of-00047.safetensors", + "model.layers.23.mlp.experts.58.gate_proj.weight_scale": "model-00024-of-00047.safetensors", + "model.layers.23.mlp.experts.58.up_proj.weight": "model-00024-of-00047.safetensors", + "model.layers.23.mlp.experts.58.up_proj.weight_scale": "model-00024-of-00047.safetensors", + "model.layers.23.mlp.experts.59.down_proj.weight": "model-00024-of-00047.safetensors", + "model.layers.23.mlp.experts.59.down_proj.weight_scale": "model-00024-of-00047.safetensors", + "model.layers.23.mlp.experts.59.gate_proj.weight": "model-00024-of-00047.safetensors", + "model.layers.23.mlp.experts.59.gate_proj.weight_scale": "model-00024-of-00047.safetensors", + "model.layers.23.mlp.experts.59.up_proj.weight": "model-00024-of-00047.safetensors", + "model.layers.23.mlp.experts.59.up_proj.weight_scale": "model-00024-of-00047.safetensors", + "model.layers.23.mlp.experts.6.down_proj.weight": "model-00024-of-00047.safetensors", + "model.layers.23.mlp.experts.6.down_proj.weight_scale": "model-00024-of-00047.safetensors", + "model.layers.23.mlp.experts.6.gate_proj.weight": "model-00024-of-00047.safetensors", + "model.layers.23.mlp.experts.6.gate_proj.weight_scale": "model-00024-of-00047.safetensors", + "model.layers.23.mlp.experts.6.up_proj.weight": "model-00024-of-00047.safetensors", + "model.layers.23.mlp.experts.6.up_proj.weight_scale": "model-00024-of-00047.safetensors", + "model.layers.23.mlp.experts.60.down_proj.weight": "model-00024-of-00047.safetensors", + "model.layers.23.mlp.experts.60.down_proj.weight_scale": "model-00024-of-00047.safetensors", + "model.layers.23.mlp.experts.60.gate_proj.weight": "model-00024-of-00047.safetensors", + "model.layers.23.mlp.experts.60.gate_proj.weight_scale": "model-00024-of-00047.safetensors", + "model.layers.23.mlp.experts.60.up_proj.weight": "model-00024-of-00047.safetensors", + "model.layers.23.mlp.experts.60.up_proj.weight_scale": "model-00024-of-00047.safetensors", + "model.layers.23.mlp.experts.61.down_proj.weight": "model-00024-of-00047.safetensors", + "model.layers.23.mlp.experts.61.down_proj.weight_scale": "model-00024-of-00047.safetensors", + "model.layers.23.mlp.experts.61.gate_proj.weight": "model-00024-of-00047.safetensors", + "model.layers.23.mlp.experts.61.gate_proj.weight_scale": "model-00024-of-00047.safetensors", + "model.layers.23.mlp.experts.61.up_proj.weight": "model-00024-of-00047.safetensors", + "model.layers.23.mlp.experts.61.up_proj.weight_scale": "model-00024-of-00047.safetensors", + "model.layers.23.mlp.experts.62.down_proj.weight": "model-00024-of-00047.safetensors", + "model.layers.23.mlp.experts.62.down_proj.weight_scale": "model-00024-of-00047.safetensors", + "model.layers.23.mlp.experts.62.gate_proj.weight": "model-00024-of-00047.safetensors", + "model.layers.23.mlp.experts.62.gate_proj.weight_scale": "model-00024-of-00047.safetensors", + "model.layers.23.mlp.experts.62.up_proj.weight": "model-00024-of-00047.safetensors", + "model.layers.23.mlp.experts.62.up_proj.weight_scale": "model-00024-of-00047.safetensors", + "model.layers.23.mlp.experts.63.down_proj.weight": "model-00024-of-00047.safetensors", + "model.layers.23.mlp.experts.63.down_proj.weight_scale": "model-00024-of-00047.safetensors", + "model.layers.23.mlp.experts.63.gate_proj.weight": "model-00024-of-00047.safetensors", + "model.layers.23.mlp.experts.63.gate_proj.weight_scale": "model-00024-of-00047.safetensors", + "model.layers.23.mlp.experts.63.up_proj.weight": "model-00024-of-00047.safetensors", + "model.layers.23.mlp.experts.63.up_proj.weight_scale": "model-00024-of-00047.safetensors", + "model.layers.23.mlp.experts.64.down_proj.weight": "model-00024-of-00047.safetensors", + "model.layers.23.mlp.experts.64.down_proj.weight_scale": "model-00024-of-00047.safetensors", + "model.layers.23.mlp.experts.64.gate_proj.weight": "model-00024-of-00047.safetensors", + "model.layers.23.mlp.experts.64.gate_proj.weight_scale": "model-00024-of-00047.safetensors", + "model.layers.23.mlp.experts.64.up_proj.weight": "model-00024-of-00047.safetensors", + "model.layers.23.mlp.experts.64.up_proj.weight_scale": "model-00024-of-00047.safetensors", + "model.layers.23.mlp.experts.65.down_proj.weight": "model-00024-of-00047.safetensors", + "model.layers.23.mlp.experts.65.down_proj.weight_scale": "model-00024-of-00047.safetensors", + "model.layers.23.mlp.experts.65.gate_proj.weight": "model-00024-of-00047.safetensors", + "model.layers.23.mlp.experts.65.gate_proj.weight_scale": "model-00024-of-00047.safetensors", + "model.layers.23.mlp.experts.65.up_proj.weight": "model-00024-of-00047.safetensors", + "model.layers.23.mlp.experts.65.up_proj.weight_scale": "model-00024-of-00047.safetensors", + "model.layers.23.mlp.experts.66.down_proj.weight": "model-00024-of-00047.safetensors", + "model.layers.23.mlp.experts.66.down_proj.weight_scale": "model-00024-of-00047.safetensors", + "model.layers.23.mlp.experts.66.gate_proj.weight": "model-00024-of-00047.safetensors", + "model.layers.23.mlp.experts.66.gate_proj.weight_scale": "model-00024-of-00047.safetensors", + "model.layers.23.mlp.experts.66.up_proj.weight": "model-00024-of-00047.safetensors", + "model.layers.23.mlp.experts.66.up_proj.weight_scale": "model-00024-of-00047.safetensors", + "model.layers.23.mlp.experts.67.down_proj.weight": "model-00024-of-00047.safetensors", + "model.layers.23.mlp.experts.67.down_proj.weight_scale": "model-00024-of-00047.safetensors", + "model.layers.23.mlp.experts.67.gate_proj.weight": "model-00024-of-00047.safetensors", + "model.layers.23.mlp.experts.67.gate_proj.weight_scale": "model-00024-of-00047.safetensors", + "model.layers.23.mlp.experts.67.up_proj.weight": "model-00024-of-00047.safetensors", + "model.layers.23.mlp.experts.67.up_proj.weight_scale": "model-00024-of-00047.safetensors", + "model.layers.23.mlp.experts.68.down_proj.weight": "model-00024-of-00047.safetensors", + "model.layers.23.mlp.experts.68.down_proj.weight_scale": "model-00024-of-00047.safetensors", + "model.layers.23.mlp.experts.68.gate_proj.weight": "model-00024-of-00047.safetensors", + "model.layers.23.mlp.experts.68.gate_proj.weight_scale": "model-00024-of-00047.safetensors", + "model.layers.23.mlp.experts.68.up_proj.weight": "model-00024-of-00047.safetensors", + "model.layers.23.mlp.experts.68.up_proj.weight_scale": "model-00024-of-00047.safetensors", + "model.layers.23.mlp.experts.69.down_proj.weight": "model-00024-of-00047.safetensors", + "model.layers.23.mlp.experts.69.down_proj.weight_scale": "model-00024-of-00047.safetensors", + "model.layers.23.mlp.experts.69.gate_proj.weight": "model-00024-of-00047.safetensors", + "model.layers.23.mlp.experts.69.gate_proj.weight_scale": "model-00024-of-00047.safetensors", + "model.layers.23.mlp.experts.69.up_proj.weight": "model-00024-of-00047.safetensors", + "model.layers.23.mlp.experts.69.up_proj.weight_scale": "model-00024-of-00047.safetensors", + "model.layers.23.mlp.experts.7.down_proj.weight": "model-00024-of-00047.safetensors", + "model.layers.23.mlp.experts.7.down_proj.weight_scale": "model-00024-of-00047.safetensors", + "model.layers.23.mlp.experts.7.gate_proj.weight": "model-00024-of-00047.safetensors", + "model.layers.23.mlp.experts.7.gate_proj.weight_scale": "model-00024-of-00047.safetensors", + "model.layers.23.mlp.experts.7.up_proj.weight": "model-00024-of-00047.safetensors", + "model.layers.23.mlp.experts.7.up_proj.weight_scale": "model-00024-of-00047.safetensors", + "model.layers.23.mlp.experts.70.down_proj.weight": "model-00024-of-00047.safetensors", + "model.layers.23.mlp.experts.70.down_proj.weight_scale": "model-00024-of-00047.safetensors", + "model.layers.23.mlp.experts.70.gate_proj.weight": "model-00024-of-00047.safetensors", + "model.layers.23.mlp.experts.70.gate_proj.weight_scale": "model-00024-of-00047.safetensors", + "model.layers.23.mlp.experts.70.up_proj.weight": "model-00024-of-00047.safetensors", + "model.layers.23.mlp.experts.70.up_proj.weight_scale": "model-00024-of-00047.safetensors", + "model.layers.23.mlp.experts.71.down_proj.weight": "model-00024-of-00047.safetensors", + "model.layers.23.mlp.experts.71.down_proj.weight_scale": "model-00024-of-00047.safetensors", + "model.layers.23.mlp.experts.71.gate_proj.weight": "model-00024-of-00047.safetensors", + "model.layers.23.mlp.experts.71.gate_proj.weight_scale": "model-00024-of-00047.safetensors", + "model.layers.23.mlp.experts.71.up_proj.weight": "model-00024-of-00047.safetensors", + "model.layers.23.mlp.experts.71.up_proj.weight_scale": "model-00024-of-00047.safetensors", + "model.layers.23.mlp.experts.72.down_proj.weight": "model-00024-of-00047.safetensors", + "model.layers.23.mlp.experts.72.down_proj.weight_scale": "model-00024-of-00047.safetensors", + "model.layers.23.mlp.experts.72.gate_proj.weight": "model-00024-of-00047.safetensors", + "model.layers.23.mlp.experts.72.gate_proj.weight_scale": "model-00024-of-00047.safetensors", + "model.layers.23.mlp.experts.72.up_proj.weight": "model-00024-of-00047.safetensors", + "model.layers.23.mlp.experts.72.up_proj.weight_scale": "model-00024-of-00047.safetensors", + "model.layers.23.mlp.experts.73.down_proj.weight": "model-00024-of-00047.safetensors", + "model.layers.23.mlp.experts.73.down_proj.weight_scale": "model-00024-of-00047.safetensors", + "model.layers.23.mlp.experts.73.gate_proj.weight": "model-00024-of-00047.safetensors", + "model.layers.23.mlp.experts.73.gate_proj.weight_scale": "model-00024-of-00047.safetensors", + "model.layers.23.mlp.experts.73.up_proj.weight": "model-00024-of-00047.safetensors", + "model.layers.23.mlp.experts.73.up_proj.weight_scale": "model-00024-of-00047.safetensors", + "model.layers.23.mlp.experts.74.down_proj.weight": "model-00024-of-00047.safetensors", + "model.layers.23.mlp.experts.74.down_proj.weight_scale": "model-00024-of-00047.safetensors", + "model.layers.23.mlp.experts.74.gate_proj.weight": "model-00024-of-00047.safetensors", + "model.layers.23.mlp.experts.74.gate_proj.weight_scale": "model-00024-of-00047.safetensors", + "model.layers.23.mlp.experts.74.up_proj.weight": "model-00024-of-00047.safetensors", + "model.layers.23.mlp.experts.74.up_proj.weight_scale": "model-00024-of-00047.safetensors", + "model.layers.23.mlp.experts.75.down_proj.weight": "model-00024-of-00047.safetensors", + "model.layers.23.mlp.experts.75.down_proj.weight_scale": "model-00024-of-00047.safetensors", + "model.layers.23.mlp.experts.75.gate_proj.weight": "model-00024-of-00047.safetensors", + "model.layers.23.mlp.experts.75.gate_proj.weight_scale": "model-00024-of-00047.safetensors", + "model.layers.23.mlp.experts.75.up_proj.weight": "model-00024-of-00047.safetensors", + "model.layers.23.mlp.experts.75.up_proj.weight_scale": "model-00024-of-00047.safetensors", + "model.layers.23.mlp.experts.76.down_proj.weight": "model-00024-of-00047.safetensors", + "model.layers.23.mlp.experts.76.down_proj.weight_scale": "model-00024-of-00047.safetensors", + "model.layers.23.mlp.experts.76.gate_proj.weight": "model-00024-of-00047.safetensors", + "model.layers.23.mlp.experts.76.gate_proj.weight_scale": "model-00024-of-00047.safetensors", + "model.layers.23.mlp.experts.76.up_proj.weight": "model-00024-of-00047.safetensors", + "model.layers.23.mlp.experts.76.up_proj.weight_scale": "model-00024-of-00047.safetensors", + "model.layers.23.mlp.experts.77.down_proj.weight": "model-00024-of-00047.safetensors", + "model.layers.23.mlp.experts.77.down_proj.weight_scale": "model-00024-of-00047.safetensors", + "model.layers.23.mlp.experts.77.gate_proj.weight": "model-00024-of-00047.safetensors", + "model.layers.23.mlp.experts.77.gate_proj.weight_scale": "model-00024-of-00047.safetensors", + "model.layers.23.mlp.experts.77.up_proj.weight": "model-00024-of-00047.safetensors", + "model.layers.23.mlp.experts.77.up_proj.weight_scale": "model-00024-of-00047.safetensors", + "model.layers.23.mlp.experts.78.down_proj.weight": "model-00024-of-00047.safetensors", + "model.layers.23.mlp.experts.78.down_proj.weight_scale": "model-00024-of-00047.safetensors", + "model.layers.23.mlp.experts.78.gate_proj.weight": "model-00024-of-00047.safetensors", + "model.layers.23.mlp.experts.78.gate_proj.weight_scale": "model-00024-of-00047.safetensors", + "model.layers.23.mlp.experts.78.up_proj.weight": "model-00024-of-00047.safetensors", + "model.layers.23.mlp.experts.78.up_proj.weight_scale": "model-00024-of-00047.safetensors", + "model.layers.23.mlp.experts.79.down_proj.weight": "model-00024-of-00047.safetensors", + "model.layers.23.mlp.experts.79.down_proj.weight_scale": "model-00024-of-00047.safetensors", + "model.layers.23.mlp.experts.79.gate_proj.weight": "model-00024-of-00047.safetensors", + "model.layers.23.mlp.experts.79.gate_proj.weight_scale": "model-00024-of-00047.safetensors", + "model.layers.23.mlp.experts.79.up_proj.weight": "model-00024-of-00047.safetensors", + "model.layers.23.mlp.experts.79.up_proj.weight_scale": "model-00024-of-00047.safetensors", + "model.layers.23.mlp.experts.8.down_proj.weight": "model-00024-of-00047.safetensors", + "model.layers.23.mlp.experts.8.down_proj.weight_scale": "model-00024-of-00047.safetensors", + "model.layers.23.mlp.experts.8.gate_proj.weight": "model-00024-of-00047.safetensors", + "model.layers.23.mlp.experts.8.gate_proj.weight_scale": "model-00024-of-00047.safetensors", + "model.layers.23.mlp.experts.8.up_proj.weight": "model-00024-of-00047.safetensors", + "model.layers.23.mlp.experts.8.up_proj.weight_scale": "model-00024-of-00047.safetensors", + "model.layers.23.mlp.experts.80.down_proj.weight": "model-00024-of-00047.safetensors", + "model.layers.23.mlp.experts.80.down_proj.weight_scale": "model-00024-of-00047.safetensors", + "model.layers.23.mlp.experts.80.gate_proj.weight": "model-00024-of-00047.safetensors", + "model.layers.23.mlp.experts.80.gate_proj.weight_scale": "model-00024-of-00047.safetensors", + "model.layers.23.mlp.experts.80.up_proj.weight": "model-00024-of-00047.safetensors", + "model.layers.23.mlp.experts.80.up_proj.weight_scale": "model-00024-of-00047.safetensors", + "model.layers.23.mlp.experts.81.down_proj.weight": "model-00024-of-00047.safetensors", + "model.layers.23.mlp.experts.81.down_proj.weight_scale": "model-00024-of-00047.safetensors", + "model.layers.23.mlp.experts.81.gate_proj.weight": "model-00024-of-00047.safetensors", + "model.layers.23.mlp.experts.81.gate_proj.weight_scale": "model-00024-of-00047.safetensors", + "model.layers.23.mlp.experts.81.up_proj.weight": "model-00024-of-00047.safetensors", + "model.layers.23.mlp.experts.81.up_proj.weight_scale": "model-00024-of-00047.safetensors", + "model.layers.23.mlp.experts.82.down_proj.weight": "model-00024-of-00047.safetensors", + "model.layers.23.mlp.experts.82.down_proj.weight_scale": "model-00024-of-00047.safetensors", + "model.layers.23.mlp.experts.82.gate_proj.weight": "model-00024-of-00047.safetensors", + "model.layers.23.mlp.experts.82.gate_proj.weight_scale": "model-00024-of-00047.safetensors", + "model.layers.23.mlp.experts.82.up_proj.weight": "model-00024-of-00047.safetensors", + "model.layers.23.mlp.experts.82.up_proj.weight_scale": "model-00024-of-00047.safetensors", + "model.layers.23.mlp.experts.83.down_proj.weight": "model-00024-of-00047.safetensors", + "model.layers.23.mlp.experts.83.down_proj.weight_scale": "model-00024-of-00047.safetensors", + "model.layers.23.mlp.experts.83.gate_proj.weight": "model-00024-of-00047.safetensors", + "model.layers.23.mlp.experts.83.gate_proj.weight_scale": "model-00024-of-00047.safetensors", + "model.layers.23.mlp.experts.83.up_proj.weight": "model-00024-of-00047.safetensors", + "model.layers.23.mlp.experts.83.up_proj.weight_scale": "model-00024-of-00047.safetensors", + "model.layers.23.mlp.experts.84.down_proj.weight": "model-00024-of-00047.safetensors", + "model.layers.23.mlp.experts.84.down_proj.weight_scale": "model-00024-of-00047.safetensors", + "model.layers.23.mlp.experts.84.gate_proj.weight": "model-00024-of-00047.safetensors", + "model.layers.23.mlp.experts.84.gate_proj.weight_scale": "model-00024-of-00047.safetensors", + "model.layers.23.mlp.experts.84.up_proj.weight": "model-00024-of-00047.safetensors", + "model.layers.23.mlp.experts.84.up_proj.weight_scale": "model-00024-of-00047.safetensors", + "model.layers.23.mlp.experts.85.down_proj.weight": "model-00024-of-00047.safetensors", + "model.layers.23.mlp.experts.85.down_proj.weight_scale": "model-00024-of-00047.safetensors", + "model.layers.23.mlp.experts.85.gate_proj.weight": "model-00024-of-00047.safetensors", + "model.layers.23.mlp.experts.85.gate_proj.weight_scale": "model-00024-of-00047.safetensors", + "model.layers.23.mlp.experts.85.up_proj.weight": "model-00024-of-00047.safetensors", + "model.layers.23.mlp.experts.85.up_proj.weight_scale": "model-00024-of-00047.safetensors", + "model.layers.23.mlp.experts.86.down_proj.weight": "model-00024-of-00047.safetensors", + "model.layers.23.mlp.experts.86.down_proj.weight_scale": "model-00024-of-00047.safetensors", + "model.layers.23.mlp.experts.86.gate_proj.weight": "model-00024-of-00047.safetensors", + "model.layers.23.mlp.experts.86.gate_proj.weight_scale": "model-00024-of-00047.safetensors", + "model.layers.23.mlp.experts.86.up_proj.weight": "model-00024-of-00047.safetensors", + "model.layers.23.mlp.experts.86.up_proj.weight_scale": "model-00024-of-00047.safetensors", + "model.layers.23.mlp.experts.87.down_proj.weight": "model-00024-of-00047.safetensors", + "model.layers.23.mlp.experts.87.down_proj.weight_scale": "model-00024-of-00047.safetensors", + "model.layers.23.mlp.experts.87.gate_proj.weight": "model-00024-of-00047.safetensors", + "model.layers.23.mlp.experts.87.gate_proj.weight_scale": "model-00024-of-00047.safetensors", + "model.layers.23.mlp.experts.87.up_proj.weight": "model-00024-of-00047.safetensors", + "model.layers.23.mlp.experts.87.up_proj.weight_scale": "model-00024-of-00047.safetensors", + "model.layers.23.mlp.experts.88.down_proj.weight": "model-00024-of-00047.safetensors", + "model.layers.23.mlp.experts.88.down_proj.weight_scale": "model-00024-of-00047.safetensors", + "model.layers.23.mlp.experts.88.gate_proj.weight": "model-00024-of-00047.safetensors", + "model.layers.23.mlp.experts.88.gate_proj.weight_scale": "model-00024-of-00047.safetensors", + "model.layers.23.mlp.experts.88.up_proj.weight": "model-00024-of-00047.safetensors", + "model.layers.23.mlp.experts.88.up_proj.weight_scale": "model-00024-of-00047.safetensors", + "model.layers.23.mlp.experts.89.down_proj.weight": "model-00024-of-00047.safetensors", + "model.layers.23.mlp.experts.89.down_proj.weight_scale": "model-00024-of-00047.safetensors", + "model.layers.23.mlp.experts.89.gate_proj.weight": "model-00024-of-00047.safetensors", + "model.layers.23.mlp.experts.89.gate_proj.weight_scale": "model-00024-of-00047.safetensors", + "model.layers.23.mlp.experts.89.up_proj.weight": "model-00024-of-00047.safetensors", + "model.layers.23.mlp.experts.89.up_proj.weight_scale": "model-00024-of-00047.safetensors", + "model.layers.23.mlp.experts.9.down_proj.weight": "model-00024-of-00047.safetensors", + "model.layers.23.mlp.experts.9.down_proj.weight_scale": "model-00024-of-00047.safetensors", + "model.layers.23.mlp.experts.9.gate_proj.weight": "model-00024-of-00047.safetensors", + "model.layers.23.mlp.experts.9.gate_proj.weight_scale": "model-00024-of-00047.safetensors", + "model.layers.23.mlp.experts.9.up_proj.weight": "model-00024-of-00047.safetensors", + "model.layers.23.mlp.experts.9.up_proj.weight_scale": "model-00024-of-00047.safetensors", + "model.layers.23.mlp.experts.90.down_proj.weight": "model-00024-of-00047.safetensors", + "model.layers.23.mlp.experts.90.down_proj.weight_scale": "model-00024-of-00047.safetensors", + "model.layers.23.mlp.experts.90.gate_proj.weight": "model-00024-of-00047.safetensors", + "model.layers.23.mlp.experts.90.gate_proj.weight_scale": "model-00024-of-00047.safetensors", + "model.layers.23.mlp.experts.90.up_proj.weight": "model-00024-of-00047.safetensors", + "model.layers.23.mlp.experts.90.up_proj.weight_scale": "model-00024-of-00047.safetensors", + "model.layers.23.mlp.experts.91.down_proj.weight": "model-00024-of-00047.safetensors", + "model.layers.23.mlp.experts.91.down_proj.weight_scale": "model-00024-of-00047.safetensors", + "model.layers.23.mlp.experts.91.gate_proj.weight": "model-00024-of-00047.safetensors", + "model.layers.23.mlp.experts.91.gate_proj.weight_scale": "model-00024-of-00047.safetensors", + "model.layers.23.mlp.experts.91.up_proj.weight": "model-00024-of-00047.safetensors", + "model.layers.23.mlp.experts.91.up_proj.weight_scale": "model-00024-of-00047.safetensors", + "model.layers.23.mlp.experts.92.down_proj.weight": "model-00024-of-00047.safetensors", + "model.layers.23.mlp.experts.92.down_proj.weight_scale": "model-00024-of-00047.safetensors", + "model.layers.23.mlp.experts.92.gate_proj.weight": "model-00024-of-00047.safetensors", + "model.layers.23.mlp.experts.92.gate_proj.weight_scale": "model-00024-of-00047.safetensors", + "model.layers.23.mlp.experts.92.up_proj.weight": "model-00024-of-00047.safetensors", + "model.layers.23.mlp.experts.92.up_proj.weight_scale": "model-00024-of-00047.safetensors", + "model.layers.23.mlp.experts.93.down_proj.weight": "model-00024-of-00047.safetensors", + "model.layers.23.mlp.experts.93.down_proj.weight_scale": "model-00024-of-00047.safetensors", + "model.layers.23.mlp.experts.93.gate_proj.weight": "model-00024-of-00047.safetensors", + "model.layers.23.mlp.experts.93.gate_proj.weight_scale": "model-00024-of-00047.safetensors", + "model.layers.23.mlp.experts.93.up_proj.weight": "model-00024-of-00047.safetensors", + "model.layers.23.mlp.experts.93.up_proj.weight_scale": "model-00024-of-00047.safetensors", + "model.layers.23.mlp.experts.94.down_proj.weight": "model-00024-of-00047.safetensors", + "model.layers.23.mlp.experts.94.down_proj.weight_scale": "model-00024-of-00047.safetensors", + "model.layers.23.mlp.experts.94.gate_proj.weight": "model-00024-of-00047.safetensors", + "model.layers.23.mlp.experts.94.gate_proj.weight_scale": "model-00024-of-00047.safetensors", + "model.layers.23.mlp.experts.94.up_proj.weight": "model-00024-of-00047.safetensors", + "model.layers.23.mlp.experts.94.up_proj.weight_scale": "model-00024-of-00047.safetensors", + "model.layers.23.mlp.experts.95.down_proj.weight": "model-00024-of-00047.safetensors", + "model.layers.23.mlp.experts.95.down_proj.weight_scale": "model-00024-of-00047.safetensors", + "model.layers.23.mlp.experts.95.gate_proj.weight": "model-00024-of-00047.safetensors", + "model.layers.23.mlp.experts.95.gate_proj.weight_scale": "model-00024-of-00047.safetensors", + "model.layers.23.mlp.experts.95.up_proj.weight": "model-00024-of-00047.safetensors", + "model.layers.23.mlp.experts.95.up_proj.weight_scale": "model-00024-of-00047.safetensors", + "model.layers.23.mlp.experts.96.down_proj.weight": "model-00024-of-00047.safetensors", + "model.layers.23.mlp.experts.96.down_proj.weight_scale": "model-00024-of-00047.safetensors", + "model.layers.23.mlp.experts.96.gate_proj.weight": "model-00024-of-00047.safetensors", + "model.layers.23.mlp.experts.96.gate_proj.weight_scale": "model-00024-of-00047.safetensors", + "model.layers.23.mlp.experts.96.up_proj.weight": "model-00024-of-00047.safetensors", + "model.layers.23.mlp.experts.96.up_proj.weight_scale": "model-00024-of-00047.safetensors", + "model.layers.23.mlp.experts.97.down_proj.weight": "model-00024-of-00047.safetensors", + "model.layers.23.mlp.experts.97.down_proj.weight_scale": "model-00024-of-00047.safetensors", + "model.layers.23.mlp.experts.97.gate_proj.weight": "model-00024-of-00047.safetensors", + "model.layers.23.mlp.experts.97.gate_proj.weight_scale": "model-00024-of-00047.safetensors", + "model.layers.23.mlp.experts.97.up_proj.weight": "model-00024-of-00047.safetensors", + "model.layers.23.mlp.experts.97.up_proj.weight_scale": "model-00024-of-00047.safetensors", + "model.layers.23.mlp.experts.98.down_proj.weight": "model-00024-of-00047.safetensors", + "model.layers.23.mlp.experts.98.down_proj.weight_scale": "model-00024-of-00047.safetensors", + "model.layers.23.mlp.experts.98.gate_proj.weight": "model-00024-of-00047.safetensors", + "model.layers.23.mlp.experts.98.gate_proj.weight_scale": "model-00024-of-00047.safetensors", + "model.layers.23.mlp.experts.98.up_proj.weight": "model-00024-of-00047.safetensors", + "model.layers.23.mlp.experts.98.up_proj.weight_scale": "model-00024-of-00047.safetensors", + "model.layers.23.mlp.experts.99.down_proj.weight": "model-00024-of-00047.safetensors", + "model.layers.23.mlp.experts.99.down_proj.weight_scale": "model-00024-of-00047.safetensors", + "model.layers.23.mlp.experts.99.gate_proj.weight": "model-00024-of-00047.safetensors", + "model.layers.23.mlp.experts.99.gate_proj.weight_scale": "model-00024-of-00047.safetensors", + "model.layers.23.mlp.experts.99.up_proj.weight": "model-00024-of-00047.safetensors", + "model.layers.23.mlp.experts.99.up_proj.weight_scale": "model-00024-of-00047.safetensors", + "model.layers.23.mlp.gate.e_score_correction_bias": "model-00024-of-00047.safetensors", + "model.layers.23.mlp.gate.weight": "model-00024-of-00047.safetensors", + "model.layers.23.mlp.shared_experts.down_proj.weight": "model-00024-of-00047.safetensors", + "model.layers.23.mlp.shared_experts.down_proj.weight_scale": "model-00024-of-00047.safetensors", + "model.layers.23.mlp.shared_experts.gate_proj.weight": "model-00024-of-00047.safetensors", + "model.layers.23.mlp.shared_experts.gate_proj.weight_scale": "model-00024-of-00047.safetensors", + "model.layers.23.mlp.shared_experts.up_proj.weight": "model-00024-of-00047.safetensors", + "model.layers.23.mlp.shared_experts.up_proj.weight_scale": "model-00024-of-00047.safetensors", + "model.layers.23.post_attention_layernorm.weight": "model-00024-of-00047.safetensors", + "model.layers.23.self_attn.k_proj.bias": "model-00024-of-00047.safetensors", + "model.layers.23.self_attn.k_proj.weight": "model-00024-of-00047.safetensors", + "model.layers.23.self_attn.k_proj.weight_scale": "model-00024-of-00047.safetensors", + "model.layers.23.self_attn.o_proj.weight": "model-00024-of-00047.safetensors", + "model.layers.23.self_attn.o_proj.weight_scale": "model-00024-of-00047.safetensors", + "model.layers.23.self_attn.q_proj.bias": "model-00024-of-00047.safetensors", + "model.layers.23.self_attn.q_proj.weight": "model-00024-of-00047.safetensors", + "model.layers.23.self_attn.q_proj.weight_scale": "model-00024-of-00047.safetensors", + "model.layers.23.self_attn.v_proj.bias": "model-00024-of-00047.safetensors", + "model.layers.23.self_attn.v_proj.weight": "model-00024-of-00047.safetensors", + "model.layers.23.self_attn.v_proj.weight_scale": "model-00024-of-00047.safetensors", + "model.layers.24.input_layernorm.weight": "model-00025-of-00047.safetensors", + "model.layers.24.mlp.experts.0.down_proj.weight": "model-00025-of-00047.safetensors", + "model.layers.24.mlp.experts.0.down_proj.weight_scale": "model-00025-of-00047.safetensors", + "model.layers.24.mlp.experts.0.gate_proj.weight": "model-00025-of-00047.safetensors", + "model.layers.24.mlp.experts.0.gate_proj.weight_scale": "model-00025-of-00047.safetensors", + "model.layers.24.mlp.experts.0.up_proj.weight": "model-00025-of-00047.safetensors", + "model.layers.24.mlp.experts.0.up_proj.weight_scale": "model-00025-of-00047.safetensors", + "model.layers.24.mlp.experts.1.down_proj.weight": "model-00025-of-00047.safetensors", + "model.layers.24.mlp.experts.1.down_proj.weight_scale": "model-00025-of-00047.safetensors", + "model.layers.24.mlp.experts.1.gate_proj.weight": "model-00025-of-00047.safetensors", + "model.layers.24.mlp.experts.1.gate_proj.weight_scale": "model-00025-of-00047.safetensors", + "model.layers.24.mlp.experts.1.up_proj.weight": "model-00025-of-00047.safetensors", + "model.layers.24.mlp.experts.1.up_proj.weight_scale": "model-00025-of-00047.safetensors", + "model.layers.24.mlp.experts.10.down_proj.weight": "model-00025-of-00047.safetensors", + "model.layers.24.mlp.experts.10.down_proj.weight_scale": "model-00025-of-00047.safetensors", + "model.layers.24.mlp.experts.10.gate_proj.weight": "model-00025-of-00047.safetensors", + "model.layers.24.mlp.experts.10.gate_proj.weight_scale": "model-00025-of-00047.safetensors", + "model.layers.24.mlp.experts.10.up_proj.weight": "model-00025-of-00047.safetensors", + "model.layers.24.mlp.experts.10.up_proj.weight_scale": "model-00025-of-00047.safetensors", + "model.layers.24.mlp.experts.100.down_proj.weight": "model-00025-of-00047.safetensors", + "model.layers.24.mlp.experts.100.down_proj.weight_scale": "model-00025-of-00047.safetensors", + "model.layers.24.mlp.experts.100.gate_proj.weight": "model-00025-of-00047.safetensors", + "model.layers.24.mlp.experts.100.gate_proj.weight_scale": "model-00025-of-00047.safetensors", + "model.layers.24.mlp.experts.100.up_proj.weight": "model-00025-of-00047.safetensors", + "model.layers.24.mlp.experts.100.up_proj.weight_scale": "model-00025-of-00047.safetensors", + "model.layers.24.mlp.experts.101.down_proj.weight": "model-00025-of-00047.safetensors", + "model.layers.24.mlp.experts.101.down_proj.weight_scale": "model-00025-of-00047.safetensors", + "model.layers.24.mlp.experts.101.gate_proj.weight": "model-00025-of-00047.safetensors", + "model.layers.24.mlp.experts.101.gate_proj.weight_scale": "model-00025-of-00047.safetensors", + "model.layers.24.mlp.experts.101.up_proj.weight": "model-00025-of-00047.safetensors", + "model.layers.24.mlp.experts.101.up_proj.weight_scale": "model-00025-of-00047.safetensors", + "model.layers.24.mlp.experts.102.down_proj.weight": "model-00025-of-00047.safetensors", + "model.layers.24.mlp.experts.102.down_proj.weight_scale": "model-00025-of-00047.safetensors", + "model.layers.24.mlp.experts.102.gate_proj.weight": "model-00025-of-00047.safetensors", + "model.layers.24.mlp.experts.102.gate_proj.weight_scale": "model-00025-of-00047.safetensors", + "model.layers.24.mlp.experts.102.up_proj.weight": "model-00025-of-00047.safetensors", + "model.layers.24.mlp.experts.102.up_proj.weight_scale": "model-00025-of-00047.safetensors", + "model.layers.24.mlp.experts.103.down_proj.weight": "model-00025-of-00047.safetensors", + "model.layers.24.mlp.experts.103.down_proj.weight_scale": "model-00025-of-00047.safetensors", + "model.layers.24.mlp.experts.103.gate_proj.weight": "model-00025-of-00047.safetensors", + "model.layers.24.mlp.experts.103.gate_proj.weight_scale": "model-00025-of-00047.safetensors", + "model.layers.24.mlp.experts.103.up_proj.weight": "model-00025-of-00047.safetensors", + "model.layers.24.mlp.experts.103.up_proj.weight_scale": "model-00025-of-00047.safetensors", + "model.layers.24.mlp.experts.104.down_proj.weight": "model-00025-of-00047.safetensors", + "model.layers.24.mlp.experts.104.down_proj.weight_scale": "model-00025-of-00047.safetensors", + "model.layers.24.mlp.experts.104.gate_proj.weight": "model-00025-of-00047.safetensors", + "model.layers.24.mlp.experts.104.gate_proj.weight_scale": "model-00025-of-00047.safetensors", + "model.layers.24.mlp.experts.104.up_proj.weight": "model-00025-of-00047.safetensors", + "model.layers.24.mlp.experts.104.up_proj.weight_scale": "model-00025-of-00047.safetensors", + "model.layers.24.mlp.experts.105.down_proj.weight": "model-00025-of-00047.safetensors", + "model.layers.24.mlp.experts.105.down_proj.weight_scale": "model-00025-of-00047.safetensors", + "model.layers.24.mlp.experts.105.gate_proj.weight": "model-00025-of-00047.safetensors", + "model.layers.24.mlp.experts.105.gate_proj.weight_scale": "model-00025-of-00047.safetensors", + "model.layers.24.mlp.experts.105.up_proj.weight": "model-00025-of-00047.safetensors", + "model.layers.24.mlp.experts.105.up_proj.weight_scale": "model-00025-of-00047.safetensors", + "model.layers.24.mlp.experts.106.down_proj.weight": "model-00025-of-00047.safetensors", + "model.layers.24.mlp.experts.106.down_proj.weight_scale": "model-00025-of-00047.safetensors", + "model.layers.24.mlp.experts.106.gate_proj.weight": "model-00025-of-00047.safetensors", + "model.layers.24.mlp.experts.106.gate_proj.weight_scale": "model-00025-of-00047.safetensors", + "model.layers.24.mlp.experts.106.up_proj.weight": "model-00025-of-00047.safetensors", + "model.layers.24.mlp.experts.106.up_proj.weight_scale": "model-00025-of-00047.safetensors", + "model.layers.24.mlp.experts.107.down_proj.weight": "model-00025-of-00047.safetensors", + "model.layers.24.mlp.experts.107.down_proj.weight_scale": "model-00025-of-00047.safetensors", + "model.layers.24.mlp.experts.107.gate_proj.weight": "model-00025-of-00047.safetensors", + "model.layers.24.mlp.experts.107.gate_proj.weight_scale": "model-00025-of-00047.safetensors", + "model.layers.24.mlp.experts.107.up_proj.weight": "model-00025-of-00047.safetensors", + "model.layers.24.mlp.experts.107.up_proj.weight_scale": "model-00025-of-00047.safetensors", + "model.layers.24.mlp.experts.108.down_proj.weight": "model-00025-of-00047.safetensors", + "model.layers.24.mlp.experts.108.down_proj.weight_scale": "model-00025-of-00047.safetensors", + "model.layers.24.mlp.experts.108.gate_proj.weight": "model-00025-of-00047.safetensors", + "model.layers.24.mlp.experts.108.gate_proj.weight_scale": "model-00025-of-00047.safetensors", + "model.layers.24.mlp.experts.108.up_proj.weight": "model-00025-of-00047.safetensors", + "model.layers.24.mlp.experts.108.up_proj.weight_scale": "model-00025-of-00047.safetensors", + "model.layers.24.mlp.experts.109.down_proj.weight": "model-00025-of-00047.safetensors", + "model.layers.24.mlp.experts.109.down_proj.weight_scale": "model-00025-of-00047.safetensors", + "model.layers.24.mlp.experts.109.gate_proj.weight": "model-00025-of-00047.safetensors", + "model.layers.24.mlp.experts.109.gate_proj.weight_scale": "model-00025-of-00047.safetensors", + "model.layers.24.mlp.experts.109.up_proj.weight": "model-00025-of-00047.safetensors", + "model.layers.24.mlp.experts.109.up_proj.weight_scale": "model-00025-of-00047.safetensors", + "model.layers.24.mlp.experts.11.down_proj.weight": "model-00025-of-00047.safetensors", + "model.layers.24.mlp.experts.11.down_proj.weight_scale": "model-00025-of-00047.safetensors", + "model.layers.24.mlp.experts.11.gate_proj.weight": "model-00025-of-00047.safetensors", + "model.layers.24.mlp.experts.11.gate_proj.weight_scale": "model-00025-of-00047.safetensors", + "model.layers.24.mlp.experts.11.up_proj.weight": "model-00025-of-00047.safetensors", + "model.layers.24.mlp.experts.11.up_proj.weight_scale": "model-00025-of-00047.safetensors", + "model.layers.24.mlp.experts.110.down_proj.weight": "model-00025-of-00047.safetensors", + "model.layers.24.mlp.experts.110.down_proj.weight_scale": "model-00025-of-00047.safetensors", + "model.layers.24.mlp.experts.110.gate_proj.weight": "model-00025-of-00047.safetensors", + "model.layers.24.mlp.experts.110.gate_proj.weight_scale": "model-00025-of-00047.safetensors", + "model.layers.24.mlp.experts.110.up_proj.weight": "model-00025-of-00047.safetensors", + "model.layers.24.mlp.experts.110.up_proj.weight_scale": "model-00025-of-00047.safetensors", + "model.layers.24.mlp.experts.111.down_proj.weight": "model-00025-of-00047.safetensors", + "model.layers.24.mlp.experts.111.down_proj.weight_scale": "model-00025-of-00047.safetensors", + "model.layers.24.mlp.experts.111.gate_proj.weight": "model-00025-of-00047.safetensors", + "model.layers.24.mlp.experts.111.gate_proj.weight_scale": "model-00025-of-00047.safetensors", + "model.layers.24.mlp.experts.111.up_proj.weight": "model-00025-of-00047.safetensors", + "model.layers.24.mlp.experts.111.up_proj.weight_scale": "model-00025-of-00047.safetensors", + "model.layers.24.mlp.experts.112.down_proj.weight": "model-00025-of-00047.safetensors", + "model.layers.24.mlp.experts.112.down_proj.weight_scale": "model-00025-of-00047.safetensors", + "model.layers.24.mlp.experts.112.gate_proj.weight": "model-00025-of-00047.safetensors", + "model.layers.24.mlp.experts.112.gate_proj.weight_scale": "model-00025-of-00047.safetensors", + "model.layers.24.mlp.experts.112.up_proj.weight": "model-00025-of-00047.safetensors", + "model.layers.24.mlp.experts.112.up_proj.weight_scale": "model-00025-of-00047.safetensors", + "model.layers.24.mlp.experts.113.down_proj.weight": "model-00025-of-00047.safetensors", + "model.layers.24.mlp.experts.113.down_proj.weight_scale": "model-00025-of-00047.safetensors", + "model.layers.24.mlp.experts.113.gate_proj.weight": "model-00025-of-00047.safetensors", + "model.layers.24.mlp.experts.113.gate_proj.weight_scale": "model-00025-of-00047.safetensors", + "model.layers.24.mlp.experts.113.up_proj.weight": "model-00025-of-00047.safetensors", + "model.layers.24.mlp.experts.113.up_proj.weight_scale": "model-00025-of-00047.safetensors", + "model.layers.24.mlp.experts.114.down_proj.weight": "model-00025-of-00047.safetensors", + "model.layers.24.mlp.experts.114.down_proj.weight_scale": "model-00025-of-00047.safetensors", + "model.layers.24.mlp.experts.114.gate_proj.weight": "model-00025-of-00047.safetensors", + "model.layers.24.mlp.experts.114.gate_proj.weight_scale": "model-00025-of-00047.safetensors", + "model.layers.24.mlp.experts.114.up_proj.weight": "model-00025-of-00047.safetensors", + "model.layers.24.mlp.experts.114.up_proj.weight_scale": "model-00025-of-00047.safetensors", + "model.layers.24.mlp.experts.115.down_proj.weight": "model-00025-of-00047.safetensors", + "model.layers.24.mlp.experts.115.down_proj.weight_scale": "model-00025-of-00047.safetensors", + "model.layers.24.mlp.experts.115.gate_proj.weight": "model-00025-of-00047.safetensors", + "model.layers.24.mlp.experts.115.gate_proj.weight_scale": "model-00025-of-00047.safetensors", + "model.layers.24.mlp.experts.115.up_proj.weight": "model-00025-of-00047.safetensors", + "model.layers.24.mlp.experts.115.up_proj.weight_scale": "model-00025-of-00047.safetensors", + "model.layers.24.mlp.experts.116.down_proj.weight": "model-00025-of-00047.safetensors", + "model.layers.24.mlp.experts.116.down_proj.weight_scale": "model-00025-of-00047.safetensors", + "model.layers.24.mlp.experts.116.gate_proj.weight": "model-00025-of-00047.safetensors", + "model.layers.24.mlp.experts.116.gate_proj.weight_scale": "model-00025-of-00047.safetensors", + "model.layers.24.mlp.experts.116.up_proj.weight": "model-00025-of-00047.safetensors", + "model.layers.24.mlp.experts.116.up_proj.weight_scale": "model-00025-of-00047.safetensors", + "model.layers.24.mlp.experts.117.down_proj.weight": "model-00025-of-00047.safetensors", + "model.layers.24.mlp.experts.117.down_proj.weight_scale": "model-00025-of-00047.safetensors", + "model.layers.24.mlp.experts.117.gate_proj.weight": "model-00025-of-00047.safetensors", + "model.layers.24.mlp.experts.117.gate_proj.weight_scale": "model-00025-of-00047.safetensors", + "model.layers.24.mlp.experts.117.up_proj.weight": "model-00025-of-00047.safetensors", + "model.layers.24.mlp.experts.117.up_proj.weight_scale": "model-00025-of-00047.safetensors", + "model.layers.24.mlp.experts.118.down_proj.weight": "model-00025-of-00047.safetensors", + "model.layers.24.mlp.experts.118.down_proj.weight_scale": "model-00025-of-00047.safetensors", + "model.layers.24.mlp.experts.118.gate_proj.weight": "model-00025-of-00047.safetensors", + "model.layers.24.mlp.experts.118.gate_proj.weight_scale": "model-00025-of-00047.safetensors", + "model.layers.24.mlp.experts.118.up_proj.weight": "model-00025-of-00047.safetensors", + "model.layers.24.mlp.experts.118.up_proj.weight_scale": "model-00025-of-00047.safetensors", + "model.layers.24.mlp.experts.119.down_proj.weight": "model-00025-of-00047.safetensors", + "model.layers.24.mlp.experts.119.down_proj.weight_scale": "model-00025-of-00047.safetensors", + "model.layers.24.mlp.experts.119.gate_proj.weight": "model-00025-of-00047.safetensors", + "model.layers.24.mlp.experts.119.gate_proj.weight_scale": "model-00025-of-00047.safetensors", + "model.layers.24.mlp.experts.119.up_proj.weight": "model-00025-of-00047.safetensors", + "model.layers.24.mlp.experts.119.up_proj.weight_scale": "model-00025-of-00047.safetensors", + "model.layers.24.mlp.experts.12.down_proj.weight": "model-00025-of-00047.safetensors", + "model.layers.24.mlp.experts.12.down_proj.weight_scale": "model-00025-of-00047.safetensors", + "model.layers.24.mlp.experts.12.gate_proj.weight": "model-00025-of-00047.safetensors", + "model.layers.24.mlp.experts.12.gate_proj.weight_scale": "model-00025-of-00047.safetensors", + "model.layers.24.mlp.experts.12.up_proj.weight": "model-00025-of-00047.safetensors", + "model.layers.24.mlp.experts.12.up_proj.weight_scale": "model-00025-of-00047.safetensors", + "model.layers.24.mlp.experts.120.down_proj.weight": "model-00025-of-00047.safetensors", + "model.layers.24.mlp.experts.120.down_proj.weight_scale": "model-00025-of-00047.safetensors", + "model.layers.24.mlp.experts.120.gate_proj.weight": "model-00025-of-00047.safetensors", + "model.layers.24.mlp.experts.120.gate_proj.weight_scale": "model-00025-of-00047.safetensors", + "model.layers.24.mlp.experts.120.up_proj.weight": "model-00025-of-00047.safetensors", + "model.layers.24.mlp.experts.120.up_proj.weight_scale": "model-00025-of-00047.safetensors", + "model.layers.24.mlp.experts.121.down_proj.weight": "model-00025-of-00047.safetensors", + "model.layers.24.mlp.experts.121.down_proj.weight_scale": "model-00025-of-00047.safetensors", + "model.layers.24.mlp.experts.121.gate_proj.weight": "model-00025-of-00047.safetensors", + "model.layers.24.mlp.experts.121.gate_proj.weight_scale": "model-00025-of-00047.safetensors", + "model.layers.24.mlp.experts.121.up_proj.weight": "model-00025-of-00047.safetensors", + "model.layers.24.mlp.experts.121.up_proj.weight_scale": "model-00025-of-00047.safetensors", + "model.layers.24.mlp.experts.122.down_proj.weight": "model-00025-of-00047.safetensors", + "model.layers.24.mlp.experts.122.down_proj.weight_scale": "model-00025-of-00047.safetensors", + "model.layers.24.mlp.experts.122.gate_proj.weight": "model-00025-of-00047.safetensors", + "model.layers.24.mlp.experts.122.gate_proj.weight_scale": "model-00025-of-00047.safetensors", + "model.layers.24.mlp.experts.122.up_proj.weight": "model-00025-of-00047.safetensors", + "model.layers.24.mlp.experts.122.up_proj.weight_scale": "model-00025-of-00047.safetensors", + "model.layers.24.mlp.experts.123.down_proj.weight": "model-00025-of-00047.safetensors", + "model.layers.24.mlp.experts.123.down_proj.weight_scale": "model-00025-of-00047.safetensors", + "model.layers.24.mlp.experts.123.gate_proj.weight": "model-00025-of-00047.safetensors", + "model.layers.24.mlp.experts.123.gate_proj.weight_scale": "model-00025-of-00047.safetensors", + "model.layers.24.mlp.experts.123.up_proj.weight": "model-00025-of-00047.safetensors", + "model.layers.24.mlp.experts.123.up_proj.weight_scale": "model-00025-of-00047.safetensors", + "model.layers.24.mlp.experts.124.down_proj.weight": "model-00025-of-00047.safetensors", + "model.layers.24.mlp.experts.124.down_proj.weight_scale": "model-00025-of-00047.safetensors", + "model.layers.24.mlp.experts.124.gate_proj.weight": "model-00025-of-00047.safetensors", + "model.layers.24.mlp.experts.124.gate_proj.weight_scale": "model-00025-of-00047.safetensors", + "model.layers.24.mlp.experts.124.up_proj.weight": "model-00025-of-00047.safetensors", + "model.layers.24.mlp.experts.124.up_proj.weight_scale": "model-00025-of-00047.safetensors", + "model.layers.24.mlp.experts.125.down_proj.weight": "model-00025-of-00047.safetensors", + "model.layers.24.mlp.experts.125.down_proj.weight_scale": "model-00025-of-00047.safetensors", + "model.layers.24.mlp.experts.125.gate_proj.weight": "model-00025-of-00047.safetensors", + "model.layers.24.mlp.experts.125.gate_proj.weight_scale": "model-00025-of-00047.safetensors", + "model.layers.24.mlp.experts.125.up_proj.weight": "model-00025-of-00047.safetensors", + "model.layers.24.mlp.experts.125.up_proj.weight_scale": "model-00025-of-00047.safetensors", + "model.layers.24.mlp.experts.126.down_proj.weight": "model-00025-of-00047.safetensors", + "model.layers.24.mlp.experts.126.down_proj.weight_scale": "model-00025-of-00047.safetensors", + "model.layers.24.mlp.experts.126.gate_proj.weight": "model-00025-of-00047.safetensors", + "model.layers.24.mlp.experts.126.gate_proj.weight_scale": "model-00025-of-00047.safetensors", + "model.layers.24.mlp.experts.126.up_proj.weight": "model-00025-of-00047.safetensors", + "model.layers.24.mlp.experts.126.up_proj.weight_scale": "model-00025-of-00047.safetensors", + "model.layers.24.mlp.experts.127.down_proj.weight": "model-00025-of-00047.safetensors", + "model.layers.24.mlp.experts.127.down_proj.weight_scale": "model-00025-of-00047.safetensors", + "model.layers.24.mlp.experts.127.gate_proj.weight": "model-00025-of-00047.safetensors", + "model.layers.24.mlp.experts.127.gate_proj.weight_scale": "model-00025-of-00047.safetensors", + "model.layers.24.mlp.experts.127.up_proj.weight": "model-00025-of-00047.safetensors", + "model.layers.24.mlp.experts.127.up_proj.weight_scale": "model-00025-of-00047.safetensors", + "model.layers.24.mlp.experts.13.down_proj.weight": "model-00025-of-00047.safetensors", + "model.layers.24.mlp.experts.13.down_proj.weight_scale": "model-00025-of-00047.safetensors", + "model.layers.24.mlp.experts.13.gate_proj.weight": "model-00025-of-00047.safetensors", + "model.layers.24.mlp.experts.13.gate_proj.weight_scale": "model-00025-of-00047.safetensors", + "model.layers.24.mlp.experts.13.up_proj.weight": "model-00025-of-00047.safetensors", + "model.layers.24.mlp.experts.13.up_proj.weight_scale": "model-00025-of-00047.safetensors", + "model.layers.24.mlp.experts.14.down_proj.weight": "model-00025-of-00047.safetensors", + "model.layers.24.mlp.experts.14.down_proj.weight_scale": "model-00025-of-00047.safetensors", + "model.layers.24.mlp.experts.14.gate_proj.weight": "model-00025-of-00047.safetensors", + "model.layers.24.mlp.experts.14.gate_proj.weight_scale": "model-00025-of-00047.safetensors", + "model.layers.24.mlp.experts.14.up_proj.weight": "model-00025-of-00047.safetensors", + "model.layers.24.mlp.experts.14.up_proj.weight_scale": "model-00025-of-00047.safetensors", + "model.layers.24.mlp.experts.15.down_proj.weight": "model-00025-of-00047.safetensors", + "model.layers.24.mlp.experts.15.down_proj.weight_scale": "model-00025-of-00047.safetensors", + "model.layers.24.mlp.experts.15.gate_proj.weight": "model-00025-of-00047.safetensors", + "model.layers.24.mlp.experts.15.gate_proj.weight_scale": "model-00025-of-00047.safetensors", + "model.layers.24.mlp.experts.15.up_proj.weight": "model-00025-of-00047.safetensors", + "model.layers.24.mlp.experts.15.up_proj.weight_scale": "model-00025-of-00047.safetensors", + "model.layers.24.mlp.experts.16.down_proj.weight": "model-00025-of-00047.safetensors", + "model.layers.24.mlp.experts.16.down_proj.weight_scale": "model-00025-of-00047.safetensors", + "model.layers.24.mlp.experts.16.gate_proj.weight": "model-00025-of-00047.safetensors", + "model.layers.24.mlp.experts.16.gate_proj.weight_scale": "model-00025-of-00047.safetensors", + "model.layers.24.mlp.experts.16.up_proj.weight": "model-00025-of-00047.safetensors", + "model.layers.24.mlp.experts.16.up_proj.weight_scale": "model-00025-of-00047.safetensors", + "model.layers.24.mlp.experts.17.down_proj.weight": "model-00025-of-00047.safetensors", + "model.layers.24.mlp.experts.17.down_proj.weight_scale": "model-00025-of-00047.safetensors", + "model.layers.24.mlp.experts.17.gate_proj.weight": "model-00025-of-00047.safetensors", + "model.layers.24.mlp.experts.17.gate_proj.weight_scale": "model-00025-of-00047.safetensors", + "model.layers.24.mlp.experts.17.up_proj.weight": "model-00025-of-00047.safetensors", + "model.layers.24.mlp.experts.17.up_proj.weight_scale": "model-00025-of-00047.safetensors", + "model.layers.24.mlp.experts.18.down_proj.weight": "model-00025-of-00047.safetensors", + "model.layers.24.mlp.experts.18.down_proj.weight_scale": "model-00025-of-00047.safetensors", + "model.layers.24.mlp.experts.18.gate_proj.weight": "model-00025-of-00047.safetensors", + "model.layers.24.mlp.experts.18.gate_proj.weight_scale": "model-00025-of-00047.safetensors", + "model.layers.24.mlp.experts.18.up_proj.weight": "model-00025-of-00047.safetensors", + "model.layers.24.mlp.experts.18.up_proj.weight_scale": "model-00025-of-00047.safetensors", + "model.layers.24.mlp.experts.19.down_proj.weight": "model-00025-of-00047.safetensors", + "model.layers.24.mlp.experts.19.down_proj.weight_scale": "model-00025-of-00047.safetensors", + "model.layers.24.mlp.experts.19.gate_proj.weight": "model-00025-of-00047.safetensors", + "model.layers.24.mlp.experts.19.gate_proj.weight_scale": "model-00025-of-00047.safetensors", + "model.layers.24.mlp.experts.19.up_proj.weight": "model-00025-of-00047.safetensors", + "model.layers.24.mlp.experts.19.up_proj.weight_scale": "model-00025-of-00047.safetensors", + "model.layers.24.mlp.experts.2.down_proj.weight": "model-00025-of-00047.safetensors", + "model.layers.24.mlp.experts.2.down_proj.weight_scale": "model-00025-of-00047.safetensors", + "model.layers.24.mlp.experts.2.gate_proj.weight": "model-00025-of-00047.safetensors", + "model.layers.24.mlp.experts.2.gate_proj.weight_scale": "model-00025-of-00047.safetensors", + "model.layers.24.mlp.experts.2.up_proj.weight": "model-00025-of-00047.safetensors", + "model.layers.24.mlp.experts.2.up_proj.weight_scale": "model-00025-of-00047.safetensors", + "model.layers.24.mlp.experts.20.down_proj.weight": "model-00025-of-00047.safetensors", + "model.layers.24.mlp.experts.20.down_proj.weight_scale": "model-00025-of-00047.safetensors", + "model.layers.24.mlp.experts.20.gate_proj.weight": "model-00025-of-00047.safetensors", + "model.layers.24.mlp.experts.20.gate_proj.weight_scale": "model-00025-of-00047.safetensors", + "model.layers.24.mlp.experts.20.up_proj.weight": "model-00025-of-00047.safetensors", + "model.layers.24.mlp.experts.20.up_proj.weight_scale": "model-00025-of-00047.safetensors", + "model.layers.24.mlp.experts.21.down_proj.weight": "model-00025-of-00047.safetensors", + "model.layers.24.mlp.experts.21.down_proj.weight_scale": "model-00025-of-00047.safetensors", + "model.layers.24.mlp.experts.21.gate_proj.weight": "model-00025-of-00047.safetensors", + "model.layers.24.mlp.experts.21.gate_proj.weight_scale": "model-00025-of-00047.safetensors", + "model.layers.24.mlp.experts.21.up_proj.weight": "model-00025-of-00047.safetensors", + "model.layers.24.mlp.experts.21.up_proj.weight_scale": "model-00025-of-00047.safetensors", + "model.layers.24.mlp.experts.22.down_proj.weight": "model-00025-of-00047.safetensors", + "model.layers.24.mlp.experts.22.down_proj.weight_scale": "model-00025-of-00047.safetensors", + "model.layers.24.mlp.experts.22.gate_proj.weight": "model-00025-of-00047.safetensors", + "model.layers.24.mlp.experts.22.gate_proj.weight_scale": "model-00025-of-00047.safetensors", + "model.layers.24.mlp.experts.22.up_proj.weight": "model-00025-of-00047.safetensors", + "model.layers.24.mlp.experts.22.up_proj.weight_scale": "model-00025-of-00047.safetensors", + "model.layers.24.mlp.experts.23.down_proj.weight": "model-00025-of-00047.safetensors", + "model.layers.24.mlp.experts.23.down_proj.weight_scale": "model-00025-of-00047.safetensors", + "model.layers.24.mlp.experts.23.gate_proj.weight": "model-00025-of-00047.safetensors", + "model.layers.24.mlp.experts.23.gate_proj.weight_scale": "model-00025-of-00047.safetensors", + "model.layers.24.mlp.experts.23.up_proj.weight": "model-00025-of-00047.safetensors", + "model.layers.24.mlp.experts.23.up_proj.weight_scale": "model-00025-of-00047.safetensors", + "model.layers.24.mlp.experts.24.down_proj.weight": "model-00025-of-00047.safetensors", + "model.layers.24.mlp.experts.24.down_proj.weight_scale": "model-00025-of-00047.safetensors", + "model.layers.24.mlp.experts.24.gate_proj.weight": "model-00025-of-00047.safetensors", + "model.layers.24.mlp.experts.24.gate_proj.weight_scale": "model-00025-of-00047.safetensors", + "model.layers.24.mlp.experts.24.up_proj.weight": "model-00025-of-00047.safetensors", + "model.layers.24.mlp.experts.24.up_proj.weight_scale": "model-00025-of-00047.safetensors", + "model.layers.24.mlp.experts.25.down_proj.weight": "model-00025-of-00047.safetensors", + "model.layers.24.mlp.experts.25.down_proj.weight_scale": "model-00025-of-00047.safetensors", + "model.layers.24.mlp.experts.25.gate_proj.weight": "model-00025-of-00047.safetensors", + "model.layers.24.mlp.experts.25.gate_proj.weight_scale": "model-00025-of-00047.safetensors", + "model.layers.24.mlp.experts.25.up_proj.weight": "model-00025-of-00047.safetensors", + "model.layers.24.mlp.experts.25.up_proj.weight_scale": "model-00025-of-00047.safetensors", + "model.layers.24.mlp.experts.26.down_proj.weight": "model-00025-of-00047.safetensors", + "model.layers.24.mlp.experts.26.down_proj.weight_scale": "model-00025-of-00047.safetensors", + "model.layers.24.mlp.experts.26.gate_proj.weight": "model-00025-of-00047.safetensors", + "model.layers.24.mlp.experts.26.gate_proj.weight_scale": "model-00025-of-00047.safetensors", + "model.layers.24.mlp.experts.26.up_proj.weight": "model-00025-of-00047.safetensors", + "model.layers.24.mlp.experts.26.up_proj.weight_scale": "model-00025-of-00047.safetensors", + "model.layers.24.mlp.experts.27.down_proj.weight": "model-00025-of-00047.safetensors", + "model.layers.24.mlp.experts.27.down_proj.weight_scale": "model-00025-of-00047.safetensors", + "model.layers.24.mlp.experts.27.gate_proj.weight": "model-00025-of-00047.safetensors", + "model.layers.24.mlp.experts.27.gate_proj.weight_scale": "model-00025-of-00047.safetensors", + "model.layers.24.mlp.experts.27.up_proj.weight": "model-00025-of-00047.safetensors", + "model.layers.24.mlp.experts.27.up_proj.weight_scale": "model-00025-of-00047.safetensors", + "model.layers.24.mlp.experts.28.down_proj.weight": "model-00025-of-00047.safetensors", + "model.layers.24.mlp.experts.28.down_proj.weight_scale": "model-00025-of-00047.safetensors", + "model.layers.24.mlp.experts.28.gate_proj.weight": "model-00025-of-00047.safetensors", + "model.layers.24.mlp.experts.28.gate_proj.weight_scale": "model-00025-of-00047.safetensors", + "model.layers.24.mlp.experts.28.up_proj.weight": "model-00025-of-00047.safetensors", + "model.layers.24.mlp.experts.28.up_proj.weight_scale": "model-00025-of-00047.safetensors", + "model.layers.24.mlp.experts.29.down_proj.weight": "model-00025-of-00047.safetensors", + "model.layers.24.mlp.experts.29.down_proj.weight_scale": "model-00025-of-00047.safetensors", + "model.layers.24.mlp.experts.29.gate_proj.weight": "model-00025-of-00047.safetensors", + "model.layers.24.mlp.experts.29.gate_proj.weight_scale": "model-00025-of-00047.safetensors", + "model.layers.24.mlp.experts.29.up_proj.weight": "model-00025-of-00047.safetensors", + "model.layers.24.mlp.experts.29.up_proj.weight_scale": "model-00025-of-00047.safetensors", + "model.layers.24.mlp.experts.3.down_proj.weight": "model-00025-of-00047.safetensors", + "model.layers.24.mlp.experts.3.down_proj.weight_scale": "model-00025-of-00047.safetensors", + "model.layers.24.mlp.experts.3.gate_proj.weight": "model-00025-of-00047.safetensors", + "model.layers.24.mlp.experts.3.gate_proj.weight_scale": "model-00025-of-00047.safetensors", + "model.layers.24.mlp.experts.3.up_proj.weight": "model-00025-of-00047.safetensors", + "model.layers.24.mlp.experts.3.up_proj.weight_scale": "model-00025-of-00047.safetensors", + "model.layers.24.mlp.experts.30.down_proj.weight": "model-00025-of-00047.safetensors", + "model.layers.24.mlp.experts.30.down_proj.weight_scale": "model-00025-of-00047.safetensors", + "model.layers.24.mlp.experts.30.gate_proj.weight": "model-00025-of-00047.safetensors", + "model.layers.24.mlp.experts.30.gate_proj.weight_scale": "model-00025-of-00047.safetensors", + "model.layers.24.mlp.experts.30.up_proj.weight": "model-00025-of-00047.safetensors", + "model.layers.24.mlp.experts.30.up_proj.weight_scale": "model-00025-of-00047.safetensors", + "model.layers.24.mlp.experts.31.down_proj.weight": "model-00025-of-00047.safetensors", + "model.layers.24.mlp.experts.31.down_proj.weight_scale": "model-00025-of-00047.safetensors", + "model.layers.24.mlp.experts.31.gate_proj.weight": "model-00025-of-00047.safetensors", + "model.layers.24.mlp.experts.31.gate_proj.weight_scale": "model-00025-of-00047.safetensors", + "model.layers.24.mlp.experts.31.up_proj.weight": "model-00025-of-00047.safetensors", + "model.layers.24.mlp.experts.31.up_proj.weight_scale": "model-00025-of-00047.safetensors", + "model.layers.24.mlp.experts.32.down_proj.weight": "model-00025-of-00047.safetensors", + "model.layers.24.mlp.experts.32.down_proj.weight_scale": "model-00025-of-00047.safetensors", + "model.layers.24.mlp.experts.32.gate_proj.weight": "model-00025-of-00047.safetensors", + "model.layers.24.mlp.experts.32.gate_proj.weight_scale": "model-00025-of-00047.safetensors", + "model.layers.24.mlp.experts.32.up_proj.weight": "model-00025-of-00047.safetensors", + "model.layers.24.mlp.experts.32.up_proj.weight_scale": "model-00025-of-00047.safetensors", + "model.layers.24.mlp.experts.33.down_proj.weight": "model-00025-of-00047.safetensors", + "model.layers.24.mlp.experts.33.down_proj.weight_scale": "model-00025-of-00047.safetensors", + "model.layers.24.mlp.experts.33.gate_proj.weight": "model-00025-of-00047.safetensors", + "model.layers.24.mlp.experts.33.gate_proj.weight_scale": "model-00025-of-00047.safetensors", + "model.layers.24.mlp.experts.33.up_proj.weight": "model-00025-of-00047.safetensors", + "model.layers.24.mlp.experts.33.up_proj.weight_scale": "model-00025-of-00047.safetensors", + "model.layers.24.mlp.experts.34.down_proj.weight": "model-00025-of-00047.safetensors", + "model.layers.24.mlp.experts.34.down_proj.weight_scale": "model-00025-of-00047.safetensors", + "model.layers.24.mlp.experts.34.gate_proj.weight": "model-00025-of-00047.safetensors", + "model.layers.24.mlp.experts.34.gate_proj.weight_scale": "model-00025-of-00047.safetensors", + "model.layers.24.mlp.experts.34.up_proj.weight": "model-00025-of-00047.safetensors", + "model.layers.24.mlp.experts.34.up_proj.weight_scale": "model-00025-of-00047.safetensors", + "model.layers.24.mlp.experts.35.down_proj.weight": "model-00025-of-00047.safetensors", + "model.layers.24.mlp.experts.35.down_proj.weight_scale": "model-00025-of-00047.safetensors", + "model.layers.24.mlp.experts.35.gate_proj.weight": "model-00025-of-00047.safetensors", + "model.layers.24.mlp.experts.35.gate_proj.weight_scale": "model-00025-of-00047.safetensors", + "model.layers.24.mlp.experts.35.up_proj.weight": "model-00025-of-00047.safetensors", + "model.layers.24.mlp.experts.35.up_proj.weight_scale": "model-00025-of-00047.safetensors", + "model.layers.24.mlp.experts.36.down_proj.weight": "model-00025-of-00047.safetensors", + "model.layers.24.mlp.experts.36.down_proj.weight_scale": "model-00025-of-00047.safetensors", + "model.layers.24.mlp.experts.36.gate_proj.weight": "model-00025-of-00047.safetensors", + "model.layers.24.mlp.experts.36.gate_proj.weight_scale": "model-00025-of-00047.safetensors", + "model.layers.24.mlp.experts.36.up_proj.weight": "model-00025-of-00047.safetensors", + "model.layers.24.mlp.experts.36.up_proj.weight_scale": "model-00025-of-00047.safetensors", + "model.layers.24.mlp.experts.37.down_proj.weight": "model-00025-of-00047.safetensors", + "model.layers.24.mlp.experts.37.down_proj.weight_scale": "model-00025-of-00047.safetensors", + "model.layers.24.mlp.experts.37.gate_proj.weight": "model-00025-of-00047.safetensors", + "model.layers.24.mlp.experts.37.gate_proj.weight_scale": "model-00025-of-00047.safetensors", + "model.layers.24.mlp.experts.37.up_proj.weight": "model-00025-of-00047.safetensors", + "model.layers.24.mlp.experts.37.up_proj.weight_scale": "model-00025-of-00047.safetensors", + "model.layers.24.mlp.experts.38.down_proj.weight": "model-00025-of-00047.safetensors", + "model.layers.24.mlp.experts.38.down_proj.weight_scale": "model-00025-of-00047.safetensors", + "model.layers.24.mlp.experts.38.gate_proj.weight": "model-00025-of-00047.safetensors", + "model.layers.24.mlp.experts.38.gate_proj.weight_scale": "model-00025-of-00047.safetensors", + "model.layers.24.mlp.experts.38.up_proj.weight": "model-00025-of-00047.safetensors", + "model.layers.24.mlp.experts.38.up_proj.weight_scale": "model-00025-of-00047.safetensors", + "model.layers.24.mlp.experts.39.down_proj.weight": "model-00025-of-00047.safetensors", + "model.layers.24.mlp.experts.39.down_proj.weight_scale": "model-00025-of-00047.safetensors", + "model.layers.24.mlp.experts.39.gate_proj.weight": "model-00025-of-00047.safetensors", + "model.layers.24.mlp.experts.39.gate_proj.weight_scale": "model-00025-of-00047.safetensors", + "model.layers.24.mlp.experts.39.up_proj.weight": "model-00025-of-00047.safetensors", + "model.layers.24.mlp.experts.39.up_proj.weight_scale": "model-00025-of-00047.safetensors", + "model.layers.24.mlp.experts.4.down_proj.weight": "model-00025-of-00047.safetensors", + "model.layers.24.mlp.experts.4.down_proj.weight_scale": "model-00025-of-00047.safetensors", + "model.layers.24.mlp.experts.4.gate_proj.weight": "model-00025-of-00047.safetensors", + "model.layers.24.mlp.experts.4.gate_proj.weight_scale": "model-00025-of-00047.safetensors", + "model.layers.24.mlp.experts.4.up_proj.weight": "model-00025-of-00047.safetensors", + "model.layers.24.mlp.experts.4.up_proj.weight_scale": "model-00025-of-00047.safetensors", + "model.layers.24.mlp.experts.40.down_proj.weight": "model-00025-of-00047.safetensors", + "model.layers.24.mlp.experts.40.down_proj.weight_scale": "model-00025-of-00047.safetensors", + "model.layers.24.mlp.experts.40.gate_proj.weight": "model-00025-of-00047.safetensors", + "model.layers.24.mlp.experts.40.gate_proj.weight_scale": "model-00025-of-00047.safetensors", + "model.layers.24.mlp.experts.40.up_proj.weight": "model-00025-of-00047.safetensors", + "model.layers.24.mlp.experts.40.up_proj.weight_scale": "model-00025-of-00047.safetensors", + "model.layers.24.mlp.experts.41.down_proj.weight": "model-00025-of-00047.safetensors", + "model.layers.24.mlp.experts.41.down_proj.weight_scale": "model-00025-of-00047.safetensors", + "model.layers.24.mlp.experts.41.gate_proj.weight": "model-00025-of-00047.safetensors", + "model.layers.24.mlp.experts.41.gate_proj.weight_scale": "model-00025-of-00047.safetensors", + "model.layers.24.mlp.experts.41.up_proj.weight": "model-00025-of-00047.safetensors", + "model.layers.24.mlp.experts.41.up_proj.weight_scale": "model-00025-of-00047.safetensors", + "model.layers.24.mlp.experts.42.down_proj.weight": "model-00025-of-00047.safetensors", + "model.layers.24.mlp.experts.42.down_proj.weight_scale": "model-00025-of-00047.safetensors", + "model.layers.24.mlp.experts.42.gate_proj.weight": "model-00025-of-00047.safetensors", + "model.layers.24.mlp.experts.42.gate_proj.weight_scale": "model-00025-of-00047.safetensors", + "model.layers.24.mlp.experts.42.up_proj.weight": "model-00025-of-00047.safetensors", + "model.layers.24.mlp.experts.42.up_proj.weight_scale": "model-00025-of-00047.safetensors", + "model.layers.24.mlp.experts.43.down_proj.weight": "model-00025-of-00047.safetensors", + "model.layers.24.mlp.experts.43.down_proj.weight_scale": "model-00025-of-00047.safetensors", + "model.layers.24.mlp.experts.43.gate_proj.weight": "model-00025-of-00047.safetensors", + "model.layers.24.mlp.experts.43.gate_proj.weight_scale": "model-00025-of-00047.safetensors", + "model.layers.24.mlp.experts.43.up_proj.weight": "model-00025-of-00047.safetensors", + "model.layers.24.mlp.experts.43.up_proj.weight_scale": "model-00025-of-00047.safetensors", + "model.layers.24.mlp.experts.44.down_proj.weight": "model-00025-of-00047.safetensors", + "model.layers.24.mlp.experts.44.down_proj.weight_scale": "model-00025-of-00047.safetensors", + "model.layers.24.mlp.experts.44.gate_proj.weight": "model-00025-of-00047.safetensors", + "model.layers.24.mlp.experts.44.gate_proj.weight_scale": "model-00025-of-00047.safetensors", + "model.layers.24.mlp.experts.44.up_proj.weight": "model-00025-of-00047.safetensors", + "model.layers.24.mlp.experts.44.up_proj.weight_scale": "model-00025-of-00047.safetensors", + "model.layers.24.mlp.experts.45.down_proj.weight": "model-00025-of-00047.safetensors", + "model.layers.24.mlp.experts.45.down_proj.weight_scale": "model-00025-of-00047.safetensors", + "model.layers.24.mlp.experts.45.gate_proj.weight": "model-00025-of-00047.safetensors", + "model.layers.24.mlp.experts.45.gate_proj.weight_scale": "model-00025-of-00047.safetensors", + "model.layers.24.mlp.experts.45.up_proj.weight": "model-00025-of-00047.safetensors", + "model.layers.24.mlp.experts.45.up_proj.weight_scale": "model-00025-of-00047.safetensors", + "model.layers.24.mlp.experts.46.down_proj.weight": "model-00025-of-00047.safetensors", + "model.layers.24.mlp.experts.46.down_proj.weight_scale": "model-00025-of-00047.safetensors", + "model.layers.24.mlp.experts.46.gate_proj.weight": "model-00025-of-00047.safetensors", + "model.layers.24.mlp.experts.46.gate_proj.weight_scale": "model-00025-of-00047.safetensors", + "model.layers.24.mlp.experts.46.up_proj.weight": "model-00025-of-00047.safetensors", + "model.layers.24.mlp.experts.46.up_proj.weight_scale": "model-00025-of-00047.safetensors", + "model.layers.24.mlp.experts.47.down_proj.weight": "model-00025-of-00047.safetensors", + "model.layers.24.mlp.experts.47.down_proj.weight_scale": "model-00025-of-00047.safetensors", + "model.layers.24.mlp.experts.47.gate_proj.weight": "model-00025-of-00047.safetensors", + "model.layers.24.mlp.experts.47.gate_proj.weight_scale": "model-00025-of-00047.safetensors", + "model.layers.24.mlp.experts.47.up_proj.weight": "model-00025-of-00047.safetensors", + "model.layers.24.mlp.experts.47.up_proj.weight_scale": "model-00025-of-00047.safetensors", + "model.layers.24.mlp.experts.48.down_proj.weight": "model-00025-of-00047.safetensors", + "model.layers.24.mlp.experts.48.down_proj.weight_scale": "model-00025-of-00047.safetensors", + "model.layers.24.mlp.experts.48.gate_proj.weight": "model-00025-of-00047.safetensors", + "model.layers.24.mlp.experts.48.gate_proj.weight_scale": "model-00025-of-00047.safetensors", + "model.layers.24.mlp.experts.48.up_proj.weight": "model-00025-of-00047.safetensors", + "model.layers.24.mlp.experts.48.up_proj.weight_scale": "model-00025-of-00047.safetensors", + "model.layers.24.mlp.experts.49.down_proj.weight": "model-00025-of-00047.safetensors", + "model.layers.24.mlp.experts.49.down_proj.weight_scale": "model-00025-of-00047.safetensors", + "model.layers.24.mlp.experts.49.gate_proj.weight": "model-00025-of-00047.safetensors", + "model.layers.24.mlp.experts.49.gate_proj.weight_scale": "model-00025-of-00047.safetensors", + "model.layers.24.mlp.experts.49.up_proj.weight": "model-00025-of-00047.safetensors", + "model.layers.24.mlp.experts.49.up_proj.weight_scale": "model-00025-of-00047.safetensors", + "model.layers.24.mlp.experts.5.down_proj.weight": "model-00025-of-00047.safetensors", + "model.layers.24.mlp.experts.5.down_proj.weight_scale": "model-00025-of-00047.safetensors", + "model.layers.24.mlp.experts.5.gate_proj.weight": "model-00025-of-00047.safetensors", + "model.layers.24.mlp.experts.5.gate_proj.weight_scale": "model-00025-of-00047.safetensors", + "model.layers.24.mlp.experts.5.up_proj.weight": "model-00025-of-00047.safetensors", + "model.layers.24.mlp.experts.5.up_proj.weight_scale": "model-00025-of-00047.safetensors", + "model.layers.24.mlp.experts.50.down_proj.weight": "model-00025-of-00047.safetensors", + "model.layers.24.mlp.experts.50.down_proj.weight_scale": "model-00025-of-00047.safetensors", + "model.layers.24.mlp.experts.50.gate_proj.weight": "model-00025-of-00047.safetensors", + "model.layers.24.mlp.experts.50.gate_proj.weight_scale": "model-00025-of-00047.safetensors", + "model.layers.24.mlp.experts.50.up_proj.weight": "model-00025-of-00047.safetensors", + "model.layers.24.mlp.experts.50.up_proj.weight_scale": "model-00025-of-00047.safetensors", + "model.layers.24.mlp.experts.51.down_proj.weight": "model-00025-of-00047.safetensors", + "model.layers.24.mlp.experts.51.down_proj.weight_scale": "model-00025-of-00047.safetensors", + "model.layers.24.mlp.experts.51.gate_proj.weight": "model-00025-of-00047.safetensors", + "model.layers.24.mlp.experts.51.gate_proj.weight_scale": "model-00025-of-00047.safetensors", + "model.layers.24.mlp.experts.51.up_proj.weight": "model-00025-of-00047.safetensors", + "model.layers.24.mlp.experts.51.up_proj.weight_scale": "model-00025-of-00047.safetensors", + "model.layers.24.mlp.experts.52.down_proj.weight": "model-00025-of-00047.safetensors", + "model.layers.24.mlp.experts.52.down_proj.weight_scale": "model-00025-of-00047.safetensors", + "model.layers.24.mlp.experts.52.gate_proj.weight": "model-00025-of-00047.safetensors", + "model.layers.24.mlp.experts.52.gate_proj.weight_scale": "model-00025-of-00047.safetensors", + "model.layers.24.mlp.experts.52.up_proj.weight": "model-00025-of-00047.safetensors", + "model.layers.24.mlp.experts.52.up_proj.weight_scale": "model-00025-of-00047.safetensors", + "model.layers.24.mlp.experts.53.down_proj.weight": "model-00025-of-00047.safetensors", + "model.layers.24.mlp.experts.53.down_proj.weight_scale": "model-00025-of-00047.safetensors", + "model.layers.24.mlp.experts.53.gate_proj.weight": "model-00025-of-00047.safetensors", + "model.layers.24.mlp.experts.53.gate_proj.weight_scale": "model-00025-of-00047.safetensors", + "model.layers.24.mlp.experts.53.up_proj.weight": "model-00025-of-00047.safetensors", + "model.layers.24.mlp.experts.53.up_proj.weight_scale": "model-00025-of-00047.safetensors", + "model.layers.24.mlp.experts.54.down_proj.weight": "model-00025-of-00047.safetensors", + "model.layers.24.mlp.experts.54.down_proj.weight_scale": "model-00025-of-00047.safetensors", + "model.layers.24.mlp.experts.54.gate_proj.weight": "model-00025-of-00047.safetensors", + "model.layers.24.mlp.experts.54.gate_proj.weight_scale": "model-00025-of-00047.safetensors", + "model.layers.24.mlp.experts.54.up_proj.weight": "model-00025-of-00047.safetensors", + "model.layers.24.mlp.experts.54.up_proj.weight_scale": "model-00025-of-00047.safetensors", + "model.layers.24.mlp.experts.55.down_proj.weight": "model-00025-of-00047.safetensors", + "model.layers.24.mlp.experts.55.down_proj.weight_scale": "model-00025-of-00047.safetensors", + "model.layers.24.mlp.experts.55.gate_proj.weight": "model-00025-of-00047.safetensors", + "model.layers.24.mlp.experts.55.gate_proj.weight_scale": "model-00025-of-00047.safetensors", + "model.layers.24.mlp.experts.55.up_proj.weight": "model-00025-of-00047.safetensors", + "model.layers.24.mlp.experts.55.up_proj.weight_scale": "model-00025-of-00047.safetensors", + "model.layers.24.mlp.experts.56.down_proj.weight": "model-00025-of-00047.safetensors", + "model.layers.24.mlp.experts.56.down_proj.weight_scale": "model-00025-of-00047.safetensors", + "model.layers.24.mlp.experts.56.gate_proj.weight": "model-00025-of-00047.safetensors", + "model.layers.24.mlp.experts.56.gate_proj.weight_scale": "model-00025-of-00047.safetensors", + "model.layers.24.mlp.experts.56.up_proj.weight": "model-00025-of-00047.safetensors", + "model.layers.24.mlp.experts.56.up_proj.weight_scale": "model-00025-of-00047.safetensors", + "model.layers.24.mlp.experts.57.down_proj.weight": "model-00025-of-00047.safetensors", + "model.layers.24.mlp.experts.57.down_proj.weight_scale": "model-00025-of-00047.safetensors", + "model.layers.24.mlp.experts.57.gate_proj.weight": "model-00025-of-00047.safetensors", + "model.layers.24.mlp.experts.57.gate_proj.weight_scale": "model-00025-of-00047.safetensors", + "model.layers.24.mlp.experts.57.up_proj.weight": "model-00025-of-00047.safetensors", + "model.layers.24.mlp.experts.57.up_proj.weight_scale": "model-00025-of-00047.safetensors", + "model.layers.24.mlp.experts.58.down_proj.weight": "model-00025-of-00047.safetensors", + "model.layers.24.mlp.experts.58.down_proj.weight_scale": "model-00025-of-00047.safetensors", + "model.layers.24.mlp.experts.58.gate_proj.weight": "model-00025-of-00047.safetensors", + "model.layers.24.mlp.experts.58.gate_proj.weight_scale": "model-00025-of-00047.safetensors", + "model.layers.24.mlp.experts.58.up_proj.weight": "model-00025-of-00047.safetensors", + "model.layers.24.mlp.experts.58.up_proj.weight_scale": "model-00025-of-00047.safetensors", + "model.layers.24.mlp.experts.59.down_proj.weight": "model-00025-of-00047.safetensors", + "model.layers.24.mlp.experts.59.down_proj.weight_scale": "model-00025-of-00047.safetensors", + "model.layers.24.mlp.experts.59.gate_proj.weight": "model-00025-of-00047.safetensors", + "model.layers.24.mlp.experts.59.gate_proj.weight_scale": "model-00025-of-00047.safetensors", + "model.layers.24.mlp.experts.59.up_proj.weight": "model-00025-of-00047.safetensors", + "model.layers.24.mlp.experts.59.up_proj.weight_scale": "model-00025-of-00047.safetensors", + "model.layers.24.mlp.experts.6.down_proj.weight": "model-00025-of-00047.safetensors", + "model.layers.24.mlp.experts.6.down_proj.weight_scale": "model-00025-of-00047.safetensors", + "model.layers.24.mlp.experts.6.gate_proj.weight": "model-00025-of-00047.safetensors", + "model.layers.24.mlp.experts.6.gate_proj.weight_scale": "model-00025-of-00047.safetensors", + "model.layers.24.mlp.experts.6.up_proj.weight": "model-00025-of-00047.safetensors", + "model.layers.24.mlp.experts.6.up_proj.weight_scale": "model-00025-of-00047.safetensors", + "model.layers.24.mlp.experts.60.down_proj.weight": "model-00025-of-00047.safetensors", + "model.layers.24.mlp.experts.60.down_proj.weight_scale": "model-00025-of-00047.safetensors", + "model.layers.24.mlp.experts.60.gate_proj.weight": "model-00025-of-00047.safetensors", + "model.layers.24.mlp.experts.60.gate_proj.weight_scale": "model-00025-of-00047.safetensors", + "model.layers.24.mlp.experts.60.up_proj.weight": "model-00025-of-00047.safetensors", + "model.layers.24.mlp.experts.60.up_proj.weight_scale": "model-00025-of-00047.safetensors", + "model.layers.24.mlp.experts.61.down_proj.weight": "model-00025-of-00047.safetensors", + "model.layers.24.mlp.experts.61.down_proj.weight_scale": "model-00025-of-00047.safetensors", + "model.layers.24.mlp.experts.61.gate_proj.weight": "model-00025-of-00047.safetensors", + "model.layers.24.mlp.experts.61.gate_proj.weight_scale": "model-00025-of-00047.safetensors", + "model.layers.24.mlp.experts.61.up_proj.weight": "model-00025-of-00047.safetensors", + "model.layers.24.mlp.experts.61.up_proj.weight_scale": "model-00025-of-00047.safetensors", + "model.layers.24.mlp.experts.62.down_proj.weight": "model-00025-of-00047.safetensors", + "model.layers.24.mlp.experts.62.down_proj.weight_scale": "model-00025-of-00047.safetensors", + "model.layers.24.mlp.experts.62.gate_proj.weight": "model-00025-of-00047.safetensors", + "model.layers.24.mlp.experts.62.gate_proj.weight_scale": "model-00025-of-00047.safetensors", + "model.layers.24.mlp.experts.62.up_proj.weight": "model-00025-of-00047.safetensors", + "model.layers.24.mlp.experts.62.up_proj.weight_scale": "model-00025-of-00047.safetensors", + "model.layers.24.mlp.experts.63.down_proj.weight": "model-00025-of-00047.safetensors", + "model.layers.24.mlp.experts.63.down_proj.weight_scale": "model-00025-of-00047.safetensors", + "model.layers.24.mlp.experts.63.gate_proj.weight": "model-00025-of-00047.safetensors", + "model.layers.24.mlp.experts.63.gate_proj.weight_scale": "model-00025-of-00047.safetensors", + "model.layers.24.mlp.experts.63.up_proj.weight": "model-00025-of-00047.safetensors", + "model.layers.24.mlp.experts.63.up_proj.weight_scale": "model-00025-of-00047.safetensors", + "model.layers.24.mlp.experts.64.down_proj.weight": "model-00025-of-00047.safetensors", + "model.layers.24.mlp.experts.64.down_proj.weight_scale": "model-00025-of-00047.safetensors", + "model.layers.24.mlp.experts.64.gate_proj.weight": "model-00025-of-00047.safetensors", + "model.layers.24.mlp.experts.64.gate_proj.weight_scale": "model-00025-of-00047.safetensors", + "model.layers.24.mlp.experts.64.up_proj.weight": "model-00025-of-00047.safetensors", + "model.layers.24.mlp.experts.64.up_proj.weight_scale": "model-00025-of-00047.safetensors", + "model.layers.24.mlp.experts.65.down_proj.weight": "model-00025-of-00047.safetensors", + "model.layers.24.mlp.experts.65.down_proj.weight_scale": "model-00025-of-00047.safetensors", + "model.layers.24.mlp.experts.65.gate_proj.weight": "model-00025-of-00047.safetensors", + "model.layers.24.mlp.experts.65.gate_proj.weight_scale": "model-00025-of-00047.safetensors", + "model.layers.24.mlp.experts.65.up_proj.weight": "model-00025-of-00047.safetensors", + "model.layers.24.mlp.experts.65.up_proj.weight_scale": "model-00025-of-00047.safetensors", + "model.layers.24.mlp.experts.66.down_proj.weight": "model-00025-of-00047.safetensors", + "model.layers.24.mlp.experts.66.down_proj.weight_scale": "model-00025-of-00047.safetensors", + "model.layers.24.mlp.experts.66.gate_proj.weight": "model-00025-of-00047.safetensors", + "model.layers.24.mlp.experts.66.gate_proj.weight_scale": "model-00025-of-00047.safetensors", + "model.layers.24.mlp.experts.66.up_proj.weight": "model-00025-of-00047.safetensors", + "model.layers.24.mlp.experts.66.up_proj.weight_scale": "model-00025-of-00047.safetensors", + "model.layers.24.mlp.experts.67.down_proj.weight": "model-00025-of-00047.safetensors", + "model.layers.24.mlp.experts.67.down_proj.weight_scale": "model-00025-of-00047.safetensors", + "model.layers.24.mlp.experts.67.gate_proj.weight": "model-00025-of-00047.safetensors", + "model.layers.24.mlp.experts.67.gate_proj.weight_scale": "model-00025-of-00047.safetensors", + "model.layers.24.mlp.experts.67.up_proj.weight": "model-00025-of-00047.safetensors", + "model.layers.24.mlp.experts.67.up_proj.weight_scale": "model-00025-of-00047.safetensors", + "model.layers.24.mlp.experts.68.down_proj.weight": "model-00025-of-00047.safetensors", + "model.layers.24.mlp.experts.68.down_proj.weight_scale": "model-00025-of-00047.safetensors", + "model.layers.24.mlp.experts.68.gate_proj.weight": "model-00025-of-00047.safetensors", + "model.layers.24.mlp.experts.68.gate_proj.weight_scale": "model-00025-of-00047.safetensors", + "model.layers.24.mlp.experts.68.up_proj.weight": "model-00025-of-00047.safetensors", + "model.layers.24.mlp.experts.68.up_proj.weight_scale": "model-00025-of-00047.safetensors", + "model.layers.24.mlp.experts.69.down_proj.weight": "model-00025-of-00047.safetensors", + "model.layers.24.mlp.experts.69.down_proj.weight_scale": "model-00025-of-00047.safetensors", + "model.layers.24.mlp.experts.69.gate_proj.weight": "model-00025-of-00047.safetensors", + "model.layers.24.mlp.experts.69.gate_proj.weight_scale": "model-00025-of-00047.safetensors", + "model.layers.24.mlp.experts.69.up_proj.weight": "model-00025-of-00047.safetensors", + "model.layers.24.mlp.experts.69.up_proj.weight_scale": "model-00025-of-00047.safetensors", + "model.layers.24.mlp.experts.7.down_proj.weight": "model-00025-of-00047.safetensors", + "model.layers.24.mlp.experts.7.down_proj.weight_scale": "model-00025-of-00047.safetensors", + "model.layers.24.mlp.experts.7.gate_proj.weight": "model-00025-of-00047.safetensors", + "model.layers.24.mlp.experts.7.gate_proj.weight_scale": "model-00025-of-00047.safetensors", + "model.layers.24.mlp.experts.7.up_proj.weight": "model-00025-of-00047.safetensors", + "model.layers.24.mlp.experts.7.up_proj.weight_scale": "model-00025-of-00047.safetensors", + "model.layers.24.mlp.experts.70.down_proj.weight": "model-00025-of-00047.safetensors", + "model.layers.24.mlp.experts.70.down_proj.weight_scale": "model-00025-of-00047.safetensors", + "model.layers.24.mlp.experts.70.gate_proj.weight": "model-00025-of-00047.safetensors", + "model.layers.24.mlp.experts.70.gate_proj.weight_scale": "model-00025-of-00047.safetensors", + "model.layers.24.mlp.experts.70.up_proj.weight": "model-00025-of-00047.safetensors", + "model.layers.24.mlp.experts.70.up_proj.weight_scale": "model-00025-of-00047.safetensors", + "model.layers.24.mlp.experts.71.down_proj.weight": "model-00025-of-00047.safetensors", + "model.layers.24.mlp.experts.71.down_proj.weight_scale": "model-00025-of-00047.safetensors", + "model.layers.24.mlp.experts.71.gate_proj.weight": "model-00025-of-00047.safetensors", + "model.layers.24.mlp.experts.71.gate_proj.weight_scale": "model-00025-of-00047.safetensors", + "model.layers.24.mlp.experts.71.up_proj.weight": "model-00025-of-00047.safetensors", + "model.layers.24.mlp.experts.71.up_proj.weight_scale": "model-00025-of-00047.safetensors", + "model.layers.24.mlp.experts.72.down_proj.weight": "model-00025-of-00047.safetensors", + "model.layers.24.mlp.experts.72.down_proj.weight_scale": "model-00025-of-00047.safetensors", + "model.layers.24.mlp.experts.72.gate_proj.weight": "model-00025-of-00047.safetensors", + "model.layers.24.mlp.experts.72.gate_proj.weight_scale": "model-00025-of-00047.safetensors", + "model.layers.24.mlp.experts.72.up_proj.weight": "model-00025-of-00047.safetensors", + "model.layers.24.mlp.experts.72.up_proj.weight_scale": "model-00025-of-00047.safetensors", + "model.layers.24.mlp.experts.73.down_proj.weight": "model-00025-of-00047.safetensors", + "model.layers.24.mlp.experts.73.down_proj.weight_scale": "model-00025-of-00047.safetensors", + "model.layers.24.mlp.experts.73.gate_proj.weight": "model-00025-of-00047.safetensors", + "model.layers.24.mlp.experts.73.gate_proj.weight_scale": "model-00025-of-00047.safetensors", + "model.layers.24.mlp.experts.73.up_proj.weight": "model-00025-of-00047.safetensors", + "model.layers.24.mlp.experts.73.up_proj.weight_scale": "model-00025-of-00047.safetensors", + "model.layers.24.mlp.experts.74.down_proj.weight": "model-00025-of-00047.safetensors", + "model.layers.24.mlp.experts.74.down_proj.weight_scale": "model-00025-of-00047.safetensors", + "model.layers.24.mlp.experts.74.gate_proj.weight": "model-00025-of-00047.safetensors", + "model.layers.24.mlp.experts.74.gate_proj.weight_scale": "model-00025-of-00047.safetensors", + "model.layers.24.mlp.experts.74.up_proj.weight": "model-00025-of-00047.safetensors", + "model.layers.24.mlp.experts.74.up_proj.weight_scale": "model-00025-of-00047.safetensors", + "model.layers.24.mlp.experts.75.down_proj.weight": "model-00025-of-00047.safetensors", + "model.layers.24.mlp.experts.75.down_proj.weight_scale": "model-00025-of-00047.safetensors", + "model.layers.24.mlp.experts.75.gate_proj.weight": "model-00025-of-00047.safetensors", + "model.layers.24.mlp.experts.75.gate_proj.weight_scale": "model-00025-of-00047.safetensors", + "model.layers.24.mlp.experts.75.up_proj.weight": "model-00025-of-00047.safetensors", + "model.layers.24.mlp.experts.75.up_proj.weight_scale": "model-00025-of-00047.safetensors", + "model.layers.24.mlp.experts.76.down_proj.weight": "model-00025-of-00047.safetensors", + "model.layers.24.mlp.experts.76.down_proj.weight_scale": "model-00025-of-00047.safetensors", + "model.layers.24.mlp.experts.76.gate_proj.weight": "model-00025-of-00047.safetensors", + "model.layers.24.mlp.experts.76.gate_proj.weight_scale": "model-00025-of-00047.safetensors", + "model.layers.24.mlp.experts.76.up_proj.weight": "model-00025-of-00047.safetensors", + "model.layers.24.mlp.experts.76.up_proj.weight_scale": "model-00025-of-00047.safetensors", + "model.layers.24.mlp.experts.77.down_proj.weight": "model-00025-of-00047.safetensors", + "model.layers.24.mlp.experts.77.down_proj.weight_scale": "model-00025-of-00047.safetensors", + "model.layers.24.mlp.experts.77.gate_proj.weight": "model-00025-of-00047.safetensors", + "model.layers.24.mlp.experts.77.gate_proj.weight_scale": "model-00025-of-00047.safetensors", + "model.layers.24.mlp.experts.77.up_proj.weight": "model-00025-of-00047.safetensors", + "model.layers.24.mlp.experts.77.up_proj.weight_scale": "model-00025-of-00047.safetensors", + "model.layers.24.mlp.experts.78.down_proj.weight": "model-00025-of-00047.safetensors", + "model.layers.24.mlp.experts.78.down_proj.weight_scale": "model-00025-of-00047.safetensors", + "model.layers.24.mlp.experts.78.gate_proj.weight": "model-00025-of-00047.safetensors", + "model.layers.24.mlp.experts.78.gate_proj.weight_scale": "model-00025-of-00047.safetensors", + "model.layers.24.mlp.experts.78.up_proj.weight": "model-00025-of-00047.safetensors", + "model.layers.24.mlp.experts.78.up_proj.weight_scale": "model-00025-of-00047.safetensors", + "model.layers.24.mlp.experts.79.down_proj.weight": "model-00025-of-00047.safetensors", + "model.layers.24.mlp.experts.79.down_proj.weight_scale": "model-00025-of-00047.safetensors", + "model.layers.24.mlp.experts.79.gate_proj.weight": "model-00025-of-00047.safetensors", + "model.layers.24.mlp.experts.79.gate_proj.weight_scale": "model-00025-of-00047.safetensors", + "model.layers.24.mlp.experts.79.up_proj.weight": "model-00025-of-00047.safetensors", + "model.layers.24.mlp.experts.79.up_proj.weight_scale": "model-00025-of-00047.safetensors", + "model.layers.24.mlp.experts.8.down_proj.weight": "model-00025-of-00047.safetensors", + "model.layers.24.mlp.experts.8.down_proj.weight_scale": "model-00025-of-00047.safetensors", + "model.layers.24.mlp.experts.8.gate_proj.weight": "model-00025-of-00047.safetensors", + "model.layers.24.mlp.experts.8.gate_proj.weight_scale": "model-00025-of-00047.safetensors", + "model.layers.24.mlp.experts.8.up_proj.weight": "model-00025-of-00047.safetensors", + "model.layers.24.mlp.experts.8.up_proj.weight_scale": "model-00025-of-00047.safetensors", + "model.layers.24.mlp.experts.80.down_proj.weight": "model-00025-of-00047.safetensors", + "model.layers.24.mlp.experts.80.down_proj.weight_scale": "model-00025-of-00047.safetensors", + "model.layers.24.mlp.experts.80.gate_proj.weight": "model-00025-of-00047.safetensors", + "model.layers.24.mlp.experts.80.gate_proj.weight_scale": "model-00025-of-00047.safetensors", + "model.layers.24.mlp.experts.80.up_proj.weight": "model-00025-of-00047.safetensors", + "model.layers.24.mlp.experts.80.up_proj.weight_scale": "model-00025-of-00047.safetensors", + "model.layers.24.mlp.experts.81.down_proj.weight": "model-00025-of-00047.safetensors", + "model.layers.24.mlp.experts.81.down_proj.weight_scale": "model-00025-of-00047.safetensors", + "model.layers.24.mlp.experts.81.gate_proj.weight": "model-00025-of-00047.safetensors", + "model.layers.24.mlp.experts.81.gate_proj.weight_scale": "model-00025-of-00047.safetensors", + "model.layers.24.mlp.experts.81.up_proj.weight": "model-00025-of-00047.safetensors", + "model.layers.24.mlp.experts.81.up_proj.weight_scale": "model-00025-of-00047.safetensors", + "model.layers.24.mlp.experts.82.down_proj.weight": "model-00025-of-00047.safetensors", + "model.layers.24.mlp.experts.82.down_proj.weight_scale": "model-00025-of-00047.safetensors", + "model.layers.24.mlp.experts.82.gate_proj.weight": "model-00025-of-00047.safetensors", + "model.layers.24.mlp.experts.82.gate_proj.weight_scale": "model-00025-of-00047.safetensors", + "model.layers.24.mlp.experts.82.up_proj.weight": "model-00025-of-00047.safetensors", + "model.layers.24.mlp.experts.82.up_proj.weight_scale": "model-00025-of-00047.safetensors", + "model.layers.24.mlp.experts.83.down_proj.weight": "model-00025-of-00047.safetensors", + "model.layers.24.mlp.experts.83.down_proj.weight_scale": "model-00025-of-00047.safetensors", + "model.layers.24.mlp.experts.83.gate_proj.weight": "model-00025-of-00047.safetensors", + "model.layers.24.mlp.experts.83.gate_proj.weight_scale": "model-00025-of-00047.safetensors", + "model.layers.24.mlp.experts.83.up_proj.weight": "model-00025-of-00047.safetensors", + "model.layers.24.mlp.experts.83.up_proj.weight_scale": "model-00025-of-00047.safetensors", + "model.layers.24.mlp.experts.84.down_proj.weight": "model-00025-of-00047.safetensors", + "model.layers.24.mlp.experts.84.down_proj.weight_scale": "model-00025-of-00047.safetensors", + "model.layers.24.mlp.experts.84.gate_proj.weight": "model-00025-of-00047.safetensors", + "model.layers.24.mlp.experts.84.gate_proj.weight_scale": "model-00025-of-00047.safetensors", + "model.layers.24.mlp.experts.84.up_proj.weight": "model-00025-of-00047.safetensors", + "model.layers.24.mlp.experts.84.up_proj.weight_scale": "model-00025-of-00047.safetensors", + "model.layers.24.mlp.experts.85.down_proj.weight": "model-00025-of-00047.safetensors", + "model.layers.24.mlp.experts.85.down_proj.weight_scale": "model-00025-of-00047.safetensors", + "model.layers.24.mlp.experts.85.gate_proj.weight": "model-00025-of-00047.safetensors", + "model.layers.24.mlp.experts.85.gate_proj.weight_scale": "model-00025-of-00047.safetensors", + "model.layers.24.mlp.experts.85.up_proj.weight": "model-00025-of-00047.safetensors", + "model.layers.24.mlp.experts.85.up_proj.weight_scale": "model-00025-of-00047.safetensors", + "model.layers.24.mlp.experts.86.down_proj.weight": "model-00025-of-00047.safetensors", + "model.layers.24.mlp.experts.86.down_proj.weight_scale": "model-00025-of-00047.safetensors", + "model.layers.24.mlp.experts.86.gate_proj.weight": "model-00025-of-00047.safetensors", + "model.layers.24.mlp.experts.86.gate_proj.weight_scale": "model-00025-of-00047.safetensors", + "model.layers.24.mlp.experts.86.up_proj.weight": "model-00025-of-00047.safetensors", + "model.layers.24.mlp.experts.86.up_proj.weight_scale": "model-00025-of-00047.safetensors", + "model.layers.24.mlp.experts.87.down_proj.weight": "model-00025-of-00047.safetensors", + "model.layers.24.mlp.experts.87.down_proj.weight_scale": "model-00025-of-00047.safetensors", + "model.layers.24.mlp.experts.87.gate_proj.weight": "model-00025-of-00047.safetensors", + "model.layers.24.mlp.experts.87.gate_proj.weight_scale": "model-00025-of-00047.safetensors", + "model.layers.24.mlp.experts.87.up_proj.weight": "model-00025-of-00047.safetensors", + "model.layers.24.mlp.experts.87.up_proj.weight_scale": "model-00025-of-00047.safetensors", + "model.layers.24.mlp.experts.88.down_proj.weight": "model-00025-of-00047.safetensors", + "model.layers.24.mlp.experts.88.down_proj.weight_scale": "model-00025-of-00047.safetensors", + "model.layers.24.mlp.experts.88.gate_proj.weight": "model-00025-of-00047.safetensors", + "model.layers.24.mlp.experts.88.gate_proj.weight_scale": "model-00025-of-00047.safetensors", + "model.layers.24.mlp.experts.88.up_proj.weight": "model-00025-of-00047.safetensors", + "model.layers.24.mlp.experts.88.up_proj.weight_scale": "model-00025-of-00047.safetensors", + "model.layers.24.mlp.experts.89.down_proj.weight": "model-00025-of-00047.safetensors", + "model.layers.24.mlp.experts.89.down_proj.weight_scale": "model-00025-of-00047.safetensors", + "model.layers.24.mlp.experts.89.gate_proj.weight": "model-00025-of-00047.safetensors", + "model.layers.24.mlp.experts.89.gate_proj.weight_scale": "model-00025-of-00047.safetensors", + "model.layers.24.mlp.experts.89.up_proj.weight": "model-00025-of-00047.safetensors", + "model.layers.24.mlp.experts.89.up_proj.weight_scale": "model-00025-of-00047.safetensors", + "model.layers.24.mlp.experts.9.down_proj.weight": "model-00025-of-00047.safetensors", + "model.layers.24.mlp.experts.9.down_proj.weight_scale": "model-00025-of-00047.safetensors", + "model.layers.24.mlp.experts.9.gate_proj.weight": "model-00025-of-00047.safetensors", + "model.layers.24.mlp.experts.9.gate_proj.weight_scale": "model-00025-of-00047.safetensors", + "model.layers.24.mlp.experts.9.up_proj.weight": "model-00025-of-00047.safetensors", + "model.layers.24.mlp.experts.9.up_proj.weight_scale": "model-00025-of-00047.safetensors", + "model.layers.24.mlp.experts.90.down_proj.weight": "model-00025-of-00047.safetensors", + "model.layers.24.mlp.experts.90.down_proj.weight_scale": "model-00025-of-00047.safetensors", + "model.layers.24.mlp.experts.90.gate_proj.weight": "model-00025-of-00047.safetensors", + "model.layers.24.mlp.experts.90.gate_proj.weight_scale": "model-00025-of-00047.safetensors", + "model.layers.24.mlp.experts.90.up_proj.weight": "model-00025-of-00047.safetensors", + "model.layers.24.mlp.experts.90.up_proj.weight_scale": "model-00025-of-00047.safetensors", + "model.layers.24.mlp.experts.91.down_proj.weight": "model-00025-of-00047.safetensors", + "model.layers.24.mlp.experts.91.down_proj.weight_scale": "model-00025-of-00047.safetensors", + "model.layers.24.mlp.experts.91.gate_proj.weight": "model-00025-of-00047.safetensors", + "model.layers.24.mlp.experts.91.gate_proj.weight_scale": "model-00025-of-00047.safetensors", + "model.layers.24.mlp.experts.91.up_proj.weight": "model-00025-of-00047.safetensors", + "model.layers.24.mlp.experts.91.up_proj.weight_scale": "model-00025-of-00047.safetensors", + "model.layers.24.mlp.experts.92.down_proj.weight": "model-00025-of-00047.safetensors", + "model.layers.24.mlp.experts.92.down_proj.weight_scale": "model-00025-of-00047.safetensors", + "model.layers.24.mlp.experts.92.gate_proj.weight": "model-00025-of-00047.safetensors", + "model.layers.24.mlp.experts.92.gate_proj.weight_scale": "model-00025-of-00047.safetensors", + "model.layers.24.mlp.experts.92.up_proj.weight": "model-00025-of-00047.safetensors", + "model.layers.24.mlp.experts.92.up_proj.weight_scale": "model-00025-of-00047.safetensors", + "model.layers.24.mlp.experts.93.down_proj.weight": "model-00025-of-00047.safetensors", + "model.layers.24.mlp.experts.93.down_proj.weight_scale": "model-00025-of-00047.safetensors", + "model.layers.24.mlp.experts.93.gate_proj.weight": "model-00025-of-00047.safetensors", + "model.layers.24.mlp.experts.93.gate_proj.weight_scale": "model-00025-of-00047.safetensors", + "model.layers.24.mlp.experts.93.up_proj.weight": "model-00025-of-00047.safetensors", + "model.layers.24.mlp.experts.93.up_proj.weight_scale": "model-00025-of-00047.safetensors", + "model.layers.24.mlp.experts.94.down_proj.weight": "model-00025-of-00047.safetensors", + "model.layers.24.mlp.experts.94.down_proj.weight_scale": "model-00025-of-00047.safetensors", + "model.layers.24.mlp.experts.94.gate_proj.weight": "model-00025-of-00047.safetensors", + "model.layers.24.mlp.experts.94.gate_proj.weight_scale": "model-00025-of-00047.safetensors", + "model.layers.24.mlp.experts.94.up_proj.weight": "model-00025-of-00047.safetensors", + "model.layers.24.mlp.experts.94.up_proj.weight_scale": "model-00025-of-00047.safetensors", + "model.layers.24.mlp.experts.95.down_proj.weight": "model-00025-of-00047.safetensors", + "model.layers.24.mlp.experts.95.down_proj.weight_scale": "model-00025-of-00047.safetensors", + "model.layers.24.mlp.experts.95.gate_proj.weight": "model-00025-of-00047.safetensors", + "model.layers.24.mlp.experts.95.gate_proj.weight_scale": "model-00025-of-00047.safetensors", + "model.layers.24.mlp.experts.95.up_proj.weight": "model-00025-of-00047.safetensors", + "model.layers.24.mlp.experts.95.up_proj.weight_scale": "model-00025-of-00047.safetensors", + "model.layers.24.mlp.experts.96.down_proj.weight": "model-00025-of-00047.safetensors", + "model.layers.24.mlp.experts.96.down_proj.weight_scale": "model-00025-of-00047.safetensors", + "model.layers.24.mlp.experts.96.gate_proj.weight": "model-00025-of-00047.safetensors", + "model.layers.24.mlp.experts.96.gate_proj.weight_scale": "model-00025-of-00047.safetensors", + "model.layers.24.mlp.experts.96.up_proj.weight": "model-00025-of-00047.safetensors", + "model.layers.24.mlp.experts.96.up_proj.weight_scale": "model-00025-of-00047.safetensors", + "model.layers.24.mlp.experts.97.down_proj.weight": "model-00025-of-00047.safetensors", + "model.layers.24.mlp.experts.97.down_proj.weight_scale": "model-00025-of-00047.safetensors", + "model.layers.24.mlp.experts.97.gate_proj.weight": "model-00025-of-00047.safetensors", + "model.layers.24.mlp.experts.97.gate_proj.weight_scale": "model-00025-of-00047.safetensors", + "model.layers.24.mlp.experts.97.up_proj.weight": "model-00025-of-00047.safetensors", + "model.layers.24.mlp.experts.97.up_proj.weight_scale": "model-00025-of-00047.safetensors", + "model.layers.24.mlp.experts.98.down_proj.weight": "model-00025-of-00047.safetensors", + "model.layers.24.mlp.experts.98.down_proj.weight_scale": "model-00025-of-00047.safetensors", + "model.layers.24.mlp.experts.98.gate_proj.weight": "model-00025-of-00047.safetensors", + "model.layers.24.mlp.experts.98.gate_proj.weight_scale": "model-00025-of-00047.safetensors", + "model.layers.24.mlp.experts.98.up_proj.weight": "model-00025-of-00047.safetensors", + "model.layers.24.mlp.experts.98.up_proj.weight_scale": "model-00025-of-00047.safetensors", + "model.layers.24.mlp.experts.99.down_proj.weight": "model-00025-of-00047.safetensors", + "model.layers.24.mlp.experts.99.down_proj.weight_scale": "model-00025-of-00047.safetensors", + "model.layers.24.mlp.experts.99.gate_proj.weight": "model-00025-of-00047.safetensors", + "model.layers.24.mlp.experts.99.gate_proj.weight_scale": "model-00025-of-00047.safetensors", + "model.layers.24.mlp.experts.99.up_proj.weight": "model-00025-of-00047.safetensors", + "model.layers.24.mlp.experts.99.up_proj.weight_scale": "model-00025-of-00047.safetensors", + "model.layers.24.mlp.gate.e_score_correction_bias": "model-00025-of-00047.safetensors", + "model.layers.24.mlp.gate.weight": "model-00025-of-00047.safetensors", + "model.layers.24.mlp.shared_experts.down_proj.weight": "model-00025-of-00047.safetensors", + "model.layers.24.mlp.shared_experts.down_proj.weight_scale": "model-00025-of-00047.safetensors", + "model.layers.24.mlp.shared_experts.gate_proj.weight": "model-00025-of-00047.safetensors", + "model.layers.24.mlp.shared_experts.gate_proj.weight_scale": "model-00025-of-00047.safetensors", + "model.layers.24.mlp.shared_experts.up_proj.weight": "model-00025-of-00047.safetensors", + "model.layers.24.mlp.shared_experts.up_proj.weight_scale": "model-00025-of-00047.safetensors", + "model.layers.24.post_attention_layernorm.weight": "model-00025-of-00047.safetensors", + "model.layers.24.self_attn.k_proj.bias": "model-00025-of-00047.safetensors", + "model.layers.24.self_attn.k_proj.weight": "model-00025-of-00047.safetensors", + "model.layers.24.self_attn.k_proj.weight_scale": "model-00025-of-00047.safetensors", + "model.layers.24.self_attn.o_proj.weight": "model-00025-of-00047.safetensors", + "model.layers.24.self_attn.o_proj.weight_scale": "model-00025-of-00047.safetensors", + "model.layers.24.self_attn.q_proj.bias": "model-00025-of-00047.safetensors", + "model.layers.24.self_attn.q_proj.weight": "model-00025-of-00047.safetensors", + "model.layers.24.self_attn.q_proj.weight_scale": "model-00025-of-00047.safetensors", + "model.layers.24.self_attn.v_proj.bias": "model-00025-of-00047.safetensors", + "model.layers.24.self_attn.v_proj.weight": "model-00025-of-00047.safetensors", + "model.layers.24.self_attn.v_proj.weight_scale": "model-00025-of-00047.safetensors", + "model.layers.25.input_layernorm.weight": "model-00026-of-00047.safetensors", + "model.layers.25.mlp.experts.0.down_proj.weight": "model-00026-of-00047.safetensors", + "model.layers.25.mlp.experts.0.down_proj.weight_scale": "model-00026-of-00047.safetensors", + "model.layers.25.mlp.experts.0.gate_proj.weight": "model-00026-of-00047.safetensors", + "model.layers.25.mlp.experts.0.gate_proj.weight_scale": "model-00026-of-00047.safetensors", + "model.layers.25.mlp.experts.0.up_proj.weight": "model-00026-of-00047.safetensors", + "model.layers.25.mlp.experts.0.up_proj.weight_scale": "model-00026-of-00047.safetensors", + "model.layers.25.mlp.experts.1.down_proj.weight": "model-00026-of-00047.safetensors", + "model.layers.25.mlp.experts.1.down_proj.weight_scale": "model-00026-of-00047.safetensors", + "model.layers.25.mlp.experts.1.gate_proj.weight": "model-00026-of-00047.safetensors", + "model.layers.25.mlp.experts.1.gate_proj.weight_scale": "model-00026-of-00047.safetensors", + "model.layers.25.mlp.experts.1.up_proj.weight": "model-00026-of-00047.safetensors", + "model.layers.25.mlp.experts.1.up_proj.weight_scale": "model-00026-of-00047.safetensors", + "model.layers.25.mlp.experts.10.down_proj.weight": "model-00026-of-00047.safetensors", + "model.layers.25.mlp.experts.10.down_proj.weight_scale": "model-00026-of-00047.safetensors", + "model.layers.25.mlp.experts.10.gate_proj.weight": "model-00026-of-00047.safetensors", + "model.layers.25.mlp.experts.10.gate_proj.weight_scale": "model-00026-of-00047.safetensors", + "model.layers.25.mlp.experts.10.up_proj.weight": "model-00026-of-00047.safetensors", + "model.layers.25.mlp.experts.10.up_proj.weight_scale": "model-00026-of-00047.safetensors", + "model.layers.25.mlp.experts.100.down_proj.weight": "model-00026-of-00047.safetensors", + "model.layers.25.mlp.experts.100.down_proj.weight_scale": "model-00026-of-00047.safetensors", + "model.layers.25.mlp.experts.100.gate_proj.weight": "model-00026-of-00047.safetensors", + "model.layers.25.mlp.experts.100.gate_proj.weight_scale": "model-00026-of-00047.safetensors", + "model.layers.25.mlp.experts.100.up_proj.weight": "model-00026-of-00047.safetensors", + "model.layers.25.mlp.experts.100.up_proj.weight_scale": "model-00026-of-00047.safetensors", + "model.layers.25.mlp.experts.101.down_proj.weight": "model-00026-of-00047.safetensors", + "model.layers.25.mlp.experts.101.down_proj.weight_scale": "model-00026-of-00047.safetensors", + "model.layers.25.mlp.experts.101.gate_proj.weight": "model-00026-of-00047.safetensors", + "model.layers.25.mlp.experts.101.gate_proj.weight_scale": "model-00026-of-00047.safetensors", + "model.layers.25.mlp.experts.101.up_proj.weight": "model-00026-of-00047.safetensors", + "model.layers.25.mlp.experts.101.up_proj.weight_scale": "model-00026-of-00047.safetensors", + "model.layers.25.mlp.experts.102.down_proj.weight": "model-00026-of-00047.safetensors", + "model.layers.25.mlp.experts.102.down_proj.weight_scale": "model-00026-of-00047.safetensors", + "model.layers.25.mlp.experts.102.gate_proj.weight": "model-00026-of-00047.safetensors", + "model.layers.25.mlp.experts.102.gate_proj.weight_scale": "model-00026-of-00047.safetensors", + "model.layers.25.mlp.experts.102.up_proj.weight": "model-00026-of-00047.safetensors", + "model.layers.25.mlp.experts.102.up_proj.weight_scale": "model-00026-of-00047.safetensors", + "model.layers.25.mlp.experts.103.down_proj.weight": "model-00026-of-00047.safetensors", + "model.layers.25.mlp.experts.103.down_proj.weight_scale": "model-00026-of-00047.safetensors", + "model.layers.25.mlp.experts.103.gate_proj.weight": "model-00026-of-00047.safetensors", + "model.layers.25.mlp.experts.103.gate_proj.weight_scale": "model-00026-of-00047.safetensors", + "model.layers.25.mlp.experts.103.up_proj.weight": "model-00026-of-00047.safetensors", + "model.layers.25.mlp.experts.103.up_proj.weight_scale": "model-00026-of-00047.safetensors", + "model.layers.25.mlp.experts.104.down_proj.weight": "model-00026-of-00047.safetensors", + "model.layers.25.mlp.experts.104.down_proj.weight_scale": "model-00026-of-00047.safetensors", + "model.layers.25.mlp.experts.104.gate_proj.weight": "model-00026-of-00047.safetensors", + "model.layers.25.mlp.experts.104.gate_proj.weight_scale": "model-00026-of-00047.safetensors", + "model.layers.25.mlp.experts.104.up_proj.weight": "model-00026-of-00047.safetensors", + "model.layers.25.mlp.experts.104.up_proj.weight_scale": "model-00026-of-00047.safetensors", + "model.layers.25.mlp.experts.105.down_proj.weight": "model-00026-of-00047.safetensors", + "model.layers.25.mlp.experts.105.down_proj.weight_scale": "model-00026-of-00047.safetensors", + "model.layers.25.mlp.experts.105.gate_proj.weight": "model-00026-of-00047.safetensors", + "model.layers.25.mlp.experts.105.gate_proj.weight_scale": "model-00026-of-00047.safetensors", + "model.layers.25.mlp.experts.105.up_proj.weight": "model-00026-of-00047.safetensors", + "model.layers.25.mlp.experts.105.up_proj.weight_scale": "model-00026-of-00047.safetensors", + "model.layers.25.mlp.experts.106.down_proj.weight": "model-00026-of-00047.safetensors", + "model.layers.25.mlp.experts.106.down_proj.weight_scale": "model-00026-of-00047.safetensors", + "model.layers.25.mlp.experts.106.gate_proj.weight": "model-00026-of-00047.safetensors", + "model.layers.25.mlp.experts.106.gate_proj.weight_scale": "model-00026-of-00047.safetensors", + "model.layers.25.mlp.experts.106.up_proj.weight": "model-00026-of-00047.safetensors", + "model.layers.25.mlp.experts.106.up_proj.weight_scale": "model-00026-of-00047.safetensors", + "model.layers.25.mlp.experts.107.down_proj.weight": "model-00026-of-00047.safetensors", + "model.layers.25.mlp.experts.107.down_proj.weight_scale": "model-00026-of-00047.safetensors", + "model.layers.25.mlp.experts.107.gate_proj.weight": "model-00026-of-00047.safetensors", + "model.layers.25.mlp.experts.107.gate_proj.weight_scale": "model-00026-of-00047.safetensors", + "model.layers.25.mlp.experts.107.up_proj.weight": "model-00026-of-00047.safetensors", + "model.layers.25.mlp.experts.107.up_proj.weight_scale": "model-00026-of-00047.safetensors", + "model.layers.25.mlp.experts.108.down_proj.weight": "model-00026-of-00047.safetensors", + "model.layers.25.mlp.experts.108.down_proj.weight_scale": "model-00026-of-00047.safetensors", + "model.layers.25.mlp.experts.108.gate_proj.weight": "model-00026-of-00047.safetensors", + "model.layers.25.mlp.experts.108.gate_proj.weight_scale": "model-00026-of-00047.safetensors", + "model.layers.25.mlp.experts.108.up_proj.weight": "model-00026-of-00047.safetensors", + "model.layers.25.mlp.experts.108.up_proj.weight_scale": "model-00026-of-00047.safetensors", + "model.layers.25.mlp.experts.109.down_proj.weight": "model-00026-of-00047.safetensors", + "model.layers.25.mlp.experts.109.down_proj.weight_scale": "model-00026-of-00047.safetensors", + "model.layers.25.mlp.experts.109.gate_proj.weight": "model-00026-of-00047.safetensors", + "model.layers.25.mlp.experts.109.gate_proj.weight_scale": "model-00026-of-00047.safetensors", + "model.layers.25.mlp.experts.109.up_proj.weight": "model-00026-of-00047.safetensors", + "model.layers.25.mlp.experts.109.up_proj.weight_scale": "model-00026-of-00047.safetensors", + "model.layers.25.mlp.experts.11.down_proj.weight": "model-00026-of-00047.safetensors", + "model.layers.25.mlp.experts.11.down_proj.weight_scale": "model-00026-of-00047.safetensors", + "model.layers.25.mlp.experts.11.gate_proj.weight": "model-00026-of-00047.safetensors", + "model.layers.25.mlp.experts.11.gate_proj.weight_scale": "model-00026-of-00047.safetensors", + "model.layers.25.mlp.experts.11.up_proj.weight": "model-00026-of-00047.safetensors", + "model.layers.25.mlp.experts.11.up_proj.weight_scale": "model-00026-of-00047.safetensors", + "model.layers.25.mlp.experts.110.down_proj.weight": "model-00026-of-00047.safetensors", + "model.layers.25.mlp.experts.110.down_proj.weight_scale": "model-00026-of-00047.safetensors", + "model.layers.25.mlp.experts.110.gate_proj.weight": "model-00026-of-00047.safetensors", + "model.layers.25.mlp.experts.110.gate_proj.weight_scale": "model-00026-of-00047.safetensors", + "model.layers.25.mlp.experts.110.up_proj.weight": "model-00026-of-00047.safetensors", + "model.layers.25.mlp.experts.110.up_proj.weight_scale": "model-00026-of-00047.safetensors", + "model.layers.25.mlp.experts.111.down_proj.weight": "model-00026-of-00047.safetensors", + "model.layers.25.mlp.experts.111.down_proj.weight_scale": "model-00026-of-00047.safetensors", + "model.layers.25.mlp.experts.111.gate_proj.weight": "model-00026-of-00047.safetensors", + "model.layers.25.mlp.experts.111.gate_proj.weight_scale": "model-00026-of-00047.safetensors", + "model.layers.25.mlp.experts.111.up_proj.weight": "model-00026-of-00047.safetensors", + "model.layers.25.mlp.experts.111.up_proj.weight_scale": "model-00026-of-00047.safetensors", + "model.layers.25.mlp.experts.112.down_proj.weight": "model-00026-of-00047.safetensors", + "model.layers.25.mlp.experts.112.down_proj.weight_scale": "model-00026-of-00047.safetensors", + "model.layers.25.mlp.experts.112.gate_proj.weight": "model-00026-of-00047.safetensors", + "model.layers.25.mlp.experts.112.gate_proj.weight_scale": "model-00026-of-00047.safetensors", + "model.layers.25.mlp.experts.112.up_proj.weight": "model-00026-of-00047.safetensors", + "model.layers.25.mlp.experts.112.up_proj.weight_scale": "model-00026-of-00047.safetensors", + "model.layers.25.mlp.experts.113.down_proj.weight": "model-00026-of-00047.safetensors", + "model.layers.25.mlp.experts.113.down_proj.weight_scale": "model-00026-of-00047.safetensors", + "model.layers.25.mlp.experts.113.gate_proj.weight": "model-00026-of-00047.safetensors", + "model.layers.25.mlp.experts.113.gate_proj.weight_scale": "model-00026-of-00047.safetensors", + "model.layers.25.mlp.experts.113.up_proj.weight": "model-00026-of-00047.safetensors", + "model.layers.25.mlp.experts.113.up_proj.weight_scale": "model-00026-of-00047.safetensors", + "model.layers.25.mlp.experts.114.down_proj.weight": "model-00026-of-00047.safetensors", + "model.layers.25.mlp.experts.114.down_proj.weight_scale": "model-00026-of-00047.safetensors", + "model.layers.25.mlp.experts.114.gate_proj.weight": "model-00026-of-00047.safetensors", + "model.layers.25.mlp.experts.114.gate_proj.weight_scale": "model-00026-of-00047.safetensors", + "model.layers.25.mlp.experts.114.up_proj.weight": "model-00026-of-00047.safetensors", + "model.layers.25.mlp.experts.114.up_proj.weight_scale": "model-00026-of-00047.safetensors", + "model.layers.25.mlp.experts.115.down_proj.weight": "model-00026-of-00047.safetensors", + "model.layers.25.mlp.experts.115.down_proj.weight_scale": "model-00026-of-00047.safetensors", + "model.layers.25.mlp.experts.115.gate_proj.weight": "model-00026-of-00047.safetensors", + "model.layers.25.mlp.experts.115.gate_proj.weight_scale": "model-00026-of-00047.safetensors", + "model.layers.25.mlp.experts.115.up_proj.weight": "model-00026-of-00047.safetensors", + "model.layers.25.mlp.experts.115.up_proj.weight_scale": "model-00026-of-00047.safetensors", + "model.layers.25.mlp.experts.116.down_proj.weight": "model-00026-of-00047.safetensors", + "model.layers.25.mlp.experts.116.down_proj.weight_scale": "model-00026-of-00047.safetensors", + "model.layers.25.mlp.experts.116.gate_proj.weight": "model-00026-of-00047.safetensors", + "model.layers.25.mlp.experts.116.gate_proj.weight_scale": "model-00026-of-00047.safetensors", + "model.layers.25.mlp.experts.116.up_proj.weight": "model-00026-of-00047.safetensors", + "model.layers.25.mlp.experts.116.up_proj.weight_scale": "model-00026-of-00047.safetensors", + "model.layers.25.mlp.experts.117.down_proj.weight": "model-00026-of-00047.safetensors", + "model.layers.25.mlp.experts.117.down_proj.weight_scale": "model-00026-of-00047.safetensors", + "model.layers.25.mlp.experts.117.gate_proj.weight": "model-00026-of-00047.safetensors", + "model.layers.25.mlp.experts.117.gate_proj.weight_scale": "model-00026-of-00047.safetensors", + "model.layers.25.mlp.experts.117.up_proj.weight": "model-00026-of-00047.safetensors", + "model.layers.25.mlp.experts.117.up_proj.weight_scale": "model-00026-of-00047.safetensors", + "model.layers.25.mlp.experts.118.down_proj.weight": "model-00026-of-00047.safetensors", + "model.layers.25.mlp.experts.118.down_proj.weight_scale": "model-00026-of-00047.safetensors", + "model.layers.25.mlp.experts.118.gate_proj.weight": "model-00026-of-00047.safetensors", + "model.layers.25.mlp.experts.118.gate_proj.weight_scale": "model-00026-of-00047.safetensors", + "model.layers.25.mlp.experts.118.up_proj.weight": "model-00026-of-00047.safetensors", + "model.layers.25.mlp.experts.118.up_proj.weight_scale": "model-00026-of-00047.safetensors", + "model.layers.25.mlp.experts.119.down_proj.weight": "model-00026-of-00047.safetensors", + "model.layers.25.mlp.experts.119.down_proj.weight_scale": "model-00026-of-00047.safetensors", + "model.layers.25.mlp.experts.119.gate_proj.weight": "model-00026-of-00047.safetensors", + "model.layers.25.mlp.experts.119.gate_proj.weight_scale": "model-00026-of-00047.safetensors", + "model.layers.25.mlp.experts.119.up_proj.weight": "model-00026-of-00047.safetensors", + "model.layers.25.mlp.experts.119.up_proj.weight_scale": "model-00026-of-00047.safetensors", + "model.layers.25.mlp.experts.12.down_proj.weight": "model-00026-of-00047.safetensors", + "model.layers.25.mlp.experts.12.down_proj.weight_scale": "model-00026-of-00047.safetensors", + "model.layers.25.mlp.experts.12.gate_proj.weight": "model-00026-of-00047.safetensors", + "model.layers.25.mlp.experts.12.gate_proj.weight_scale": "model-00026-of-00047.safetensors", + "model.layers.25.mlp.experts.12.up_proj.weight": "model-00026-of-00047.safetensors", + "model.layers.25.mlp.experts.12.up_proj.weight_scale": "model-00026-of-00047.safetensors", + "model.layers.25.mlp.experts.120.down_proj.weight": "model-00026-of-00047.safetensors", + "model.layers.25.mlp.experts.120.down_proj.weight_scale": "model-00026-of-00047.safetensors", + "model.layers.25.mlp.experts.120.gate_proj.weight": "model-00026-of-00047.safetensors", + "model.layers.25.mlp.experts.120.gate_proj.weight_scale": "model-00026-of-00047.safetensors", + "model.layers.25.mlp.experts.120.up_proj.weight": "model-00026-of-00047.safetensors", + "model.layers.25.mlp.experts.120.up_proj.weight_scale": "model-00026-of-00047.safetensors", + "model.layers.25.mlp.experts.121.down_proj.weight": "model-00026-of-00047.safetensors", + "model.layers.25.mlp.experts.121.down_proj.weight_scale": "model-00026-of-00047.safetensors", + "model.layers.25.mlp.experts.121.gate_proj.weight": "model-00026-of-00047.safetensors", + "model.layers.25.mlp.experts.121.gate_proj.weight_scale": "model-00026-of-00047.safetensors", + "model.layers.25.mlp.experts.121.up_proj.weight": "model-00026-of-00047.safetensors", + "model.layers.25.mlp.experts.121.up_proj.weight_scale": "model-00026-of-00047.safetensors", + "model.layers.25.mlp.experts.122.down_proj.weight": "model-00026-of-00047.safetensors", + "model.layers.25.mlp.experts.122.down_proj.weight_scale": "model-00026-of-00047.safetensors", + "model.layers.25.mlp.experts.122.gate_proj.weight": "model-00026-of-00047.safetensors", + "model.layers.25.mlp.experts.122.gate_proj.weight_scale": "model-00026-of-00047.safetensors", + "model.layers.25.mlp.experts.122.up_proj.weight": "model-00026-of-00047.safetensors", + "model.layers.25.mlp.experts.122.up_proj.weight_scale": "model-00026-of-00047.safetensors", + "model.layers.25.mlp.experts.123.down_proj.weight": "model-00026-of-00047.safetensors", + "model.layers.25.mlp.experts.123.down_proj.weight_scale": "model-00026-of-00047.safetensors", + "model.layers.25.mlp.experts.123.gate_proj.weight": "model-00026-of-00047.safetensors", + "model.layers.25.mlp.experts.123.gate_proj.weight_scale": "model-00026-of-00047.safetensors", + "model.layers.25.mlp.experts.123.up_proj.weight": "model-00026-of-00047.safetensors", + "model.layers.25.mlp.experts.123.up_proj.weight_scale": "model-00026-of-00047.safetensors", + "model.layers.25.mlp.experts.124.down_proj.weight": "model-00026-of-00047.safetensors", + "model.layers.25.mlp.experts.124.down_proj.weight_scale": "model-00026-of-00047.safetensors", + "model.layers.25.mlp.experts.124.gate_proj.weight": "model-00026-of-00047.safetensors", + "model.layers.25.mlp.experts.124.gate_proj.weight_scale": "model-00026-of-00047.safetensors", + "model.layers.25.mlp.experts.124.up_proj.weight": "model-00026-of-00047.safetensors", + "model.layers.25.mlp.experts.124.up_proj.weight_scale": "model-00026-of-00047.safetensors", + "model.layers.25.mlp.experts.125.down_proj.weight": "model-00026-of-00047.safetensors", + "model.layers.25.mlp.experts.125.down_proj.weight_scale": "model-00026-of-00047.safetensors", + "model.layers.25.mlp.experts.125.gate_proj.weight": "model-00026-of-00047.safetensors", + "model.layers.25.mlp.experts.125.gate_proj.weight_scale": "model-00026-of-00047.safetensors", + "model.layers.25.mlp.experts.125.up_proj.weight": "model-00026-of-00047.safetensors", + "model.layers.25.mlp.experts.125.up_proj.weight_scale": "model-00026-of-00047.safetensors", + "model.layers.25.mlp.experts.126.down_proj.weight": "model-00026-of-00047.safetensors", + "model.layers.25.mlp.experts.126.down_proj.weight_scale": "model-00026-of-00047.safetensors", + "model.layers.25.mlp.experts.126.gate_proj.weight": "model-00026-of-00047.safetensors", + "model.layers.25.mlp.experts.126.gate_proj.weight_scale": "model-00026-of-00047.safetensors", + "model.layers.25.mlp.experts.126.up_proj.weight": "model-00026-of-00047.safetensors", + "model.layers.25.mlp.experts.126.up_proj.weight_scale": "model-00026-of-00047.safetensors", + "model.layers.25.mlp.experts.127.down_proj.weight": "model-00026-of-00047.safetensors", + "model.layers.25.mlp.experts.127.down_proj.weight_scale": "model-00026-of-00047.safetensors", + "model.layers.25.mlp.experts.127.gate_proj.weight": "model-00026-of-00047.safetensors", + "model.layers.25.mlp.experts.127.gate_proj.weight_scale": "model-00026-of-00047.safetensors", + "model.layers.25.mlp.experts.127.up_proj.weight": "model-00026-of-00047.safetensors", + "model.layers.25.mlp.experts.127.up_proj.weight_scale": "model-00026-of-00047.safetensors", + "model.layers.25.mlp.experts.13.down_proj.weight": "model-00026-of-00047.safetensors", + "model.layers.25.mlp.experts.13.down_proj.weight_scale": "model-00026-of-00047.safetensors", + "model.layers.25.mlp.experts.13.gate_proj.weight": "model-00026-of-00047.safetensors", + "model.layers.25.mlp.experts.13.gate_proj.weight_scale": "model-00026-of-00047.safetensors", + "model.layers.25.mlp.experts.13.up_proj.weight": "model-00026-of-00047.safetensors", + "model.layers.25.mlp.experts.13.up_proj.weight_scale": "model-00026-of-00047.safetensors", + "model.layers.25.mlp.experts.14.down_proj.weight": "model-00026-of-00047.safetensors", + "model.layers.25.mlp.experts.14.down_proj.weight_scale": "model-00026-of-00047.safetensors", + "model.layers.25.mlp.experts.14.gate_proj.weight": "model-00026-of-00047.safetensors", + "model.layers.25.mlp.experts.14.gate_proj.weight_scale": "model-00026-of-00047.safetensors", + "model.layers.25.mlp.experts.14.up_proj.weight": "model-00026-of-00047.safetensors", + "model.layers.25.mlp.experts.14.up_proj.weight_scale": "model-00026-of-00047.safetensors", + "model.layers.25.mlp.experts.15.down_proj.weight": "model-00026-of-00047.safetensors", + "model.layers.25.mlp.experts.15.down_proj.weight_scale": "model-00026-of-00047.safetensors", + "model.layers.25.mlp.experts.15.gate_proj.weight": "model-00026-of-00047.safetensors", + "model.layers.25.mlp.experts.15.gate_proj.weight_scale": "model-00026-of-00047.safetensors", + "model.layers.25.mlp.experts.15.up_proj.weight": "model-00026-of-00047.safetensors", + "model.layers.25.mlp.experts.15.up_proj.weight_scale": "model-00026-of-00047.safetensors", + "model.layers.25.mlp.experts.16.down_proj.weight": "model-00026-of-00047.safetensors", + "model.layers.25.mlp.experts.16.down_proj.weight_scale": "model-00026-of-00047.safetensors", + "model.layers.25.mlp.experts.16.gate_proj.weight": "model-00026-of-00047.safetensors", + "model.layers.25.mlp.experts.16.gate_proj.weight_scale": "model-00026-of-00047.safetensors", + "model.layers.25.mlp.experts.16.up_proj.weight": "model-00026-of-00047.safetensors", + "model.layers.25.mlp.experts.16.up_proj.weight_scale": "model-00026-of-00047.safetensors", + "model.layers.25.mlp.experts.17.down_proj.weight": "model-00026-of-00047.safetensors", + "model.layers.25.mlp.experts.17.down_proj.weight_scale": "model-00026-of-00047.safetensors", + "model.layers.25.mlp.experts.17.gate_proj.weight": "model-00026-of-00047.safetensors", + "model.layers.25.mlp.experts.17.gate_proj.weight_scale": "model-00026-of-00047.safetensors", + "model.layers.25.mlp.experts.17.up_proj.weight": "model-00026-of-00047.safetensors", + "model.layers.25.mlp.experts.17.up_proj.weight_scale": "model-00026-of-00047.safetensors", + "model.layers.25.mlp.experts.18.down_proj.weight": "model-00026-of-00047.safetensors", + "model.layers.25.mlp.experts.18.down_proj.weight_scale": "model-00026-of-00047.safetensors", + "model.layers.25.mlp.experts.18.gate_proj.weight": "model-00026-of-00047.safetensors", + "model.layers.25.mlp.experts.18.gate_proj.weight_scale": "model-00026-of-00047.safetensors", + "model.layers.25.mlp.experts.18.up_proj.weight": "model-00026-of-00047.safetensors", + "model.layers.25.mlp.experts.18.up_proj.weight_scale": "model-00026-of-00047.safetensors", + "model.layers.25.mlp.experts.19.down_proj.weight": "model-00026-of-00047.safetensors", + "model.layers.25.mlp.experts.19.down_proj.weight_scale": "model-00026-of-00047.safetensors", + "model.layers.25.mlp.experts.19.gate_proj.weight": "model-00026-of-00047.safetensors", + "model.layers.25.mlp.experts.19.gate_proj.weight_scale": "model-00026-of-00047.safetensors", + "model.layers.25.mlp.experts.19.up_proj.weight": "model-00026-of-00047.safetensors", + "model.layers.25.mlp.experts.19.up_proj.weight_scale": "model-00026-of-00047.safetensors", + "model.layers.25.mlp.experts.2.down_proj.weight": "model-00026-of-00047.safetensors", + "model.layers.25.mlp.experts.2.down_proj.weight_scale": "model-00026-of-00047.safetensors", + "model.layers.25.mlp.experts.2.gate_proj.weight": "model-00026-of-00047.safetensors", + "model.layers.25.mlp.experts.2.gate_proj.weight_scale": "model-00026-of-00047.safetensors", + "model.layers.25.mlp.experts.2.up_proj.weight": "model-00026-of-00047.safetensors", + "model.layers.25.mlp.experts.2.up_proj.weight_scale": "model-00026-of-00047.safetensors", + "model.layers.25.mlp.experts.20.down_proj.weight": "model-00026-of-00047.safetensors", + "model.layers.25.mlp.experts.20.down_proj.weight_scale": "model-00026-of-00047.safetensors", + "model.layers.25.mlp.experts.20.gate_proj.weight": "model-00026-of-00047.safetensors", + "model.layers.25.mlp.experts.20.gate_proj.weight_scale": "model-00026-of-00047.safetensors", + "model.layers.25.mlp.experts.20.up_proj.weight": "model-00026-of-00047.safetensors", + "model.layers.25.mlp.experts.20.up_proj.weight_scale": "model-00026-of-00047.safetensors", + "model.layers.25.mlp.experts.21.down_proj.weight": "model-00026-of-00047.safetensors", + "model.layers.25.mlp.experts.21.down_proj.weight_scale": "model-00026-of-00047.safetensors", + "model.layers.25.mlp.experts.21.gate_proj.weight": "model-00026-of-00047.safetensors", + "model.layers.25.mlp.experts.21.gate_proj.weight_scale": "model-00026-of-00047.safetensors", + "model.layers.25.mlp.experts.21.up_proj.weight": "model-00026-of-00047.safetensors", + "model.layers.25.mlp.experts.21.up_proj.weight_scale": "model-00026-of-00047.safetensors", + "model.layers.25.mlp.experts.22.down_proj.weight": "model-00026-of-00047.safetensors", + "model.layers.25.mlp.experts.22.down_proj.weight_scale": "model-00026-of-00047.safetensors", + "model.layers.25.mlp.experts.22.gate_proj.weight": "model-00026-of-00047.safetensors", + "model.layers.25.mlp.experts.22.gate_proj.weight_scale": "model-00026-of-00047.safetensors", + "model.layers.25.mlp.experts.22.up_proj.weight": "model-00026-of-00047.safetensors", + "model.layers.25.mlp.experts.22.up_proj.weight_scale": "model-00026-of-00047.safetensors", + "model.layers.25.mlp.experts.23.down_proj.weight": "model-00026-of-00047.safetensors", + "model.layers.25.mlp.experts.23.down_proj.weight_scale": "model-00026-of-00047.safetensors", + "model.layers.25.mlp.experts.23.gate_proj.weight": "model-00026-of-00047.safetensors", + "model.layers.25.mlp.experts.23.gate_proj.weight_scale": "model-00026-of-00047.safetensors", + "model.layers.25.mlp.experts.23.up_proj.weight": "model-00026-of-00047.safetensors", + "model.layers.25.mlp.experts.23.up_proj.weight_scale": "model-00026-of-00047.safetensors", + "model.layers.25.mlp.experts.24.down_proj.weight": "model-00026-of-00047.safetensors", + "model.layers.25.mlp.experts.24.down_proj.weight_scale": "model-00026-of-00047.safetensors", + "model.layers.25.mlp.experts.24.gate_proj.weight": "model-00026-of-00047.safetensors", + "model.layers.25.mlp.experts.24.gate_proj.weight_scale": "model-00026-of-00047.safetensors", + "model.layers.25.mlp.experts.24.up_proj.weight": "model-00026-of-00047.safetensors", + "model.layers.25.mlp.experts.24.up_proj.weight_scale": "model-00026-of-00047.safetensors", + "model.layers.25.mlp.experts.25.down_proj.weight": "model-00026-of-00047.safetensors", + "model.layers.25.mlp.experts.25.down_proj.weight_scale": "model-00026-of-00047.safetensors", + "model.layers.25.mlp.experts.25.gate_proj.weight": "model-00026-of-00047.safetensors", + "model.layers.25.mlp.experts.25.gate_proj.weight_scale": "model-00026-of-00047.safetensors", + "model.layers.25.mlp.experts.25.up_proj.weight": "model-00026-of-00047.safetensors", + "model.layers.25.mlp.experts.25.up_proj.weight_scale": "model-00026-of-00047.safetensors", + "model.layers.25.mlp.experts.26.down_proj.weight": "model-00026-of-00047.safetensors", + "model.layers.25.mlp.experts.26.down_proj.weight_scale": "model-00026-of-00047.safetensors", + "model.layers.25.mlp.experts.26.gate_proj.weight": "model-00026-of-00047.safetensors", + "model.layers.25.mlp.experts.26.gate_proj.weight_scale": "model-00026-of-00047.safetensors", + "model.layers.25.mlp.experts.26.up_proj.weight": "model-00026-of-00047.safetensors", + "model.layers.25.mlp.experts.26.up_proj.weight_scale": "model-00026-of-00047.safetensors", + "model.layers.25.mlp.experts.27.down_proj.weight": "model-00026-of-00047.safetensors", + "model.layers.25.mlp.experts.27.down_proj.weight_scale": "model-00026-of-00047.safetensors", + "model.layers.25.mlp.experts.27.gate_proj.weight": "model-00026-of-00047.safetensors", + "model.layers.25.mlp.experts.27.gate_proj.weight_scale": "model-00026-of-00047.safetensors", + "model.layers.25.mlp.experts.27.up_proj.weight": "model-00026-of-00047.safetensors", + "model.layers.25.mlp.experts.27.up_proj.weight_scale": "model-00026-of-00047.safetensors", + "model.layers.25.mlp.experts.28.down_proj.weight": "model-00026-of-00047.safetensors", + "model.layers.25.mlp.experts.28.down_proj.weight_scale": "model-00026-of-00047.safetensors", + "model.layers.25.mlp.experts.28.gate_proj.weight": "model-00026-of-00047.safetensors", + "model.layers.25.mlp.experts.28.gate_proj.weight_scale": "model-00026-of-00047.safetensors", + "model.layers.25.mlp.experts.28.up_proj.weight": "model-00026-of-00047.safetensors", + "model.layers.25.mlp.experts.28.up_proj.weight_scale": "model-00026-of-00047.safetensors", + "model.layers.25.mlp.experts.29.down_proj.weight": "model-00026-of-00047.safetensors", + "model.layers.25.mlp.experts.29.down_proj.weight_scale": "model-00026-of-00047.safetensors", + "model.layers.25.mlp.experts.29.gate_proj.weight": "model-00026-of-00047.safetensors", + "model.layers.25.mlp.experts.29.gate_proj.weight_scale": "model-00026-of-00047.safetensors", + "model.layers.25.mlp.experts.29.up_proj.weight": "model-00026-of-00047.safetensors", + "model.layers.25.mlp.experts.29.up_proj.weight_scale": "model-00026-of-00047.safetensors", + "model.layers.25.mlp.experts.3.down_proj.weight": "model-00026-of-00047.safetensors", + "model.layers.25.mlp.experts.3.down_proj.weight_scale": "model-00026-of-00047.safetensors", + "model.layers.25.mlp.experts.3.gate_proj.weight": "model-00026-of-00047.safetensors", + "model.layers.25.mlp.experts.3.gate_proj.weight_scale": "model-00026-of-00047.safetensors", + "model.layers.25.mlp.experts.3.up_proj.weight": "model-00026-of-00047.safetensors", + "model.layers.25.mlp.experts.3.up_proj.weight_scale": "model-00026-of-00047.safetensors", + "model.layers.25.mlp.experts.30.down_proj.weight": "model-00026-of-00047.safetensors", + "model.layers.25.mlp.experts.30.down_proj.weight_scale": "model-00026-of-00047.safetensors", + "model.layers.25.mlp.experts.30.gate_proj.weight": "model-00026-of-00047.safetensors", + "model.layers.25.mlp.experts.30.gate_proj.weight_scale": "model-00026-of-00047.safetensors", + "model.layers.25.mlp.experts.30.up_proj.weight": "model-00026-of-00047.safetensors", + "model.layers.25.mlp.experts.30.up_proj.weight_scale": "model-00026-of-00047.safetensors", + "model.layers.25.mlp.experts.31.down_proj.weight": "model-00026-of-00047.safetensors", + "model.layers.25.mlp.experts.31.down_proj.weight_scale": "model-00026-of-00047.safetensors", + "model.layers.25.mlp.experts.31.gate_proj.weight": "model-00026-of-00047.safetensors", + "model.layers.25.mlp.experts.31.gate_proj.weight_scale": "model-00026-of-00047.safetensors", + "model.layers.25.mlp.experts.31.up_proj.weight": "model-00026-of-00047.safetensors", + "model.layers.25.mlp.experts.31.up_proj.weight_scale": "model-00026-of-00047.safetensors", + "model.layers.25.mlp.experts.32.down_proj.weight": "model-00026-of-00047.safetensors", + "model.layers.25.mlp.experts.32.down_proj.weight_scale": "model-00026-of-00047.safetensors", + "model.layers.25.mlp.experts.32.gate_proj.weight": "model-00026-of-00047.safetensors", + "model.layers.25.mlp.experts.32.gate_proj.weight_scale": "model-00026-of-00047.safetensors", + "model.layers.25.mlp.experts.32.up_proj.weight": "model-00026-of-00047.safetensors", + "model.layers.25.mlp.experts.32.up_proj.weight_scale": "model-00026-of-00047.safetensors", + "model.layers.25.mlp.experts.33.down_proj.weight": "model-00026-of-00047.safetensors", + "model.layers.25.mlp.experts.33.down_proj.weight_scale": "model-00026-of-00047.safetensors", + "model.layers.25.mlp.experts.33.gate_proj.weight": "model-00026-of-00047.safetensors", + "model.layers.25.mlp.experts.33.gate_proj.weight_scale": "model-00026-of-00047.safetensors", + "model.layers.25.mlp.experts.33.up_proj.weight": "model-00026-of-00047.safetensors", + "model.layers.25.mlp.experts.33.up_proj.weight_scale": "model-00026-of-00047.safetensors", + "model.layers.25.mlp.experts.34.down_proj.weight": "model-00026-of-00047.safetensors", + "model.layers.25.mlp.experts.34.down_proj.weight_scale": "model-00026-of-00047.safetensors", + "model.layers.25.mlp.experts.34.gate_proj.weight": "model-00026-of-00047.safetensors", + "model.layers.25.mlp.experts.34.gate_proj.weight_scale": "model-00026-of-00047.safetensors", + "model.layers.25.mlp.experts.34.up_proj.weight": "model-00026-of-00047.safetensors", + "model.layers.25.mlp.experts.34.up_proj.weight_scale": "model-00026-of-00047.safetensors", + "model.layers.25.mlp.experts.35.down_proj.weight": "model-00026-of-00047.safetensors", + "model.layers.25.mlp.experts.35.down_proj.weight_scale": "model-00026-of-00047.safetensors", + "model.layers.25.mlp.experts.35.gate_proj.weight": "model-00026-of-00047.safetensors", + "model.layers.25.mlp.experts.35.gate_proj.weight_scale": "model-00026-of-00047.safetensors", + "model.layers.25.mlp.experts.35.up_proj.weight": "model-00026-of-00047.safetensors", + "model.layers.25.mlp.experts.35.up_proj.weight_scale": "model-00026-of-00047.safetensors", + "model.layers.25.mlp.experts.36.down_proj.weight": "model-00026-of-00047.safetensors", + "model.layers.25.mlp.experts.36.down_proj.weight_scale": "model-00026-of-00047.safetensors", + "model.layers.25.mlp.experts.36.gate_proj.weight": "model-00026-of-00047.safetensors", + "model.layers.25.mlp.experts.36.gate_proj.weight_scale": "model-00026-of-00047.safetensors", + "model.layers.25.mlp.experts.36.up_proj.weight": "model-00026-of-00047.safetensors", + "model.layers.25.mlp.experts.36.up_proj.weight_scale": "model-00026-of-00047.safetensors", + "model.layers.25.mlp.experts.37.down_proj.weight": "model-00026-of-00047.safetensors", + "model.layers.25.mlp.experts.37.down_proj.weight_scale": "model-00026-of-00047.safetensors", + "model.layers.25.mlp.experts.37.gate_proj.weight": "model-00026-of-00047.safetensors", + "model.layers.25.mlp.experts.37.gate_proj.weight_scale": "model-00026-of-00047.safetensors", + "model.layers.25.mlp.experts.37.up_proj.weight": "model-00026-of-00047.safetensors", + "model.layers.25.mlp.experts.37.up_proj.weight_scale": "model-00026-of-00047.safetensors", + "model.layers.25.mlp.experts.38.down_proj.weight": "model-00026-of-00047.safetensors", + "model.layers.25.mlp.experts.38.down_proj.weight_scale": "model-00026-of-00047.safetensors", + "model.layers.25.mlp.experts.38.gate_proj.weight": "model-00026-of-00047.safetensors", + "model.layers.25.mlp.experts.38.gate_proj.weight_scale": "model-00026-of-00047.safetensors", + "model.layers.25.mlp.experts.38.up_proj.weight": "model-00026-of-00047.safetensors", + "model.layers.25.mlp.experts.38.up_proj.weight_scale": "model-00026-of-00047.safetensors", + "model.layers.25.mlp.experts.39.down_proj.weight": "model-00026-of-00047.safetensors", + "model.layers.25.mlp.experts.39.down_proj.weight_scale": "model-00026-of-00047.safetensors", + "model.layers.25.mlp.experts.39.gate_proj.weight": "model-00026-of-00047.safetensors", + "model.layers.25.mlp.experts.39.gate_proj.weight_scale": "model-00026-of-00047.safetensors", + "model.layers.25.mlp.experts.39.up_proj.weight": "model-00026-of-00047.safetensors", + "model.layers.25.mlp.experts.39.up_proj.weight_scale": "model-00026-of-00047.safetensors", + "model.layers.25.mlp.experts.4.down_proj.weight": "model-00026-of-00047.safetensors", + "model.layers.25.mlp.experts.4.down_proj.weight_scale": "model-00026-of-00047.safetensors", + "model.layers.25.mlp.experts.4.gate_proj.weight": "model-00026-of-00047.safetensors", + "model.layers.25.mlp.experts.4.gate_proj.weight_scale": "model-00026-of-00047.safetensors", + "model.layers.25.mlp.experts.4.up_proj.weight": "model-00026-of-00047.safetensors", + "model.layers.25.mlp.experts.4.up_proj.weight_scale": "model-00026-of-00047.safetensors", + "model.layers.25.mlp.experts.40.down_proj.weight": "model-00026-of-00047.safetensors", + "model.layers.25.mlp.experts.40.down_proj.weight_scale": "model-00026-of-00047.safetensors", + "model.layers.25.mlp.experts.40.gate_proj.weight": "model-00026-of-00047.safetensors", + "model.layers.25.mlp.experts.40.gate_proj.weight_scale": "model-00026-of-00047.safetensors", + "model.layers.25.mlp.experts.40.up_proj.weight": "model-00026-of-00047.safetensors", + "model.layers.25.mlp.experts.40.up_proj.weight_scale": "model-00026-of-00047.safetensors", + "model.layers.25.mlp.experts.41.down_proj.weight": "model-00026-of-00047.safetensors", + "model.layers.25.mlp.experts.41.down_proj.weight_scale": "model-00026-of-00047.safetensors", + "model.layers.25.mlp.experts.41.gate_proj.weight": "model-00026-of-00047.safetensors", + "model.layers.25.mlp.experts.41.gate_proj.weight_scale": "model-00026-of-00047.safetensors", + "model.layers.25.mlp.experts.41.up_proj.weight": "model-00026-of-00047.safetensors", + "model.layers.25.mlp.experts.41.up_proj.weight_scale": "model-00026-of-00047.safetensors", + "model.layers.25.mlp.experts.42.down_proj.weight": "model-00026-of-00047.safetensors", + "model.layers.25.mlp.experts.42.down_proj.weight_scale": "model-00026-of-00047.safetensors", + "model.layers.25.mlp.experts.42.gate_proj.weight": "model-00026-of-00047.safetensors", + "model.layers.25.mlp.experts.42.gate_proj.weight_scale": "model-00026-of-00047.safetensors", + "model.layers.25.mlp.experts.42.up_proj.weight": "model-00026-of-00047.safetensors", + "model.layers.25.mlp.experts.42.up_proj.weight_scale": "model-00026-of-00047.safetensors", + "model.layers.25.mlp.experts.43.down_proj.weight": "model-00026-of-00047.safetensors", + "model.layers.25.mlp.experts.43.down_proj.weight_scale": "model-00026-of-00047.safetensors", + "model.layers.25.mlp.experts.43.gate_proj.weight": "model-00026-of-00047.safetensors", + "model.layers.25.mlp.experts.43.gate_proj.weight_scale": "model-00026-of-00047.safetensors", + "model.layers.25.mlp.experts.43.up_proj.weight": "model-00026-of-00047.safetensors", + "model.layers.25.mlp.experts.43.up_proj.weight_scale": "model-00026-of-00047.safetensors", + "model.layers.25.mlp.experts.44.down_proj.weight": "model-00026-of-00047.safetensors", + "model.layers.25.mlp.experts.44.down_proj.weight_scale": "model-00026-of-00047.safetensors", + "model.layers.25.mlp.experts.44.gate_proj.weight": "model-00026-of-00047.safetensors", + "model.layers.25.mlp.experts.44.gate_proj.weight_scale": "model-00026-of-00047.safetensors", + "model.layers.25.mlp.experts.44.up_proj.weight": "model-00026-of-00047.safetensors", + "model.layers.25.mlp.experts.44.up_proj.weight_scale": "model-00026-of-00047.safetensors", + "model.layers.25.mlp.experts.45.down_proj.weight": "model-00026-of-00047.safetensors", + "model.layers.25.mlp.experts.45.down_proj.weight_scale": "model-00026-of-00047.safetensors", + "model.layers.25.mlp.experts.45.gate_proj.weight": "model-00026-of-00047.safetensors", + "model.layers.25.mlp.experts.45.gate_proj.weight_scale": "model-00026-of-00047.safetensors", + "model.layers.25.mlp.experts.45.up_proj.weight": "model-00026-of-00047.safetensors", + "model.layers.25.mlp.experts.45.up_proj.weight_scale": "model-00026-of-00047.safetensors", + "model.layers.25.mlp.experts.46.down_proj.weight": "model-00026-of-00047.safetensors", + "model.layers.25.mlp.experts.46.down_proj.weight_scale": "model-00026-of-00047.safetensors", + "model.layers.25.mlp.experts.46.gate_proj.weight": "model-00026-of-00047.safetensors", + "model.layers.25.mlp.experts.46.gate_proj.weight_scale": "model-00026-of-00047.safetensors", + "model.layers.25.mlp.experts.46.up_proj.weight": "model-00026-of-00047.safetensors", + "model.layers.25.mlp.experts.46.up_proj.weight_scale": "model-00026-of-00047.safetensors", + "model.layers.25.mlp.experts.47.down_proj.weight": "model-00026-of-00047.safetensors", + "model.layers.25.mlp.experts.47.down_proj.weight_scale": "model-00026-of-00047.safetensors", + "model.layers.25.mlp.experts.47.gate_proj.weight": "model-00026-of-00047.safetensors", + "model.layers.25.mlp.experts.47.gate_proj.weight_scale": "model-00026-of-00047.safetensors", + "model.layers.25.mlp.experts.47.up_proj.weight": "model-00026-of-00047.safetensors", + "model.layers.25.mlp.experts.47.up_proj.weight_scale": "model-00026-of-00047.safetensors", + "model.layers.25.mlp.experts.48.down_proj.weight": "model-00026-of-00047.safetensors", + "model.layers.25.mlp.experts.48.down_proj.weight_scale": "model-00026-of-00047.safetensors", + "model.layers.25.mlp.experts.48.gate_proj.weight": "model-00026-of-00047.safetensors", + "model.layers.25.mlp.experts.48.gate_proj.weight_scale": "model-00026-of-00047.safetensors", + "model.layers.25.mlp.experts.48.up_proj.weight": "model-00026-of-00047.safetensors", + "model.layers.25.mlp.experts.48.up_proj.weight_scale": "model-00026-of-00047.safetensors", + "model.layers.25.mlp.experts.49.down_proj.weight": "model-00026-of-00047.safetensors", + "model.layers.25.mlp.experts.49.down_proj.weight_scale": "model-00026-of-00047.safetensors", + "model.layers.25.mlp.experts.49.gate_proj.weight": "model-00026-of-00047.safetensors", + "model.layers.25.mlp.experts.49.gate_proj.weight_scale": "model-00026-of-00047.safetensors", + "model.layers.25.mlp.experts.49.up_proj.weight": "model-00026-of-00047.safetensors", + "model.layers.25.mlp.experts.49.up_proj.weight_scale": "model-00026-of-00047.safetensors", + "model.layers.25.mlp.experts.5.down_proj.weight": "model-00026-of-00047.safetensors", + "model.layers.25.mlp.experts.5.down_proj.weight_scale": "model-00026-of-00047.safetensors", + "model.layers.25.mlp.experts.5.gate_proj.weight": "model-00026-of-00047.safetensors", + "model.layers.25.mlp.experts.5.gate_proj.weight_scale": "model-00026-of-00047.safetensors", + "model.layers.25.mlp.experts.5.up_proj.weight": "model-00026-of-00047.safetensors", + "model.layers.25.mlp.experts.5.up_proj.weight_scale": "model-00026-of-00047.safetensors", + "model.layers.25.mlp.experts.50.down_proj.weight": "model-00026-of-00047.safetensors", + "model.layers.25.mlp.experts.50.down_proj.weight_scale": "model-00026-of-00047.safetensors", + "model.layers.25.mlp.experts.50.gate_proj.weight": "model-00026-of-00047.safetensors", + "model.layers.25.mlp.experts.50.gate_proj.weight_scale": "model-00026-of-00047.safetensors", + "model.layers.25.mlp.experts.50.up_proj.weight": "model-00026-of-00047.safetensors", + "model.layers.25.mlp.experts.50.up_proj.weight_scale": "model-00026-of-00047.safetensors", + "model.layers.25.mlp.experts.51.down_proj.weight": "model-00026-of-00047.safetensors", + "model.layers.25.mlp.experts.51.down_proj.weight_scale": "model-00026-of-00047.safetensors", + "model.layers.25.mlp.experts.51.gate_proj.weight": "model-00026-of-00047.safetensors", + "model.layers.25.mlp.experts.51.gate_proj.weight_scale": "model-00026-of-00047.safetensors", + "model.layers.25.mlp.experts.51.up_proj.weight": "model-00026-of-00047.safetensors", + "model.layers.25.mlp.experts.51.up_proj.weight_scale": "model-00026-of-00047.safetensors", + "model.layers.25.mlp.experts.52.down_proj.weight": "model-00026-of-00047.safetensors", + "model.layers.25.mlp.experts.52.down_proj.weight_scale": "model-00026-of-00047.safetensors", + "model.layers.25.mlp.experts.52.gate_proj.weight": "model-00026-of-00047.safetensors", + "model.layers.25.mlp.experts.52.gate_proj.weight_scale": "model-00026-of-00047.safetensors", + "model.layers.25.mlp.experts.52.up_proj.weight": "model-00026-of-00047.safetensors", + "model.layers.25.mlp.experts.52.up_proj.weight_scale": "model-00026-of-00047.safetensors", + "model.layers.25.mlp.experts.53.down_proj.weight": "model-00026-of-00047.safetensors", + "model.layers.25.mlp.experts.53.down_proj.weight_scale": "model-00026-of-00047.safetensors", + "model.layers.25.mlp.experts.53.gate_proj.weight": "model-00026-of-00047.safetensors", + "model.layers.25.mlp.experts.53.gate_proj.weight_scale": "model-00026-of-00047.safetensors", + "model.layers.25.mlp.experts.53.up_proj.weight": "model-00026-of-00047.safetensors", + "model.layers.25.mlp.experts.53.up_proj.weight_scale": "model-00026-of-00047.safetensors", + "model.layers.25.mlp.experts.54.down_proj.weight": "model-00026-of-00047.safetensors", + "model.layers.25.mlp.experts.54.down_proj.weight_scale": "model-00026-of-00047.safetensors", + "model.layers.25.mlp.experts.54.gate_proj.weight": "model-00026-of-00047.safetensors", + "model.layers.25.mlp.experts.54.gate_proj.weight_scale": "model-00026-of-00047.safetensors", + "model.layers.25.mlp.experts.54.up_proj.weight": "model-00026-of-00047.safetensors", + "model.layers.25.mlp.experts.54.up_proj.weight_scale": "model-00026-of-00047.safetensors", + "model.layers.25.mlp.experts.55.down_proj.weight": "model-00026-of-00047.safetensors", + "model.layers.25.mlp.experts.55.down_proj.weight_scale": "model-00026-of-00047.safetensors", + "model.layers.25.mlp.experts.55.gate_proj.weight": "model-00026-of-00047.safetensors", + "model.layers.25.mlp.experts.55.gate_proj.weight_scale": "model-00026-of-00047.safetensors", + "model.layers.25.mlp.experts.55.up_proj.weight": "model-00026-of-00047.safetensors", + "model.layers.25.mlp.experts.55.up_proj.weight_scale": "model-00026-of-00047.safetensors", + "model.layers.25.mlp.experts.56.down_proj.weight": "model-00026-of-00047.safetensors", + "model.layers.25.mlp.experts.56.down_proj.weight_scale": "model-00026-of-00047.safetensors", + "model.layers.25.mlp.experts.56.gate_proj.weight": "model-00026-of-00047.safetensors", + "model.layers.25.mlp.experts.56.gate_proj.weight_scale": "model-00026-of-00047.safetensors", + "model.layers.25.mlp.experts.56.up_proj.weight": "model-00026-of-00047.safetensors", + "model.layers.25.mlp.experts.56.up_proj.weight_scale": "model-00026-of-00047.safetensors", + "model.layers.25.mlp.experts.57.down_proj.weight": "model-00026-of-00047.safetensors", + "model.layers.25.mlp.experts.57.down_proj.weight_scale": "model-00026-of-00047.safetensors", + "model.layers.25.mlp.experts.57.gate_proj.weight": "model-00026-of-00047.safetensors", + "model.layers.25.mlp.experts.57.gate_proj.weight_scale": "model-00026-of-00047.safetensors", + "model.layers.25.mlp.experts.57.up_proj.weight": "model-00026-of-00047.safetensors", + "model.layers.25.mlp.experts.57.up_proj.weight_scale": "model-00026-of-00047.safetensors", + "model.layers.25.mlp.experts.58.down_proj.weight": "model-00026-of-00047.safetensors", + "model.layers.25.mlp.experts.58.down_proj.weight_scale": "model-00026-of-00047.safetensors", + "model.layers.25.mlp.experts.58.gate_proj.weight": "model-00026-of-00047.safetensors", + "model.layers.25.mlp.experts.58.gate_proj.weight_scale": "model-00026-of-00047.safetensors", + "model.layers.25.mlp.experts.58.up_proj.weight": "model-00026-of-00047.safetensors", + "model.layers.25.mlp.experts.58.up_proj.weight_scale": "model-00026-of-00047.safetensors", + "model.layers.25.mlp.experts.59.down_proj.weight": "model-00026-of-00047.safetensors", + "model.layers.25.mlp.experts.59.down_proj.weight_scale": "model-00026-of-00047.safetensors", + "model.layers.25.mlp.experts.59.gate_proj.weight": "model-00026-of-00047.safetensors", + "model.layers.25.mlp.experts.59.gate_proj.weight_scale": "model-00026-of-00047.safetensors", + "model.layers.25.mlp.experts.59.up_proj.weight": "model-00026-of-00047.safetensors", + "model.layers.25.mlp.experts.59.up_proj.weight_scale": "model-00026-of-00047.safetensors", + "model.layers.25.mlp.experts.6.down_proj.weight": "model-00026-of-00047.safetensors", + "model.layers.25.mlp.experts.6.down_proj.weight_scale": "model-00026-of-00047.safetensors", + "model.layers.25.mlp.experts.6.gate_proj.weight": "model-00026-of-00047.safetensors", + "model.layers.25.mlp.experts.6.gate_proj.weight_scale": "model-00026-of-00047.safetensors", + "model.layers.25.mlp.experts.6.up_proj.weight": "model-00026-of-00047.safetensors", + "model.layers.25.mlp.experts.6.up_proj.weight_scale": "model-00026-of-00047.safetensors", + "model.layers.25.mlp.experts.60.down_proj.weight": "model-00026-of-00047.safetensors", + "model.layers.25.mlp.experts.60.down_proj.weight_scale": "model-00026-of-00047.safetensors", + "model.layers.25.mlp.experts.60.gate_proj.weight": "model-00026-of-00047.safetensors", + "model.layers.25.mlp.experts.60.gate_proj.weight_scale": "model-00026-of-00047.safetensors", + "model.layers.25.mlp.experts.60.up_proj.weight": "model-00026-of-00047.safetensors", + "model.layers.25.mlp.experts.60.up_proj.weight_scale": "model-00026-of-00047.safetensors", + "model.layers.25.mlp.experts.61.down_proj.weight": "model-00026-of-00047.safetensors", + "model.layers.25.mlp.experts.61.down_proj.weight_scale": "model-00026-of-00047.safetensors", + "model.layers.25.mlp.experts.61.gate_proj.weight": "model-00026-of-00047.safetensors", + "model.layers.25.mlp.experts.61.gate_proj.weight_scale": "model-00026-of-00047.safetensors", + "model.layers.25.mlp.experts.61.up_proj.weight": "model-00026-of-00047.safetensors", + "model.layers.25.mlp.experts.61.up_proj.weight_scale": "model-00026-of-00047.safetensors", + "model.layers.25.mlp.experts.62.down_proj.weight": "model-00026-of-00047.safetensors", + "model.layers.25.mlp.experts.62.down_proj.weight_scale": "model-00026-of-00047.safetensors", + "model.layers.25.mlp.experts.62.gate_proj.weight": "model-00026-of-00047.safetensors", + "model.layers.25.mlp.experts.62.gate_proj.weight_scale": "model-00026-of-00047.safetensors", + "model.layers.25.mlp.experts.62.up_proj.weight": "model-00026-of-00047.safetensors", + "model.layers.25.mlp.experts.62.up_proj.weight_scale": "model-00026-of-00047.safetensors", + "model.layers.25.mlp.experts.63.down_proj.weight": "model-00026-of-00047.safetensors", + "model.layers.25.mlp.experts.63.down_proj.weight_scale": "model-00026-of-00047.safetensors", + "model.layers.25.mlp.experts.63.gate_proj.weight": "model-00026-of-00047.safetensors", + "model.layers.25.mlp.experts.63.gate_proj.weight_scale": "model-00026-of-00047.safetensors", + "model.layers.25.mlp.experts.63.up_proj.weight": "model-00026-of-00047.safetensors", + "model.layers.25.mlp.experts.63.up_proj.weight_scale": "model-00026-of-00047.safetensors", + "model.layers.25.mlp.experts.64.down_proj.weight": "model-00026-of-00047.safetensors", + "model.layers.25.mlp.experts.64.down_proj.weight_scale": "model-00026-of-00047.safetensors", + "model.layers.25.mlp.experts.64.gate_proj.weight": "model-00026-of-00047.safetensors", + "model.layers.25.mlp.experts.64.gate_proj.weight_scale": "model-00026-of-00047.safetensors", + "model.layers.25.mlp.experts.64.up_proj.weight": "model-00026-of-00047.safetensors", + "model.layers.25.mlp.experts.64.up_proj.weight_scale": "model-00026-of-00047.safetensors", + "model.layers.25.mlp.experts.65.down_proj.weight": "model-00026-of-00047.safetensors", + "model.layers.25.mlp.experts.65.down_proj.weight_scale": "model-00026-of-00047.safetensors", + "model.layers.25.mlp.experts.65.gate_proj.weight": "model-00026-of-00047.safetensors", + "model.layers.25.mlp.experts.65.gate_proj.weight_scale": "model-00026-of-00047.safetensors", + "model.layers.25.mlp.experts.65.up_proj.weight": "model-00026-of-00047.safetensors", + "model.layers.25.mlp.experts.65.up_proj.weight_scale": "model-00026-of-00047.safetensors", + "model.layers.25.mlp.experts.66.down_proj.weight": "model-00026-of-00047.safetensors", + "model.layers.25.mlp.experts.66.down_proj.weight_scale": "model-00026-of-00047.safetensors", + "model.layers.25.mlp.experts.66.gate_proj.weight": "model-00026-of-00047.safetensors", + "model.layers.25.mlp.experts.66.gate_proj.weight_scale": "model-00026-of-00047.safetensors", + "model.layers.25.mlp.experts.66.up_proj.weight": "model-00026-of-00047.safetensors", + "model.layers.25.mlp.experts.66.up_proj.weight_scale": "model-00026-of-00047.safetensors", + "model.layers.25.mlp.experts.67.down_proj.weight": "model-00026-of-00047.safetensors", + "model.layers.25.mlp.experts.67.down_proj.weight_scale": "model-00026-of-00047.safetensors", + "model.layers.25.mlp.experts.67.gate_proj.weight": "model-00026-of-00047.safetensors", + "model.layers.25.mlp.experts.67.gate_proj.weight_scale": "model-00026-of-00047.safetensors", + "model.layers.25.mlp.experts.67.up_proj.weight": "model-00026-of-00047.safetensors", + "model.layers.25.mlp.experts.67.up_proj.weight_scale": "model-00026-of-00047.safetensors", + "model.layers.25.mlp.experts.68.down_proj.weight": "model-00026-of-00047.safetensors", + "model.layers.25.mlp.experts.68.down_proj.weight_scale": "model-00026-of-00047.safetensors", + "model.layers.25.mlp.experts.68.gate_proj.weight": "model-00026-of-00047.safetensors", + "model.layers.25.mlp.experts.68.gate_proj.weight_scale": "model-00026-of-00047.safetensors", + "model.layers.25.mlp.experts.68.up_proj.weight": "model-00026-of-00047.safetensors", + "model.layers.25.mlp.experts.68.up_proj.weight_scale": "model-00026-of-00047.safetensors", + "model.layers.25.mlp.experts.69.down_proj.weight": "model-00026-of-00047.safetensors", + "model.layers.25.mlp.experts.69.down_proj.weight_scale": "model-00026-of-00047.safetensors", + "model.layers.25.mlp.experts.69.gate_proj.weight": "model-00026-of-00047.safetensors", + "model.layers.25.mlp.experts.69.gate_proj.weight_scale": "model-00026-of-00047.safetensors", + "model.layers.25.mlp.experts.69.up_proj.weight": "model-00026-of-00047.safetensors", + "model.layers.25.mlp.experts.69.up_proj.weight_scale": "model-00026-of-00047.safetensors", + "model.layers.25.mlp.experts.7.down_proj.weight": "model-00026-of-00047.safetensors", + "model.layers.25.mlp.experts.7.down_proj.weight_scale": "model-00026-of-00047.safetensors", + "model.layers.25.mlp.experts.7.gate_proj.weight": "model-00026-of-00047.safetensors", + "model.layers.25.mlp.experts.7.gate_proj.weight_scale": "model-00026-of-00047.safetensors", + "model.layers.25.mlp.experts.7.up_proj.weight": "model-00026-of-00047.safetensors", + "model.layers.25.mlp.experts.7.up_proj.weight_scale": "model-00026-of-00047.safetensors", + "model.layers.25.mlp.experts.70.down_proj.weight": "model-00026-of-00047.safetensors", + "model.layers.25.mlp.experts.70.down_proj.weight_scale": "model-00026-of-00047.safetensors", + "model.layers.25.mlp.experts.70.gate_proj.weight": "model-00026-of-00047.safetensors", + "model.layers.25.mlp.experts.70.gate_proj.weight_scale": "model-00026-of-00047.safetensors", + "model.layers.25.mlp.experts.70.up_proj.weight": "model-00026-of-00047.safetensors", + "model.layers.25.mlp.experts.70.up_proj.weight_scale": "model-00026-of-00047.safetensors", + "model.layers.25.mlp.experts.71.down_proj.weight": "model-00026-of-00047.safetensors", + "model.layers.25.mlp.experts.71.down_proj.weight_scale": "model-00026-of-00047.safetensors", + "model.layers.25.mlp.experts.71.gate_proj.weight": "model-00026-of-00047.safetensors", + "model.layers.25.mlp.experts.71.gate_proj.weight_scale": "model-00026-of-00047.safetensors", + "model.layers.25.mlp.experts.71.up_proj.weight": "model-00026-of-00047.safetensors", + "model.layers.25.mlp.experts.71.up_proj.weight_scale": "model-00026-of-00047.safetensors", + "model.layers.25.mlp.experts.72.down_proj.weight": "model-00026-of-00047.safetensors", + "model.layers.25.mlp.experts.72.down_proj.weight_scale": "model-00026-of-00047.safetensors", + "model.layers.25.mlp.experts.72.gate_proj.weight": "model-00026-of-00047.safetensors", + "model.layers.25.mlp.experts.72.gate_proj.weight_scale": "model-00026-of-00047.safetensors", + "model.layers.25.mlp.experts.72.up_proj.weight": "model-00026-of-00047.safetensors", + "model.layers.25.mlp.experts.72.up_proj.weight_scale": "model-00026-of-00047.safetensors", + "model.layers.25.mlp.experts.73.down_proj.weight": "model-00026-of-00047.safetensors", + "model.layers.25.mlp.experts.73.down_proj.weight_scale": "model-00026-of-00047.safetensors", + "model.layers.25.mlp.experts.73.gate_proj.weight": "model-00026-of-00047.safetensors", + "model.layers.25.mlp.experts.73.gate_proj.weight_scale": "model-00026-of-00047.safetensors", + "model.layers.25.mlp.experts.73.up_proj.weight": "model-00026-of-00047.safetensors", + "model.layers.25.mlp.experts.73.up_proj.weight_scale": "model-00026-of-00047.safetensors", + "model.layers.25.mlp.experts.74.down_proj.weight": "model-00026-of-00047.safetensors", + "model.layers.25.mlp.experts.74.down_proj.weight_scale": "model-00026-of-00047.safetensors", + "model.layers.25.mlp.experts.74.gate_proj.weight": "model-00026-of-00047.safetensors", + "model.layers.25.mlp.experts.74.gate_proj.weight_scale": "model-00026-of-00047.safetensors", + "model.layers.25.mlp.experts.74.up_proj.weight": "model-00026-of-00047.safetensors", + "model.layers.25.mlp.experts.74.up_proj.weight_scale": "model-00026-of-00047.safetensors", + "model.layers.25.mlp.experts.75.down_proj.weight": "model-00026-of-00047.safetensors", + "model.layers.25.mlp.experts.75.down_proj.weight_scale": "model-00026-of-00047.safetensors", + "model.layers.25.mlp.experts.75.gate_proj.weight": "model-00026-of-00047.safetensors", + "model.layers.25.mlp.experts.75.gate_proj.weight_scale": "model-00026-of-00047.safetensors", + "model.layers.25.mlp.experts.75.up_proj.weight": "model-00026-of-00047.safetensors", + "model.layers.25.mlp.experts.75.up_proj.weight_scale": "model-00026-of-00047.safetensors", + "model.layers.25.mlp.experts.76.down_proj.weight": "model-00026-of-00047.safetensors", + "model.layers.25.mlp.experts.76.down_proj.weight_scale": "model-00026-of-00047.safetensors", + "model.layers.25.mlp.experts.76.gate_proj.weight": "model-00026-of-00047.safetensors", + "model.layers.25.mlp.experts.76.gate_proj.weight_scale": "model-00026-of-00047.safetensors", + "model.layers.25.mlp.experts.76.up_proj.weight": "model-00026-of-00047.safetensors", + "model.layers.25.mlp.experts.76.up_proj.weight_scale": "model-00026-of-00047.safetensors", + "model.layers.25.mlp.experts.77.down_proj.weight": "model-00026-of-00047.safetensors", + "model.layers.25.mlp.experts.77.down_proj.weight_scale": "model-00026-of-00047.safetensors", + "model.layers.25.mlp.experts.77.gate_proj.weight": "model-00026-of-00047.safetensors", + "model.layers.25.mlp.experts.77.gate_proj.weight_scale": "model-00026-of-00047.safetensors", + "model.layers.25.mlp.experts.77.up_proj.weight": "model-00026-of-00047.safetensors", + "model.layers.25.mlp.experts.77.up_proj.weight_scale": "model-00026-of-00047.safetensors", + "model.layers.25.mlp.experts.78.down_proj.weight": "model-00026-of-00047.safetensors", + "model.layers.25.mlp.experts.78.down_proj.weight_scale": "model-00026-of-00047.safetensors", + "model.layers.25.mlp.experts.78.gate_proj.weight": "model-00026-of-00047.safetensors", + "model.layers.25.mlp.experts.78.gate_proj.weight_scale": "model-00026-of-00047.safetensors", + "model.layers.25.mlp.experts.78.up_proj.weight": "model-00026-of-00047.safetensors", + "model.layers.25.mlp.experts.78.up_proj.weight_scale": "model-00026-of-00047.safetensors", + "model.layers.25.mlp.experts.79.down_proj.weight": "model-00026-of-00047.safetensors", + "model.layers.25.mlp.experts.79.down_proj.weight_scale": "model-00026-of-00047.safetensors", + "model.layers.25.mlp.experts.79.gate_proj.weight": "model-00026-of-00047.safetensors", + "model.layers.25.mlp.experts.79.gate_proj.weight_scale": "model-00026-of-00047.safetensors", + "model.layers.25.mlp.experts.79.up_proj.weight": "model-00026-of-00047.safetensors", + "model.layers.25.mlp.experts.79.up_proj.weight_scale": "model-00026-of-00047.safetensors", + "model.layers.25.mlp.experts.8.down_proj.weight": "model-00026-of-00047.safetensors", + "model.layers.25.mlp.experts.8.down_proj.weight_scale": "model-00026-of-00047.safetensors", + "model.layers.25.mlp.experts.8.gate_proj.weight": "model-00026-of-00047.safetensors", + "model.layers.25.mlp.experts.8.gate_proj.weight_scale": "model-00026-of-00047.safetensors", + "model.layers.25.mlp.experts.8.up_proj.weight": "model-00026-of-00047.safetensors", + "model.layers.25.mlp.experts.8.up_proj.weight_scale": "model-00026-of-00047.safetensors", + "model.layers.25.mlp.experts.80.down_proj.weight": "model-00026-of-00047.safetensors", + "model.layers.25.mlp.experts.80.down_proj.weight_scale": "model-00026-of-00047.safetensors", + "model.layers.25.mlp.experts.80.gate_proj.weight": "model-00026-of-00047.safetensors", + "model.layers.25.mlp.experts.80.gate_proj.weight_scale": "model-00026-of-00047.safetensors", + "model.layers.25.mlp.experts.80.up_proj.weight": "model-00026-of-00047.safetensors", + "model.layers.25.mlp.experts.80.up_proj.weight_scale": "model-00026-of-00047.safetensors", + "model.layers.25.mlp.experts.81.down_proj.weight": "model-00026-of-00047.safetensors", + "model.layers.25.mlp.experts.81.down_proj.weight_scale": "model-00026-of-00047.safetensors", + "model.layers.25.mlp.experts.81.gate_proj.weight": "model-00026-of-00047.safetensors", + "model.layers.25.mlp.experts.81.gate_proj.weight_scale": "model-00026-of-00047.safetensors", + "model.layers.25.mlp.experts.81.up_proj.weight": "model-00026-of-00047.safetensors", + "model.layers.25.mlp.experts.81.up_proj.weight_scale": "model-00026-of-00047.safetensors", + "model.layers.25.mlp.experts.82.down_proj.weight": "model-00026-of-00047.safetensors", + "model.layers.25.mlp.experts.82.down_proj.weight_scale": "model-00026-of-00047.safetensors", + "model.layers.25.mlp.experts.82.gate_proj.weight": "model-00026-of-00047.safetensors", + "model.layers.25.mlp.experts.82.gate_proj.weight_scale": "model-00026-of-00047.safetensors", + "model.layers.25.mlp.experts.82.up_proj.weight": "model-00026-of-00047.safetensors", + "model.layers.25.mlp.experts.82.up_proj.weight_scale": "model-00026-of-00047.safetensors", + "model.layers.25.mlp.experts.83.down_proj.weight": "model-00026-of-00047.safetensors", + "model.layers.25.mlp.experts.83.down_proj.weight_scale": "model-00026-of-00047.safetensors", + "model.layers.25.mlp.experts.83.gate_proj.weight": "model-00026-of-00047.safetensors", + "model.layers.25.mlp.experts.83.gate_proj.weight_scale": "model-00026-of-00047.safetensors", + "model.layers.25.mlp.experts.83.up_proj.weight": "model-00026-of-00047.safetensors", + "model.layers.25.mlp.experts.83.up_proj.weight_scale": "model-00026-of-00047.safetensors", + "model.layers.25.mlp.experts.84.down_proj.weight": "model-00026-of-00047.safetensors", + "model.layers.25.mlp.experts.84.down_proj.weight_scale": "model-00026-of-00047.safetensors", + "model.layers.25.mlp.experts.84.gate_proj.weight": "model-00026-of-00047.safetensors", + "model.layers.25.mlp.experts.84.gate_proj.weight_scale": "model-00026-of-00047.safetensors", + "model.layers.25.mlp.experts.84.up_proj.weight": "model-00026-of-00047.safetensors", + "model.layers.25.mlp.experts.84.up_proj.weight_scale": "model-00026-of-00047.safetensors", + "model.layers.25.mlp.experts.85.down_proj.weight": "model-00026-of-00047.safetensors", + "model.layers.25.mlp.experts.85.down_proj.weight_scale": "model-00026-of-00047.safetensors", + "model.layers.25.mlp.experts.85.gate_proj.weight": "model-00026-of-00047.safetensors", + "model.layers.25.mlp.experts.85.gate_proj.weight_scale": "model-00026-of-00047.safetensors", + "model.layers.25.mlp.experts.85.up_proj.weight": "model-00026-of-00047.safetensors", + "model.layers.25.mlp.experts.85.up_proj.weight_scale": "model-00026-of-00047.safetensors", + "model.layers.25.mlp.experts.86.down_proj.weight": "model-00026-of-00047.safetensors", + "model.layers.25.mlp.experts.86.down_proj.weight_scale": "model-00026-of-00047.safetensors", + "model.layers.25.mlp.experts.86.gate_proj.weight": "model-00026-of-00047.safetensors", + "model.layers.25.mlp.experts.86.gate_proj.weight_scale": "model-00026-of-00047.safetensors", + "model.layers.25.mlp.experts.86.up_proj.weight": "model-00026-of-00047.safetensors", + "model.layers.25.mlp.experts.86.up_proj.weight_scale": "model-00026-of-00047.safetensors", + "model.layers.25.mlp.experts.87.down_proj.weight": "model-00026-of-00047.safetensors", + "model.layers.25.mlp.experts.87.down_proj.weight_scale": "model-00026-of-00047.safetensors", + "model.layers.25.mlp.experts.87.gate_proj.weight": "model-00026-of-00047.safetensors", + "model.layers.25.mlp.experts.87.gate_proj.weight_scale": "model-00026-of-00047.safetensors", + "model.layers.25.mlp.experts.87.up_proj.weight": "model-00026-of-00047.safetensors", + "model.layers.25.mlp.experts.87.up_proj.weight_scale": "model-00026-of-00047.safetensors", + "model.layers.25.mlp.experts.88.down_proj.weight": "model-00026-of-00047.safetensors", + "model.layers.25.mlp.experts.88.down_proj.weight_scale": "model-00026-of-00047.safetensors", + "model.layers.25.mlp.experts.88.gate_proj.weight": "model-00026-of-00047.safetensors", + "model.layers.25.mlp.experts.88.gate_proj.weight_scale": "model-00026-of-00047.safetensors", + "model.layers.25.mlp.experts.88.up_proj.weight": "model-00026-of-00047.safetensors", + "model.layers.25.mlp.experts.88.up_proj.weight_scale": "model-00026-of-00047.safetensors", + "model.layers.25.mlp.experts.89.down_proj.weight": "model-00026-of-00047.safetensors", + "model.layers.25.mlp.experts.89.down_proj.weight_scale": "model-00026-of-00047.safetensors", + "model.layers.25.mlp.experts.89.gate_proj.weight": "model-00026-of-00047.safetensors", + "model.layers.25.mlp.experts.89.gate_proj.weight_scale": "model-00026-of-00047.safetensors", + "model.layers.25.mlp.experts.89.up_proj.weight": "model-00026-of-00047.safetensors", + "model.layers.25.mlp.experts.89.up_proj.weight_scale": "model-00026-of-00047.safetensors", + "model.layers.25.mlp.experts.9.down_proj.weight": "model-00026-of-00047.safetensors", + "model.layers.25.mlp.experts.9.down_proj.weight_scale": "model-00026-of-00047.safetensors", + "model.layers.25.mlp.experts.9.gate_proj.weight": "model-00026-of-00047.safetensors", + "model.layers.25.mlp.experts.9.gate_proj.weight_scale": "model-00026-of-00047.safetensors", + "model.layers.25.mlp.experts.9.up_proj.weight": "model-00026-of-00047.safetensors", + "model.layers.25.mlp.experts.9.up_proj.weight_scale": "model-00026-of-00047.safetensors", + "model.layers.25.mlp.experts.90.down_proj.weight": "model-00026-of-00047.safetensors", + "model.layers.25.mlp.experts.90.down_proj.weight_scale": "model-00026-of-00047.safetensors", + "model.layers.25.mlp.experts.90.gate_proj.weight": "model-00026-of-00047.safetensors", + "model.layers.25.mlp.experts.90.gate_proj.weight_scale": "model-00026-of-00047.safetensors", + "model.layers.25.mlp.experts.90.up_proj.weight": "model-00026-of-00047.safetensors", + "model.layers.25.mlp.experts.90.up_proj.weight_scale": "model-00026-of-00047.safetensors", + "model.layers.25.mlp.experts.91.down_proj.weight": "model-00026-of-00047.safetensors", + "model.layers.25.mlp.experts.91.down_proj.weight_scale": "model-00026-of-00047.safetensors", + "model.layers.25.mlp.experts.91.gate_proj.weight": "model-00026-of-00047.safetensors", + "model.layers.25.mlp.experts.91.gate_proj.weight_scale": "model-00026-of-00047.safetensors", + "model.layers.25.mlp.experts.91.up_proj.weight": "model-00026-of-00047.safetensors", + "model.layers.25.mlp.experts.91.up_proj.weight_scale": "model-00026-of-00047.safetensors", + "model.layers.25.mlp.experts.92.down_proj.weight": "model-00026-of-00047.safetensors", + "model.layers.25.mlp.experts.92.down_proj.weight_scale": "model-00026-of-00047.safetensors", + "model.layers.25.mlp.experts.92.gate_proj.weight": "model-00026-of-00047.safetensors", + "model.layers.25.mlp.experts.92.gate_proj.weight_scale": "model-00026-of-00047.safetensors", + "model.layers.25.mlp.experts.92.up_proj.weight": "model-00026-of-00047.safetensors", + "model.layers.25.mlp.experts.92.up_proj.weight_scale": "model-00026-of-00047.safetensors", + "model.layers.25.mlp.experts.93.down_proj.weight": "model-00026-of-00047.safetensors", + "model.layers.25.mlp.experts.93.down_proj.weight_scale": "model-00026-of-00047.safetensors", + "model.layers.25.mlp.experts.93.gate_proj.weight": "model-00026-of-00047.safetensors", + "model.layers.25.mlp.experts.93.gate_proj.weight_scale": "model-00026-of-00047.safetensors", + "model.layers.25.mlp.experts.93.up_proj.weight": "model-00026-of-00047.safetensors", + "model.layers.25.mlp.experts.93.up_proj.weight_scale": "model-00026-of-00047.safetensors", + "model.layers.25.mlp.experts.94.down_proj.weight": "model-00026-of-00047.safetensors", + "model.layers.25.mlp.experts.94.down_proj.weight_scale": "model-00026-of-00047.safetensors", + "model.layers.25.mlp.experts.94.gate_proj.weight": "model-00026-of-00047.safetensors", + "model.layers.25.mlp.experts.94.gate_proj.weight_scale": "model-00026-of-00047.safetensors", + "model.layers.25.mlp.experts.94.up_proj.weight": "model-00026-of-00047.safetensors", + "model.layers.25.mlp.experts.94.up_proj.weight_scale": "model-00026-of-00047.safetensors", + "model.layers.25.mlp.experts.95.down_proj.weight": "model-00026-of-00047.safetensors", + "model.layers.25.mlp.experts.95.down_proj.weight_scale": "model-00026-of-00047.safetensors", + "model.layers.25.mlp.experts.95.gate_proj.weight": "model-00026-of-00047.safetensors", + "model.layers.25.mlp.experts.95.gate_proj.weight_scale": "model-00026-of-00047.safetensors", + "model.layers.25.mlp.experts.95.up_proj.weight": "model-00026-of-00047.safetensors", + "model.layers.25.mlp.experts.95.up_proj.weight_scale": "model-00026-of-00047.safetensors", + "model.layers.25.mlp.experts.96.down_proj.weight": "model-00026-of-00047.safetensors", + "model.layers.25.mlp.experts.96.down_proj.weight_scale": "model-00026-of-00047.safetensors", + "model.layers.25.mlp.experts.96.gate_proj.weight": "model-00026-of-00047.safetensors", + "model.layers.25.mlp.experts.96.gate_proj.weight_scale": "model-00026-of-00047.safetensors", + "model.layers.25.mlp.experts.96.up_proj.weight": "model-00026-of-00047.safetensors", + "model.layers.25.mlp.experts.96.up_proj.weight_scale": "model-00026-of-00047.safetensors", + "model.layers.25.mlp.experts.97.down_proj.weight": "model-00026-of-00047.safetensors", + "model.layers.25.mlp.experts.97.down_proj.weight_scale": "model-00026-of-00047.safetensors", + "model.layers.25.mlp.experts.97.gate_proj.weight": "model-00026-of-00047.safetensors", + "model.layers.25.mlp.experts.97.gate_proj.weight_scale": "model-00026-of-00047.safetensors", + "model.layers.25.mlp.experts.97.up_proj.weight": "model-00026-of-00047.safetensors", + "model.layers.25.mlp.experts.97.up_proj.weight_scale": "model-00026-of-00047.safetensors", + "model.layers.25.mlp.experts.98.down_proj.weight": "model-00026-of-00047.safetensors", + "model.layers.25.mlp.experts.98.down_proj.weight_scale": "model-00026-of-00047.safetensors", + "model.layers.25.mlp.experts.98.gate_proj.weight": "model-00026-of-00047.safetensors", + "model.layers.25.mlp.experts.98.gate_proj.weight_scale": "model-00026-of-00047.safetensors", + "model.layers.25.mlp.experts.98.up_proj.weight": "model-00026-of-00047.safetensors", + "model.layers.25.mlp.experts.98.up_proj.weight_scale": "model-00026-of-00047.safetensors", + "model.layers.25.mlp.experts.99.down_proj.weight": "model-00026-of-00047.safetensors", + "model.layers.25.mlp.experts.99.down_proj.weight_scale": "model-00026-of-00047.safetensors", + "model.layers.25.mlp.experts.99.gate_proj.weight": "model-00026-of-00047.safetensors", + "model.layers.25.mlp.experts.99.gate_proj.weight_scale": "model-00026-of-00047.safetensors", + "model.layers.25.mlp.experts.99.up_proj.weight": "model-00026-of-00047.safetensors", + "model.layers.25.mlp.experts.99.up_proj.weight_scale": "model-00026-of-00047.safetensors", + "model.layers.25.mlp.gate.e_score_correction_bias": "model-00026-of-00047.safetensors", + "model.layers.25.mlp.gate.weight": "model-00026-of-00047.safetensors", + "model.layers.25.mlp.shared_experts.down_proj.weight": "model-00026-of-00047.safetensors", + "model.layers.25.mlp.shared_experts.down_proj.weight_scale": "model-00026-of-00047.safetensors", + "model.layers.25.mlp.shared_experts.gate_proj.weight": "model-00026-of-00047.safetensors", + "model.layers.25.mlp.shared_experts.gate_proj.weight_scale": "model-00026-of-00047.safetensors", + "model.layers.25.mlp.shared_experts.up_proj.weight": "model-00026-of-00047.safetensors", + "model.layers.25.mlp.shared_experts.up_proj.weight_scale": "model-00026-of-00047.safetensors", + "model.layers.25.post_attention_layernorm.weight": "model-00026-of-00047.safetensors", + "model.layers.25.self_attn.k_proj.bias": "model-00026-of-00047.safetensors", + "model.layers.25.self_attn.k_proj.weight": "model-00026-of-00047.safetensors", + "model.layers.25.self_attn.k_proj.weight_scale": "model-00026-of-00047.safetensors", + "model.layers.25.self_attn.o_proj.weight": "model-00026-of-00047.safetensors", + "model.layers.25.self_attn.o_proj.weight_scale": "model-00026-of-00047.safetensors", + "model.layers.25.self_attn.q_proj.bias": "model-00026-of-00047.safetensors", + "model.layers.25.self_attn.q_proj.weight": "model-00026-of-00047.safetensors", + "model.layers.25.self_attn.q_proj.weight_scale": "model-00026-of-00047.safetensors", + "model.layers.25.self_attn.v_proj.bias": "model-00026-of-00047.safetensors", + "model.layers.25.self_attn.v_proj.weight": "model-00026-of-00047.safetensors", + "model.layers.25.self_attn.v_proj.weight_scale": "model-00026-of-00047.safetensors", + "model.layers.26.input_layernorm.weight": "model-00027-of-00047.safetensors", + "model.layers.26.mlp.experts.0.down_proj.weight": "model-00027-of-00047.safetensors", + "model.layers.26.mlp.experts.0.down_proj.weight_scale": "model-00027-of-00047.safetensors", + "model.layers.26.mlp.experts.0.gate_proj.weight": "model-00027-of-00047.safetensors", + "model.layers.26.mlp.experts.0.gate_proj.weight_scale": "model-00027-of-00047.safetensors", + "model.layers.26.mlp.experts.0.up_proj.weight": "model-00027-of-00047.safetensors", + "model.layers.26.mlp.experts.0.up_proj.weight_scale": "model-00027-of-00047.safetensors", + "model.layers.26.mlp.experts.1.down_proj.weight": "model-00027-of-00047.safetensors", + "model.layers.26.mlp.experts.1.down_proj.weight_scale": "model-00027-of-00047.safetensors", + "model.layers.26.mlp.experts.1.gate_proj.weight": "model-00027-of-00047.safetensors", + "model.layers.26.mlp.experts.1.gate_proj.weight_scale": "model-00027-of-00047.safetensors", + "model.layers.26.mlp.experts.1.up_proj.weight": "model-00027-of-00047.safetensors", + "model.layers.26.mlp.experts.1.up_proj.weight_scale": "model-00027-of-00047.safetensors", + "model.layers.26.mlp.experts.10.down_proj.weight": "model-00027-of-00047.safetensors", + "model.layers.26.mlp.experts.10.down_proj.weight_scale": "model-00027-of-00047.safetensors", + "model.layers.26.mlp.experts.10.gate_proj.weight": "model-00027-of-00047.safetensors", + "model.layers.26.mlp.experts.10.gate_proj.weight_scale": "model-00027-of-00047.safetensors", + "model.layers.26.mlp.experts.10.up_proj.weight": "model-00027-of-00047.safetensors", + "model.layers.26.mlp.experts.10.up_proj.weight_scale": "model-00027-of-00047.safetensors", + "model.layers.26.mlp.experts.100.down_proj.weight": "model-00027-of-00047.safetensors", + "model.layers.26.mlp.experts.100.down_proj.weight_scale": "model-00027-of-00047.safetensors", + "model.layers.26.mlp.experts.100.gate_proj.weight": "model-00027-of-00047.safetensors", + "model.layers.26.mlp.experts.100.gate_proj.weight_scale": "model-00027-of-00047.safetensors", + "model.layers.26.mlp.experts.100.up_proj.weight": "model-00027-of-00047.safetensors", + "model.layers.26.mlp.experts.100.up_proj.weight_scale": "model-00027-of-00047.safetensors", + "model.layers.26.mlp.experts.101.down_proj.weight": "model-00027-of-00047.safetensors", + "model.layers.26.mlp.experts.101.down_proj.weight_scale": "model-00027-of-00047.safetensors", + "model.layers.26.mlp.experts.101.gate_proj.weight": "model-00027-of-00047.safetensors", + "model.layers.26.mlp.experts.101.gate_proj.weight_scale": "model-00027-of-00047.safetensors", + "model.layers.26.mlp.experts.101.up_proj.weight": "model-00027-of-00047.safetensors", + "model.layers.26.mlp.experts.101.up_proj.weight_scale": "model-00027-of-00047.safetensors", + "model.layers.26.mlp.experts.102.down_proj.weight": "model-00027-of-00047.safetensors", + "model.layers.26.mlp.experts.102.down_proj.weight_scale": "model-00027-of-00047.safetensors", + "model.layers.26.mlp.experts.102.gate_proj.weight": "model-00027-of-00047.safetensors", + "model.layers.26.mlp.experts.102.gate_proj.weight_scale": "model-00027-of-00047.safetensors", + "model.layers.26.mlp.experts.102.up_proj.weight": "model-00027-of-00047.safetensors", + "model.layers.26.mlp.experts.102.up_proj.weight_scale": "model-00027-of-00047.safetensors", + "model.layers.26.mlp.experts.103.down_proj.weight": "model-00027-of-00047.safetensors", + "model.layers.26.mlp.experts.103.down_proj.weight_scale": "model-00027-of-00047.safetensors", + "model.layers.26.mlp.experts.103.gate_proj.weight": "model-00027-of-00047.safetensors", + "model.layers.26.mlp.experts.103.gate_proj.weight_scale": "model-00027-of-00047.safetensors", + "model.layers.26.mlp.experts.103.up_proj.weight": "model-00027-of-00047.safetensors", + "model.layers.26.mlp.experts.103.up_proj.weight_scale": "model-00027-of-00047.safetensors", + "model.layers.26.mlp.experts.104.down_proj.weight": "model-00027-of-00047.safetensors", + "model.layers.26.mlp.experts.104.down_proj.weight_scale": "model-00027-of-00047.safetensors", + "model.layers.26.mlp.experts.104.gate_proj.weight": "model-00027-of-00047.safetensors", + "model.layers.26.mlp.experts.104.gate_proj.weight_scale": "model-00027-of-00047.safetensors", + "model.layers.26.mlp.experts.104.up_proj.weight": "model-00027-of-00047.safetensors", + "model.layers.26.mlp.experts.104.up_proj.weight_scale": "model-00027-of-00047.safetensors", + "model.layers.26.mlp.experts.105.down_proj.weight": "model-00027-of-00047.safetensors", + "model.layers.26.mlp.experts.105.down_proj.weight_scale": "model-00027-of-00047.safetensors", + "model.layers.26.mlp.experts.105.gate_proj.weight": "model-00027-of-00047.safetensors", + "model.layers.26.mlp.experts.105.gate_proj.weight_scale": "model-00027-of-00047.safetensors", + "model.layers.26.mlp.experts.105.up_proj.weight": "model-00027-of-00047.safetensors", + "model.layers.26.mlp.experts.105.up_proj.weight_scale": "model-00027-of-00047.safetensors", + "model.layers.26.mlp.experts.106.down_proj.weight": "model-00027-of-00047.safetensors", + "model.layers.26.mlp.experts.106.down_proj.weight_scale": "model-00027-of-00047.safetensors", + "model.layers.26.mlp.experts.106.gate_proj.weight": "model-00027-of-00047.safetensors", + "model.layers.26.mlp.experts.106.gate_proj.weight_scale": "model-00027-of-00047.safetensors", + "model.layers.26.mlp.experts.106.up_proj.weight": "model-00027-of-00047.safetensors", + "model.layers.26.mlp.experts.106.up_proj.weight_scale": "model-00027-of-00047.safetensors", + "model.layers.26.mlp.experts.107.down_proj.weight": "model-00027-of-00047.safetensors", + "model.layers.26.mlp.experts.107.down_proj.weight_scale": "model-00027-of-00047.safetensors", + "model.layers.26.mlp.experts.107.gate_proj.weight": "model-00027-of-00047.safetensors", + "model.layers.26.mlp.experts.107.gate_proj.weight_scale": "model-00027-of-00047.safetensors", + "model.layers.26.mlp.experts.107.up_proj.weight": "model-00027-of-00047.safetensors", + "model.layers.26.mlp.experts.107.up_proj.weight_scale": "model-00027-of-00047.safetensors", + "model.layers.26.mlp.experts.108.down_proj.weight": "model-00027-of-00047.safetensors", + "model.layers.26.mlp.experts.108.down_proj.weight_scale": "model-00027-of-00047.safetensors", + "model.layers.26.mlp.experts.108.gate_proj.weight": "model-00027-of-00047.safetensors", + "model.layers.26.mlp.experts.108.gate_proj.weight_scale": "model-00027-of-00047.safetensors", + "model.layers.26.mlp.experts.108.up_proj.weight": "model-00027-of-00047.safetensors", + "model.layers.26.mlp.experts.108.up_proj.weight_scale": "model-00027-of-00047.safetensors", + "model.layers.26.mlp.experts.109.down_proj.weight": "model-00027-of-00047.safetensors", + "model.layers.26.mlp.experts.109.down_proj.weight_scale": "model-00027-of-00047.safetensors", + "model.layers.26.mlp.experts.109.gate_proj.weight": "model-00027-of-00047.safetensors", + "model.layers.26.mlp.experts.109.gate_proj.weight_scale": "model-00027-of-00047.safetensors", + "model.layers.26.mlp.experts.109.up_proj.weight": "model-00027-of-00047.safetensors", + "model.layers.26.mlp.experts.109.up_proj.weight_scale": "model-00027-of-00047.safetensors", + "model.layers.26.mlp.experts.11.down_proj.weight": "model-00027-of-00047.safetensors", + "model.layers.26.mlp.experts.11.down_proj.weight_scale": "model-00027-of-00047.safetensors", + "model.layers.26.mlp.experts.11.gate_proj.weight": "model-00027-of-00047.safetensors", + "model.layers.26.mlp.experts.11.gate_proj.weight_scale": "model-00027-of-00047.safetensors", + "model.layers.26.mlp.experts.11.up_proj.weight": "model-00027-of-00047.safetensors", + "model.layers.26.mlp.experts.11.up_proj.weight_scale": "model-00027-of-00047.safetensors", + "model.layers.26.mlp.experts.110.down_proj.weight": "model-00027-of-00047.safetensors", + "model.layers.26.mlp.experts.110.down_proj.weight_scale": "model-00027-of-00047.safetensors", + "model.layers.26.mlp.experts.110.gate_proj.weight": "model-00027-of-00047.safetensors", + "model.layers.26.mlp.experts.110.gate_proj.weight_scale": "model-00027-of-00047.safetensors", + "model.layers.26.mlp.experts.110.up_proj.weight": "model-00027-of-00047.safetensors", + "model.layers.26.mlp.experts.110.up_proj.weight_scale": "model-00027-of-00047.safetensors", + "model.layers.26.mlp.experts.111.down_proj.weight": "model-00027-of-00047.safetensors", + "model.layers.26.mlp.experts.111.down_proj.weight_scale": "model-00027-of-00047.safetensors", + "model.layers.26.mlp.experts.111.gate_proj.weight": "model-00027-of-00047.safetensors", + "model.layers.26.mlp.experts.111.gate_proj.weight_scale": "model-00027-of-00047.safetensors", + "model.layers.26.mlp.experts.111.up_proj.weight": "model-00027-of-00047.safetensors", + "model.layers.26.mlp.experts.111.up_proj.weight_scale": "model-00027-of-00047.safetensors", + "model.layers.26.mlp.experts.112.down_proj.weight": "model-00027-of-00047.safetensors", + "model.layers.26.mlp.experts.112.down_proj.weight_scale": "model-00027-of-00047.safetensors", + "model.layers.26.mlp.experts.112.gate_proj.weight": "model-00027-of-00047.safetensors", + "model.layers.26.mlp.experts.112.gate_proj.weight_scale": "model-00027-of-00047.safetensors", + "model.layers.26.mlp.experts.112.up_proj.weight": "model-00027-of-00047.safetensors", + "model.layers.26.mlp.experts.112.up_proj.weight_scale": "model-00027-of-00047.safetensors", + "model.layers.26.mlp.experts.113.down_proj.weight": "model-00027-of-00047.safetensors", + "model.layers.26.mlp.experts.113.down_proj.weight_scale": "model-00027-of-00047.safetensors", + "model.layers.26.mlp.experts.113.gate_proj.weight": "model-00027-of-00047.safetensors", + "model.layers.26.mlp.experts.113.gate_proj.weight_scale": "model-00027-of-00047.safetensors", + "model.layers.26.mlp.experts.113.up_proj.weight": "model-00027-of-00047.safetensors", + "model.layers.26.mlp.experts.113.up_proj.weight_scale": "model-00027-of-00047.safetensors", + "model.layers.26.mlp.experts.114.down_proj.weight": "model-00027-of-00047.safetensors", + "model.layers.26.mlp.experts.114.down_proj.weight_scale": "model-00027-of-00047.safetensors", + "model.layers.26.mlp.experts.114.gate_proj.weight": "model-00027-of-00047.safetensors", + "model.layers.26.mlp.experts.114.gate_proj.weight_scale": "model-00027-of-00047.safetensors", + "model.layers.26.mlp.experts.114.up_proj.weight": "model-00027-of-00047.safetensors", + "model.layers.26.mlp.experts.114.up_proj.weight_scale": "model-00027-of-00047.safetensors", + "model.layers.26.mlp.experts.115.down_proj.weight": "model-00027-of-00047.safetensors", + "model.layers.26.mlp.experts.115.down_proj.weight_scale": "model-00027-of-00047.safetensors", + "model.layers.26.mlp.experts.115.gate_proj.weight": "model-00027-of-00047.safetensors", + "model.layers.26.mlp.experts.115.gate_proj.weight_scale": "model-00027-of-00047.safetensors", + "model.layers.26.mlp.experts.115.up_proj.weight": "model-00027-of-00047.safetensors", + "model.layers.26.mlp.experts.115.up_proj.weight_scale": "model-00027-of-00047.safetensors", + "model.layers.26.mlp.experts.116.down_proj.weight": "model-00027-of-00047.safetensors", + "model.layers.26.mlp.experts.116.down_proj.weight_scale": "model-00027-of-00047.safetensors", + "model.layers.26.mlp.experts.116.gate_proj.weight": "model-00027-of-00047.safetensors", + "model.layers.26.mlp.experts.116.gate_proj.weight_scale": "model-00027-of-00047.safetensors", + "model.layers.26.mlp.experts.116.up_proj.weight": "model-00027-of-00047.safetensors", + "model.layers.26.mlp.experts.116.up_proj.weight_scale": "model-00027-of-00047.safetensors", + "model.layers.26.mlp.experts.117.down_proj.weight": "model-00027-of-00047.safetensors", + "model.layers.26.mlp.experts.117.down_proj.weight_scale": "model-00027-of-00047.safetensors", + "model.layers.26.mlp.experts.117.gate_proj.weight": "model-00027-of-00047.safetensors", + "model.layers.26.mlp.experts.117.gate_proj.weight_scale": "model-00027-of-00047.safetensors", + "model.layers.26.mlp.experts.117.up_proj.weight": "model-00027-of-00047.safetensors", + "model.layers.26.mlp.experts.117.up_proj.weight_scale": "model-00027-of-00047.safetensors", + "model.layers.26.mlp.experts.118.down_proj.weight": "model-00027-of-00047.safetensors", + "model.layers.26.mlp.experts.118.down_proj.weight_scale": "model-00027-of-00047.safetensors", + "model.layers.26.mlp.experts.118.gate_proj.weight": "model-00027-of-00047.safetensors", + "model.layers.26.mlp.experts.118.gate_proj.weight_scale": "model-00027-of-00047.safetensors", + "model.layers.26.mlp.experts.118.up_proj.weight": "model-00027-of-00047.safetensors", + "model.layers.26.mlp.experts.118.up_proj.weight_scale": "model-00027-of-00047.safetensors", + "model.layers.26.mlp.experts.119.down_proj.weight": "model-00027-of-00047.safetensors", + "model.layers.26.mlp.experts.119.down_proj.weight_scale": "model-00027-of-00047.safetensors", + "model.layers.26.mlp.experts.119.gate_proj.weight": "model-00027-of-00047.safetensors", + "model.layers.26.mlp.experts.119.gate_proj.weight_scale": "model-00027-of-00047.safetensors", + "model.layers.26.mlp.experts.119.up_proj.weight": "model-00027-of-00047.safetensors", + "model.layers.26.mlp.experts.119.up_proj.weight_scale": "model-00027-of-00047.safetensors", + "model.layers.26.mlp.experts.12.down_proj.weight": "model-00027-of-00047.safetensors", + "model.layers.26.mlp.experts.12.down_proj.weight_scale": "model-00027-of-00047.safetensors", + "model.layers.26.mlp.experts.12.gate_proj.weight": "model-00027-of-00047.safetensors", + "model.layers.26.mlp.experts.12.gate_proj.weight_scale": "model-00027-of-00047.safetensors", + "model.layers.26.mlp.experts.12.up_proj.weight": "model-00027-of-00047.safetensors", + "model.layers.26.mlp.experts.12.up_proj.weight_scale": "model-00027-of-00047.safetensors", + "model.layers.26.mlp.experts.120.down_proj.weight": "model-00027-of-00047.safetensors", + "model.layers.26.mlp.experts.120.down_proj.weight_scale": "model-00027-of-00047.safetensors", + "model.layers.26.mlp.experts.120.gate_proj.weight": "model-00027-of-00047.safetensors", + "model.layers.26.mlp.experts.120.gate_proj.weight_scale": "model-00027-of-00047.safetensors", + "model.layers.26.mlp.experts.120.up_proj.weight": "model-00027-of-00047.safetensors", + "model.layers.26.mlp.experts.120.up_proj.weight_scale": "model-00027-of-00047.safetensors", + "model.layers.26.mlp.experts.121.down_proj.weight": "model-00027-of-00047.safetensors", + "model.layers.26.mlp.experts.121.down_proj.weight_scale": "model-00027-of-00047.safetensors", + "model.layers.26.mlp.experts.121.gate_proj.weight": "model-00027-of-00047.safetensors", + "model.layers.26.mlp.experts.121.gate_proj.weight_scale": "model-00027-of-00047.safetensors", + "model.layers.26.mlp.experts.121.up_proj.weight": "model-00027-of-00047.safetensors", + "model.layers.26.mlp.experts.121.up_proj.weight_scale": "model-00027-of-00047.safetensors", + "model.layers.26.mlp.experts.122.down_proj.weight": "model-00027-of-00047.safetensors", + "model.layers.26.mlp.experts.122.down_proj.weight_scale": "model-00027-of-00047.safetensors", + "model.layers.26.mlp.experts.122.gate_proj.weight": "model-00027-of-00047.safetensors", + "model.layers.26.mlp.experts.122.gate_proj.weight_scale": "model-00027-of-00047.safetensors", + "model.layers.26.mlp.experts.122.up_proj.weight": "model-00027-of-00047.safetensors", + "model.layers.26.mlp.experts.122.up_proj.weight_scale": "model-00027-of-00047.safetensors", + "model.layers.26.mlp.experts.123.down_proj.weight": "model-00027-of-00047.safetensors", + "model.layers.26.mlp.experts.123.down_proj.weight_scale": "model-00027-of-00047.safetensors", + "model.layers.26.mlp.experts.123.gate_proj.weight": "model-00027-of-00047.safetensors", + "model.layers.26.mlp.experts.123.gate_proj.weight_scale": "model-00027-of-00047.safetensors", + "model.layers.26.mlp.experts.123.up_proj.weight": "model-00027-of-00047.safetensors", + "model.layers.26.mlp.experts.123.up_proj.weight_scale": "model-00027-of-00047.safetensors", + "model.layers.26.mlp.experts.124.down_proj.weight": "model-00027-of-00047.safetensors", + "model.layers.26.mlp.experts.124.down_proj.weight_scale": "model-00027-of-00047.safetensors", + "model.layers.26.mlp.experts.124.gate_proj.weight": "model-00027-of-00047.safetensors", + "model.layers.26.mlp.experts.124.gate_proj.weight_scale": "model-00027-of-00047.safetensors", + "model.layers.26.mlp.experts.124.up_proj.weight": "model-00027-of-00047.safetensors", + "model.layers.26.mlp.experts.124.up_proj.weight_scale": "model-00027-of-00047.safetensors", + "model.layers.26.mlp.experts.125.down_proj.weight": "model-00027-of-00047.safetensors", + "model.layers.26.mlp.experts.125.down_proj.weight_scale": "model-00027-of-00047.safetensors", + "model.layers.26.mlp.experts.125.gate_proj.weight": "model-00027-of-00047.safetensors", + "model.layers.26.mlp.experts.125.gate_proj.weight_scale": "model-00027-of-00047.safetensors", + "model.layers.26.mlp.experts.125.up_proj.weight": "model-00027-of-00047.safetensors", + "model.layers.26.mlp.experts.125.up_proj.weight_scale": "model-00027-of-00047.safetensors", + "model.layers.26.mlp.experts.126.down_proj.weight": "model-00027-of-00047.safetensors", + "model.layers.26.mlp.experts.126.down_proj.weight_scale": "model-00027-of-00047.safetensors", + "model.layers.26.mlp.experts.126.gate_proj.weight": "model-00027-of-00047.safetensors", + "model.layers.26.mlp.experts.126.gate_proj.weight_scale": "model-00027-of-00047.safetensors", + "model.layers.26.mlp.experts.126.up_proj.weight": "model-00027-of-00047.safetensors", + "model.layers.26.mlp.experts.126.up_proj.weight_scale": "model-00027-of-00047.safetensors", + "model.layers.26.mlp.experts.127.down_proj.weight": "model-00027-of-00047.safetensors", + "model.layers.26.mlp.experts.127.down_proj.weight_scale": "model-00027-of-00047.safetensors", + "model.layers.26.mlp.experts.127.gate_proj.weight": "model-00027-of-00047.safetensors", + "model.layers.26.mlp.experts.127.gate_proj.weight_scale": "model-00027-of-00047.safetensors", + "model.layers.26.mlp.experts.127.up_proj.weight": "model-00027-of-00047.safetensors", + "model.layers.26.mlp.experts.127.up_proj.weight_scale": "model-00027-of-00047.safetensors", + "model.layers.26.mlp.experts.13.down_proj.weight": "model-00027-of-00047.safetensors", + "model.layers.26.mlp.experts.13.down_proj.weight_scale": "model-00027-of-00047.safetensors", + "model.layers.26.mlp.experts.13.gate_proj.weight": "model-00027-of-00047.safetensors", + "model.layers.26.mlp.experts.13.gate_proj.weight_scale": "model-00027-of-00047.safetensors", + "model.layers.26.mlp.experts.13.up_proj.weight": "model-00027-of-00047.safetensors", + "model.layers.26.mlp.experts.13.up_proj.weight_scale": "model-00027-of-00047.safetensors", + "model.layers.26.mlp.experts.14.down_proj.weight": "model-00027-of-00047.safetensors", + "model.layers.26.mlp.experts.14.down_proj.weight_scale": "model-00027-of-00047.safetensors", + "model.layers.26.mlp.experts.14.gate_proj.weight": "model-00027-of-00047.safetensors", + "model.layers.26.mlp.experts.14.gate_proj.weight_scale": "model-00027-of-00047.safetensors", + "model.layers.26.mlp.experts.14.up_proj.weight": "model-00027-of-00047.safetensors", + "model.layers.26.mlp.experts.14.up_proj.weight_scale": "model-00027-of-00047.safetensors", + "model.layers.26.mlp.experts.15.down_proj.weight": "model-00027-of-00047.safetensors", + "model.layers.26.mlp.experts.15.down_proj.weight_scale": "model-00027-of-00047.safetensors", + "model.layers.26.mlp.experts.15.gate_proj.weight": "model-00027-of-00047.safetensors", + "model.layers.26.mlp.experts.15.gate_proj.weight_scale": "model-00027-of-00047.safetensors", + "model.layers.26.mlp.experts.15.up_proj.weight": "model-00027-of-00047.safetensors", + "model.layers.26.mlp.experts.15.up_proj.weight_scale": "model-00027-of-00047.safetensors", + "model.layers.26.mlp.experts.16.down_proj.weight": "model-00027-of-00047.safetensors", + "model.layers.26.mlp.experts.16.down_proj.weight_scale": "model-00027-of-00047.safetensors", + "model.layers.26.mlp.experts.16.gate_proj.weight": "model-00027-of-00047.safetensors", + "model.layers.26.mlp.experts.16.gate_proj.weight_scale": "model-00027-of-00047.safetensors", + "model.layers.26.mlp.experts.16.up_proj.weight": "model-00027-of-00047.safetensors", + "model.layers.26.mlp.experts.16.up_proj.weight_scale": "model-00027-of-00047.safetensors", + "model.layers.26.mlp.experts.17.down_proj.weight": "model-00027-of-00047.safetensors", + "model.layers.26.mlp.experts.17.down_proj.weight_scale": "model-00027-of-00047.safetensors", + "model.layers.26.mlp.experts.17.gate_proj.weight": "model-00027-of-00047.safetensors", + "model.layers.26.mlp.experts.17.gate_proj.weight_scale": "model-00027-of-00047.safetensors", + "model.layers.26.mlp.experts.17.up_proj.weight": "model-00027-of-00047.safetensors", + "model.layers.26.mlp.experts.17.up_proj.weight_scale": "model-00027-of-00047.safetensors", + "model.layers.26.mlp.experts.18.down_proj.weight": "model-00027-of-00047.safetensors", + "model.layers.26.mlp.experts.18.down_proj.weight_scale": "model-00027-of-00047.safetensors", + "model.layers.26.mlp.experts.18.gate_proj.weight": "model-00027-of-00047.safetensors", + "model.layers.26.mlp.experts.18.gate_proj.weight_scale": "model-00027-of-00047.safetensors", + "model.layers.26.mlp.experts.18.up_proj.weight": "model-00027-of-00047.safetensors", + "model.layers.26.mlp.experts.18.up_proj.weight_scale": "model-00027-of-00047.safetensors", + "model.layers.26.mlp.experts.19.down_proj.weight": "model-00027-of-00047.safetensors", + "model.layers.26.mlp.experts.19.down_proj.weight_scale": "model-00027-of-00047.safetensors", + "model.layers.26.mlp.experts.19.gate_proj.weight": "model-00027-of-00047.safetensors", + "model.layers.26.mlp.experts.19.gate_proj.weight_scale": "model-00027-of-00047.safetensors", + "model.layers.26.mlp.experts.19.up_proj.weight": "model-00027-of-00047.safetensors", + "model.layers.26.mlp.experts.19.up_proj.weight_scale": "model-00027-of-00047.safetensors", + "model.layers.26.mlp.experts.2.down_proj.weight": "model-00027-of-00047.safetensors", + "model.layers.26.mlp.experts.2.down_proj.weight_scale": "model-00027-of-00047.safetensors", + "model.layers.26.mlp.experts.2.gate_proj.weight": "model-00027-of-00047.safetensors", + "model.layers.26.mlp.experts.2.gate_proj.weight_scale": "model-00027-of-00047.safetensors", + "model.layers.26.mlp.experts.2.up_proj.weight": "model-00027-of-00047.safetensors", + "model.layers.26.mlp.experts.2.up_proj.weight_scale": "model-00027-of-00047.safetensors", + "model.layers.26.mlp.experts.20.down_proj.weight": "model-00027-of-00047.safetensors", + "model.layers.26.mlp.experts.20.down_proj.weight_scale": "model-00027-of-00047.safetensors", + "model.layers.26.mlp.experts.20.gate_proj.weight": "model-00027-of-00047.safetensors", + "model.layers.26.mlp.experts.20.gate_proj.weight_scale": "model-00027-of-00047.safetensors", + "model.layers.26.mlp.experts.20.up_proj.weight": "model-00027-of-00047.safetensors", + "model.layers.26.mlp.experts.20.up_proj.weight_scale": "model-00027-of-00047.safetensors", + "model.layers.26.mlp.experts.21.down_proj.weight": "model-00027-of-00047.safetensors", + "model.layers.26.mlp.experts.21.down_proj.weight_scale": "model-00027-of-00047.safetensors", + "model.layers.26.mlp.experts.21.gate_proj.weight": "model-00027-of-00047.safetensors", + "model.layers.26.mlp.experts.21.gate_proj.weight_scale": "model-00027-of-00047.safetensors", + "model.layers.26.mlp.experts.21.up_proj.weight": "model-00027-of-00047.safetensors", + "model.layers.26.mlp.experts.21.up_proj.weight_scale": "model-00027-of-00047.safetensors", + "model.layers.26.mlp.experts.22.down_proj.weight": "model-00027-of-00047.safetensors", + "model.layers.26.mlp.experts.22.down_proj.weight_scale": "model-00027-of-00047.safetensors", + "model.layers.26.mlp.experts.22.gate_proj.weight": "model-00027-of-00047.safetensors", + "model.layers.26.mlp.experts.22.gate_proj.weight_scale": "model-00027-of-00047.safetensors", + "model.layers.26.mlp.experts.22.up_proj.weight": "model-00027-of-00047.safetensors", + "model.layers.26.mlp.experts.22.up_proj.weight_scale": "model-00027-of-00047.safetensors", + "model.layers.26.mlp.experts.23.down_proj.weight": "model-00027-of-00047.safetensors", + "model.layers.26.mlp.experts.23.down_proj.weight_scale": "model-00027-of-00047.safetensors", + "model.layers.26.mlp.experts.23.gate_proj.weight": "model-00027-of-00047.safetensors", + "model.layers.26.mlp.experts.23.gate_proj.weight_scale": "model-00027-of-00047.safetensors", + "model.layers.26.mlp.experts.23.up_proj.weight": "model-00027-of-00047.safetensors", + "model.layers.26.mlp.experts.23.up_proj.weight_scale": "model-00027-of-00047.safetensors", + "model.layers.26.mlp.experts.24.down_proj.weight": "model-00027-of-00047.safetensors", + "model.layers.26.mlp.experts.24.down_proj.weight_scale": "model-00027-of-00047.safetensors", + "model.layers.26.mlp.experts.24.gate_proj.weight": "model-00027-of-00047.safetensors", + "model.layers.26.mlp.experts.24.gate_proj.weight_scale": "model-00027-of-00047.safetensors", + "model.layers.26.mlp.experts.24.up_proj.weight": "model-00027-of-00047.safetensors", + "model.layers.26.mlp.experts.24.up_proj.weight_scale": "model-00027-of-00047.safetensors", + "model.layers.26.mlp.experts.25.down_proj.weight": "model-00027-of-00047.safetensors", + "model.layers.26.mlp.experts.25.down_proj.weight_scale": "model-00027-of-00047.safetensors", + "model.layers.26.mlp.experts.25.gate_proj.weight": "model-00027-of-00047.safetensors", + "model.layers.26.mlp.experts.25.gate_proj.weight_scale": "model-00027-of-00047.safetensors", + "model.layers.26.mlp.experts.25.up_proj.weight": "model-00027-of-00047.safetensors", + "model.layers.26.mlp.experts.25.up_proj.weight_scale": "model-00027-of-00047.safetensors", + "model.layers.26.mlp.experts.26.down_proj.weight": "model-00027-of-00047.safetensors", + "model.layers.26.mlp.experts.26.down_proj.weight_scale": "model-00027-of-00047.safetensors", + "model.layers.26.mlp.experts.26.gate_proj.weight": "model-00027-of-00047.safetensors", + "model.layers.26.mlp.experts.26.gate_proj.weight_scale": "model-00027-of-00047.safetensors", + "model.layers.26.mlp.experts.26.up_proj.weight": "model-00027-of-00047.safetensors", + "model.layers.26.mlp.experts.26.up_proj.weight_scale": "model-00027-of-00047.safetensors", + "model.layers.26.mlp.experts.27.down_proj.weight": "model-00027-of-00047.safetensors", + "model.layers.26.mlp.experts.27.down_proj.weight_scale": "model-00027-of-00047.safetensors", + "model.layers.26.mlp.experts.27.gate_proj.weight": "model-00027-of-00047.safetensors", + "model.layers.26.mlp.experts.27.gate_proj.weight_scale": "model-00027-of-00047.safetensors", + "model.layers.26.mlp.experts.27.up_proj.weight": "model-00027-of-00047.safetensors", + "model.layers.26.mlp.experts.27.up_proj.weight_scale": "model-00027-of-00047.safetensors", + "model.layers.26.mlp.experts.28.down_proj.weight": "model-00027-of-00047.safetensors", + "model.layers.26.mlp.experts.28.down_proj.weight_scale": "model-00027-of-00047.safetensors", + "model.layers.26.mlp.experts.28.gate_proj.weight": "model-00027-of-00047.safetensors", + "model.layers.26.mlp.experts.28.gate_proj.weight_scale": "model-00027-of-00047.safetensors", + "model.layers.26.mlp.experts.28.up_proj.weight": "model-00027-of-00047.safetensors", + "model.layers.26.mlp.experts.28.up_proj.weight_scale": "model-00027-of-00047.safetensors", + "model.layers.26.mlp.experts.29.down_proj.weight": "model-00027-of-00047.safetensors", + "model.layers.26.mlp.experts.29.down_proj.weight_scale": "model-00027-of-00047.safetensors", + "model.layers.26.mlp.experts.29.gate_proj.weight": "model-00027-of-00047.safetensors", + "model.layers.26.mlp.experts.29.gate_proj.weight_scale": "model-00027-of-00047.safetensors", + "model.layers.26.mlp.experts.29.up_proj.weight": "model-00027-of-00047.safetensors", + "model.layers.26.mlp.experts.29.up_proj.weight_scale": "model-00027-of-00047.safetensors", + "model.layers.26.mlp.experts.3.down_proj.weight": "model-00027-of-00047.safetensors", + "model.layers.26.mlp.experts.3.down_proj.weight_scale": "model-00027-of-00047.safetensors", + "model.layers.26.mlp.experts.3.gate_proj.weight": "model-00027-of-00047.safetensors", + "model.layers.26.mlp.experts.3.gate_proj.weight_scale": "model-00027-of-00047.safetensors", + "model.layers.26.mlp.experts.3.up_proj.weight": "model-00027-of-00047.safetensors", + "model.layers.26.mlp.experts.3.up_proj.weight_scale": "model-00027-of-00047.safetensors", + "model.layers.26.mlp.experts.30.down_proj.weight": "model-00027-of-00047.safetensors", + "model.layers.26.mlp.experts.30.down_proj.weight_scale": "model-00027-of-00047.safetensors", + "model.layers.26.mlp.experts.30.gate_proj.weight": "model-00027-of-00047.safetensors", + "model.layers.26.mlp.experts.30.gate_proj.weight_scale": "model-00027-of-00047.safetensors", + "model.layers.26.mlp.experts.30.up_proj.weight": "model-00027-of-00047.safetensors", + "model.layers.26.mlp.experts.30.up_proj.weight_scale": "model-00027-of-00047.safetensors", + "model.layers.26.mlp.experts.31.down_proj.weight": "model-00027-of-00047.safetensors", + "model.layers.26.mlp.experts.31.down_proj.weight_scale": "model-00027-of-00047.safetensors", + "model.layers.26.mlp.experts.31.gate_proj.weight": "model-00027-of-00047.safetensors", + "model.layers.26.mlp.experts.31.gate_proj.weight_scale": "model-00027-of-00047.safetensors", + "model.layers.26.mlp.experts.31.up_proj.weight": "model-00027-of-00047.safetensors", + "model.layers.26.mlp.experts.31.up_proj.weight_scale": "model-00027-of-00047.safetensors", + "model.layers.26.mlp.experts.32.down_proj.weight": "model-00027-of-00047.safetensors", + "model.layers.26.mlp.experts.32.down_proj.weight_scale": "model-00027-of-00047.safetensors", + "model.layers.26.mlp.experts.32.gate_proj.weight": "model-00027-of-00047.safetensors", + "model.layers.26.mlp.experts.32.gate_proj.weight_scale": "model-00027-of-00047.safetensors", + "model.layers.26.mlp.experts.32.up_proj.weight": "model-00027-of-00047.safetensors", + "model.layers.26.mlp.experts.32.up_proj.weight_scale": "model-00027-of-00047.safetensors", + "model.layers.26.mlp.experts.33.down_proj.weight": "model-00027-of-00047.safetensors", + "model.layers.26.mlp.experts.33.down_proj.weight_scale": "model-00027-of-00047.safetensors", + "model.layers.26.mlp.experts.33.gate_proj.weight": "model-00027-of-00047.safetensors", + "model.layers.26.mlp.experts.33.gate_proj.weight_scale": "model-00027-of-00047.safetensors", + "model.layers.26.mlp.experts.33.up_proj.weight": "model-00027-of-00047.safetensors", + "model.layers.26.mlp.experts.33.up_proj.weight_scale": "model-00027-of-00047.safetensors", + "model.layers.26.mlp.experts.34.down_proj.weight": "model-00027-of-00047.safetensors", + "model.layers.26.mlp.experts.34.down_proj.weight_scale": "model-00027-of-00047.safetensors", + "model.layers.26.mlp.experts.34.gate_proj.weight": "model-00027-of-00047.safetensors", + "model.layers.26.mlp.experts.34.gate_proj.weight_scale": "model-00027-of-00047.safetensors", + "model.layers.26.mlp.experts.34.up_proj.weight": "model-00027-of-00047.safetensors", + "model.layers.26.mlp.experts.34.up_proj.weight_scale": "model-00027-of-00047.safetensors", + "model.layers.26.mlp.experts.35.down_proj.weight": "model-00027-of-00047.safetensors", + "model.layers.26.mlp.experts.35.down_proj.weight_scale": "model-00027-of-00047.safetensors", + "model.layers.26.mlp.experts.35.gate_proj.weight": "model-00027-of-00047.safetensors", + "model.layers.26.mlp.experts.35.gate_proj.weight_scale": "model-00027-of-00047.safetensors", + "model.layers.26.mlp.experts.35.up_proj.weight": "model-00027-of-00047.safetensors", + "model.layers.26.mlp.experts.35.up_proj.weight_scale": "model-00027-of-00047.safetensors", + "model.layers.26.mlp.experts.36.down_proj.weight": "model-00027-of-00047.safetensors", + "model.layers.26.mlp.experts.36.down_proj.weight_scale": "model-00027-of-00047.safetensors", + "model.layers.26.mlp.experts.36.gate_proj.weight": "model-00027-of-00047.safetensors", + "model.layers.26.mlp.experts.36.gate_proj.weight_scale": "model-00027-of-00047.safetensors", + "model.layers.26.mlp.experts.36.up_proj.weight": "model-00027-of-00047.safetensors", + "model.layers.26.mlp.experts.36.up_proj.weight_scale": "model-00027-of-00047.safetensors", + "model.layers.26.mlp.experts.37.down_proj.weight": "model-00027-of-00047.safetensors", + "model.layers.26.mlp.experts.37.down_proj.weight_scale": "model-00027-of-00047.safetensors", + "model.layers.26.mlp.experts.37.gate_proj.weight": "model-00027-of-00047.safetensors", + "model.layers.26.mlp.experts.37.gate_proj.weight_scale": "model-00027-of-00047.safetensors", + "model.layers.26.mlp.experts.37.up_proj.weight": "model-00027-of-00047.safetensors", + "model.layers.26.mlp.experts.37.up_proj.weight_scale": "model-00027-of-00047.safetensors", + "model.layers.26.mlp.experts.38.down_proj.weight": "model-00027-of-00047.safetensors", + "model.layers.26.mlp.experts.38.down_proj.weight_scale": "model-00027-of-00047.safetensors", + "model.layers.26.mlp.experts.38.gate_proj.weight": "model-00027-of-00047.safetensors", + "model.layers.26.mlp.experts.38.gate_proj.weight_scale": "model-00027-of-00047.safetensors", + "model.layers.26.mlp.experts.38.up_proj.weight": "model-00027-of-00047.safetensors", + "model.layers.26.mlp.experts.38.up_proj.weight_scale": "model-00027-of-00047.safetensors", + "model.layers.26.mlp.experts.39.down_proj.weight": "model-00027-of-00047.safetensors", + "model.layers.26.mlp.experts.39.down_proj.weight_scale": "model-00027-of-00047.safetensors", + "model.layers.26.mlp.experts.39.gate_proj.weight": "model-00027-of-00047.safetensors", + "model.layers.26.mlp.experts.39.gate_proj.weight_scale": "model-00027-of-00047.safetensors", + "model.layers.26.mlp.experts.39.up_proj.weight": "model-00027-of-00047.safetensors", + "model.layers.26.mlp.experts.39.up_proj.weight_scale": "model-00027-of-00047.safetensors", + "model.layers.26.mlp.experts.4.down_proj.weight": "model-00027-of-00047.safetensors", + "model.layers.26.mlp.experts.4.down_proj.weight_scale": "model-00027-of-00047.safetensors", + "model.layers.26.mlp.experts.4.gate_proj.weight": "model-00027-of-00047.safetensors", + "model.layers.26.mlp.experts.4.gate_proj.weight_scale": "model-00027-of-00047.safetensors", + "model.layers.26.mlp.experts.4.up_proj.weight": "model-00027-of-00047.safetensors", + "model.layers.26.mlp.experts.4.up_proj.weight_scale": "model-00027-of-00047.safetensors", + "model.layers.26.mlp.experts.40.down_proj.weight": "model-00027-of-00047.safetensors", + "model.layers.26.mlp.experts.40.down_proj.weight_scale": "model-00027-of-00047.safetensors", + "model.layers.26.mlp.experts.40.gate_proj.weight": "model-00027-of-00047.safetensors", + "model.layers.26.mlp.experts.40.gate_proj.weight_scale": "model-00027-of-00047.safetensors", + "model.layers.26.mlp.experts.40.up_proj.weight": "model-00027-of-00047.safetensors", + "model.layers.26.mlp.experts.40.up_proj.weight_scale": "model-00027-of-00047.safetensors", + "model.layers.26.mlp.experts.41.down_proj.weight": "model-00027-of-00047.safetensors", + "model.layers.26.mlp.experts.41.down_proj.weight_scale": "model-00027-of-00047.safetensors", + "model.layers.26.mlp.experts.41.gate_proj.weight": "model-00027-of-00047.safetensors", + "model.layers.26.mlp.experts.41.gate_proj.weight_scale": "model-00027-of-00047.safetensors", + "model.layers.26.mlp.experts.41.up_proj.weight": "model-00027-of-00047.safetensors", + "model.layers.26.mlp.experts.41.up_proj.weight_scale": "model-00027-of-00047.safetensors", + "model.layers.26.mlp.experts.42.down_proj.weight": "model-00027-of-00047.safetensors", + "model.layers.26.mlp.experts.42.down_proj.weight_scale": "model-00027-of-00047.safetensors", + "model.layers.26.mlp.experts.42.gate_proj.weight": "model-00027-of-00047.safetensors", + "model.layers.26.mlp.experts.42.gate_proj.weight_scale": "model-00027-of-00047.safetensors", + "model.layers.26.mlp.experts.42.up_proj.weight": "model-00027-of-00047.safetensors", + "model.layers.26.mlp.experts.42.up_proj.weight_scale": "model-00027-of-00047.safetensors", + "model.layers.26.mlp.experts.43.down_proj.weight": "model-00027-of-00047.safetensors", + "model.layers.26.mlp.experts.43.down_proj.weight_scale": "model-00027-of-00047.safetensors", + "model.layers.26.mlp.experts.43.gate_proj.weight": "model-00027-of-00047.safetensors", + "model.layers.26.mlp.experts.43.gate_proj.weight_scale": "model-00027-of-00047.safetensors", + "model.layers.26.mlp.experts.43.up_proj.weight": "model-00027-of-00047.safetensors", + "model.layers.26.mlp.experts.43.up_proj.weight_scale": "model-00027-of-00047.safetensors", + "model.layers.26.mlp.experts.44.down_proj.weight": "model-00027-of-00047.safetensors", + "model.layers.26.mlp.experts.44.down_proj.weight_scale": "model-00027-of-00047.safetensors", + "model.layers.26.mlp.experts.44.gate_proj.weight": "model-00027-of-00047.safetensors", + "model.layers.26.mlp.experts.44.gate_proj.weight_scale": "model-00027-of-00047.safetensors", + "model.layers.26.mlp.experts.44.up_proj.weight": "model-00027-of-00047.safetensors", + "model.layers.26.mlp.experts.44.up_proj.weight_scale": "model-00027-of-00047.safetensors", + "model.layers.26.mlp.experts.45.down_proj.weight": "model-00027-of-00047.safetensors", + "model.layers.26.mlp.experts.45.down_proj.weight_scale": "model-00027-of-00047.safetensors", + "model.layers.26.mlp.experts.45.gate_proj.weight": "model-00027-of-00047.safetensors", + "model.layers.26.mlp.experts.45.gate_proj.weight_scale": "model-00027-of-00047.safetensors", + "model.layers.26.mlp.experts.45.up_proj.weight": "model-00027-of-00047.safetensors", + "model.layers.26.mlp.experts.45.up_proj.weight_scale": "model-00027-of-00047.safetensors", + "model.layers.26.mlp.experts.46.down_proj.weight": "model-00027-of-00047.safetensors", + "model.layers.26.mlp.experts.46.down_proj.weight_scale": "model-00027-of-00047.safetensors", + "model.layers.26.mlp.experts.46.gate_proj.weight": "model-00027-of-00047.safetensors", + "model.layers.26.mlp.experts.46.gate_proj.weight_scale": "model-00027-of-00047.safetensors", + "model.layers.26.mlp.experts.46.up_proj.weight": "model-00027-of-00047.safetensors", + "model.layers.26.mlp.experts.46.up_proj.weight_scale": "model-00027-of-00047.safetensors", + "model.layers.26.mlp.experts.47.down_proj.weight": "model-00027-of-00047.safetensors", + "model.layers.26.mlp.experts.47.down_proj.weight_scale": "model-00027-of-00047.safetensors", + "model.layers.26.mlp.experts.47.gate_proj.weight": "model-00027-of-00047.safetensors", + "model.layers.26.mlp.experts.47.gate_proj.weight_scale": "model-00027-of-00047.safetensors", + "model.layers.26.mlp.experts.47.up_proj.weight": "model-00027-of-00047.safetensors", + "model.layers.26.mlp.experts.47.up_proj.weight_scale": "model-00027-of-00047.safetensors", + "model.layers.26.mlp.experts.48.down_proj.weight": "model-00027-of-00047.safetensors", + "model.layers.26.mlp.experts.48.down_proj.weight_scale": "model-00027-of-00047.safetensors", + "model.layers.26.mlp.experts.48.gate_proj.weight": "model-00027-of-00047.safetensors", + "model.layers.26.mlp.experts.48.gate_proj.weight_scale": "model-00027-of-00047.safetensors", + "model.layers.26.mlp.experts.48.up_proj.weight": "model-00027-of-00047.safetensors", + "model.layers.26.mlp.experts.48.up_proj.weight_scale": "model-00027-of-00047.safetensors", + "model.layers.26.mlp.experts.49.down_proj.weight": "model-00027-of-00047.safetensors", + "model.layers.26.mlp.experts.49.down_proj.weight_scale": "model-00027-of-00047.safetensors", + "model.layers.26.mlp.experts.49.gate_proj.weight": "model-00027-of-00047.safetensors", + "model.layers.26.mlp.experts.49.gate_proj.weight_scale": "model-00027-of-00047.safetensors", + "model.layers.26.mlp.experts.49.up_proj.weight": "model-00027-of-00047.safetensors", + "model.layers.26.mlp.experts.49.up_proj.weight_scale": "model-00027-of-00047.safetensors", + "model.layers.26.mlp.experts.5.down_proj.weight": "model-00027-of-00047.safetensors", + "model.layers.26.mlp.experts.5.down_proj.weight_scale": "model-00027-of-00047.safetensors", + "model.layers.26.mlp.experts.5.gate_proj.weight": "model-00027-of-00047.safetensors", + "model.layers.26.mlp.experts.5.gate_proj.weight_scale": "model-00027-of-00047.safetensors", + "model.layers.26.mlp.experts.5.up_proj.weight": "model-00027-of-00047.safetensors", + "model.layers.26.mlp.experts.5.up_proj.weight_scale": "model-00027-of-00047.safetensors", + "model.layers.26.mlp.experts.50.down_proj.weight": "model-00027-of-00047.safetensors", + "model.layers.26.mlp.experts.50.down_proj.weight_scale": "model-00027-of-00047.safetensors", + "model.layers.26.mlp.experts.50.gate_proj.weight": "model-00027-of-00047.safetensors", + "model.layers.26.mlp.experts.50.gate_proj.weight_scale": "model-00027-of-00047.safetensors", + "model.layers.26.mlp.experts.50.up_proj.weight": "model-00027-of-00047.safetensors", + "model.layers.26.mlp.experts.50.up_proj.weight_scale": "model-00027-of-00047.safetensors", + "model.layers.26.mlp.experts.51.down_proj.weight": "model-00027-of-00047.safetensors", + "model.layers.26.mlp.experts.51.down_proj.weight_scale": "model-00027-of-00047.safetensors", + "model.layers.26.mlp.experts.51.gate_proj.weight": "model-00027-of-00047.safetensors", + "model.layers.26.mlp.experts.51.gate_proj.weight_scale": "model-00027-of-00047.safetensors", + "model.layers.26.mlp.experts.51.up_proj.weight": "model-00027-of-00047.safetensors", + "model.layers.26.mlp.experts.51.up_proj.weight_scale": "model-00027-of-00047.safetensors", + "model.layers.26.mlp.experts.52.down_proj.weight": "model-00027-of-00047.safetensors", + "model.layers.26.mlp.experts.52.down_proj.weight_scale": "model-00027-of-00047.safetensors", + "model.layers.26.mlp.experts.52.gate_proj.weight": "model-00027-of-00047.safetensors", + "model.layers.26.mlp.experts.52.gate_proj.weight_scale": "model-00027-of-00047.safetensors", + "model.layers.26.mlp.experts.52.up_proj.weight": "model-00027-of-00047.safetensors", + "model.layers.26.mlp.experts.52.up_proj.weight_scale": "model-00027-of-00047.safetensors", + "model.layers.26.mlp.experts.53.down_proj.weight": "model-00027-of-00047.safetensors", + "model.layers.26.mlp.experts.53.down_proj.weight_scale": "model-00027-of-00047.safetensors", + "model.layers.26.mlp.experts.53.gate_proj.weight": "model-00027-of-00047.safetensors", + "model.layers.26.mlp.experts.53.gate_proj.weight_scale": "model-00027-of-00047.safetensors", + "model.layers.26.mlp.experts.53.up_proj.weight": "model-00027-of-00047.safetensors", + "model.layers.26.mlp.experts.53.up_proj.weight_scale": "model-00027-of-00047.safetensors", + "model.layers.26.mlp.experts.54.down_proj.weight": "model-00027-of-00047.safetensors", + "model.layers.26.mlp.experts.54.down_proj.weight_scale": "model-00027-of-00047.safetensors", + "model.layers.26.mlp.experts.54.gate_proj.weight": "model-00027-of-00047.safetensors", + "model.layers.26.mlp.experts.54.gate_proj.weight_scale": "model-00027-of-00047.safetensors", + "model.layers.26.mlp.experts.54.up_proj.weight": "model-00027-of-00047.safetensors", + "model.layers.26.mlp.experts.54.up_proj.weight_scale": "model-00027-of-00047.safetensors", + "model.layers.26.mlp.experts.55.down_proj.weight": "model-00027-of-00047.safetensors", + "model.layers.26.mlp.experts.55.down_proj.weight_scale": "model-00027-of-00047.safetensors", + "model.layers.26.mlp.experts.55.gate_proj.weight": "model-00027-of-00047.safetensors", + "model.layers.26.mlp.experts.55.gate_proj.weight_scale": "model-00027-of-00047.safetensors", + "model.layers.26.mlp.experts.55.up_proj.weight": "model-00027-of-00047.safetensors", + "model.layers.26.mlp.experts.55.up_proj.weight_scale": "model-00027-of-00047.safetensors", + "model.layers.26.mlp.experts.56.down_proj.weight": "model-00027-of-00047.safetensors", + "model.layers.26.mlp.experts.56.down_proj.weight_scale": "model-00027-of-00047.safetensors", + "model.layers.26.mlp.experts.56.gate_proj.weight": "model-00027-of-00047.safetensors", + "model.layers.26.mlp.experts.56.gate_proj.weight_scale": "model-00027-of-00047.safetensors", + "model.layers.26.mlp.experts.56.up_proj.weight": "model-00027-of-00047.safetensors", + "model.layers.26.mlp.experts.56.up_proj.weight_scale": "model-00027-of-00047.safetensors", + "model.layers.26.mlp.experts.57.down_proj.weight": "model-00027-of-00047.safetensors", + "model.layers.26.mlp.experts.57.down_proj.weight_scale": "model-00027-of-00047.safetensors", + "model.layers.26.mlp.experts.57.gate_proj.weight": "model-00027-of-00047.safetensors", + "model.layers.26.mlp.experts.57.gate_proj.weight_scale": "model-00027-of-00047.safetensors", + "model.layers.26.mlp.experts.57.up_proj.weight": "model-00027-of-00047.safetensors", + "model.layers.26.mlp.experts.57.up_proj.weight_scale": "model-00027-of-00047.safetensors", + "model.layers.26.mlp.experts.58.down_proj.weight": "model-00027-of-00047.safetensors", + "model.layers.26.mlp.experts.58.down_proj.weight_scale": "model-00027-of-00047.safetensors", + "model.layers.26.mlp.experts.58.gate_proj.weight": "model-00027-of-00047.safetensors", + "model.layers.26.mlp.experts.58.gate_proj.weight_scale": "model-00027-of-00047.safetensors", + "model.layers.26.mlp.experts.58.up_proj.weight": "model-00027-of-00047.safetensors", + "model.layers.26.mlp.experts.58.up_proj.weight_scale": "model-00027-of-00047.safetensors", + "model.layers.26.mlp.experts.59.down_proj.weight": "model-00027-of-00047.safetensors", + "model.layers.26.mlp.experts.59.down_proj.weight_scale": "model-00027-of-00047.safetensors", + "model.layers.26.mlp.experts.59.gate_proj.weight": "model-00027-of-00047.safetensors", + "model.layers.26.mlp.experts.59.gate_proj.weight_scale": "model-00027-of-00047.safetensors", + "model.layers.26.mlp.experts.59.up_proj.weight": "model-00027-of-00047.safetensors", + "model.layers.26.mlp.experts.59.up_proj.weight_scale": "model-00027-of-00047.safetensors", + "model.layers.26.mlp.experts.6.down_proj.weight": "model-00027-of-00047.safetensors", + "model.layers.26.mlp.experts.6.down_proj.weight_scale": "model-00027-of-00047.safetensors", + "model.layers.26.mlp.experts.6.gate_proj.weight": "model-00027-of-00047.safetensors", + "model.layers.26.mlp.experts.6.gate_proj.weight_scale": "model-00027-of-00047.safetensors", + "model.layers.26.mlp.experts.6.up_proj.weight": "model-00027-of-00047.safetensors", + "model.layers.26.mlp.experts.6.up_proj.weight_scale": "model-00027-of-00047.safetensors", + "model.layers.26.mlp.experts.60.down_proj.weight": "model-00027-of-00047.safetensors", + "model.layers.26.mlp.experts.60.down_proj.weight_scale": "model-00027-of-00047.safetensors", + "model.layers.26.mlp.experts.60.gate_proj.weight": "model-00027-of-00047.safetensors", + "model.layers.26.mlp.experts.60.gate_proj.weight_scale": "model-00027-of-00047.safetensors", + "model.layers.26.mlp.experts.60.up_proj.weight": "model-00027-of-00047.safetensors", + "model.layers.26.mlp.experts.60.up_proj.weight_scale": "model-00027-of-00047.safetensors", + "model.layers.26.mlp.experts.61.down_proj.weight": "model-00027-of-00047.safetensors", + "model.layers.26.mlp.experts.61.down_proj.weight_scale": "model-00027-of-00047.safetensors", + "model.layers.26.mlp.experts.61.gate_proj.weight": "model-00027-of-00047.safetensors", + "model.layers.26.mlp.experts.61.gate_proj.weight_scale": "model-00027-of-00047.safetensors", + "model.layers.26.mlp.experts.61.up_proj.weight": "model-00027-of-00047.safetensors", + "model.layers.26.mlp.experts.61.up_proj.weight_scale": "model-00027-of-00047.safetensors", + "model.layers.26.mlp.experts.62.down_proj.weight": "model-00027-of-00047.safetensors", + "model.layers.26.mlp.experts.62.down_proj.weight_scale": "model-00027-of-00047.safetensors", + "model.layers.26.mlp.experts.62.gate_proj.weight": "model-00027-of-00047.safetensors", + "model.layers.26.mlp.experts.62.gate_proj.weight_scale": "model-00027-of-00047.safetensors", + "model.layers.26.mlp.experts.62.up_proj.weight": "model-00027-of-00047.safetensors", + "model.layers.26.mlp.experts.62.up_proj.weight_scale": "model-00027-of-00047.safetensors", + "model.layers.26.mlp.experts.63.down_proj.weight": "model-00027-of-00047.safetensors", + "model.layers.26.mlp.experts.63.down_proj.weight_scale": "model-00027-of-00047.safetensors", + "model.layers.26.mlp.experts.63.gate_proj.weight": "model-00027-of-00047.safetensors", + "model.layers.26.mlp.experts.63.gate_proj.weight_scale": "model-00027-of-00047.safetensors", + "model.layers.26.mlp.experts.63.up_proj.weight": "model-00027-of-00047.safetensors", + "model.layers.26.mlp.experts.63.up_proj.weight_scale": "model-00027-of-00047.safetensors", + "model.layers.26.mlp.experts.64.down_proj.weight": "model-00027-of-00047.safetensors", + "model.layers.26.mlp.experts.64.down_proj.weight_scale": "model-00027-of-00047.safetensors", + "model.layers.26.mlp.experts.64.gate_proj.weight": "model-00027-of-00047.safetensors", + "model.layers.26.mlp.experts.64.gate_proj.weight_scale": "model-00027-of-00047.safetensors", + "model.layers.26.mlp.experts.64.up_proj.weight": "model-00027-of-00047.safetensors", + "model.layers.26.mlp.experts.64.up_proj.weight_scale": "model-00027-of-00047.safetensors", + "model.layers.26.mlp.experts.65.down_proj.weight": "model-00027-of-00047.safetensors", + "model.layers.26.mlp.experts.65.down_proj.weight_scale": "model-00027-of-00047.safetensors", + "model.layers.26.mlp.experts.65.gate_proj.weight": "model-00027-of-00047.safetensors", + "model.layers.26.mlp.experts.65.gate_proj.weight_scale": "model-00027-of-00047.safetensors", + "model.layers.26.mlp.experts.65.up_proj.weight": "model-00027-of-00047.safetensors", + "model.layers.26.mlp.experts.65.up_proj.weight_scale": "model-00027-of-00047.safetensors", + "model.layers.26.mlp.experts.66.down_proj.weight": "model-00027-of-00047.safetensors", + "model.layers.26.mlp.experts.66.down_proj.weight_scale": "model-00027-of-00047.safetensors", + "model.layers.26.mlp.experts.66.gate_proj.weight": "model-00027-of-00047.safetensors", + "model.layers.26.mlp.experts.66.gate_proj.weight_scale": "model-00027-of-00047.safetensors", + "model.layers.26.mlp.experts.66.up_proj.weight": "model-00027-of-00047.safetensors", + "model.layers.26.mlp.experts.66.up_proj.weight_scale": "model-00027-of-00047.safetensors", + "model.layers.26.mlp.experts.67.down_proj.weight": "model-00027-of-00047.safetensors", + "model.layers.26.mlp.experts.67.down_proj.weight_scale": "model-00027-of-00047.safetensors", + "model.layers.26.mlp.experts.67.gate_proj.weight": "model-00027-of-00047.safetensors", + "model.layers.26.mlp.experts.67.gate_proj.weight_scale": "model-00027-of-00047.safetensors", + "model.layers.26.mlp.experts.67.up_proj.weight": "model-00027-of-00047.safetensors", + "model.layers.26.mlp.experts.67.up_proj.weight_scale": "model-00027-of-00047.safetensors", + "model.layers.26.mlp.experts.68.down_proj.weight": "model-00027-of-00047.safetensors", + "model.layers.26.mlp.experts.68.down_proj.weight_scale": "model-00027-of-00047.safetensors", + "model.layers.26.mlp.experts.68.gate_proj.weight": "model-00027-of-00047.safetensors", + "model.layers.26.mlp.experts.68.gate_proj.weight_scale": "model-00027-of-00047.safetensors", + "model.layers.26.mlp.experts.68.up_proj.weight": "model-00027-of-00047.safetensors", + "model.layers.26.mlp.experts.68.up_proj.weight_scale": "model-00027-of-00047.safetensors", + "model.layers.26.mlp.experts.69.down_proj.weight": "model-00027-of-00047.safetensors", + "model.layers.26.mlp.experts.69.down_proj.weight_scale": "model-00027-of-00047.safetensors", + "model.layers.26.mlp.experts.69.gate_proj.weight": "model-00027-of-00047.safetensors", + "model.layers.26.mlp.experts.69.gate_proj.weight_scale": "model-00027-of-00047.safetensors", + "model.layers.26.mlp.experts.69.up_proj.weight": "model-00027-of-00047.safetensors", + "model.layers.26.mlp.experts.69.up_proj.weight_scale": "model-00027-of-00047.safetensors", + "model.layers.26.mlp.experts.7.down_proj.weight": "model-00027-of-00047.safetensors", + "model.layers.26.mlp.experts.7.down_proj.weight_scale": "model-00027-of-00047.safetensors", + "model.layers.26.mlp.experts.7.gate_proj.weight": "model-00027-of-00047.safetensors", + "model.layers.26.mlp.experts.7.gate_proj.weight_scale": "model-00027-of-00047.safetensors", + "model.layers.26.mlp.experts.7.up_proj.weight": "model-00027-of-00047.safetensors", + "model.layers.26.mlp.experts.7.up_proj.weight_scale": "model-00027-of-00047.safetensors", + "model.layers.26.mlp.experts.70.down_proj.weight": "model-00027-of-00047.safetensors", + "model.layers.26.mlp.experts.70.down_proj.weight_scale": "model-00027-of-00047.safetensors", + "model.layers.26.mlp.experts.70.gate_proj.weight": "model-00027-of-00047.safetensors", + "model.layers.26.mlp.experts.70.gate_proj.weight_scale": "model-00027-of-00047.safetensors", + "model.layers.26.mlp.experts.70.up_proj.weight": "model-00027-of-00047.safetensors", + "model.layers.26.mlp.experts.70.up_proj.weight_scale": "model-00027-of-00047.safetensors", + "model.layers.26.mlp.experts.71.down_proj.weight": "model-00027-of-00047.safetensors", + "model.layers.26.mlp.experts.71.down_proj.weight_scale": "model-00027-of-00047.safetensors", + "model.layers.26.mlp.experts.71.gate_proj.weight": "model-00027-of-00047.safetensors", + "model.layers.26.mlp.experts.71.gate_proj.weight_scale": "model-00027-of-00047.safetensors", + "model.layers.26.mlp.experts.71.up_proj.weight": "model-00027-of-00047.safetensors", + "model.layers.26.mlp.experts.71.up_proj.weight_scale": "model-00027-of-00047.safetensors", + "model.layers.26.mlp.experts.72.down_proj.weight": "model-00027-of-00047.safetensors", + "model.layers.26.mlp.experts.72.down_proj.weight_scale": "model-00027-of-00047.safetensors", + "model.layers.26.mlp.experts.72.gate_proj.weight": "model-00027-of-00047.safetensors", + "model.layers.26.mlp.experts.72.gate_proj.weight_scale": "model-00027-of-00047.safetensors", + "model.layers.26.mlp.experts.72.up_proj.weight": "model-00027-of-00047.safetensors", + "model.layers.26.mlp.experts.72.up_proj.weight_scale": "model-00027-of-00047.safetensors", + "model.layers.26.mlp.experts.73.down_proj.weight": "model-00027-of-00047.safetensors", + "model.layers.26.mlp.experts.73.down_proj.weight_scale": "model-00027-of-00047.safetensors", + "model.layers.26.mlp.experts.73.gate_proj.weight": "model-00027-of-00047.safetensors", + "model.layers.26.mlp.experts.73.gate_proj.weight_scale": "model-00027-of-00047.safetensors", + "model.layers.26.mlp.experts.73.up_proj.weight": "model-00027-of-00047.safetensors", + "model.layers.26.mlp.experts.73.up_proj.weight_scale": "model-00027-of-00047.safetensors", + "model.layers.26.mlp.experts.74.down_proj.weight": "model-00027-of-00047.safetensors", + "model.layers.26.mlp.experts.74.down_proj.weight_scale": "model-00027-of-00047.safetensors", + "model.layers.26.mlp.experts.74.gate_proj.weight": "model-00027-of-00047.safetensors", + "model.layers.26.mlp.experts.74.gate_proj.weight_scale": "model-00027-of-00047.safetensors", + "model.layers.26.mlp.experts.74.up_proj.weight": "model-00027-of-00047.safetensors", + "model.layers.26.mlp.experts.74.up_proj.weight_scale": "model-00027-of-00047.safetensors", + "model.layers.26.mlp.experts.75.down_proj.weight": "model-00027-of-00047.safetensors", + "model.layers.26.mlp.experts.75.down_proj.weight_scale": "model-00027-of-00047.safetensors", + "model.layers.26.mlp.experts.75.gate_proj.weight": "model-00027-of-00047.safetensors", + "model.layers.26.mlp.experts.75.gate_proj.weight_scale": "model-00027-of-00047.safetensors", + "model.layers.26.mlp.experts.75.up_proj.weight": "model-00027-of-00047.safetensors", + "model.layers.26.mlp.experts.75.up_proj.weight_scale": "model-00027-of-00047.safetensors", + "model.layers.26.mlp.experts.76.down_proj.weight": "model-00027-of-00047.safetensors", + "model.layers.26.mlp.experts.76.down_proj.weight_scale": "model-00027-of-00047.safetensors", + "model.layers.26.mlp.experts.76.gate_proj.weight": "model-00027-of-00047.safetensors", + "model.layers.26.mlp.experts.76.gate_proj.weight_scale": "model-00027-of-00047.safetensors", + "model.layers.26.mlp.experts.76.up_proj.weight": "model-00027-of-00047.safetensors", + "model.layers.26.mlp.experts.76.up_proj.weight_scale": "model-00027-of-00047.safetensors", + "model.layers.26.mlp.experts.77.down_proj.weight": "model-00027-of-00047.safetensors", + "model.layers.26.mlp.experts.77.down_proj.weight_scale": "model-00027-of-00047.safetensors", + "model.layers.26.mlp.experts.77.gate_proj.weight": "model-00027-of-00047.safetensors", + "model.layers.26.mlp.experts.77.gate_proj.weight_scale": "model-00027-of-00047.safetensors", + "model.layers.26.mlp.experts.77.up_proj.weight": "model-00027-of-00047.safetensors", + "model.layers.26.mlp.experts.77.up_proj.weight_scale": "model-00027-of-00047.safetensors", + "model.layers.26.mlp.experts.78.down_proj.weight": "model-00027-of-00047.safetensors", + "model.layers.26.mlp.experts.78.down_proj.weight_scale": "model-00027-of-00047.safetensors", + "model.layers.26.mlp.experts.78.gate_proj.weight": "model-00027-of-00047.safetensors", + "model.layers.26.mlp.experts.78.gate_proj.weight_scale": "model-00027-of-00047.safetensors", + "model.layers.26.mlp.experts.78.up_proj.weight": "model-00027-of-00047.safetensors", + "model.layers.26.mlp.experts.78.up_proj.weight_scale": "model-00027-of-00047.safetensors", + "model.layers.26.mlp.experts.79.down_proj.weight": "model-00027-of-00047.safetensors", + "model.layers.26.mlp.experts.79.down_proj.weight_scale": "model-00027-of-00047.safetensors", + "model.layers.26.mlp.experts.79.gate_proj.weight": "model-00027-of-00047.safetensors", + "model.layers.26.mlp.experts.79.gate_proj.weight_scale": "model-00027-of-00047.safetensors", + "model.layers.26.mlp.experts.79.up_proj.weight": "model-00027-of-00047.safetensors", + "model.layers.26.mlp.experts.79.up_proj.weight_scale": "model-00027-of-00047.safetensors", + "model.layers.26.mlp.experts.8.down_proj.weight": "model-00027-of-00047.safetensors", + "model.layers.26.mlp.experts.8.down_proj.weight_scale": "model-00027-of-00047.safetensors", + "model.layers.26.mlp.experts.8.gate_proj.weight": "model-00027-of-00047.safetensors", + "model.layers.26.mlp.experts.8.gate_proj.weight_scale": "model-00027-of-00047.safetensors", + "model.layers.26.mlp.experts.8.up_proj.weight": "model-00027-of-00047.safetensors", + "model.layers.26.mlp.experts.8.up_proj.weight_scale": "model-00027-of-00047.safetensors", + "model.layers.26.mlp.experts.80.down_proj.weight": "model-00027-of-00047.safetensors", + "model.layers.26.mlp.experts.80.down_proj.weight_scale": "model-00027-of-00047.safetensors", + "model.layers.26.mlp.experts.80.gate_proj.weight": "model-00027-of-00047.safetensors", + "model.layers.26.mlp.experts.80.gate_proj.weight_scale": "model-00027-of-00047.safetensors", + "model.layers.26.mlp.experts.80.up_proj.weight": "model-00027-of-00047.safetensors", + "model.layers.26.mlp.experts.80.up_proj.weight_scale": "model-00027-of-00047.safetensors", + "model.layers.26.mlp.experts.81.down_proj.weight": "model-00027-of-00047.safetensors", + "model.layers.26.mlp.experts.81.down_proj.weight_scale": "model-00027-of-00047.safetensors", + "model.layers.26.mlp.experts.81.gate_proj.weight": "model-00027-of-00047.safetensors", + "model.layers.26.mlp.experts.81.gate_proj.weight_scale": "model-00027-of-00047.safetensors", + "model.layers.26.mlp.experts.81.up_proj.weight": "model-00027-of-00047.safetensors", + "model.layers.26.mlp.experts.81.up_proj.weight_scale": "model-00027-of-00047.safetensors", + "model.layers.26.mlp.experts.82.down_proj.weight": "model-00027-of-00047.safetensors", + "model.layers.26.mlp.experts.82.down_proj.weight_scale": "model-00027-of-00047.safetensors", + "model.layers.26.mlp.experts.82.gate_proj.weight": "model-00027-of-00047.safetensors", + "model.layers.26.mlp.experts.82.gate_proj.weight_scale": "model-00027-of-00047.safetensors", + "model.layers.26.mlp.experts.82.up_proj.weight": "model-00027-of-00047.safetensors", + "model.layers.26.mlp.experts.82.up_proj.weight_scale": "model-00027-of-00047.safetensors", + "model.layers.26.mlp.experts.83.down_proj.weight": "model-00027-of-00047.safetensors", + "model.layers.26.mlp.experts.83.down_proj.weight_scale": "model-00027-of-00047.safetensors", + "model.layers.26.mlp.experts.83.gate_proj.weight": "model-00027-of-00047.safetensors", + "model.layers.26.mlp.experts.83.gate_proj.weight_scale": "model-00027-of-00047.safetensors", + "model.layers.26.mlp.experts.83.up_proj.weight": "model-00027-of-00047.safetensors", + "model.layers.26.mlp.experts.83.up_proj.weight_scale": "model-00027-of-00047.safetensors", + "model.layers.26.mlp.experts.84.down_proj.weight": "model-00027-of-00047.safetensors", + "model.layers.26.mlp.experts.84.down_proj.weight_scale": "model-00027-of-00047.safetensors", + "model.layers.26.mlp.experts.84.gate_proj.weight": "model-00027-of-00047.safetensors", + "model.layers.26.mlp.experts.84.gate_proj.weight_scale": "model-00027-of-00047.safetensors", + "model.layers.26.mlp.experts.84.up_proj.weight": "model-00027-of-00047.safetensors", + "model.layers.26.mlp.experts.84.up_proj.weight_scale": "model-00027-of-00047.safetensors", + "model.layers.26.mlp.experts.85.down_proj.weight": "model-00027-of-00047.safetensors", + "model.layers.26.mlp.experts.85.down_proj.weight_scale": "model-00027-of-00047.safetensors", + "model.layers.26.mlp.experts.85.gate_proj.weight": "model-00027-of-00047.safetensors", + "model.layers.26.mlp.experts.85.gate_proj.weight_scale": "model-00027-of-00047.safetensors", + "model.layers.26.mlp.experts.85.up_proj.weight": "model-00027-of-00047.safetensors", + "model.layers.26.mlp.experts.85.up_proj.weight_scale": "model-00027-of-00047.safetensors", + "model.layers.26.mlp.experts.86.down_proj.weight": "model-00027-of-00047.safetensors", + "model.layers.26.mlp.experts.86.down_proj.weight_scale": "model-00027-of-00047.safetensors", + "model.layers.26.mlp.experts.86.gate_proj.weight": "model-00027-of-00047.safetensors", + "model.layers.26.mlp.experts.86.gate_proj.weight_scale": "model-00027-of-00047.safetensors", + "model.layers.26.mlp.experts.86.up_proj.weight": "model-00027-of-00047.safetensors", + "model.layers.26.mlp.experts.86.up_proj.weight_scale": "model-00027-of-00047.safetensors", + "model.layers.26.mlp.experts.87.down_proj.weight": "model-00027-of-00047.safetensors", + "model.layers.26.mlp.experts.87.down_proj.weight_scale": "model-00027-of-00047.safetensors", + "model.layers.26.mlp.experts.87.gate_proj.weight": "model-00027-of-00047.safetensors", + "model.layers.26.mlp.experts.87.gate_proj.weight_scale": "model-00027-of-00047.safetensors", + "model.layers.26.mlp.experts.87.up_proj.weight": "model-00027-of-00047.safetensors", + "model.layers.26.mlp.experts.87.up_proj.weight_scale": "model-00027-of-00047.safetensors", + "model.layers.26.mlp.experts.88.down_proj.weight": "model-00027-of-00047.safetensors", + "model.layers.26.mlp.experts.88.down_proj.weight_scale": "model-00027-of-00047.safetensors", + "model.layers.26.mlp.experts.88.gate_proj.weight": "model-00027-of-00047.safetensors", + "model.layers.26.mlp.experts.88.gate_proj.weight_scale": "model-00027-of-00047.safetensors", + "model.layers.26.mlp.experts.88.up_proj.weight": "model-00027-of-00047.safetensors", + "model.layers.26.mlp.experts.88.up_proj.weight_scale": "model-00027-of-00047.safetensors", + "model.layers.26.mlp.experts.89.down_proj.weight": "model-00027-of-00047.safetensors", + "model.layers.26.mlp.experts.89.down_proj.weight_scale": "model-00027-of-00047.safetensors", + "model.layers.26.mlp.experts.89.gate_proj.weight": "model-00027-of-00047.safetensors", + "model.layers.26.mlp.experts.89.gate_proj.weight_scale": "model-00027-of-00047.safetensors", + "model.layers.26.mlp.experts.89.up_proj.weight": "model-00027-of-00047.safetensors", + "model.layers.26.mlp.experts.89.up_proj.weight_scale": "model-00027-of-00047.safetensors", + "model.layers.26.mlp.experts.9.down_proj.weight": "model-00027-of-00047.safetensors", + "model.layers.26.mlp.experts.9.down_proj.weight_scale": "model-00027-of-00047.safetensors", + "model.layers.26.mlp.experts.9.gate_proj.weight": "model-00027-of-00047.safetensors", + "model.layers.26.mlp.experts.9.gate_proj.weight_scale": "model-00027-of-00047.safetensors", + "model.layers.26.mlp.experts.9.up_proj.weight": "model-00027-of-00047.safetensors", + "model.layers.26.mlp.experts.9.up_proj.weight_scale": "model-00027-of-00047.safetensors", + "model.layers.26.mlp.experts.90.down_proj.weight": "model-00027-of-00047.safetensors", + "model.layers.26.mlp.experts.90.down_proj.weight_scale": "model-00027-of-00047.safetensors", + "model.layers.26.mlp.experts.90.gate_proj.weight": "model-00027-of-00047.safetensors", + "model.layers.26.mlp.experts.90.gate_proj.weight_scale": "model-00027-of-00047.safetensors", + "model.layers.26.mlp.experts.90.up_proj.weight": "model-00027-of-00047.safetensors", + "model.layers.26.mlp.experts.90.up_proj.weight_scale": "model-00027-of-00047.safetensors", + "model.layers.26.mlp.experts.91.down_proj.weight": "model-00027-of-00047.safetensors", + "model.layers.26.mlp.experts.91.down_proj.weight_scale": "model-00027-of-00047.safetensors", + "model.layers.26.mlp.experts.91.gate_proj.weight": "model-00027-of-00047.safetensors", + "model.layers.26.mlp.experts.91.gate_proj.weight_scale": "model-00027-of-00047.safetensors", + "model.layers.26.mlp.experts.91.up_proj.weight": "model-00027-of-00047.safetensors", + "model.layers.26.mlp.experts.91.up_proj.weight_scale": "model-00027-of-00047.safetensors", + "model.layers.26.mlp.experts.92.down_proj.weight": "model-00027-of-00047.safetensors", + "model.layers.26.mlp.experts.92.down_proj.weight_scale": "model-00027-of-00047.safetensors", + "model.layers.26.mlp.experts.92.gate_proj.weight": "model-00027-of-00047.safetensors", + "model.layers.26.mlp.experts.92.gate_proj.weight_scale": "model-00027-of-00047.safetensors", + "model.layers.26.mlp.experts.92.up_proj.weight": "model-00027-of-00047.safetensors", + "model.layers.26.mlp.experts.92.up_proj.weight_scale": "model-00027-of-00047.safetensors", + "model.layers.26.mlp.experts.93.down_proj.weight": "model-00027-of-00047.safetensors", + "model.layers.26.mlp.experts.93.down_proj.weight_scale": "model-00027-of-00047.safetensors", + "model.layers.26.mlp.experts.93.gate_proj.weight": "model-00027-of-00047.safetensors", + "model.layers.26.mlp.experts.93.gate_proj.weight_scale": "model-00027-of-00047.safetensors", + "model.layers.26.mlp.experts.93.up_proj.weight": "model-00027-of-00047.safetensors", + "model.layers.26.mlp.experts.93.up_proj.weight_scale": "model-00027-of-00047.safetensors", + "model.layers.26.mlp.experts.94.down_proj.weight": "model-00027-of-00047.safetensors", + "model.layers.26.mlp.experts.94.down_proj.weight_scale": "model-00027-of-00047.safetensors", + "model.layers.26.mlp.experts.94.gate_proj.weight": "model-00027-of-00047.safetensors", + "model.layers.26.mlp.experts.94.gate_proj.weight_scale": "model-00027-of-00047.safetensors", + "model.layers.26.mlp.experts.94.up_proj.weight": "model-00027-of-00047.safetensors", + "model.layers.26.mlp.experts.94.up_proj.weight_scale": "model-00027-of-00047.safetensors", + "model.layers.26.mlp.experts.95.down_proj.weight": "model-00027-of-00047.safetensors", + "model.layers.26.mlp.experts.95.down_proj.weight_scale": "model-00027-of-00047.safetensors", + "model.layers.26.mlp.experts.95.gate_proj.weight": "model-00027-of-00047.safetensors", + "model.layers.26.mlp.experts.95.gate_proj.weight_scale": "model-00027-of-00047.safetensors", + "model.layers.26.mlp.experts.95.up_proj.weight": "model-00027-of-00047.safetensors", + "model.layers.26.mlp.experts.95.up_proj.weight_scale": "model-00027-of-00047.safetensors", + "model.layers.26.mlp.experts.96.down_proj.weight": "model-00027-of-00047.safetensors", + "model.layers.26.mlp.experts.96.down_proj.weight_scale": "model-00027-of-00047.safetensors", + "model.layers.26.mlp.experts.96.gate_proj.weight": "model-00027-of-00047.safetensors", + "model.layers.26.mlp.experts.96.gate_proj.weight_scale": "model-00027-of-00047.safetensors", + "model.layers.26.mlp.experts.96.up_proj.weight": "model-00027-of-00047.safetensors", + "model.layers.26.mlp.experts.96.up_proj.weight_scale": "model-00027-of-00047.safetensors", + "model.layers.26.mlp.experts.97.down_proj.weight": "model-00027-of-00047.safetensors", + "model.layers.26.mlp.experts.97.down_proj.weight_scale": "model-00027-of-00047.safetensors", + "model.layers.26.mlp.experts.97.gate_proj.weight": "model-00027-of-00047.safetensors", + "model.layers.26.mlp.experts.97.gate_proj.weight_scale": "model-00027-of-00047.safetensors", + "model.layers.26.mlp.experts.97.up_proj.weight": "model-00027-of-00047.safetensors", + "model.layers.26.mlp.experts.97.up_proj.weight_scale": "model-00027-of-00047.safetensors", + "model.layers.26.mlp.experts.98.down_proj.weight": "model-00027-of-00047.safetensors", + "model.layers.26.mlp.experts.98.down_proj.weight_scale": "model-00027-of-00047.safetensors", + "model.layers.26.mlp.experts.98.gate_proj.weight": "model-00027-of-00047.safetensors", + "model.layers.26.mlp.experts.98.gate_proj.weight_scale": "model-00027-of-00047.safetensors", + "model.layers.26.mlp.experts.98.up_proj.weight": "model-00027-of-00047.safetensors", + "model.layers.26.mlp.experts.98.up_proj.weight_scale": "model-00027-of-00047.safetensors", + "model.layers.26.mlp.experts.99.down_proj.weight": "model-00027-of-00047.safetensors", + "model.layers.26.mlp.experts.99.down_proj.weight_scale": "model-00027-of-00047.safetensors", + "model.layers.26.mlp.experts.99.gate_proj.weight": "model-00027-of-00047.safetensors", + "model.layers.26.mlp.experts.99.gate_proj.weight_scale": "model-00027-of-00047.safetensors", + "model.layers.26.mlp.experts.99.up_proj.weight": "model-00027-of-00047.safetensors", + "model.layers.26.mlp.experts.99.up_proj.weight_scale": "model-00027-of-00047.safetensors", + "model.layers.26.mlp.gate.e_score_correction_bias": "model-00027-of-00047.safetensors", + "model.layers.26.mlp.gate.weight": "model-00027-of-00047.safetensors", + "model.layers.26.mlp.shared_experts.down_proj.weight": "model-00027-of-00047.safetensors", + "model.layers.26.mlp.shared_experts.down_proj.weight_scale": "model-00027-of-00047.safetensors", + "model.layers.26.mlp.shared_experts.gate_proj.weight": "model-00027-of-00047.safetensors", + "model.layers.26.mlp.shared_experts.gate_proj.weight_scale": "model-00027-of-00047.safetensors", + "model.layers.26.mlp.shared_experts.up_proj.weight": "model-00027-of-00047.safetensors", + "model.layers.26.mlp.shared_experts.up_proj.weight_scale": "model-00027-of-00047.safetensors", + "model.layers.26.post_attention_layernorm.weight": "model-00027-of-00047.safetensors", + "model.layers.26.self_attn.k_proj.bias": "model-00027-of-00047.safetensors", + "model.layers.26.self_attn.k_proj.weight": "model-00027-of-00047.safetensors", + "model.layers.26.self_attn.k_proj.weight_scale": "model-00027-of-00047.safetensors", + "model.layers.26.self_attn.o_proj.weight": "model-00027-of-00047.safetensors", + "model.layers.26.self_attn.o_proj.weight_scale": "model-00027-of-00047.safetensors", + "model.layers.26.self_attn.q_proj.bias": "model-00027-of-00047.safetensors", + "model.layers.26.self_attn.q_proj.weight": "model-00027-of-00047.safetensors", + "model.layers.26.self_attn.q_proj.weight_scale": "model-00027-of-00047.safetensors", + "model.layers.26.self_attn.v_proj.bias": "model-00027-of-00047.safetensors", + "model.layers.26.self_attn.v_proj.weight": "model-00027-of-00047.safetensors", + "model.layers.26.self_attn.v_proj.weight_scale": "model-00027-of-00047.safetensors", + "model.layers.27.input_layernorm.weight": "model-00028-of-00047.safetensors", + "model.layers.27.mlp.experts.0.down_proj.weight": "model-00028-of-00047.safetensors", + "model.layers.27.mlp.experts.0.down_proj.weight_scale": "model-00028-of-00047.safetensors", + "model.layers.27.mlp.experts.0.gate_proj.weight": "model-00028-of-00047.safetensors", + "model.layers.27.mlp.experts.0.gate_proj.weight_scale": "model-00028-of-00047.safetensors", + "model.layers.27.mlp.experts.0.up_proj.weight": "model-00028-of-00047.safetensors", + "model.layers.27.mlp.experts.0.up_proj.weight_scale": "model-00028-of-00047.safetensors", + "model.layers.27.mlp.experts.1.down_proj.weight": "model-00028-of-00047.safetensors", + "model.layers.27.mlp.experts.1.down_proj.weight_scale": "model-00028-of-00047.safetensors", + "model.layers.27.mlp.experts.1.gate_proj.weight": "model-00028-of-00047.safetensors", + "model.layers.27.mlp.experts.1.gate_proj.weight_scale": "model-00028-of-00047.safetensors", + "model.layers.27.mlp.experts.1.up_proj.weight": "model-00028-of-00047.safetensors", + "model.layers.27.mlp.experts.1.up_proj.weight_scale": "model-00028-of-00047.safetensors", + "model.layers.27.mlp.experts.10.down_proj.weight": "model-00028-of-00047.safetensors", + "model.layers.27.mlp.experts.10.down_proj.weight_scale": "model-00028-of-00047.safetensors", + "model.layers.27.mlp.experts.10.gate_proj.weight": "model-00028-of-00047.safetensors", + "model.layers.27.mlp.experts.10.gate_proj.weight_scale": "model-00028-of-00047.safetensors", + "model.layers.27.mlp.experts.10.up_proj.weight": "model-00028-of-00047.safetensors", + "model.layers.27.mlp.experts.10.up_proj.weight_scale": "model-00028-of-00047.safetensors", + "model.layers.27.mlp.experts.100.down_proj.weight": "model-00028-of-00047.safetensors", + "model.layers.27.mlp.experts.100.down_proj.weight_scale": "model-00028-of-00047.safetensors", + "model.layers.27.mlp.experts.100.gate_proj.weight": "model-00028-of-00047.safetensors", + "model.layers.27.mlp.experts.100.gate_proj.weight_scale": "model-00028-of-00047.safetensors", + "model.layers.27.mlp.experts.100.up_proj.weight": "model-00028-of-00047.safetensors", + "model.layers.27.mlp.experts.100.up_proj.weight_scale": "model-00028-of-00047.safetensors", + "model.layers.27.mlp.experts.101.down_proj.weight": "model-00028-of-00047.safetensors", + "model.layers.27.mlp.experts.101.down_proj.weight_scale": "model-00028-of-00047.safetensors", + "model.layers.27.mlp.experts.101.gate_proj.weight": "model-00028-of-00047.safetensors", + "model.layers.27.mlp.experts.101.gate_proj.weight_scale": "model-00028-of-00047.safetensors", + "model.layers.27.mlp.experts.101.up_proj.weight": "model-00028-of-00047.safetensors", + "model.layers.27.mlp.experts.101.up_proj.weight_scale": "model-00028-of-00047.safetensors", + "model.layers.27.mlp.experts.102.down_proj.weight": "model-00028-of-00047.safetensors", + "model.layers.27.mlp.experts.102.down_proj.weight_scale": "model-00028-of-00047.safetensors", + "model.layers.27.mlp.experts.102.gate_proj.weight": "model-00028-of-00047.safetensors", + "model.layers.27.mlp.experts.102.gate_proj.weight_scale": "model-00028-of-00047.safetensors", + "model.layers.27.mlp.experts.102.up_proj.weight": "model-00028-of-00047.safetensors", + "model.layers.27.mlp.experts.102.up_proj.weight_scale": "model-00028-of-00047.safetensors", + "model.layers.27.mlp.experts.103.down_proj.weight": "model-00028-of-00047.safetensors", + "model.layers.27.mlp.experts.103.down_proj.weight_scale": "model-00028-of-00047.safetensors", + "model.layers.27.mlp.experts.103.gate_proj.weight": "model-00028-of-00047.safetensors", + "model.layers.27.mlp.experts.103.gate_proj.weight_scale": "model-00028-of-00047.safetensors", + "model.layers.27.mlp.experts.103.up_proj.weight": "model-00028-of-00047.safetensors", + "model.layers.27.mlp.experts.103.up_proj.weight_scale": "model-00028-of-00047.safetensors", + "model.layers.27.mlp.experts.104.down_proj.weight": "model-00028-of-00047.safetensors", + "model.layers.27.mlp.experts.104.down_proj.weight_scale": "model-00028-of-00047.safetensors", + "model.layers.27.mlp.experts.104.gate_proj.weight": "model-00028-of-00047.safetensors", + "model.layers.27.mlp.experts.104.gate_proj.weight_scale": "model-00028-of-00047.safetensors", + "model.layers.27.mlp.experts.104.up_proj.weight": "model-00028-of-00047.safetensors", + "model.layers.27.mlp.experts.104.up_proj.weight_scale": "model-00028-of-00047.safetensors", + "model.layers.27.mlp.experts.105.down_proj.weight": "model-00028-of-00047.safetensors", + "model.layers.27.mlp.experts.105.down_proj.weight_scale": "model-00028-of-00047.safetensors", + "model.layers.27.mlp.experts.105.gate_proj.weight": "model-00028-of-00047.safetensors", + "model.layers.27.mlp.experts.105.gate_proj.weight_scale": "model-00028-of-00047.safetensors", + "model.layers.27.mlp.experts.105.up_proj.weight": "model-00028-of-00047.safetensors", + "model.layers.27.mlp.experts.105.up_proj.weight_scale": "model-00028-of-00047.safetensors", + "model.layers.27.mlp.experts.106.down_proj.weight": "model-00028-of-00047.safetensors", + "model.layers.27.mlp.experts.106.down_proj.weight_scale": "model-00028-of-00047.safetensors", + "model.layers.27.mlp.experts.106.gate_proj.weight": "model-00028-of-00047.safetensors", + "model.layers.27.mlp.experts.106.gate_proj.weight_scale": "model-00028-of-00047.safetensors", + "model.layers.27.mlp.experts.106.up_proj.weight": "model-00028-of-00047.safetensors", + "model.layers.27.mlp.experts.106.up_proj.weight_scale": "model-00028-of-00047.safetensors", + "model.layers.27.mlp.experts.107.down_proj.weight": "model-00028-of-00047.safetensors", + "model.layers.27.mlp.experts.107.down_proj.weight_scale": "model-00028-of-00047.safetensors", + "model.layers.27.mlp.experts.107.gate_proj.weight": "model-00028-of-00047.safetensors", + "model.layers.27.mlp.experts.107.gate_proj.weight_scale": "model-00028-of-00047.safetensors", + "model.layers.27.mlp.experts.107.up_proj.weight": "model-00028-of-00047.safetensors", + "model.layers.27.mlp.experts.107.up_proj.weight_scale": "model-00028-of-00047.safetensors", + "model.layers.27.mlp.experts.108.down_proj.weight": "model-00028-of-00047.safetensors", + "model.layers.27.mlp.experts.108.down_proj.weight_scale": "model-00028-of-00047.safetensors", + "model.layers.27.mlp.experts.108.gate_proj.weight": "model-00028-of-00047.safetensors", + "model.layers.27.mlp.experts.108.gate_proj.weight_scale": "model-00028-of-00047.safetensors", + "model.layers.27.mlp.experts.108.up_proj.weight": "model-00028-of-00047.safetensors", + "model.layers.27.mlp.experts.108.up_proj.weight_scale": "model-00028-of-00047.safetensors", + "model.layers.27.mlp.experts.109.down_proj.weight": "model-00028-of-00047.safetensors", + "model.layers.27.mlp.experts.109.down_proj.weight_scale": "model-00028-of-00047.safetensors", + "model.layers.27.mlp.experts.109.gate_proj.weight": "model-00028-of-00047.safetensors", + "model.layers.27.mlp.experts.109.gate_proj.weight_scale": "model-00028-of-00047.safetensors", + "model.layers.27.mlp.experts.109.up_proj.weight": "model-00028-of-00047.safetensors", + "model.layers.27.mlp.experts.109.up_proj.weight_scale": "model-00028-of-00047.safetensors", + "model.layers.27.mlp.experts.11.down_proj.weight": "model-00028-of-00047.safetensors", + "model.layers.27.mlp.experts.11.down_proj.weight_scale": "model-00028-of-00047.safetensors", + "model.layers.27.mlp.experts.11.gate_proj.weight": "model-00028-of-00047.safetensors", + "model.layers.27.mlp.experts.11.gate_proj.weight_scale": "model-00028-of-00047.safetensors", + "model.layers.27.mlp.experts.11.up_proj.weight": "model-00028-of-00047.safetensors", + "model.layers.27.mlp.experts.11.up_proj.weight_scale": "model-00028-of-00047.safetensors", + "model.layers.27.mlp.experts.110.down_proj.weight": "model-00028-of-00047.safetensors", + "model.layers.27.mlp.experts.110.down_proj.weight_scale": "model-00028-of-00047.safetensors", + "model.layers.27.mlp.experts.110.gate_proj.weight": "model-00028-of-00047.safetensors", + "model.layers.27.mlp.experts.110.gate_proj.weight_scale": "model-00028-of-00047.safetensors", + "model.layers.27.mlp.experts.110.up_proj.weight": "model-00028-of-00047.safetensors", + "model.layers.27.mlp.experts.110.up_proj.weight_scale": "model-00028-of-00047.safetensors", + "model.layers.27.mlp.experts.111.down_proj.weight": "model-00028-of-00047.safetensors", + "model.layers.27.mlp.experts.111.down_proj.weight_scale": "model-00028-of-00047.safetensors", + "model.layers.27.mlp.experts.111.gate_proj.weight": "model-00028-of-00047.safetensors", + "model.layers.27.mlp.experts.111.gate_proj.weight_scale": "model-00028-of-00047.safetensors", + "model.layers.27.mlp.experts.111.up_proj.weight": "model-00028-of-00047.safetensors", + "model.layers.27.mlp.experts.111.up_proj.weight_scale": "model-00028-of-00047.safetensors", + "model.layers.27.mlp.experts.112.down_proj.weight": "model-00028-of-00047.safetensors", + "model.layers.27.mlp.experts.112.down_proj.weight_scale": "model-00028-of-00047.safetensors", + "model.layers.27.mlp.experts.112.gate_proj.weight": "model-00028-of-00047.safetensors", + "model.layers.27.mlp.experts.112.gate_proj.weight_scale": "model-00028-of-00047.safetensors", + "model.layers.27.mlp.experts.112.up_proj.weight": "model-00028-of-00047.safetensors", + "model.layers.27.mlp.experts.112.up_proj.weight_scale": "model-00028-of-00047.safetensors", + "model.layers.27.mlp.experts.113.down_proj.weight": "model-00028-of-00047.safetensors", + "model.layers.27.mlp.experts.113.down_proj.weight_scale": "model-00028-of-00047.safetensors", + "model.layers.27.mlp.experts.113.gate_proj.weight": "model-00028-of-00047.safetensors", + "model.layers.27.mlp.experts.113.gate_proj.weight_scale": "model-00028-of-00047.safetensors", + "model.layers.27.mlp.experts.113.up_proj.weight": "model-00028-of-00047.safetensors", + "model.layers.27.mlp.experts.113.up_proj.weight_scale": "model-00028-of-00047.safetensors", + "model.layers.27.mlp.experts.114.down_proj.weight": "model-00028-of-00047.safetensors", + "model.layers.27.mlp.experts.114.down_proj.weight_scale": "model-00028-of-00047.safetensors", + "model.layers.27.mlp.experts.114.gate_proj.weight": "model-00028-of-00047.safetensors", + "model.layers.27.mlp.experts.114.gate_proj.weight_scale": "model-00028-of-00047.safetensors", + "model.layers.27.mlp.experts.114.up_proj.weight": "model-00028-of-00047.safetensors", + "model.layers.27.mlp.experts.114.up_proj.weight_scale": "model-00028-of-00047.safetensors", + "model.layers.27.mlp.experts.115.down_proj.weight": "model-00028-of-00047.safetensors", + "model.layers.27.mlp.experts.115.down_proj.weight_scale": "model-00028-of-00047.safetensors", + "model.layers.27.mlp.experts.115.gate_proj.weight": "model-00028-of-00047.safetensors", + "model.layers.27.mlp.experts.115.gate_proj.weight_scale": "model-00028-of-00047.safetensors", + "model.layers.27.mlp.experts.115.up_proj.weight": "model-00028-of-00047.safetensors", + "model.layers.27.mlp.experts.115.up_proj.weight_scale": "model-00028-of-00047.safetensors", + "model.layers.27.mlp.experts.116.down_proj.weight": "model-00028-of-00047.safetensors", + "model.layers.27.mlp.experts.116.down_proj.weight_scale": "model-00028-of-00047.safetensors", + "model.layers.27.mlp.experts.116.gate_proj.weight": "model-00028-of-00047.safetensors", + "model.layers.27.mlp.experts.116.gate_proj.weight_scale": "model-00028-of-00047.safetensors", + "model.layers.27.mlp.experts.116.up_proj.weight": "model-00028-of-00047.safetensors", + "model.layers.27.mlp.experts.116.up_proj.weight_scale": "model-00028-of-00047.safetensors", + "model.layers.27.mlp.experts.117.down_proj.weight": "model-00028-of-00047.safetensors", + "model.layers.27.mlp.experts.117.down_proj.weight_scale": "model-00028-of-00047.safetensors", + "model.layers.27.mlp.experts.117.gate_proj.weight": "model-00028-of-00047.safetensors", + "model.layers.27.mlp.experts.117.gate_proj.weight_scale": "model-00028-of-00047.safetensors", + "model.layers.27.mlp.experts.117.up_proj.weight": "model-00028-of-00047.safetensors", + "model.layers.27.mlp.experts.117.up_proj.weight_scale": "model-00028-of-00047.safetensors", + "model.layers.27.mlp.experts.118.down_proj.weight": "model-00028-of-00047.safetensors", + "model.layers.27.mlp.experts.118.down_proj.weight_scale": "model-00028-of-00047.safetensors", + "model.layers.27.mlp.experts.118.gate_proj.weight": "model-00028-of-00047.safetensors", + "model.layers.27.mlp.experts.118.gate_proj.weight_scale": "model-00028-of-00047.safetensors", + "model.layers.27.mlp.experts.118.up_proj.weight": "model-00028-of-00047.safetensors", + "model.layers.27.mlp.experts.118.up_proj.weight_scale": "model-00028-of-00047.safetensors", + "model.layers.27.mlp.experts.119.down_proj.weight": "model-00028-of-00047.safetensors", + "model.layers.27.mlp.experts.119.down_proj.weight_scale": "model-00028-of-00047.safetensors", + "model.layers.27.mlp.experts.119.gate_proj.weight": "model-00028-of-00047.safetensors", + "model.layers.27.mlp.experts.119.gate_proj.weight_scale": "model-00028-of-00047.safetensors", + "model.layers.27.mlp.experts.119.up_proj.weight": "model-00028-of-00047.safetensors", + "model.layers.27.mlp.experts.119.up_proj.weight_scale": "model-00028-of-00047.safetensors", + "model.layers.27.mlp.experts.12.down_proj.weight": "model-00028-of-00047.safetensors", + "model.layers.27.mlp.experts.12.down_proj.weight_scale": "model-00028-of-00047.safetensors", + "model.layers.27.mlp.experts.12.gate_proj.weight": "model-00028-of-00047.safetensors", + "model.layers.27.mlp.experts.12.gate_proj.weight_scale": "model-00028-of-00047.safetensors", + "model.layers.27.mlp.experts.12.up_proj.weight": "model-00028-of-00047.safetensors", + "model.layers.27.mlp.experts.12.up_proj.weight_scale": "model-00028-of-00047.safetensors", + "model.layers.27.mlp.experts.120.down_proj.weight": "model-00028-of-00047.safetensors", + "model.layers.27.mlp.experts.120.down_proj.weight_scale": "model-00028-of-00047.safetensors", + "model.layers.27.mlp.experts.120.gate_proj.weight": "model-00028-of-00047.safetensors", + "model.layers.27.mlp.experts.120.gate_proj.weight_scale": "model-00028-of-00047.safetensors", + "model.layers.27.mlp.experts.120.up_proj.weight": "model-00028-of-00047.safetensors", + "model.layers.27.mlp.experts.120.up_proj.weight_scale": "model-00028-of-00047.safetensors", + "model.layers.27.mlp.experts.121.down_proj.weight": "model-00028-of-00047.safetensors", + "model.layers.27.mlp.experts.121.down_proj.weight_scale": "model-00028-of-00047.safetensors", + "model.layers.27.mlp.experts.121.gate_proj.weight": "model-00028-of-00047.safetensors", + "model.layers.27.mlp.experts.121.gate_proj.weight_scale": "model-00028-of-00047.safetensors", + "model.layers.27.mlp.experts.121.up_proj.weight": "model-00028-of-00047.safetensors", + "model.layers.27.mlp.experts.121.up_proj.weight_scale": "model-00028-of-00047.safetensors", + "model.layers.27.mlp.experts.122.down_proj.weight": "model-00028-of-00047.safetensors", + "model.layers.27.mlp.experts.122.down_proj.weight_scale": "model-00028-of-00047.safetensors", + "model.layers.27.mlp.experts.122.gate_proj.weight": "model-00028-of-00047.safetensors", + "model.layers.27.mlp.experts.122.gate_proj.weight_scale": "model-00028-of-00047.safetensors", + "model.layers.27.mlp.experts.122.up_proj.weight": "model-00028-of-00047.safetensors", + "model.layers.27.mlp.experts.122.up_proj.weight_scale": "model-00028-of-00047.safetensors", + "model.layers.27.mlp.experts.123.down_proj.weight": "model-00028-of-00047.safetensors", + "model.layers.27.mlp.experts.123.down_proj.weight_scale": "model-00028-of-00047.safetensors", + "model.layers.27.mlp.experts.123.gate_proj.weight": "model-00028-of-00047.safetensors", + "model.layers.27.mlp.experts.123.gate_proj.weight_scale": "model-00028-of-00047.safetensors", + "model.layers.27.mlp.experts.123.up_proj.weight": "model-00028-of-00047.safetensors", + "model.layers.27.mlp.experts.123.up_proj.weight_scale": "model-00028-of-00047.safetensors", + "model.layers.27.mlp.experts.124.down_proj.weight": "model-00028-of-00047.safetensors", + "model.layers.27.mlp.experts.124.down_proj.weight_scale": "model-00028-of-00047.safetensors", + "model.layers.27.mlp.experts.124.gate_proj.weight": "model-00028-of-00047.safetensors", + "model.layers.27.mlp.experts.124.gate_proj.weight_scale": "model-00028-of-00047.safetensors", + "model.layers.27.mlp.experts.124.up_proj.weight": "model-00028-of-00047.safetensors", + "model.layers.27.mlp.experts.124.up_proj.weight_scale": "model-00028-of-00047.safetensors", + "model.layers.27.mlp.experts.125.down_proj.weight": "model-00028-of-00047.safetensors", + "model.layers.27.mlp.experts.125.down_proj.weight_scale": "model-00028-of-00047.safetensors", + "model.layers.27.mlp.experts.125.gate_proj.weight": "model-00028-of-00047.safetensors", + "model.layers.27.mlp.experts.125.gate_proj.weight_scale": "model-00028-of-00047.safetensors", + "model.layers.27.mlp.experts.125.up_proj.weight": "model-00028-of-00047.safetensors", + "model.layers.27.mlp.experts.125.up_proj.weight_scale": "model-00028-of-00047.safetensors", + "model.layers.27.mlp.experts.126.down_proj.weight": "model-00028-of-00047.safetensors", + "model.layers.27.mlp.experts.126.down_proj.weight_scale": "model-00028-of-00047.safetensors", + "model.layers.27.mlp.experts.126.gate_proj.weight": "model-00028-of-00047.safetensors", + "model.layers.27.mlp.experts.126.gate_proj.weight_scale": "model-00028-of-00047.safetensors", + "model.layers.27.mlp.experts.126.up_proj.weight": "model-00028-of-00047.safetensors", + "model.layers.27.mlp.experts.126.up_proj.weight_scale": "model-00028-of-00047.safetensors", + "model.layers.27.mlp.experts.127.down_proj.weight": "model-00028-of-00047.safetensors", + "model.layers.27.mlp.experts.127.down_proj.weight_scale": "model-00028-of-00047.safetensors", + "model.layers.27.mlp.experts.127.gate_proj.weight": "model-00028-of-00047.safetensors", + "model.layers.27.mlp.experts.127.gate_proj.weight_scale": "model-00028-of-00047.safetensors", + "model.layers.27.mlp.experts.127.up_proj.weight": "model-00028-of-00047.safetensors", + "model.layers.27.mlp.experts.127.up_proj.weight_scale": "model-00028-of-00047.safetensors", + "model.layers.27.mlp.experts.13.down_proj.weight": "model-00028-of-00047.safetensors", + "model.layers.27.mlp.experts.13.down_proj.weight_scale": "model-00028-of-00047.safetensors", + "model.layers.27.mlp.experts.13.gate_proj.weight": "model-00028-of-00047.safetensors", + "model.layers.27.mlp.experts.13.gate_proj.weight_scale": "model-00028-of-00047.safetensors", + "model.layers.27.mlp.experts.13.up_proj.weight": "model-00028-of-00047.safetensors", + "model.layers.27.mlp.experts.13.up_proj.weight_scale": "model-00028-of-00047.safetensors", + "model.layers.27.mlp.experts.14.down_proj.weight": "model-00028-of-00047.safetensors", + "model.layers.27.mlp.experts.14.down_proj.weight_scale": "model-00028-of-00047.safetensors", + "model.layers.27.mlp.experts.14.gate_proj.weight": "model-00028-of-00047.safetensors", + "model.layers.27.mlp.experts.14.gate_proj.weight_scale": "model-00028-of-00047.safetensors", + "model.layers.27.mlp.experts.14.up_proj.weight": "model-00028-of-00047.safetensors", + "model.layers.27.mlp.experts.14.up_proj.weight_scale": "model-00028-of-00047.safetensors", + "model.layers.27.mlp.experts.15.down_proj.weight": "model-00028-of-00047.safetensors", + "model.layers.27.mlp.experts.15.down_proj.weight_scale": "model-00028-of-00047.safetensors", + "model.layers.27.mlp.experts.15.gate_proj.weight": "model-00028-of-00047.safetensors", + "model.layers.27.mlp.experts.15.gate_proj.weight_scale": "model-00028-of-00047.safetensors", + "model.layers.27.mlp.experts.15.up_proj.weight": "model-00028-of-00047.safetensors", + "model.layers.27.mlp.experts.15.up_proj.weight_scale": "model-00028-of-00047.safetensors", + "model.layers.27.mlp.experts.16.down_proj.weight": "model-00028-of-00047.safetensors", + "model.layers.27.mlp.experts.16.down_proj.weight_scale": "model-00028-of-00047.safetensors", + "model.layers.27.mlp.experts.16.gate_proj.weight": "model-00028-of-00047.safetensors", + "model.layers.27.mlp.experts.16.gate_proj.weight_scale": "model-00028-of-00047.safetensors", + "model.layers.27.mlp.experts.16.up_proj.weight": "model-00028-of-00047.safetensors", + "model.layers.27.mlp.experts.16.up_proj.weight_scale": "model-00028-of-00047.safetensors", + "model.layers.27.mlp.experts.17.down_proj.weight": "model-00028-of-00047.safetensors", + "model.layers.27.mlp.experts.17.down_proj.weight_scale": "model-00028-of-00047.safetensors", + "model.layers.27.mlp.experts.17.gate_proj.weight": "model-00028-of-00047.safetensors", + "model.layers.27.mlp.experts.17.gate_proj.weight_scale": "model-00028-of-00047.safetensors", + "model.layers.27.mlp.experts.17.up_proj.weight": "model-00028-of-00047.safetensors", + "model.layers.27.mlp.experts.17.up_proj.weight_scale": "model-00028-of-00047.safetensors", + "model.layers.27.mlp.experts.18.down_proj.weight": "model-00028-of-00047.safetensors", + "model.layers.27.mlp.experts.18.down_proj.weight_scale": "model-00028-of-00047.safetensors", + "model.layers.27.mlp.experts.18.gate_proj.weight": "model-00028-of-00047.safetensors", + "model.layers.27.mlp.experts.18.gate_proj.weight_scale": "model-00028-of-00047.safetensors", + "model.layers.27.mlp.experts.18.up_proj.weight": "model-00028-of-00047.safetensors", + "model.layers.27.mlp.experts.18.up_proj.weight_scale": "model-00028-of-00047.safetensors", + "model.layers.27.mlp.experts.19.down_proj.weight": "model-00028-of-00047.safetensors", + "model.layers.27.mlp.experts.19.down_proj.weight_scale": "model-00028-of-00047.safetensors", + "model.layers.27.mlp.experts.19.gate_proj.weight": "model-00028-of-00047.safetensors", + "model.layers.27.mlp.experts.19.gate_proj.weight_scale": "model-00028-of-00047.safetensors", + "model.layers.27.mlp.experts.19.up_proj.weight": "model-00028-of-00047.safetensors", + "model.layers.27.mlp.experts.19.up_proj.weight_scale": "model-00028-of-00047.safetensors", + "model.layers.27.mlp.experts.2.down_proj.weight": "model-00028-of-00047.safetensors", + "model.layers.27.mlp.experts.2.down_proj.weight_scale": "model-00028-of-00047.safetensors", + "model.layers.27.mlp.experts.2.gate_proj.weight": "model-00028-of-00047.safetensors", + "model.layers.27.mlp.experts.2.gate_proj.weight_scale": "model-00028-of-00047.safetensors", + "model.layers.27.mlp.experts.2.up_proj.weight": "model-00028-of-00047.safetensors", + "model.layers.27.mlp.experts.2.up_proj.weight_scale": "model-00028-of-00047.safetensors", + "model.layers.27.mlp.experts.20.down_proj.weight": "model-00028-of-00047.safetensors", + "model.layers.27.mlp.experts.20.down_proj.weight_scale": "model-00028-of-00047.safetensors", + "model.layers.27.mlp.experts.20.gate_proj.weight": "model-00028-of-00047.safetensors", + "model.layers.27.mlp.experts.20.gate_proj.weight_scale": "model-00028-of-00047.safetensors", + "model.layers.27.mlp.experts.20.up_proj.weight": "model-00028-of-00047.safetensors", + "model.layers.27.mlp.experts.20.up_proj.weight_scale": "model-00028-of-00047.safetensors", + "model.layers.27.mlp.experts.21.down_proj.weight": "model-00028-of-00047.safetensors", + "model.layers.27.mlp.experts.21.down_proj.weight_scale": "model-00028-of-00047.safetensors", + "model.layers.27.mlp.experts.21.gate_proj.weight": "model-00028-of-00047.safetensors", + "model.layers.27.mlp.experts.21.gate_proj.weight_scale": "model-00028-of-00047.safetensors", + "model.layers.27.mlp.experts.21.up_proj.weight": "model-00028-of-00047.safetensors", + "model.layers.27.mlp.experts.21.up_proj.weight_scale": "model-00028-of-00047.safetensors", + "model.layers.27.mlp.experts.22.down_proj.weight": "model-00028-of-00047.safetensors", + "model.layers.27.mlp.experts.22.down_proj.weight_scale": "model-00028-of-00047.safetensors", + "model.layers.27.mlp.experts.22.gate_proj.weight": "model-00028-of-00047.safetensors", + "model.layers.27.mlp.experts.22.gate_proj.weight_scale": "model-00028-of-00047.safetensors", + "model.layers.27.mlp.experts.22.up_proj.weight": "model-00028-of-00047.safetensors", + "model.layers.27.mlp.experts.22.up_proj.weight_scale": "model-00028-of-00047.safetensors", + "model.layers.27.mlp.experts.23.down_proj.weight": "model-00028-of-00047.safetensors", + "model.layers.27.mlp.experts.23.down_proj.weight_scale": "model-00028-of-00047.safetensors", + "model.layers.27.mlp.experts.23.gate_proj.weight": "model-00028-of-00047.safetensors", + "model.layers.27.mlp.experts.23.gate_proj.weight_scale": "model-00028-of-00047.safetensors", + "model.layers.27.mlp.experts.23.up_proj.weight": "model-00028-of-00047.safetensors", + "model.layers.27.mlp.experts.23.up_proj.weight_scale": "model-00028-of-00047.safetensors", + "model.layers.27.mlp.experts.24.down_proj.weight": "model-00028-of-00047.safetensors", + "model.layers.27.mlp.experts.24.down_proj.weight_scale": "model-00028-of-00047.safetensors", + "model.layers.27.mlp.experts.24.gate_proj.weight": "model-00028-of-00047.safetensors", + "model.layers.27.mlp.experts.24.gate_proj.weight_scale": "model-00028-of-00047.safetensors", + "model.layers.27.mlp.experts.24.up_proj.weight": "model-00028-of-00047.safetensors", + "model.layers.27.mlp.experts.24.up_proj.weight_scale": "model-00028-of-00047.safetensors", + "model.layers.27.mlp.experts.25.down_proj.weight": "model-00028-of-00047.safetensors", + "model.layers.27.mlp.experts.25.down_proj.weight_scale": "model-00028-of-00047.safetensors", + "model.layers.27.mlp.experts.25.gate_proj.weight": "model-00028-of-00047.safetensors", + "model.layers.27.mlp.experts.25.gate_proj.weight_scale": "model-00028-of-00047.safetensors", + "model.layers.27.mlp.experts.25.up_proj.weight": "model-00028-of-00047.safetensors", + "model.layers.27.mlp.experts.25.up_proj.weight_scale": "model-00028-of-00047.safetensors", + "model.layers.27.mlp.experts.26.down_proj.weight": "model-00028-of-00047.safetensors", + "model.layers.27.mlp.experts.26.down_proj.weight_scale": "model-00028-of-00047.safetensors", + "model.layers.27.mlp.experts.26.gate_proj.weight": "model-00028-of-00047.safetensors", + "model.layers.27.mlp.experts.26.gate_proj.weight_scale": "model-00028-of-00047.safetensors", + "model.layers.27.mlp.experts.26.up_proj.weight": "model-00028-of-00047.safetensors", + "model.layers.27.mlp.experts.26.up_proj.weight_scale": "model-00028-of-00047.safetensors", + "model.layers.27.mlp.experts.27.down_proj.weight": "model-00028-of-00047.safetensors", + "model.layers.27.mlp.experts.27.down_proj.weight_scale": "model-00028-of-00047.safetensors", + "model.layers.27.mlp.experts.27.gate_proj.weight": "model-00028-of-00047.safetensors", + "model.layers.27.mlp.experts.27.gate_proj.weight_scale": "model-00028-of-00047.safetensors", + "model.layers.27.mlp.experts.27.up_proj.weight": "model-00028-of-00047.safetensors", + "model.layers.27.mlp.experts.27.up_proj.weight_scale": "model-00028-of-00047.safetensors", + "model.layers.27.mlp.experts.28.down_proj.weight": "model-00028-of-00047.safetensors", + "model.layers.27.mlp.experts.28.down_proj.weight_scale": "model-00028-of-00047.safetensors", + "model.layers.27.mlp.experts.28.gate_proj.weight": "model-00028-of-00047.safetensors", + "model.layers.27.mlp.experts.28.gate_proj.weight_scale": "model-00028-of-00047.safetensors", + "model.layers.27.mlp.experts.28.up_proj.weight": "model-00028-of-00047.safetensors", + "model.layers.27.mlp.experts.28.up_proj.weight_scale": "model-00028-of-00047.safetensors", + "model.layers.27.mlp.experts.29.down_proj.weight": "model-00028-of-00047.safetensors", + "model.layers.27.mlp.experts.29.down_proj.weight_scale": "model-00028-of-00047.safetensors", + "model.layers.27.mlp.experts.29.gate_proj.weight": "model-00028-of-00047.safetensors", + "model.layers.27.mlp.experts.29.gate_proj.weight_scale": "model-00028-of-00047.safetensors", + "model.layers.27.mlp.experts.29.up_proj.weight": "model-00028-of-00047.safetensors", + "model.layers.27.mlp.experts.29.up_proj.weight_scale": "model-00028-of-00047.safetensors", + "model.layers.27.mlp.experts.3.down_proj.weight": "model-00028-of-00047.safetensors", + "model.layers.27.mlp.experts.3.down_proj.weight_scale": "model-00028-of-00047.safetensors", + "model.layers.27.mlp.experts.3.gate_proj.weight": "model-00028-of-00047.safetensors", + "model.layers.27.mlp.experts.3.gate_proj.weight_scale": "model-00028-of-00047.safetensors", + "model.layers.27.mlp.experts.3.up_proj.weight": "model-00028-of-00047.safetensors", + "model.layers.27.mlp.experts.3.up_proj.weight_scale": "model-00028-of-00047.safetensors", + "model.layers.27.mlp.experts.30.down_proj.weight": "model-00028-of-00047.safetensors", + "model.layers.27.mlp.experts.30.down_proj.weight_scale": "model-00028-of-00047.safetensors", + "model.layers.27.mlp.experts.30.gate_proj.weight": "model-00028-of-00047.safetensors", + "model.layers.27.mlp.experts.30.gate_proj.weight_scale": "model-00028-of-00047.safetensors", + "model.layers.27.mlp.experts.30.up_proj.weight": "model-00028-of-00047.safetensors", + "model.layers.27.mlp.experts.30.up_proj.weight_scale": "model-00028-of-00047.safetensors", + "model.layers.27.mlp.experts.31.down_proj.weight": "model-00028-of-00047.safetensors", + "model.layers.27.mlp.experts.31.down_proj.weight_scale": "model-00028-of-00047.safetensors", + "model.layers.27.mlp.experts.31.gate_proj.weight": "model-00028-of-00047.safetensors", + "model.layers.27.mlp.experts.31.gate_proj.weight_scale": "model-00028-of-00047.safetensors", + "model.layers.27.mlp.experts.31.up_proj.weight": "model-00028-of-00047.safetensors", + "model.layers.27.mlp.experts.31.up_proj.weight_scale": "model-00028-of-00047.safetensors", + "model.layers.27.mlp.experts.32.down_proj.weight": "model-00028-of-00047.safetensors", + "model.layers.27.mlp.experts.32.down_proj.weight_scale": "model-00028-of-00047.safetensors", + "model.layers.27.mlp.experts.32.gate_proj.weight": "model-00028-of-00047.safetensors", + "model.layers.27.mlp.experts.32.gate_proj.weight_scale": "model-00028-of-00047.safetensors", + "model.layers.27.mlp.experts.32.up_proj.weight": "model-00028-of-00047.safetensors", + "model.layers.27.mlp.experts.32.up_proj.weight_scale": "model-00028-of-00047.safetensors", + "model.layers.27.mlp.experts.33.down_proj.weight": "model-00028-of-00047.safetensors", + "model.layers.27.mlp.experts.33.down_proj.weight_scale": "model-00028-of-00047.safetensors", + "model.layers.27.mlp.experts.33.gate_proj.weight": "model-00028-of-00047.safetensors", + "model.layers.27.mlp.experts.33.gate_proj.weight_scale": "model-00028-of-00047.safetensors", + "model.layers.27.mlp.experts.33.up_proj.weight": "model-00028-of-00047.safetensors", + "model.layers.27.mlp.experts.33.up_proj.weight_scale": "model-00028-of-00047.safetensors", + "model.layers.27.mlp.experts.34.down_proj.weight": "model-00028-of-00047.safetensors", + "model.layers.27.mlp.experts.34.down_proj.weight_scale": "model-00028-of-00047.safetensors", + "model.layers.27.mlp.experts.34.gate_proj.weight": "model-00028-of-00047.safetensors", + "model.layers.27.mlp.experts.34.gate_proj.weight_scale": "model-00028-of-00047.safetensors", + "model.layers.27.mlp.experts.34.up_proj.weight": "model-00028-of-00047.safetensors", + "model.layers.27.mlp.experts.34.up_proj.weight_scale": "model-00028-of-00047.safetensors", + "model.layers.27.mlp.experts.35.down_proj.weight": "model-00028-of-00047.safetensors", + "model.layers.27.mlp.experts.35.down_proj.weight_scale": "model-00028-of-00047.safetensors", + "model.layers.27.mlp.experts.35.gate_proj.weight": "model-00028-of-00047.safetensors", + "model.layers.27.mlp.experts.35.gate_proj.weight_scale": "model-00028-of-00047.safetensors", + "model.layers.27.mlp.experts.35.up_proj.weight": "model-00028-of-00047.safetensors", + "model.layers.27.mlp.experts.35.up_proj.weight_scale": "model-00028-of-00047.safetensors", + "model.layers.27.mlp.experts.36.down_proj.weight": "model-00028-of-00047.safetensors", + "model.layers.27.mlp.experts.36.down_proj.weight_scale": "model-00028-of-00047.safetensors", + "model.layers.27.mlp.experts.36.gate_proj.weight": "model-00028-of-00047.safetensors", + "model.layers.27.mlp.experts.36.gate_proj.weight_scale": "model-00028-of-00047.safetensors", + "model.layers.27.mlp.experts.36.up_proj.weight": "model-00028-of-00047.safetensors", + "model.layers.27.mlp.experts.36.up_proj.weight_scale": "model-00028-of-00047.safetensors", + "model.layers.27.mlp.experts.37.down_proj.weight": "model-00028-of-00047.safetensors", + "model.layers.27.mlp.experts.37.down_proj.weight_scale": "model-00028-of-00047.safetensors", + "model.layers.27.mlp.experts.37.gate_proj.weight": "model-00028-of-00047.safetensors", + "model.layers.27.mlp.experts.37.gate_proj.weight_scale": "model-00028-of-00047.safetensors", + "model.layers.27.mlp.experts.37.up_proj.weight": "model-00028-of-00047.safetensors", + "model.layers.27.mlp.experts.37.up_proj.weight_scale": "model-00028-of-00047.safetensors", + "model.layers.27.mlp.experts.38.down_proj.weight": "model-00028-of-00047.safetensors", + "model.layers.27.mlp.experts.38.down_proj.weight_scale": "model-00028-of-00047.safetensors", + "model.layers.27.mlp.experts.38.gate_proj.weight": "model-00028-of-00047.safetensors", + "model.layers.27.mlp.experts.38.gate_proj.weight_scale": "model-00028-of-00047.safetensors", + "model.layers.27.mlp.experts.38.up_proj.weight": "model-00028-of-00047.safetensors", + "model.layers.27.mlp.experts.38.up_proj.weight_scale": "model-00028-of-00047.safetensors", + "model.layers.27.mlp.experts.39.down_proj.weight": "model-00028-of-00047.safetensors", + "model.layers.27.mlp.experts.39.down_proj.weight_scale": "model-00028-of-00047.safetensors", + "model.layers.27.mlp.experts.39.gate_proj.weight": "model-00028-of-00047.safetensors", + "model.layers.27.mlp.experts.39.gate_proj.weight_scale": "model-00028-of-00047.safetensors", + "model.layers.27.mlp.experts.39.up_proj.weight": "model-00028-of-00047.safetensors", + "model.layers.27.mlp.experts.39.up_proj.weight_scale": "model-00028-of-00047.safetensors", + "model.layers.27.mlp.experts.4.down_proj.weight": "model-00028-of-00047.safetensors", + "model.layers.27.mlp.experts.4.down_proj.weight_scale": "model-00028-of-00047.safetensors", + "model.layers.27.mlp.experts.4.gate_proj.weight": "model-00028-of-00047.safetensors", + "model.layers.27.mlp.experts.4.gate_proj.weight_scale": "model-00028-of-00047.safetensors", + "model.layers.27.mlp.experts.4.up_proj.weight": "model-00028-of-00047.safetensors", + "model.layers.27.mlp.experts.4.up_proj.weight_scale": "model-00028-of-00047.safetensors", + "model.layers.27.mlp.experts.40.down_proj.weight": "model-00028-of-00047.safetensors", + "model.layers.27.mlp.experts.40.down_proj.weight_scale": "model-00028-of-00047.safetensors", + "model.layers.27.mlp.experts.40.gate_proj.weight": "model-00028-of-00047.safetensors", + "model.layers.27.mlp.experts.40.gate_proj.weight_scale": "model-00028-of-00047.safetensors", + "model.layers.27.mlp.experts.40.up_proj.weight": "model-00028-of-00047.safetensors", + "model.layers.27.mlp.experts.40.up_proj.weight_scale": "model-00028-of-00047.safetensors", + "model.layers.27.mlp.experts.41.down_proj.weight": "model-00028-of-00047.safetensors", + "model.layers.27.mlp.experts.41.down_proj.weight_scale": "model-00028-of-00047.safetensors", + "model.layers.27.mlp.experts.41.gate_proj.weight": "model-00028-of-00047.safetensors", + "model.layers.27.mlp.experts.41.gate_proj.weight_scale": "model-00028-of-00047.safetensors", + "model.layers.27.mlp.experts.41.up_proj.weight": "model-00028-of-00047.safetensors", + "model.layers.27.mlp.experts.41.up_proj.weight_scale": "model-00028-of-00047.safetensors", + "model.layers.27.mlp.experts.42.down_proj.weight": "model-00028-of-00047.safetensors", + "model.layers.27.mlp.experts.42.down_proj.weight_scale": "model-00028-of-00047.safetensors", + "model.layers.27.mlp.experts.42.gate_proj.weight": "model-00028-of-00047.safetensors", + "model.layers.27.mlp.experts.42.gate_proj.weight_scale": "model-00028-of-00047.safetensors", + "model.layers.27.mlp.experts.42.up_proj.weight": "model-00028-of-00047.safetensors", + "model.layers.27.mlp.experts.42.up_proj.weight_scale": "model-00028-of-00047.safetensors", + "model.layers.27.mlp.experts.43.down_proj.weight": "model-00028-of-00047.safetensors", + "model.layers.27.mlp.experts.43.down_proj.weight_scale": "model-00028-of-00047.safetensors", + "model.layers.27.mlp.experts.43.gate_proj.weight": "model-00028-of-00047.safetensors", + "model.layers.27.mlp.experts.43.gate_proj.weight_scale": "model-00028-of-00047.safetensors", + "model.layers.27.mlp.experts.43.up_proj.weight": "model-00028-of-00047.safetensors", + "model.layers.27.mlp.experts.43.up_proj.weight_scale": "model-00028-of-00047.safetensors", + "model.layers.27.mlp.experts.44.down_proj.weight": "model-00028-of-00047.safetensors", + "model.layers.27.mlp.experts.44.down_proj.weight_scale": "model-00028-of-00047.safetensors", + "model.layers.27.mlp.experts.44.gate_proj.weight": "model-00028-of-00047.safetensors", + "model.layers.27.mlp.experts.44.gate_proj.weight_scale": "model-00028-of-00047.safetensors", + "model.layers.27.mlp.experts.44.up_proj.weight": "model-00028-of-00047.safetensors", + "model.layers.27.mlp.experts.44.up_proj.weight_scale": "model-00028-of-00047.safetensors", + "model.layers.27.mlp.experts.45.down_proj.weight": "model-00028-of-00047.safetensors", + "model.layers.27.mlp.experts.45.down_proj.weight_scale": "model-00028-of-00047.safetensors", + "model.layers.27.mlp.experts.45.gate_proj.weight": "model-00028-of-00047.safetensors", + "model.layers.27.mlp.experts.45.gate_proj.weight_scale": "model-00028-of-00047.safetensors", + "model.layers.27.mlp.experts.45.up_proj.weight": "model-00028-of-00047.safetensors", + "model.layers.27.mlp.experts.45.up_proj.weight_scale": "model-00028-of-00047.safetensors", + "model.layers.27.mlp.experts.46.down_proj.weight": "model-00028-of-00047.safetensors", + "model.layers.27.mlp.experts.46.down_proj.weight_scale": "model-00028-of-00047.safetensors", + "model.layers.27.mlp.experts.46.gate_proj.weight": "model-00028-of-00047.safetensors", + "model.layers.27.mlp.experts.46.gate_proj.weight_scale": "model-00028-of-00047.safetensors", + "model.layers.27.mlp.experts.46.up_proj.weight": "model-00028-of-00047.safetensors", + "model.layers.27.mlp.experts.46.up_proj.weight_scale": "model-00028-of-00047.safetensors", + "model.layers.27.mlp.experts.47.down_proj.weight": "model-00028-of-00047.safetensors", + "model.layers.27.mlp.experts.47.down_proj.weight_scale": "model-00028-of-00047.safetensors", + "model.layers.27.mlp.experts.47.gate_proj.weight": "model-00028-of-00047.safetensors", + "model.layers.27.mlp.experts.47.gate_proj.weight_scale": "model-00028-of-00047.safetensors", + "model.layers.27.mlp.experts.47.up_proj.weight": "model-00028-of-00047.safetensors", + "model.layers.27.mlp.experts.47.up_proj.weight_scale": "model-00028-of-00047.safetensors", + "model.layers.27.mlp.experts.48.down_proj.weight": "model-00028-of-00047.safetensors", + "model.layers.27.mlp.experts.48.down_proj.weight_scale": "model-00028-of-00047.safetensors", + "model.layers.27.mlp.experts.48.gate_proj.weight": "model-00028-of-00047.safetensors", + "model.layers.27.mlp.experts.48.gate_proj.weight_scale": "model-00028-of-00047.safetensors", + "model.layers.27.mlp.experts.48.up_proj.weight": "model-00028-of-00047.safetensors", + "model.layers.27.mlp.experts.48.up_proj.weight_scale": "model-00028-of-00047.safetensors", + "model.layers.27.mlp.experts.49.down_proj.weight": "model-00028-of-00047.safetensors", + "model.layers.27.mlp.experts.49.down_proj.weight_scale": "model-00028-of-00047.safetensors", + "model.layers.27.mlp.experts.49.gate_proj.weight": "model-00028-of-00047.safetensors", + "model.layers.27.mlp.experts.49.gate_proj.weight_scale": "model-00028-of-00047.safetensors", + "model.layers.27.mlp.experts.49.up_proj.weight": "model-00028-of-00047.safetensors", + "model.layers.27.mlp.experts.49.up_proj.weight_scale": "model-00028-of-00047.safetensors", + "model.layers.27.mlp.experts.5.down_proj.weight": "model-00028-of-00047.safetensors", + "model.layers.27.mlp.experts.5.down_proj.weight_scale": "model-00028-of-00047.safetensors", + "model.layers.27.mlp.experts.5.gate_proj.weight": "model-00028-of-00047.safetensors", + "model.layers.27.mlp.experts.5.gate_proj.weight_scale": "model-00028-of-00047.safetensors", + "model.layers.27.mlp.experts.5.up_proj.weight": "model-00028-of-00047.safetensors", + "model.layers.27.mlp.experts.5.up_proj.weight_scale": "model-00028-of-00047.safetensors", + "model.layers.27.mlp.experts.50.down_proj.weight": "model-00028-of-00047.safetensors", + "model.layers.27.mlp.experts.50.down_proj.weight_scale": "model-00028-of-00047.safetensors", + "model.layers.27.mlp.experts.50.gate_proj.weight": "model-00028-of-00047.safetensors", + "model.layers.27.mlp.experts.50.gate_proj.weight_scale": "model-00028-of-00047.safetensors", + "model.layers.27.mlp.experts.50.up_proj.weight": "model-00028-of-00047.safetensors", + "model.layers.27.mlp.experts.50.up_proj.weight_scale": "model-00028-of-00047.safetensors", + "model.layers.27.mlp.experts.51.down_proj.weight": "model-00028-of-00047.safetensors", + "model.layers.27.mlp.experts.51.down_proj.weight_scale": "model-00028-of-00047.safetensors", + "model.layers.27.mlp.experts.51.gate_proj.weight": "model-00028-of-00047.safetensors", + "model.layers.27.mlp.experts.51.gate_proj.weight_scale": "model-00028-of-00047.safetensors", + "model.layers.27.mlp.experts.51.up_proj.weight": "model-00028-of-00047.safetensors", + "model.layers.27.mlp.experts.51.up_proj.weight_scale": "model-00028-of-00047.safetensors", + "model.layers.27.mlp.experts.52.down_proj.weight": "model-00028-of-00047.safetensors", + "model.layers.27.mlp.experts.52.down_proj.weight_scale": "model-00028-of-00047.safetensors", + "model.layers.27.mlp.experts.52.gate_proj.weight": "model-00028-of-00047.safetensors", + "model.layers.27.mlp.experts.52.gate_proj.weight_scale": "model-00028-of-00047.safetensors", + "model.layers.27.mlp.experts.52.up_proj.weight": "model-00028-of-00047.safetensors", + "model.layers.27.mlp.experts.52.up_proj.weight_scale": "model-00028-of-00047.safetensors", + "model.layers.27.mlp.experts.53.down_proj.weight": "model-00028-of-00047.safetensors", + "model.layers.27.mlp.experts.53.down_proj.weight_scale": "model-00028-of-00047.safetensors", + "model.layers.27.mlp.experts.53.gate_proj.weight": "model-00028-of-00047.safetensors", + "model.layers.27.mlp.experts.53.gate_proj.weight_scale": "model-00028-of-00047.safetensors", + "model.layers.27.mlp.experts.53.up_proj.weight": "model-00028-of-00047.safetensors", + "model.layers.27.mlp.experts.53.up_proj.weight_scale": "model-00028-of-00047.safetensors", + "model.layers.27.mlp.experts.54.down_proj.weight": "model-00028-of-00047.safetensors", + "model.layers.27.mlp.experts.54.down_proj.weight_scale": "model-00028-of-00047.safetensors", + "model.layers.27.mlp.experts.54.gate_proj.weight": "model-00028-of-00047.safetensors", + "model.layers.27.mlp.experts.54.gate_proj.weight_scale": "model-00028-of-00047.safetensors", + "model.layers.27.mlp.experts.54.up_proj.weight": "model-00028-of-00047.safetensors", + "model.layers.27.mlp.experts.54.up_proj.weight_scale": "model-00028-of-00047.safetensors", + "model.layers.27.mlp.experts.55.down_proj.weight": "model-00028-of-00047.safetensors", + "model.layers.27.mlp.experts.55.down_proj.weight_scale": "model-00028-of-00047.safetensors", + "model.layers.27.mlp.experts.55.gate_proj.weight": "model-00028-of-00047.safetensors", + "model.layers.27.mlp.experts.55.gate_proj.weight_scale": "model-00028-of-00047.safetensors", + "model.layers.27.mlp.experts.55.up_proj.weight": "model-00028-of-00047.safetensors", + "model.layers.27.mlp.experts.55.up_proj.weight_scale": "model-00028-of-00047.safetensors", + "model.layers.27.mlp.experts.56.down_proj.weight": "model-00028-of-00047.safetensors", + "model.layers.27.mlp.experts.56.down_proj.weight_scale": "model-00028-of-00047.safetensors", + "model.layers.27.mlp.experts.56.gate_proj.weight": "model-00028-of-00047.safetensors", + "model.layers.27.mlp.experts.56.gate_proj.weight_scale": "model-00028-of-00047.safetensors", + "model.layers.27.mlp.experts.56.up_proj.weight": "model-00028-of-00047.safetensors", + "model.layers.27.mlp.experts.56.up_proj.weight_scale": "model-00028-of-00047.safetensors", + "model.layers.27.mlp.experts.57.down_proj.weight": "model-00028-of-00047.safetensors", + "model.layers.27.mlp.experts.57.down_proj.weight_scale": "model-00028-of-00047.safetensors", + "model.layers.27.mlp.experts.57.gate_proj.weight": "model-00028-of-00047.safetensors", + "model.layers.27.mlp.experts.57.gate_proj.weight_scale": "model-00028-of-00047.safetensors", + "model.layers.27.mlp.experts.57.up_proj.weight": "model-00028-of-00047.safetensors", + "model.layers.27.mlp.experts.57.up_proj.weight_scale": "model-00028-of-00047.safetensors", + "model.layers.27.mlp.experts.58.down_proj.weight": "model-00028-of-00047.safetensors", + "model.layers.27.mlp.experts.58.down_proj.weight_scale": "model-00028-of-00047.safetensors", + "model.layers.27.mlp.experts.58.gate_proj.weight": "model-00028-of-00047.safetensors", + "model.layers.27.mlp.experts.58.gate_proj.weight_scale": "model-00028-of-00047.safetensors", + "model.layers.27.mlp.experts.58.up_proj.weight": "model-00028-of-00047.safetensors", + "model.layers.27.mlp.experts.58.up_proj.weight_scale": "model-00028-of-00047.safetensors", + "model.layers.27.mlp.experts.59.down_proj.weight": "model-00028-of-00047.safetensors", + "model.layers.27.mlp.experts.59.down_proj.weight_scale": "model-00028-of-00047.safetensors", + "model.layers.27.mlp.experts.59.gate_proj.weight": "model-00028-of-00047.safetensors", + "model.layers.27.mlp.experts.59.gate_proj.weight_scale": "model-00028-of-00047.safetensors", + "model.layers.27.mlp.experts.59.up_proj.weight": "model-00028-of-00047.safetensors", + "model.layers.27.mlp.experts.59.up_proj.weight_scale": "model-00028-of-00047.safetensors", + "model.layers.27.mlp.experts.6.down_proj.weight": "model-00028-of-00047.safetensors", + "model.layers.27.mlp.experts.6.down_proj.weight_scale": "model-00028-of-00047.safetensors", + "model.layers.27.mlp.experts.6.gate_proj.weight": "model-00028-of-00047.safetensors", + "model.layers.27.mlp.experts.6.gate_proj.weight_scale": "model-00028-of-00047.safetensors", + "model.layers.27.mlp.experts.6.up_proj.weight": "model-00028-of-00047.safetensors", + "model.layers.27.mlp.experts.6.up_proj.weight_scale": "model-00028-of-00047.safetensors", + "model.layers.27.mlp.experts.60.down_proj.weight": "model-00028-of-00047.safetensors", + "model.layers.27.mlp.experts.60.down_proj.weight_scale": "model-00028-of-00047.safetensors", + "model.layers.27.mlp.experts.60.gate_proj.weight": "model-00028-of-00047.safetensors", + "model.layers.27.mlp.experts.60.gate_proj.weight_scale": "model-00028-of-00047.safetensors", + "model.layers.27.mlp.experts.60.up_proj.weight": "model-00028-of-00047.safetensors", + "model.layers.27.mlp.experts.60.up_proj.weight_scale": "model-00028-of-00047.safetensors", + "model.layers.27.mlp.experts.61.down_proj.weight": "model-00028-of-00047.safetensors", + "model.layers.27.mlp.experts.61.down_proj.weight_scale": "model-00028-of-00047.safetensors", + "model.layers.27.mlp.experts.61.gate_proj.weight": "model-00028-of-00047.safetensors", + "model.layers.27.mlp.experts.61.gate_proj.weight_scale": "model-00028-of-00047.safetensors", + "model.layers.27.mlp.experts.61.up_proj.weight": "model-00028-of-00047.safetensors", + "model.layers.27.mlp.experts.61.up_proj.weight_scale": "model-00028-of-00047.safetensors", + "model.layers.27.mlp.experts.62.down_proj.weight": "model-00028-of-00047.safetensors", + "model.layers.27.mlp.experts.62.down_proj.weight_scale": "model-00028-of-00047.safetensors", + "model.layers.27.mlp.experts.62.gate_proj.weight": "model-00028-of-00047.safetensors", + "model.layers.27.mlp.experts.62.gate_proj.weight_scale": "model-00028-of-00047.safetensors", + "model.layers.27.mlp.experts.62.up_proj.weight": "model-00028-of-00047.safetensors", + "model.layers.27.mlp.experts.62.up_proj.weight_scale": "model-00028-of-00047.safetensors", + "model.layers.27.mlp.experts.63.down_proj.weight": "model-00028-of-00047.safetensors", + "model.layers.27.mlp.experts.63.down_proj.weight_scale": "model-00028-of-00047.safetensors", + "model.layers.27.mlp.experts.63.gate_proj.weight": "model-00028-of-00047.safetensors", + "model.layers.27.mlp.experts.63.gate_proj.weight_scale": "model-00028-of-00047.safetensors", + "model.layers.27.mlp.experts.63.up_proj.weight": "model-00028-of-00047.safetensors", + "model.layers.27.mlp.experts.63.up_proj.weight_scale": "model-00028-of-00047.safetensors", + "model.layers.27.mlp.experts.64.down_proj.weight": "model-00028-of-00047.safetensors", + "model.layers.27.mlp.experts.64.down_proj.weight_scale": "model-00028-of-00047.safetensors", + "model.layers.27.mlp.experts.64.gate_proj.weight": "model-00028-of-00047.safetensors", + "model.layers.27.mlp.experts.64.gate_proj.weight_scale": "model-00028-of-00047.safetensors", + "model.layers.27.mlp.experts.64.up_proj.weight": "model-00028-of-00047.safetensors", + "model.layers.27.mlp.experts.64.up_proj.weight_scale": "model-00028-of-00047.safetensors", + "model.layers.27.mlp.experts.65.down_proj.weight": "model-00028-of-00047.safetensors", + "model.layers.27.mlp.experts.65.down_proj.weight_scale": "model-00028-of-00047.safetensors", + "model.layers.27.mlp.experts.65.gate_proj.weight": "model-00028-of-00047.safetensors", + "model.layers.27.mlp.experts.65.gate_proj.weight_scale": "model-00028-of-00047.safetensors", + "model.layers.27.mlp.experts.65.up_proj.weight": "model-00028-of-00047.safetensors", + "model.layers.27.mlp.experts.65.up_proj.weight_scale": "model-00028-of-00047.safetensors", + "model.layers.27.mlp.experts.66.down_proj.weight": "model-00028-of-00047.safetensors", + "model.layers.27.mlp.experts.66.down_proj.weight_scale": "model-00028-of-00047.safetensors", + "model.layers.27.mlp.experts.66.gate_proj.weight": "model-00028-of-00047.safetensors", + "model.layers.27.mlp.experts.66.gate_proj.weight_scale": "model-00028-of-00047.safetensors", + "model.layers.27.mlp.experts.66.up_proj.weight": "model-00028-of-00047.safetensors", + "model.layers.27.mlp.experts.66.up_proj.weight_scale": "model-00028-of-00047.safetensors", + "model.layers.27.mlp.experts.67.down_proj.weight": "model-00028-of-00047.safetensors", + "model.layers.27.mlp.experts.67.down_proj.weight_scale": "model-00028-of-00047.safetensors", + "model.layers.27.mlp.experts.67.gate_proj.weight": "model-00028-of-00047.safetensors", + "model.layers.27.mlp.experts.67.gate_proj.weight_scale": "model-00028-of-00047.safetensors", + "model.layers.27.mlp.experts.67.up_proj.weight": "model-00028-of-00047.safetensors", + "model.layers.27.mlp.experts.67.up_proj.weight_scale": "model-00028-of-00047.safetensors", + "model.layers.27.mlp.experts.68.down_proj.weight": "model-00028-of-00047.safetensors", + "model.layers.27.mlp.experts.68.down_proj.weight_scale": "model-00028-of-00047.safetensors", + "model.layers.27.mlp.experts.68.gate_proj.weight": "model-00028-of-00047.safetensors", + "model.layers.27.mlp.experts.68.gate_proj.weight_scale": "model-00028-of-00047.safetensors", + "model.layers.27.mlp.experts.68.up_proj.weight": "model-00028-of-00047.safetensors", + "model.layers.27.mlp.experts.68.up_proj.weight_scale": "model-00028-of-00047.safetensors", + "model.layers.27.mlp.experts.69.down_proj.weight": "model-00028-of-00047.safetensors", + "model.layers.27.mlp.experts.69.down_proj.weight_scale": "model-00028-of-00047.safetensors", + "model.layers.27.mlp.experts.69.gate_proj.weight": "model-00028-of-00047.safetensors", + "model.layers.27.mlp.experts.69.gate_proj.weight_scale": "model-00028-of-00047.safetensors", + "model.layers.27.mlp.experts.69.up_proj.weight": "model-00028-of-00047.safetensors", + "model.layers.27.mlp.experts.69.up_proj.weight_scale": "model-00028-of-00047.safetensors", + "model.layers.27.mlp.experts.7.down_proj.weight": "model-00028-of-00047.safetensors", + "model.layers.27.mlp.experts.7.down_proj.weight_scale": "model-00028-of-00047.safetensors", + "model.layers.27.mlp.experts.7.gate_proj.weight": "model-00028-of-00047.safetensors", + "model.layers.27.mlp.experts.7.gate_proj.weight_scale": "model-00028-of-00047.safetensors", + "model.layers.27.mlp.experts.7.up_proj.weight": "model-00028-of-00047.safetensors", + "model.layers.27.mlp.experts.7.up_proj.weight_scale": "model-00028-of-00047.safetensors", + "model.layers.27.mlp.experts.70.down_proj.weight": "model-00028-of-00047.safetensors", + "model.layers.27.mlp.experts.70.down_proj.weight_scale": "model-00028-of-00047.safetensors", + "model.layers.27.mlp.experts.70.gate_proj.weight": "model-00028-of-00047.safetensors", + "model.layers.27.mlp.experts.70.gate_proj.weight_scale": "model-00028-of-00047.safetensors", + "model.layers.27.mlp.experts.70.up_proj.weight": "model-00028-of-00047.safetensors", + "model.layers.27.mlp.experts.70.up_proj.weight_scale": "model-00028-of-00047.safetensors", + "model.layers.27.mlp.experts.71.down_proj.weight": "model-00028-of-00047.safetensors", + "model.layers.27.mlp.experts.71.down_proj.weight_scale": "model-00028-of-00047.safetensors", + "model.layers.27.mlp.experts.71.gate_proj.weight": "model-00028-of-00047.safetensors", + "model.layers.27.mlp.experts.71.gate_proj.weight_scale": "model-00028-of-00047.safetensors", + "model.layers.27.mlp.experts.71.up_proj.weight": "model-00028-of-00047.safetensors", + "model.layers.27.mlp.experts.71.up_proj.weight_scale": "model-00028-of-00047.safetensors", + "model.layers.27.mlp.experts.72.down_proj.weight": "model-00028-of-00047.safetensors", + "model.layers.27.mlp.experts.72.down_proj.weight_scale": "model-00028-of-00047.safetensors", + "model.layers.27.mlp.experts.72.gate_proj.weight": "model-00028-of-00047.safetensors", + "model.layers.27.mlp.experts.72.gate_proj.weight_scale": "model-00028-of-00047.safetensors", + "model.layers.27.mlp.experts.72.up_proj.weight": "model-00028-of-00047.safetensors", + "model.layers.27.mlp.experts.72.up_proj.weight_scale": "model-00028-of-00047.safetensors", + "model.layers.27.mlp.experts.73.down_proj.weight": "model-00028-of-00047.safetensors", + "model.layers.27.mlp.experts.73.down_proj.weight_scale": "model-00028-of-00047.safetensors", + "model.layers.27.mlp.experts.73.gate_proj.weight": "model-00028-of-00047.safetensors", + "model.layers.27.mlp.experts.73.gate_proj.weight_scale": "model-00028-of-00047.safetensors", + "model.layers.27.mlp.experts.73.up_proj.weight": "model-00028-of-00047.safetensors", + "model.layers.27.mlp.experts.73.up_proj.weight_scale": "model-00028-of-00047.safetensors", + "model.layers.27.mlp.experts.74.down_proj.weight": "model-00028-of-00047.safetensors", + "model.layers.27.mlp.experts.74.down_proj.weight_scale": "model-00028-of-00047.safetensors", + "model.layers.27.mlp.experts.74.gate_proj.weight": "model-00028-of-00047.safetensors", + "model.layers.27.mlp.experts.74.gate_proj.weight_scale": "model-00028-of-00047.safetensors", + "model.layers.27.mlp.experts.74.up_proj.weight": "model-00028-of-00047.safetensors", + "model.layers.27.mlp.experts.74.up_proj.weight_scale": "model-00028-of-00047.safetensors", + "model.layers.27.mlp.experts.75.down_proj.weight": "model-00028-of-00047.safetensors", + "model.layers.27.mlp.experts.75.down_proj.weight_scale": "model-00028-of-00047.safetensors", + "model.layers.27.mlp.experts.75.gate_proj.weight": "model-00028-of-00047.safetensors", + "model.layers.27.mlp.experts.75.gate_proj.weight_scale": "model-00028-of-00047.safetensors", + "model.layers.27.mlp.experts.75.up_proj.weight": "model-00028-of-00047.safetensors", + "model.layers.27.mlp.experts.75.up_proj.weight_scale": "model-00028-of-00047.safetensors", + "model.layers.27.mlp.experts.76.down_proj.weight": "model-00028-of-00047.safetensors", + "model.layers.27.mlp.experts.76.down_proj.weight_scale": "model-00028-of-00047.safetensors", + "model.layers.27.mlp.experts.76.gate_proj.weight": "model-00028-of-00047.safetensors", + "model.layers.27.mlp.experts.76.gate_proj.weight_scale": "model-00028-of-00047.safetensors", + "model.layers.27.mlp.experts.76.up_proj.weight": "model-00028-of-00047.safetensors", + "model.layers.27.mlp.experts.76.up_proj.weight_scale": "model-00028-of-00047.safetensors", + "model.layers.27.mlp.experts.77.down_proj.weight": "model-00028-of-00047.safetensors", + "model.layers.27.mlp.experts.77.down_proj.weight_scale": "model-00028-of-00047.safetensors", + "model.layers.27.mlp.experts.77.gate_proj.weight": "model-00028-of-00047.safetensors", + "model.layers.27.mlp.experts.77.gate_proj.weight_scale": "model-00028-of-00047.safetensors", + "model.layers.27.mlp.experts.77.up_proj.weight": "model-00028-of-00047.safetensors", + "model.layers.27.mlp.experts.77.up_proj.weight_scale": "model-00028-of-00047.safetensors", + "model.layers.27.mlp.experts.78.down_proj.weight": "model-00028-of-00047.safetensors", + "model.layers.27.mlp.experts.78.down_proj.weight_scale": "model-00028-of-00047.safetensors", + "model.layers.27.mlp.experts.78.gate_proj.weight": "model-00028-of-00047.safetensors", + "model.layers.27.mlp.experts.78.gate_proj.weight_scale": "model-00028-of-00047.safetensors", + "model.layers.27.mlp.experts.78.up_proj.weight": "model-00028-of-00047.safetensors", + "model.layers.27.mlp.experts.78.up_proj.weight_scale": "model-00028-of-00047.safetensors", + "model.layers.27.mlp.experts.79.down_proj.weight": "model-00028-of-00047.safetensors", + "model.layers.27.mlp.experts.79.down_proj.weight_scale": "model-00028-of-00047.safetensors", + "model.layers.27.mlp.experts.79.gate_proj.weight": "model-00028-of-00047.safetensors", + "model.layers.27.mlp.experts.79.gate_proj.weight_scale": "model-00028-of-00047.safetensors", + "model.layers.27.mlp.experts.79.up_proj.weight": "model-00028-of-00047.safetensors", + "model.layers.27.mlp.experts.79.up_proj.weight_scale": "model-00028-of-00047.safetensors", + "model.layers.27.mlp.experts.8.down_proj.weight": "model-00028-of-00047.safetensors", + "model.layers.27.mlp.experts.8.down_proj.weight_scale": "model-00028-of-00047.safetensors", + "model.layers.27.mlp.experts.8.gate_proj.weight": "model-00028-of-00047.safetensors", + "model.layers.27.mlp.experts.8.gate_proj.weight_scale": "model-00028-of-00047.safetensors", + "model.layers.27.mlp.experts.8.up_proj.weight": "model-00028-of-00047.safetensors", + "model.layers.27.mlp.experts.8.up_proj.weight_scale": "model-00028-of-00047.safetensors", + "model.layers.27.mlp.experts.80.down_proj.weight": "model-00028-of-00047.safetensors", + "model.layers.27.mlp.experts.80.down_proj.weight_scale": "model-00028-of-00047.safetensors", + "model.layers.27.mlp.experts.80.gate_proj.weight": "model-00028-of-00047.safetensors", + "model.layers.27.mlp.experts.80.gate_proj.weight_scale": "model-00028-of-00047.safetensors", + "model.layers.27.mlp.experts.80.up_proj.weight": "model-00028-of-00047.safetensors", + "model.layers.27.mlp.experts.80.up_proj.weight_scale": "model-00028-of-00047.safetensors", + "model.layers.27.mlp.experts.81.down_proj.weight": "model-00028-of-00047.safetensors", + "model.layers.27.mlp.experts.81.down_proj.weight_scale": "model-00028-of-00047.safetensors", + "model.layers.27.mlp.experts.81.gate_proj.weight": "model-00028-of-00047.safetensors", + "model.layers.27.mlp.experts.81.gate_proj.weight_scale": "model-00028-of-00047.safetensors", + "model.layers.27.mlp.experts.81.up_proj.weight": "model-00028-of-00047.safetensors", + "model.layers.27.mlp.experts.81.up_proj.weight_scale": "model-00028-of-00047.safetensors", + "model.layers.27.mlp.experts.82.down_proj.weight": "model-00028-of-00047.safetensors", + "model.layers.27.mlp.experts.82.down_proj.weight_scale": "model-00028-of-00047.safetensors", + "model.layers.27.mlp.experts.82.gate_proj.weight": "model-00028-of-00047.safetensors", + "model.layers.27.mlp.experts.82.gate_proj.weight_scale": "model-00028-of-00047.safetensors", + "model.layers.27.mlp.experts.82.up_proj.weight": "model-00028-of-00047.safetensors", + "model.layers.27.mlp.experts.82.up_proj.weight_scale": "model-00028-of-00047.safetensors", + "model.layers.27.mlp.experts.83.down_proj.weight": "model-00028-of-00047.safetensors", + "model.layers.27.mlp.experts.83.down_proj.weight_scale": "model-00028-of-00047.safetensors", + "model.layers.27.mlp.experts.83.gate_proj.weight": "model-00028-of-00047.safetensors", + "model.layers.27.mlp.experts.83.gate_proj.weight_scale": "model-00028-of-00047.safetensors", + "model.layers.27.mlp.experts.83.up_proj.weight": "model-00028-of-00047.safetensors", + "model.layers.27.mlp.experts.83.up_proj.weight_scale": "model-00028-of-00047.safetensors", + "model.layers.27.mlp.experts.84.down_proj.weight": "model-00028-of-00047.safetensors", + "model.layers.27.mlp.experts.84.down_proj.weight_scale": "model-00028-of-00047.safetensors", + "model.layers.27.mlp.experts.84.gate_proj.weight": "model-00028-of-00047.safetensors", + "model.layers.27.mlp.experts.84.gate_proj.weight_scale": "model-00028-of-00047.safetensors", + "model.layers.27.mlp.experts.84.up_proj.weight": "model-00028-of-00047.safetensors", + "model.layers.27.mlp.experts.84.up_proj.weight_scale": "model-00028-of-00047.safetensors", + "model.layers.27.mlp.experts.85.down_proj.weight": "model-00028-of-00047.safetensors", + "model.layers.27.mlp.experts.85.down_proj.weight_scale": "model-00028-of-00047.safetensors", + "model.layers.27.mlp.experts.85.gate_proj.weight": "model-00028-of-00047.safetensors", + "model.layers.27.mlp.experts.85.gate_proj.weight_scale": "model-00028-of-00047.safetensors", + "model.layers.27.mlp.experts.85.up_proj.weight": "model-00028-of-00047.safetensors", + "model.layers.27.mlp.experts.85.up_proj.weight_scale": "model-00028-of-00047.safetensors", + "model.layers.27.mlp.experts.86.down_proj.weight": "model-00028-of-00047.safetensors", + "model.layers.27.mlp.experts.86.down_proj.weight_scale": "model-00028-of-00047.safetensors", + "model.layers.27.mlp.experts.86.gate_proj.weight": "model-00028-of-00047.safetensors", + "model.layers.27.mlp.experts.86.gate_proj.weight_scale": "model-00028-of-00047.safetensors", + "model.layers.27.mlp.experts.86.up_proj.weight": "model-00028-of-00047.safetensors", + "model.layers.27.mlp.experts.86.up_proj.weight_scale": "model-00028-of-00047.safetensors", + "model.layers.27.mlp.experts.87.down_proj.weight": "model-00028-of-00047.safetensors", + "model.layers.27.mlp.experts.87.down_proj.weight_scale": "model-00028-of-00047.safetensors", + "model.layers.27.mlp.experts.87.gate_proj.weight": "model-00028-of-00047.safetensors", + "model.layers.27.mlp.experts.87.gate_proj.weight_scale": "model-00028-of-00047.safetensors", + "model.layers.27.mlp.experts.87.up_proj.weight": "model-00028-of-00047.safetensors", + "model.layers.27.mlp.experts.87.up_proj.weight_scale": "model-00028-of-00047.safetensors", + "model.layers.27.mlp.experts.88.down_proj.weight": "model-00028-of-00047.safetensors", + "model.layers.27.mlp.experts.88.down_proj.weight_scale": "model-00028-of-00047.safetensors", + "model.layers.27.mlp.experts.88.gate_proj.weight": "model-00028-of-00047.safetensors", + "model.layers.27.mlp.experts.88.gate_proj.weight_scale": "model-00028-of-00047.safetensors", + "model.layers.27.mlp.experts.88.up_proj.weight": "model-00028-of-00047.safetensors", + "model.layers.27.mlp.experts.88.up_proj.weight_scale": "model-00028-of-00047.safetensors", + "model.layers.27.mlp.experts.89.down_proj.weight": "model-00028-of-00047.safetensors", + "model.layers.27.mlp.experts.89.down_proj.weight_scale": "model-00028-of-00047.safetensors", + "model.layers.27.mlp.experts.89.gate_proj.weight": "model-00028-of-00047.safetensors", + "model.layers.27.mlp.experts.89.gate_proj.weight_scale": "model-00028-of-00047.safetensors", + "model.layers.27.mlp.experts.89.up_proj.weight": "model-00028-of-00047.safetensors", + "model.layers.27.mlp.experts.89.up_proj.weight_scale": "model-00028-of-00047.safetensors", + "model.layers.27.mlp.experts.9.down_proj.weight": "model-00028-of-00047.safetensors", + "model.layers.27.mlp.experts.9.down_proj.weight_scale": "model-00028-of-00047.safetensors", + "model.layers.27.mlp.experts.9.gate_proj.weight": "model-00028-of-00047.safetensors", + "model.layers.27.mlp.experts.9.gate_proj.weight_scale": "model-00028-of-00047.safetensors", + "model.layers.27.mlp.experts.9.up_proj.weight": "model-00028-of-00047.safetensors", + "model.layers.27.mlp.experts.9.up_proj.weight_scale": "model-00028-of-00047.safetensors", + "model.layers.27.mlp.experts.90.down_proj.weight": "model-00028-of-00047.safetensors", + "model.layers.27.mlp.experts.90.down_proj.weight_scale": "model-00028-of-00047.safetensors", + "model.layers.27.mlp.experts.90.gate_proj.weight": "model-00028-of-00047.safetensors", + "model.layers.27.mlp.experts.90.gate_proj.weight_scale": "model-00028-of-00047.safetensors", + "model.layers.27.mlp.experts.90.up_proj.weight": "model-00028-of-00047.safetensors", + "model.layers.27.mlp.experts.90.up_proj.weight_scale": "model-00028-of-00047.safetensors", + "model.layers.27.mlp.experts.91.down_proj.weight": "model-00028-of-00047.safetensors", + "model.layers.27.mlp.experts.91.down_proj.weight_scale": "model-00028-of-00047.safetensors", + "model.layers.27.mlp.experts.91.gate_proj.weight": "model-00028-of-00047.safetensors", + "model.layers.27.mlp.experts.91.gate_proj.weight_scale": "model-00028-of-00047.safetensors", + "model.layers.27.mlp.experts.91.up_proj.weight": "model-00028-of-00047.safetensors", + "model.layers.27.mlp.experts.91.up_proj.weight_scale": "model-00028-of-00047.safetensors", + "model.layers.27.mlp.experts.92.down_proj.weight": "model-00028-of-00047.safetensors", + "model.layers.27.mlp.experts.92.down_proj.weight_scale": "model-00028-of-00047.safetensors", + "model.layers.27.mlp.experts.92.gate_proj.weight": "model-00028-of-00047.safetensors", + "model.layers.27.mlp.experts.92.gate_proj.weight_scale": "model-00028-of-00047.safetensors", + "model.layers.27.mlp.experts.92.up_proj.weight": "model-00028-of-00047.safetensors", + "model.layers.27.mlp.experts.92.up_proj.weight_scale": "model-00028-of-00047.safetensors", + "model.layers.27.mlp.experts.93.down_proj.weight": "model-00028-of-00047.safetensors", + "model.layers.27.mlp.experts.93.down_proj.weight_scale": "model-00028-of-00047.safetensors", + "model.layers.27.mlp.experts.93.gate_proj.weight": "model-00028-of-00047.safetensors", + "model.layers.27.mlp.experts.93.gate_proj.weight_scale": "model-00028-of-00047.safetensors", + "model.layers.27.mlp.experts.93.up_proj.weight": "model-00028-of-00047.safetensors", + "model.layers.27.mlp.experts.93.up_proj.weight_scale": "model-00028-of-00047.safetensors", + "model.layers.27.mlp.experts.94.down_proj.weight": "model-00028-of-00047.safetensors", + "model.layers.27.mlp.experts.94.down_proj.weight_scale": "model-00028-of-00047.safetensors", + "model.layers.27.mlp.experts.94.gate_proj.weight": "model-00028-of-00047.safetensors", + "model.layers.27.mlp.experts.94.gate_proj.weight_scale": "model-00028-of-00047.safetensors", + "model.layers.27.mlp.experts.94.up_proj.weight": "model-00028-of-00047.safetensors", + "model.layers.27.mlp.experts.94.up_proj.weight_scale": "model-00028-of-00047.safetensors", + "model.layers.27.mlp.experts.95.down_proj.weight": "model-00028-of-00047.safetensors", + "model.layers.27.mlp.experts.95.down_proj.weight_scale": "model-00028-of-00047.safetensors", + "model.layers.27.mlp.experts.95.gate_proj.weight": "model-00028-of-00047.safetensors", + "model.layers.27.mlp.experts.95.gate_proj.weight_scale": "model-00028-of-00047.safetensors", + "model.layers.27.mlp.experts.95.up_proj.weight": "model-00028-of-00047.safetensors", + "model.layers.27.mlp.experts.95.up_proj.weight_scale": "model-00028-of-00047.safetensors", + "model.layers.27.mlp.experts.96.down_proj.weight": "model-00028-of-00047.safetensors", + "model.layers.27.mlp.experts.96.down_proj.weight_scale": "model-00028-of-00047.safetensors", + "model.layers.27.mlp.experts.96.gate_proj.weight": "model-00028-of-00047.safetensors", + "model.layers.27.mlp.experts.96.gate_proj.weight_scale": "model-00028-of-00047.safetensors", + "model.layers.27.mlp.experts.96.up_proj.weight": "model-00028-of-00047.safetensors", + "model.layers.27.mlp.experts.96.up_proj.weight_scale": "model-00028-of-00047.safetensors", + "model.layers.27.mlp.experts.97.down_proj.weight": "model-00028-of-00047.safetensors", + "model.layers.27.mlp.experts.97.down_proj.weight_scale": "model-00028-of-00047.safetensors", + "model.layers.27.mlp.experts.97.gate_proj.weight": "model-00028-of-00047.safetensors", + "model.layers.27.mlp.experts.97.gate_proj.weight_scale": "model-00028-of-00047.safetensors", + "model.layers.27.mlp.experts.97.up_proj.weight": "model-00028-of-00047.safetensors", + "model.layers.27.mlp.experts.97.up_proj.weight_scale": "model-00028-of-00047.safetensors", + "model.layers.27.mlp.experts.98.down_proj.weight": "model-00028-of-00047.safetensors", + "model.layers.27.mlp.experts.98.down_proj.weight_scale": "model-00028-of-00047.safetensors", + "model.layers.27.mlp.experts.98.gate_proj.weight": "model-00028-of-00047.safetensors", + "model.layers.27.mlp.experts.98.gate_proj.weight_scale": "model-00028-of-00047.safetensors", + "model.layers.27.mlp.experts.98.up_proj.weight": "model-00028-of-00047.safetensors", + "model.layers.27.mlp.experts.98.up_proj.weight_scale": "model-00028-of-00047.safetensors", + "model.layers.27.mlp.experts.99.down_proj.weight": "model-00028-of-00047.safetensors", + "model.layers.27.mlp.experts.99.down_proj.weight_scale": "model-00028-of-00047.safetensors", + "model.layers.27.mlp.experts.99.gate_proj.weight": "model-00028-of-00047.safetensors", + "model.layers.27.mlp.experts.99.gate_proj.weight_scale": "model-00028-of-00047.safetensors", + "model.layers.27.mlp.experts.99.up_proj.weight": "model-00028-of-00047.safetensors", + "model.layers.27.mlp.experts.99.up_proj.weight_scale": "model-00028-of-00047.safetensors", + "model.layers.27.mlp.gate.e_score_correction_bias": "model-00028-of-00047.safetensors", + "model.layers.27.mlp.gate.weight": "model-00028-of-00047.safetensors", + "model.layers.27.mlp.shared_experts.down_proj.weight": "model-00028-of-00047.safetensors", + "model.layers.27.mlp.shared_experts.down_proj.weight_scale": "model-00028-of-00047.safetensors", + "model.layers.27.mlp.shared_experts.gate_proj.weight": "model-00028-of-00047.safetensors", + "model.layers.27.mlp.shared_experts.gate_proj.weight_scale": "model-00028-of-00047.safetensors", + "model.layers.27.mlp.shared_experts.up_proj.weight": "model-00028-of-00047.safetensors", + "model.layers.27.mlp.shared_experts.up_proj.weight_scale": "model-00028-of-00047.safetensors", + "model.layers.27.post_attention_layernorm.weight": "model-00028-of-00047.safetensors", + "model.layers.27.self_attn.k_proj.bias": "model-00028-of-00047.safetensors", + "model.layers.27.self_attn.k_proj.weight": "model-00028-of-00047.safetensors", + "model.layers.27.self_attn.k_proj.weight_scale": "model-00028-of-00047.safetensors", + "model.layers.27.self_attn.o_proj.weight": "model-00028-of-00047.safetensors", + "model.layers.27.self_attn.o_proj.weight_scale": "model-00028-of-00047.safetensors", + "model.layers.27.self_attn.q_proj.bias": "model-00028-of-00047.safetensors", + "model.layers.27.self_attn.q_proj.weight": "model-00028-of-00047.safetensors", + "model.layers.27.self_attn.q_proj.weight_scale": "model-00028-of-00047.safetensors", + "model.layers.27.self_attn.v_proj.bias": "model-00028-of-00047.safetensors", + "model.layers.27.self_attn.v_proj.weight": "model-00028-of-00047.safetensors", + "model.layers.27.self_attn.v_proj.weight_scale": "model-00028-of-00047.safetensors", + "model.layers.28.input_layernorm.weight": "model-00029-of-00047.safetensors", + "model.layers.28.mlp.experts.0.down_proj.weight": "model-00029-of-00047.safetensors", + "model.layers.28.mlp.experts.0.down_proj.weight_scale": "model-00029-of-00047.safetensors", + "model.layers.28.mlp.experts.0.gate_proj.weight": "model-00029-of-00047.safetensors", + "model.layers.28.mlp.experts.0.gate_proj.weight_scale": "model-00029-of-00047.safetensors", + "model.layers.28.mlp.experts.0.up_proj.weight": "model-00029-of-00047.safetensors", + "model.layers.28.mlp.experts.0.up_proj.weight_scale": "model-00029-of-00047.safetensors", + "model.layers.28.mlp.experts.1.down_proj.weight": "model-00029-of-00047.safetensors", + "model.layers.28.mlp.experts.1.down_proj.weight_scale": "model-00029-of-00047.safetensors", + "model.layers.28.mlp.experts.1.gate_proj.weight": "model-00029-of-00047.safetensors", + "model.layers.28.mlp.experts.1.gate_proj.weight_scale": "model-00029-of-00047.safetensors", + "model.layers.28.mlp.experts.1.up_proj.weight": "model-00029-of-00047.safetensors", + "model.layers.28.mlp.experts.1.up_proj.weight_scale": "model-00029-of-00047.safetensors", + "model.layers.28.mlp.experts.10.down_proj.weight": "model-00029-of-00047.safetensors", + "model.layers.28.mlp.experts.10.down_proj.weight_scale": "model-00029-of-00047.safetensors", + "model.layers.28.mlp.experts.10.gate_proj.weight": "model-00029-of-00047.safetensors", + "model.layers.28.mlp.experts.10.gate_proj.weight_scale": "model-00029-of-00047.safetensors", + "model.layers.28.mlp.experts.10.up_proj.weight": "model-00029-of-00047.safetensors", + "model.layers.28.mlp.experts.10.up_proj.weight_scale": "model-00029-of-00047.safetensors", + "model.layers.28.mlp.experts.100.down_proj.weight": "model-00029-of-00047.safetensors", + "model.layers.28.mlp.experts.100.down_proj.weight_scale": "model-00029-of-00047.safetensors", + "model.layers.28.mlp.experts.100.gate_proj.weight": "model-00029-of-00047.safetensors", + "model.layers.28.mlp.experts.100.gate_proj.weight_scale": "model-00029-of-00047.safetensors", + "model.layers.28.mlp.experts.100.up_proj.weight": "model-00029-of-00047.safetensors", + "model.layers.28.mlp.experts.100.up_proj.weight_scale": "model-00029-of-00047.safetensors", + "model.layers.28.mlp.experts.101.down_proj.weight": "model-00029-of-00047.safetensors", + "model.layers.28.mlp.experts.101.down_proj.weight_scale": "model-00029-of-00047.safetensors", + "model.layers.28.mlp.experts.101.gate_proj.weight": "model-00029-of-00047.safetensors", + "model.layers.28.mlp.experts.101.gate_proj.weight_scale": "model-00029-of-00047.safetensors", + "model.layers.28.mlp.experts.101.up_proj.weight": "model-00029-of-00047.safetensors", + "model.layers.28.mlp.experts.101.up_proj.weight_scale": "model-00029-of-00047.safetensors", + "model.layers.28.mlp.experts.102.down_proj.weight": "model-00029-of-00047.safetensors", + "model.layers.28.mlp.experts.102.down_proj.weight_scale": "model-00029-of-00047.safetensors", + "model.layers.28.mlp.experts.102.gate_proj.weight": "model-00029-of-00047.safetensors", + "model.layers.28.mlp.experts.102.gate_proj.weight_scale": "model-00029-of-00047.safetensors", + "model.layers.28.mlp.experts.102.up_proj.weight": "model-00029-of-00047.safetensors", + "model.layers.28.mlp.experts.102.up_proj.weight_scale": "model-00029-of-00047.safetensors", + "model.layers.28.mlp.experts.103.down_proj.weight": "model-00029-of-00047.safetensors", + "model.layers.28.mlp.experts.103.down_proj.weight_scale": "model-00029-of-00047.safetensors", + "model.layers.28.mlp.experts.103.gate_proj.weight": "model-00029-of-00047.safetensors", + "model.layers.28.mlp.experts.103.gate_proj.weight_scale": "model-00029-of-00047.safetensors", + "model.layers.28.mlp.experts.103.up_proj.weight": "model-00029-of-00047.safetensors", + "model.layers.28.mlp.experts.103.up_proj.weight_scale": "model-00029-of-00047.safetensors", + "model.layers.28.mlp.experts.104.down_proj.weight": "model-00029-of-00047.safetensors", + "model.layers.28.mlp.experts.104.down_proj.weight_scale": "model-00029-of-00047.safetensors", + "model.layers.28.mlp.experts.104.gate_proj.weight": "model-00029-of-00047.safetensors", + "model.layers.28.mlp.experts.104.gate_proj.weight_scale": "model-00029-of-00047.safetensors", + "model.layers.28.mlp.experts.104.up_proj.weight": "model-00029-of-00047.safetensors", + "model.layers.28.mlp.experts.104.up_proj.weight_scale": "model-00029-of-00047.safetensors", + "model.layers.28.mlp.experts.105.down_proj.weight": "model-00029-of-00047.safetensors", + "model.layers.28.mlp.experts.105.down_proj.weight_scale": "model-00029-of-00047.safetensors", + "model.layers.28.mlp.experts.105.gate_proj.weight": "model-00029-of-00047.safetensors", + "model.layers.28.mlp.experts.105.gate_proj.weight_scale": "model-00029-of-00047.safetensors", + "model.layers.28.mlp.experts.105.up_proj.weight": "model-00029-of-00047.safetensors", + "model.layers.28.mlp.experts.105.up_proj.weight_scale": "model-00029-of-00047.safetensors", + "model.layers.28.mlp.experts.106.down_proj.weight": "model-00029-of-00047.safetensors", + "model.layers.28.mlp.experts.106.down_proj.weight_scale": "model-00029-of-00047.safetensors", + "model.layers.28.mlp.experts.106.gate_proj.weight": "model-00029-of-00047.safetensors", + "model.layers.28.mlp.experts.106.gate_proj.weight_scale": "model-00029-of-00047.safetensors", + "model.layers.28.mlp.experts.106.up_proj.weight": "model-00029-of-00047.safetensors", + "model.layers.28.mlp.experts.106.up_proj.weight_scale": "model-00029-of-00047.safetensors", + "model.layers.28.mlp.experts.107.down_proj.weight": "model-00029-of-00047.safetensors", + "model.layers.28.mlp.experts.107.down_proj.weight_scale": "model-00029-of-00047.safetensors", + "model.layers.28.mlp.experts.107.gate_proj.weight": "model-00029-of-00047.safetensors", + "model.layers.28.mlp.experts.107.gate_proj.weight_scale": "model-00029-of-00047.safetensors", + "model.layers.28.mlp.experts.107.up_proj.weight": "model-00029-of-00047.safetensors", + "model.layers.28.mlp.experts.107.up_proj.weight_scale": "model-00029-of-00047.safetensors", + "model.layers.28.mlp.experts.108.down_proj.weight": "model-00029-of-00047.safetensors", + "model.layers.28.mlp.experts.108.down_proj.weight_scale": "model-00029-of-00047.safetensors", + "model.layers.28.mlp.experts.108.gate_proj.weight": "model-00029-of-00047.safetensors", + "model.layers.28.mlp.experts.108.gate_proj.weight_scale": "model-00029-of-00047.safetensors", + "model.layers.28.mlp.experts.108.up_proj.weight": "model-00029-of-00047.safetensors", + "model.layers.28.mlp.experts.108.up_proj.weight_scale": "model-00029-of-00047.safetensors", + "model.layers.28.mlp.experts.109.down_proj.weight": "model-00029-of-00047.safetensors", + "model.layers.28.mlp.experts.109.down_proj.weight_scale": "model-00029-of-00047.safetensors", + "model.layers.28.mlp.experts.109.gate_proj.weight": "model-00029-of-00047.safetensors", + "model.layers.28.mlp.experts.109.gate_proj.weight_scale": "model-00029-of-00047.safetensors", + "model.layers.28.mlp.experts.109.up_proj.weight": "model-00029-of-00047.safetensors", + "model.layers.28.mlp.experts.109.up_proj.weight_scale": "model-00029-of-00047.safetensors", + "model.layers.28.mlp.experts.11.down_proj.weight": "model-00029-of-00047.safetensors", + "model.layers.28.mlp.experts.11.down_proj.weight_scale": "model-00029-of-00047.safetensors", + "model.layers.28.mlp.experts.11.gate_proj.weight": "model-00029-of-00047.safetensors", + "model.layers.28.mlp.experts.11.gate_proj.weight_scale": "model-00029-of-00047.safetensors", + "model.layers.28.mlp.experts.11.up_proj.weight": "model-00029-of-00047.safetensors", + "model.layers.28.mlp.experts.11.up_proj.weight_scale": "model-00029-of-00047.safetensors", + "model.layers.28.mlp.experts.110.down_proj.weight": "model-00029-of-00047.safetensors", + "model.layers.28.mlp.experts.110.down_proj.weight_scale": "model-00029-of-00047.safetensors", + "model.layers.28.mlp.experts.110.gate_proj.weight": "model-00029-of-00047.safetensors", + "model.layers.28.mlp.experts.110.gate_proj.weight_scale": "model-00029-of-00047.safetensors", + "model.layers.28.mlp.experts.110.up_proj.weight": "model-00029-of-00047.safetensors", + "model.layers.28.mlp.experts.110.up_proj.weight_scale": "model-00029-of-00047.safetensors", + "model.layers.28.mlp.experts.111.down_proj.weight": "model-00029-of-00047.safetensors", + "model.layers.28.mlp.experts.111.down_proj.weight_scale": "model-00029-of-00047.safetensors", + "model.layers.28.mlp.experts.111.gate_proj.weight": "model-00029-of-00047.safetensors", + "model.layers.28.mlp.experts.111.gate_proj.weight_scale": "model-00029-of-00047.safetensors", + "model.layers.28.mlp.experts.111.up_proj.weight": "model-00029-of-00047.safetensors", + "model.layers.28.mlp.experts.111.up_proj.weight_scale": "model-00029-of-00047.safetensors", + "model.layers.28.mlp.experts.112.down_proj.weight": "model-00029-of-00047.safetensors", + "model.layers.28.mlp.experts.112.down_proj.weight_scale": "model-00029-of-00047.safetensors", + "model.layers.28.mlp.experts.112.gate_proj.weight": "model-00029-of-00047.safetensors", + "model.layers.28.mlp.experts.112.gate_proj.weight_scale": "model-00029-of-00047.safetensors", + "model.layers.28.mlp.experts.112.up_proj.weight": "model-00029-of-00047.safetensors", + "model.layers.28.mlp.experts.112.up_proj.weight_scale": "model-00029-of-00047.safetensors", + "model.layers.28.mlp.experts.113.down_proj.weight": "model-00029-of-00047.safetensors", + "model.layers.28.mlp.experts.113.down_proj.weight_scale": "model-00029-of-00047.safetensors", + "model.layers.28.mlp.experts.113.gate_proj.weight": "model-00029-of-00047.safetensors", + "model.layers.28.mlp.experts.113.gate_proj.weight_scale": "model-00029-of-00047.safetensors", + "model.layers.28.mlp.experts.113.up_proj.weight": "model-00029-of-00047.safetensors", + "model.layers.28.mlp.experts.113.up_proj.weight_scale": "model-00029-of-00047.safetensors", + "model.layers.28.mlp.experts.114.down_proj.weight": "model-00029-of-00047.safetensors", + "model.layers.28.mlp.experts.114.down_proj.weight_scale": "model-00029-of-00047.safetensors", + "model.layers.28.mlp.experts.114.gate_proj.weight": "model-00029-of-00047.safetensors", + "model.layers.28.mlp.experts.114.gate_proj.weight_scale": "model-00029-of-00047.safetensors", + "model.layers.28.mlp.experts.114.up_proj.weight": "model-00029-of-00047.safetensors", + "model.layers.28.mlp.experts.114.up_proj.weight_scale": "model-00029-of-00047.safetensors", + "model.layers.28.mlp.experts.115.down_proj.weight": "model-00029-of-00047.safetensors", + "model.layers.28.mlp.experts.115.down_proj.weight_scale": "model-00029-of-00047.safetensors", + "model.layers.28.mlp.experts.115.gate_proj.weight": "model-00029-of-00047.safetensors", + "model.layers.28.mlp.experts.115.gate_proj.weight_scale": "model-00029-of-00047.safetensors", + "model.layers.28.mlp.experts.115.up_proj.weight": "model-00029-of-00047.safetensors", + "model.layers.28.mlp.experts.115.up_proj.weight_scale": "model-00029-of-00047.safetensors", + "model.layers.28.mlp.experts.116.down_proj.weight": "model-00029-of-00047.safetensors", + "model.layers.28.mlp.experts.116.down_proj.weight_scale": "model-00029-of-00047.safetensors", + "model.layers.28.mlp.experts.116.gate_proj.weight": "model-00029-of-00047.safetensors", + "model.layers.28.mlp.experts.116.gate_proj.weight_scale": "model-00029-of-00047.safetensors", + "model.layers.28.mlp.experts.116.up_proj.weight": "model-00029-of-00047.safetensors", + "model.layers.28.mlp.experts.116.up_proj.weight_scale": "model-00029-of-00047.safetensors", + "model.layers.28.mlp.experts.117.down_proj.weight": "model-00029-of-00047.safetensors", + "model.layers.28.mlp.experts.117.down_proj.weight_scale": "model-00029-of-00047.safetensors", + "model.layers.28.mlp.experts.117.gate_proj.weight": "model-00029-of-00047.safetensors", + "model.layers.28.mlp.experts.117.gate_proj.weight_scale": "model-00029-of-00047.safetensors", + "model.layers.28.mlp.experts.117.up_proj.weight": "model-00029-of-00047.safetensors", + "model.layers.28.mlp.experts.117.up_proj.weight_scale": "model-00029-of-00047.safetensors", + "model.layers.28.mlp.experts.118.down_proj.weight": "model-00029-of-00047.safetensors", + "model.layers.28.mlp.experts.118.down_proj.weight_scale": "model-00029-of-00047.safetensors", + "model.layers.28.mlp.experts.118.gate_proj.weight": "model-00029-of-00047.safetensors", + "model.layers.28.mlp.experts.118.gate_proj.weight_scale": "model-00029-of-00047.safetensors", + "model.layers.28.mlp.experts.118.up_proj.weight": "model-00029-of-00047.safetensors", + "model.layers.28.mlp.experts.118.up_proj.weight_scale": "model-00029-of-00047.safetensors", + "model.layers.28.mlp.experts.119.down_proj.weight": "model-00029-of-00047.safetensors", + "model.layers.28.mlp.experts.119.down_proj.weight_scale": "model-00029-of-00047.safetensors", + "model.layers.28.mlp.experts.119.gate_proj.weight": "model-00029-of-00047.safetensors", + "model.layers.28.mlp.experts.119.gate_proj.weight_scale": "model-00029-of-00047.safetensors", + "model.layers.28.mlp.experts.119.up_proj.weight": "model-00029-of-00047.safetensors", + "model.layers.28.mlp.experts.119.up_proj.weight_scale": "model-00029-of-00047.safetensors", + "model.layers.28.mlp.experts.12.down_proj.weight": "model-00029-of-00047.safetensors", + "model.layers.28.mlp.experts.12.down_proj.weight_scale": "model-00029-of-00047.safetensors", + "model.layers.28.mlp.experts.12.gate_proj.weight": "model-00029-of-00047.safetensors", + "model.layers.28.mlp.experts.12.gate_proj.weight_scale": "model-00029-of-00047.safetensors", + "model.layers.28.mlp.experts.12.up_proj.weight": "model-00029-of-00047.safetensors", + "model.layers.28.mlp.experts.12.up_proj.weight_scale": "model-00029-of-00047.safetensors", + "model.layers.28.mlp.experts.120.down_proj.weight": "model-00029-of-00047.safetensors", + "model.layers.28.mlp.experts.120.down_proj.weight_scale": "model-00029-of-00047.safetensors", + "model.layers.28.mlp.experts.120.gate_proj.weight": "model-00029-of-00047.safetensors", + "model.layers.28.mlp.experts.120.gate_proj.weight_scale": "model-00029-of-00047.safetensors", + "model.layers.28.mlp.experts.120.up_proj.weight": "model-00029-of-00047.safetensors", + "model.layers.28.mlp.experts.120.up_proj.weight_scale": "model-00029-of-00047.safetensors", + "model.layers.28.mlp.experts.121.down_proj.weight": "model-00029-of-00047.safetensors", + "model.layers.28.mlp.experts.121.down_proj.weight_scale": "model-00029-of-00047.safetensors", + "model.layers.28.mlp.experts.121.gate_proj.weight": "model-00029-of-00047.safetensors", + "model.layers.28.mlp.experts.121.gate_proj.weight_scale": "model-00029-of-00047.safetensors", + "model.layers.28.mlp.experts.121.up_proj.weight": "model-00029-of-00047.safetensors", + "model.layers.28.mlp.experts.121.up_proj.weight_scale": "model-00029-of-00047.safetensors", + "model.layers.28.mlp.experts.122.down_proj.weight": "model-00029-of-00047.safetensors", + "model.layers.28.mlp.experts.122.down_proj.weight_scale": "model-00029-of-00047.safetensors", + "model.layers.28.mlp.experts.122.gate_proj.weight": "model-00029-of-00047.safetensors", + "model.layers.28.mlp.experts.122.gate_proj.weight_scale": "model-00029-of-00047.safetensors", + "model.layers.28.mlp.experts.122.up_proj.weight": "model-00029-of-00047.safetensors", + "model.layers.28.mlp.experts.122.up_proj.weight_scale": "model-00029-of-00047.safetensors", + "model.layers.28.mlp.experts.123.down_proj.weight": "model-00029-of-00047.safetensors", + "model.layers.28.mlp.experts.123.down_proj.weight_scale": "model-00029-of-00047.safetensors", + "model.layers.28.mlp.experts.123.gate_proj.weight": "model-00029-of-00047.safetensors", + "model.layers.28.mlp.experts.123.gate_proj.weight_scale": "model-00029-of-00047.safetensors", + "model.layers.28.mlp.experts.123.up_proj.weight": "model-00029-of-00047.safetensors", + "model.layers.28.mlp.experts.123.up_proj.weight_scale": "model-00029-of-00047.safetensors", + "model.layers.28.mlp.experts.124.down_proj.weight": "model-00029-of-00047.safetensors", + "model.layers.28.mlp.experts.124.down_proj.weight_scale": "model-00029-of-00047.safetensors", + "model.layers.28.mlp.experts.124.gate_proj.weight": "model-00029-of-00047.safetensors", + "model.layers.28.mlp.experts.124.gate_proj.weight_scale": "model-00029-of-00047.safetensors", + "model.layers.28.mlp.experts.124.up_proj.weight": "model-00029-of-00047.safetensors", + "model.layers.28.mlp.experts.124.up_proj.weight_scale": "model-00029-of-00047.safetensors", + "model.layers.28.mlp.experts.125.down_proj.weight": "model-00029-of-00047.safetensors", + "model.layers.28.mlp.experts.125.down_proj.weight_scale": "model-00029-of-00047.safetensors", + "model.layers.28.mlp.experts.125.gate_proj.weight": "model-00029-of-00047.safetensors", + "model.layers.28.mlp.experts.125.gate_proj.weight_scale": "model-00029-of-00047.safetensors", + "model.layers.28.mlp.experts.125.up_proj.weight": "model-00029-of-00047.safetensors", + "model.layers.28.mlp.experts.125.up_proj.weight_scale": "model-00029-of-00047.safetensors", + "model.layers.28.mlp.experts.126.down_proj.weight": "model-00029-of-00047.safetensors", + "model.layers.28.mlp.experts.126.down_proj.weight_scale": "model-00029-of-00047.safetensors", + "model.layers.28.mlp.experts.126.gate_proj.weight": "model-00029-of-00047.safetensors", + "model.layers.28.mlp.experts.126.gate_proj.weight_scale": "model-00029-of-00047.safetensors", + "model.layers.28.mlp.experts.126.up_proj.weight": "model-00029-of-00047.safetensors", + "model.layers.28.mlp.experts.126.up_proj.weight_scale": "model-00029-of-00047.safetensors", + "model.layers.28.mlp.experts.127.down_proj.weight": "model-00029-of-00047.safetensors", + "model.layers.28.mlp.experts.127.down_proj.weight_scale": "model-00029-of-00047.safetensors", + "model.layers.28.mlp.experts.127.gate_proj.weight": "model-00029-of-00047.safetensors", + "model.layers.28.mlp.experts.127.gate_proj.weight_scale": "model-00029-of-00047.safetensors", + "model.layers.28.mlp.experts.127.up_proj.weight": "model-00029-of-00047.safetensors", + "model.layers.28.mlp.experts.127.up_proj.weight_scale": "model-00029-of-00047.safetensors", + "model.layers.28.mlp.experts.13.down_proj.weight": "model-00029-of-00047.safetensors", + "model.layers.28.mlp.experts.13.down_proj.weight_scale": "model-00029-of-00047.safetensors", + "model.layers.28.mlp.experts.13.gate_proj.weight": "model-00029-of-00047.safetensors", + "model.layers.28.mlp.experts.13.gate_proj.weight_scale": "model-00029-of-00047.safetensors", + "model.layers.28.mlp.experts.13.up_proj.weight": "model-00029-of-00047.safetensors", + "model.layers.28.mlp.experts.13.up_proj.weight_scale": "model-00029-of-00047.safetensors", + "model.layers.28.mlp.experts.14.down_proj.weight": "model-00029-of-00047.safetensors", + "model.layers.28.mlp.experts.14.down_proj.weight_scale": "model-00029-of-00047.safetensors", + "model.layers.28.mlp.experts.14.gate_proj.weight": "model-00029-of-00047.safetensors", + "model.layers.28.mlp.experts.14.gate_proj.weight_scale": "model-00029-of-00047.safetensors", + "model.layers.28.mlp.experts.14.up_proj.weight": "model-00029-of-00047.safetensors", + "model.layers.28.mlp.experts.14.up_proj.weight_scale": "model-00029-of-00047.safetensors", + "model.layers.28.mlp.experts.15.down_proj.weight": "model-00029-of-00047.safetensors", + "model.layers.28.mlp.experts.15.down_proj.weight_scale": "model-00029-of-00047.safetensors", + "model.layers.28.mlp.experts.15.gate_proj.weight": "model-00029-of-00047.safetensors", + "model.layers.28.mlp.experts.15.gate_proj.weight_scale": "model-00029-of-00047.safetensors", + "model.layers.28.mlp.experts.15.up_proj.weight": "model-00029-of-00047.safetensors", + "model.layers.28.mlp.experts.15.up_proj.weight_scale": "model-00029-of-00047.safetensors", + "model.layers.28.mlp.experts.16.down_proj.weight": "model-00029-of-00047.safetensors", + "model.layers.28.mlp.experts.16.down_proj.weight_scale": "model-00029-of-00047.safetensors", + "model.layers.28.mlp.experts.16.gate_proj.weight": "model-00029-of-00047.safetensors", + "model.layers.28.mlp.experts.16.gate_proj.weight_scale": "model-00029-of-00047.safetensors", + "model.layers.28.mlp.experts.16.up_proj.weight": "model-00029-of-00047.safetensors", + "model.layers.28.mlp.experts.16.up_proj.weight_scale": "model-00029-of-00047.safetensors", + "model.layers.28.mlp.experts.17.down_proj.weight": "model-00029-of-00047.safetensors", + "model.layers.28.mlp.experts.17.down_proj.weight_scale": "model-00029-of-00047.safetensors", + "model.layers.28.mlp.experts.17.gate_proj.weight": "model-00029-of-00047.safetensors", + "model.layers.28.mlp.experts.17.gate_proj.weight_scale": "model-00029-of-00047.safetensors", + "model.layers.28.mlp.experts.17.up_proj.weight": "model-00029-of-00047.safetensors", + "model.layers.28.mlp.experts.17.up_proj.weight_scale": "model-00029-of-00047.safetensors", + "model.layers.28.mlp.experts.18.down_proj.weight": "model-00029-of-00047.safetensors", + "model.layers.28.mlp.experts.18.down_proj.weight_scale": "model-00029-of-00047.safetensors", + "model.layers.28.mlp.experts.18.gate_proj.weight": "model-00029-of-00047.safetensors", + "model.layers.28.mlp.experts.18.gate_proj.weight_scale": "model-00029-of-00047.safetensors", + "model.layers.28.mlp.experts.18.up_proj.weight": "model-00029-of-00047.safetensors", + "model.layers.28.mlp.experts.18.up_proj.weight_scale": "model-00029-of-00047.safetensors", + "model.layers.28.mlp.experts.19.down_proj.weight": "model-00029-of-00047.safetensors", + "model.layers.28.mlp.experts.19.down_proj.weight_scale": "model-00029-of-00047.safetensors", + "model.layers.28.mlp.experts.19.gate_proj.weight": "model-00029-of-00047.safetensors", + "model.layers.28.mlp.experts.19.gate_proj.weight_scale": "model-00029-of-00047.safetensors", + "model.layers.28.mlp.experts.19.up_proj.weight": "model-00029-of-00047.safetensors", + "model.layers.28.mlp.experts.19.up_proj.weight_scale": "model-00029-of-00047.safetensors", + "model.layers.28.mlp.experts.2.down_proj.weight": "model-00029-of-00047.safetensors", + "model.layers.28.mlp.experts.2.down_proj.weight_scale": "model-00029-of-00047.safetensors", + "model.layers.28.mlp.experts.2.gate_proj.weight": "model-00029-of-00047.safetensors", + "model.layers.28.mlp.experts.2.gate_proj.weight_scale": "model-00029-of-00047.safetensors", + "model.layers.28.mlp.experts.2.up_proj.weight": "model-00029-of-00047.safetensors", + "model.layers.28.mlp.experts.2.up_proj.weight_scale": "model-00029-of-00047.safetensors", + "model.layers.28.mlp.experts.20.down_proj.weight": "model-00029-of-00047.safetensors", + "model.layers.28.mlp.experts.20.down_proj.weight_scale": "model-00029-of-00047.safetensors", + "model.layers.28.mlp.experts.20.gate_proj.weight": "model-00029-of-00047.safetensors", + "model.layers.28.mlp.experts.20.gate_proj.weight_scale": "model-00029-of-00047.safetensors", + "model.layers.28.mlp.experts.20.up_proj.weight": "model-00029-of-00047.safetensors", + "model.layers.28.mlp.experts.20.up_proj.weight_scale": "model-00029-of-00047.safetensors", + "model.layers.28.mlp.experts.21.down_proj.weight": "model-00029-of-00047.safetensors", + "model.layers.28.mlp.experts.21.down_proj.weight_scale": "model-00029-of-00047.safetensors", + "model.layers.28.mlp.experts.21.gate_proj.weight": "model-00029-of-00047.safetensors", + "model.layers.28.mlp.experts.21.gate_proj.weight_scale": "model-00029-of-00047.safetensors", + "model.layers.28.mlp.experts.21.up_proj.weight": "model-00029-of-00047.safetensors", + "model.layers.28.mlp.experts.21.up_proj.weight_scale": "model-00029-of-00047.safetensors", + "model.layers.28.mlp.experts.22.down_proj.weight": "model-00029-of-00047.safetensors", + "model.layers.28.mlp.experts.22.down_proj.weight_scale": "model-00029-of-00047.safetensors", + "model.layers.28.mlp.experts.22.gate_proj.weight": "model-00029-of-00047.safetensors", + "model.layers.28.mlp.experts.22.gate_proj.weight_scale": "model-00029-of-00047.safetensors", + "model.layers.28.mlp.experts.22.up_proj.weight": "model-00029-of-00047.safetensors", + "model.layers.28.mlp.experts.22.up_proj.weight_scale": "model-00029-of-00047.safetensors", + "model.layers.28.mlp.experts.23.down_proj.weight": "model-00029-of-00047.safetensors", + "model.layers.28.mlp.experts.23.down_proj.weight_scale": "model-00029-of-00047.safetensors", + "model.layers.28.mlp.experts.23.gate_proj.weight": "model-00029-of-00047.safetensors", + "model.layers.28.mlp.experts.23.gate_proj.weight_scale": "model-00029-of-00047.safetensors", + "model.layers.28.mlp.experts.23.up_proj.weight": "model-00029-of-00047.safetensors", + "model.layers.28.mlp.experts.23.up_proj.weight_scale": "model-00029-of-00047.safetensors", + "model.layers.28.mlp.experts.24.down_proj.weight": "model-00029-of-00047.safetensors", + "model.layers.28.mlp.experts.24.down_proj.weight_scale": "model-00029-of-00047.safetensors", + "model.layers.28.mlp.experts.24.gate_proj.weight": "model-00029-of-00047.safetensors", + "model.layers.28.mlp.experts.24.gate_proj.weight_scale": "model-00029-of-00047.safetensors", + "model.layers.28.mlp.experts.24.up_proj.weight": "model-00029-of-00047.safetensors", + "model.layers.28.mlp.experts.24.up_proj.weight_scale": "model-00029-of-00047.safetensors", + "model.layers.28.mlp.experts.25.down_proj.weight": "model-00029-of-00047.safetensors", + "model.layers.28.mlp.experts.25.down_proj.weight_scale": "model-00029-of-00047.safetensors", + "model.layers.28.mlp.experts.25.gate_proj.weight": "model-00029-of-00047.safetensors", + "model.layers.28.mlp.experts.25.gate_proj.weight_scale": "model-00029-of-00047.safetensors", + "model.layers.28.mlp.experts.25.up_proj.weight": "model-00029-of-00047.safetensors", + "model.layers.28.mlp.experts.25.up_proj.weight_scale": "model-00029-of-00047.safetensors", + "model.layers.28.mlp.experts.26.down_proj.weight": "model-00029-of-00047.safetensors", + "model.layers.28.mlp.experts.26.down_proj.weight_scale": "model-00029-of-00047.safetensors", + "model.layers.28.mlp.experts.26.gate_proj.weight": "model-00029-of-00047.safetensors", + "model.layers.28.mlp.experts.26.gate_proj.weight_scale": "model-00029-of-00047.safetensors", + "model.layers.28.mlp.experts.26.up_proj.weight": "model-00029-of-00047.safetensors", + "model.layers.28.mlp.experts.26.up_proj.weight_scale": "model-00029-of-00047.safetensors", + "model.layers.28.mlp.experts.27.down_proj.weight": "model-00029-of-00047.safetensors", + "model.layers.28.mlp.experts.27.down_proj.weight_scale": "model-00029-of-00047.safetensors", + "model.layers.28.mlp.experts.27.gate_proj.weight": "model-00029-of-00047.safetensors", + "model.layers.28.mlp.experts.27.gate_proj.weight_scale": "model-00029-of-00047.safetensors", + "model.layers.28.mlp.experts.27.up_proj.weight": "model-00029-of-00047.safetensors", + "model.layers.28.mlp.experts.27.up_proj.weight_scale": "model-00029-of-00047.safetensors", + "model.layers.28.mlp.experts.28.down_proj.weight": "model-00029-of-00047.safetensors", + "model.layers.28.mlp.experts.28.down_proj.weight_scale": "model-00029-of-00047.safetensors", + "model.layers.28.mlp.experts.28.gate_proj.weight": "model-00029-of-00047.safetensors", + "model.layers.28.mlp.experts.28.gate_proj.weight_scale": "model-00029-of-00047.safetensors", + "model.layers.28.mlp.experts.28.up_proj.weight": "model-00029-of-00047.safetensors", + "model.layers.28.mlp.experts.28.up_proj.weight_scale": "model-00029-of-00047.safetensors", + "model.layers.28.mlp.experts.29.down_proj.weight": "model-00029-of-00047.safetensors", + "model.layers.28.mlp.experts.29.down_proj.weight_scale": "model-00029-of-00047.safetensors", + "model.layers.28.mlp.experts.29.gate_proj.weight": "model-00029-of-00047.safetensors", + "model.layers.28.mlp.experts.29.gate_proj.weight_scale": "model-00029-of-00047.safetensors", + "model.layers.28.mlp.experts.29.up_proj.weight": "model-00029-of-00047.safetensors", + "model.layers.28.mlp.experts.29.up_proj.weight_scale": "model-00029-of-00047.safetensors", + "model.layers.28.mlp.experts.3.down_proj.weight": "model-00029-of-00047.safetensors", + "model.layers.28.mlp.experts.3.down_proj.weight_scale": "model-00029-of-00047.safetensors", + "model.layers.28.mlp.experts.3.gate_proj.weight": "model-00029-of-00047.safetensors", + "model.layers.28.mlp.experts.3.gate_proj.weight_scale": "model-00029-of-00047.safetensors", + "model.layers.28.mlp.experts.3.up_proj.weight": "model-00029-of-00047.safetensors", + "model.layers.28.mlp.experts.3.up_proj.weight_scale": "model-00029-of-00047.safetensors", + "model.layers.28.mlp.experts.30.down_proj.weight": "model-00029-of-00047.safetensors", + "model.layers.28.mlp.experts.30.down_proj.weight_scale": "model-00029-of-00047.safetensors", + "model.layers.28.mlp.experts.30.gate_proj.weight": "model-00029-of-00047.safetensors", + "model.layers.28.mlp.experts.30.gate_proj.weight_scale": "model-00029-of-00047.safetensors", + "model.layers.28.mlp.experts.30.up_proj.weight": "model-00029-of-00047.safetensors", + "model.layers.28.mlp.experts.30.up_proj.weight_scale": "model-00029-of-00047.safetensors", + "model.layers.28.mlp.experts.31.down_proj.weight": "model-00029-of-00047.safetensors", + "model.layers.28.mlp.experts.31.down_proj.weight_scale": "model-00029-of-00047.safetensors", + "model.layers.28.mlp.experts.31.gate_proj.weight": "model-00029-of-00047.safetensors", + "model.layers.28.mlp.experts.31.gate_proj.weight_scale": "model-00029-of-00047.safetensors", + "model.layers.28.mlp.experts.31.up_proj.weight": "model-00029-of-00047.safetensors", + "model.layers.28.mlp.experts.31.up_proj.weight_scale": "model-00029-of-00047.safetensors", + "model.layers.28.mlp.experts.32.down_proj.weight": "model-00029-of-00047.safetensors", + "model.layers.28.mlp.experts.32.down_proj.weight_scale": "model-00029-of-00047.safetensors", + "model.layers.28.mlp.experts.32.gate_proj.weight": "model-00029-of-00047.safetensors", + "model.layers.28.mlp.experts.32.gate_proj.weight_scale": "model-00029-of-00047.safetensors", + "model.layers.28.mlp.experts.32.up_proj.weight": "model-00029-of-00047.safetensors", + "model.layers.28.mlp.experts.32.up_proj.weight_scale": "model-00029-of-00047.safetensors", + "model.layers.28.mlp.experts.33.down_proj.weight": "model-00029-of-00047.safetensors", + "model.layers.28.mlp.experts.33.down_proj.weight_scale": "model-00029-of-00047.safetensors", + "model.layers.28.mlp.experts.33.gate_proj.weight": "model-00029-of-00047.safetensors", + "model.layers.28.mlp.experts.33.gate_proj.weight_scale": "model-00029-of-00047.safetensors", + "model.layers.28.mlp.experts.33.up_proj.weight": "model-00029-of-00047.safetensors", + "model.layers.28.mlp.experts.33.up_proj.weight_scale": "model-00029-of-00047.safetensors", + "model.layers.28.mlp.experts.34.down_proj.weight": "model-00029-of-00047.safetensors", + "model.layers.28.mlp.experts.34.down_proj.weight_scale": "model-00029-of-00047.safetensors", + "model.layers.28.mlp.experts.34.gate_proj.weight": "model-00029-of-00047.safetensors", + "model.layers.28.mlp.experts.34.gate_proj.weight_scale": "model-00029-of-00047.safetensors", + "model.layers.28.mlp.experts.34.up_proj.weight": "model-00029-of-00047.safetensors", + "model.layers.28.mlp.experts.34.up_proj.weight_scale": "model-00029-of-00047.safetensors", + "model.layers.28.mlp.experts.35.down_proj.weight": "model-00029-of-00047.safetensors", + "model.layers.28.mlp.experts.35.down_proj.weight_scale": "model-00029-of-00047.safetensors", + "model.layers.28.mlp.experts.35.gate_proj.weight": "model-00029-of-00047.safetensors", + "model.layers.28.mlp.experts.35.gate_proj.weight_scale": "model-00029-of-00047.safetensors", + "model.layers.28.mlp.experts.35.up_proj.weight": "model-00029-of-00047.safetensors", + "model.layers.28.mlp.experts.35.up_proj.weight_scale": "model-00029-of-00047.safetensors", + "model.layers.28.mlp.experts.36.down_proj.weight": "model-00029-of-00047.safetensors", + "model.layers.28.mlp.experts.36.down_proj.weight_scale": "model-00029-of-00047.safetensors", + "model.layers.28.mlp.experts.36.gate_proj.weight": "model-00029-of-00047.safetensors", + "model.layers.28.mlp.experts.36.gate_proj.weight_scale": "model-00029-of-00047.safetensors", + "model.layers.28.mlp.experts.36.up_proj.weight": "model-00029-of-00047.safetensors", + "model.layers.28.mlp.experts.36.up_proj.weight_scale": "model-00029-of-00047.safetensors", + "model.layers.28.mlp.experts.37.down_proj.weight": "model-00029-of-00047.safetensors", + "model.layers.28.mlp.experts.37.down_proj.weight_scale": "model-00029-of-00047.safetensors", + "model.layers.28.mlp.experts.37.gate_proj.weight": "model-00029-of-00047.safetensors", + "model.layers.28.mlp.experts.37.gate_proj.weight_scale": "model-00029-of-00047.safetensors", + "model.layers.28.mlp.experts.37.up_proj.weight": "model-00029-of-00047.safetensors", + "model.layers.28.mlp.experts.37.up_proj.weight_scale": "model-00029-of-00047.safetensors", + "model.layers.28.mlp.experts.38.down_proj.weight": "model-00029-of-00047.safetensors", + "model.layers.28.mlp.experts.38.down_proj.weight_scale": "model-00029-of-00047.safetensors", + "model.layers.28.mlp.experts.38.gate_proj.weight": "model-00029-of-00047.safetensors", + "model.layers.28.mlp.experts.38.gate_proj.weight_scale": "model-00029-of-00047.safetensors", + "model.layers.28.mlp.experts.38.up_proj.weight": "model-00029-of-00047.safetensors", + "model.layers.28.mlp.experts.38.up_proj.weight_scale": "model-00029-of-00047.safetensors", + "model.layers.28.mlp.experts.39.down_proj.weight": "model-00029-of-00047.safetensors", + "model.layers.28.mlp.experts.39.down_proj.weight_scale": "model-00029-of-00047.safetensors", + "model.layers.28.mlp.experts.39.gate_proj.weight": "model-00029-of-00047.safetensors", + "model.layers.28.mlp.experts.39.gate_proj.weight_scale": "model-00029-of-00047.safetensors", + "model.layers.28.mlp.experts.39.up_proj.weight": "model-00029-of-00047.safetensors", + "model.layers.28.mlp.experts.39.up_proj.weight_scale": "model-00029-of-00047.safetensors", + "model.layers.28.mlp.experts.4.down_proj.weight": "model-00029-of-00047.safetensors", + "model.layers.28.mlp.experts.4.down_proj.weight_scale": "model-00029-of-00047.safetensors", + "model.layers.28.mlp.experts.4.gate_proj.weight": "model-00029-of-00047.safetensors", + "model.layers.28.mlp.experts.4.gate_proj.weight_scale": "model-00029-of-00047.safetensors", + "model.layers.28.mlp.experts.4.up_proj.weight": "model-00029-of-00047.safetensors", + "model.layers.28.mlp.experts.4.up_proj.weight_scale": "model-00029-of-00047.safetensors", + "model.layers.28.mlp.experts.40.down_proj.weight": "model-00029-of-00047.safetensors", + "model.layers.28.mlp.experts.40.down_proj.weight_scale": "model-00029-of-00047.safetensors", + "model.layers.28.mlp.experts.40.gate_proj.weight": "model-00029-of-00047.safetensors", + "model.layers.28.mlp.experts.40.gate_proj.weight_scale": "model-00029-of-00047.safetensors", + "model.layers.28.mlp.experts.40.up_proj.weight": "model-00029-of-00047.safetensors", + "model.layers.28.mlp.experts.40.up_proj.weight_scale": "model-00029-of-00047.safetensors", + "model.layers.28.mlp.experts.41.down_proj.weight": "model-00029-of-00047.safetensors", + "model.layers.28.mlp.experts.41.down_proj.weight_scale": "model-00029-of-00047.safetensors", + "model.layers.28.mlp.experts.41.gate_proj.weight": "model-00029-of-00047.safetensors", + "model.layers.28.mlp.experts.41.gate_proj.weight_scale": "model-00029-of-00047.safetensors", + "model.layers.28.mlp.experts.41.up_proj.weight": "model-00029-of-00047.safetensors", + "model.layers.28.mlp.experts.41.up_proj.weight_scale": "model-00029-of-00047.safetensors", + "model.layers.28.mlp.experts.42.down_proj.weight": "model-00029-of-00047.safetensors", + "model.layers.28.mlp.experts.42.down_proj.weight_scale": "model-00029-of-00047.safetensors", + "model.layers.28.mlp.experts.42.gate_proj.weight": "model-00029-of-00047.safetensors", + "model.layers.28.mlp.experts.42.gate_proj.weight_scale": "model-00029-of-00047.safetensors", + "model.layers.28.mlp.experts.42.up_proj.weight": "model-00029-of-00047.safetensors", + "model.layers.28.mlp.experts.42.up_proj.weight_scale": "model-00029-of-00047.safetensors", + "model.layers.28.mlp.experts.43.down_proj.weight": "model-00029-of-00047.safetensors", + "model.layers.28.mlp.experts.43.down_proj.weight_scale": "model-00029-of-00047.safetensors", + "model.layers.28.mlp.experts.43.gate_proj.weight": "model-00029-of-00047.safetensors", + "model.layers.28.mlp.experts.43.gate_proj.weight_scale": "model-00029-of-00047.safetensors", + "model.layers.28.mlp.experts.43.up_proj.weight": "model-00029-of-00047.safetensors", + "model.layers.28.mlp.experts.43.up_proj.weight_scale": "model-00029-of-00047.safetensors", + "model.layers.28.mlp.experts.44.down_proj.weight": "model-00029-of-00047.safetensors", + "model.layers.28.mlp.experts.44.down_proj.weight_scale": "model-00029-of-00047.safetensors", + "model.layers.28.mlp.experts.44.gate_proj.weight": "model-00029-of-00047.safetensors", + "model.layers.28.mlp.experts.44.gate_proj.weight_scale": "model-00029-of-00047.safetensors", + "model.layers.28.mlp.experts.44.up_proj.weight": "model-00029-of-00047.safetensors", + "model.layers.28.mlp.experts.44.up_proj.weight_scale": "model-00029-of-00047.safetensors", + "model.layers.28.mlp.experts.45.down_proj.weight": "model-00029-of-00047.safetensors", + "model.layers.28.mlp.experts.45.down_proj.weight_scale": "model-00029-of-00047.safetensors", + "model.layers.28.mlp.experts.45.gate_proj.weight": "model-00029-of-00047.safetensors", + "model.layers.28.mlp.experts.45.gate_proj.weight_scale": "model-00029-of-00047.safetensors", + "model.layers.28.mlp.experts.45.up_proj.weight": "model-00029-of-00047.safetensors", + "model.layers.28.mlp.experts.45.up_proj.weight_scale": "model-00029-of-00047.safetensors", + "model.layers.28.mlp.experts.46.down_proj.weight": "model-00029-of-00047.safetensors", + "model.layers.28.mlp.experts.46.down_proj.weight_scale": "model-00029-of-00047.safetensors", + "model.layers.28.mlp.experts.46.gate_proj.weight": "model-00029-of-00047.safetensors", + "model.layers.28.mlp.experts.46.gate_proj.weight_scale": "model-00029-of-00047.safetensors", + "model.layers.28.mlp.experts.46.up_proj.weight": "model-00029-of-00047.safetensors", + "model.layers.28.mlp.experts.46.up_proj.weight_scale": "model-00029-of-00047.safetensors", + "model.layers.28.mlp.experts.47.down_proj.weight": "model-00029-of-00047.safetensors", + "model.layers.28.mlp.experts.47.down_proj.weight_scale": "model-00029-of-00047.safetensors", + "model.layers.28.mlp.experts.47.gate_proj.weight": "model-00029-of-00047.safetensors", + "model.layers.28.mlp.experts.47.gate_proj.weight_scale": "model-00029-of-00047.safetensors", + "model.layers.28.mlp.experts.47.up_proj.weight": "model-00029-of-00047.safetensors", + "model.layers.28.mlp.experts.47.up_proj.weight_scale": "model-00029-of-00047.safetensors", + "model.layers.28.mlp.experts.48.down_proj.weight": "model-00029-of-00047.safetensors", + "model.layers.28.mlp.experts.48.down_proj.weight_scale": "model-00029-of-00047.safetensors", + "model.layers.28.mlp.experts.48.gate_proj.weight": "model-00029-of-00047.safetensors", + "model.layers.28.mlp.experts.48.gate_proj.weight_scale": "model-00029-of-00047.safetensors", + "model.layers.28.mlp.experts.48.up_proj.weight": "model-00029-of-00047.safetensors", + "model.layers.28.mlp.experts.48.up_proj.weight_scale": "model-00029-of-00047.safetensors", + "model.layers.28.mlp.experts.49.down_proj.weight": "model-00029-of-00047.safetensors", + "model.layers.28.mlp.experts.49.down_proj.weight_scale": "model-00029-of-00047.safetensors", + "model.layers.28.mlp.experts.49.gate_proj.weight": "model-00029-of-00047.safetensors", + "model.layers.28.mlp.experts.49.gate_proj.weight_scale": "model-00029-of-00047.safetensors", + "model.layers.28.mlp.experts.49.up_proj.weight": "model-00029-of-00047.safetensors", + "model.layers.28.mlp.experts.49.up_proj.weight_scale": "model-00029-of-00047.safetensors", + "model.layers.28.mlp.experts.5.down_proj.weight": "model-00029-of-00047.safetensors", + "model.layers.28.mlp.experts.5.down_proj.weight_scale": "model-00029-of-00047.safetensors", + "model.layers.28.mlp.experts.5.gate_proj.weight": "model-00029-of-00047.safetensors", + "model.layers.28.mlp.experts.5.gate_proj.weight_scale": "model-00029-of-00047.safetensors", + "model.layers.28.mlp.experts.5.up_proj.weight": "model-00029-of-00047.safetensors", + "model.layers.28.mlp.experts.5.up_proj.weight_scale": "model-00029-of-00047.safetensors", + "model.layers.28.mlp.experts.50.down_proj.weight": "model-00029-of-00047.safetensors", + "model.layers.28.mlp.experts.50.down_proj.weight_scale": "model-00029-of-00047.safetensors", + "model.layers.28.mlp.experts.50.gate_proj.weight": "model-00029-of-00047.safetensors", + "model.layers.28.mlp.experts.50.gate_proj.weight_scale": "model-00029-of-00047.safetensors", + "model.layers.28.mlp.experts.50.up_proj.weight": "model-00029-of-00047.safetensors", + "model.layers.28.mlp.experts.50.up_proj.weight_scale": "model-00029-of-00047.safetensors", + "model.layers.28.mlp.experts.51.down_proj.weight": "model-00029-of-00047.safetensors", + "model.layers.28.mlp.experts.51.down_proj.weight_scale": "model-00029-of-00047.safetensors", + "model.layers.28.mlp.experts.51.gate_proj.weight": "model-00029-of-00047.safetensors", + "model.layers.28.mlp.experts.51.gate_proj.weight_scale": "model-00029-of-00047.safetensors", + "model.layers.28.mlp.experts.51.up_proj.weight": "model-00029-of-00047.safetensors", + "model.layers.28.mlp.experts.51.up_proj.weight_scale": "model-00029-of-00047.safetensors", + "model.layers.28.mlp.experts.52.down_proj.weight": "model-00029-of-00047.safetensors", + "model.layers.28.mlp.experts.52.down_proj.weight_scale": "model-00029-of-00047.safetensors", + "model.layers.28.mlp.experts.52.gate_proj.weight": "model-00029-of-00047.safetensors", + "model.layers.28.mlp.experts.52.gate_proj.weight_scale": "model-00029-of-00047.safetensors", + "model.layers.28.mlp.experts.52.up_proj.weight": "model-00029-of-00047.safetensors", + "model.layers.28.mlp.experts.52.up_proj.weight_scale": "model-00029-of-00047.safetensors", + "model.layers.28.mlp.experts.53.down_proj.weight": "model-00029-of-00047.safetensors", + "model.layers.28.mlp.experts.53.down_proj.weight_scale": "model-00029-of-00047.safetensors", + "model.layers.28.mlp.experts.53.gate_proj.weight": "model-00029-of-00047.safetensors", + "model.layers.28.mlp.experts.53.gate_proj.weight_scale": "model-00029-of-00047.safetensors", + "model.layers.28.mlp.experts.53.up_proj.weight": "model-00029-of-00047.safetensors", + "model.layers.28.mlp.experts.53.up_proj.weight_scale": "model-00029-of-00047.safetensors", + "model.layers.28.mlp.experts.54.down_proj.weight": "model-00029-of-00047.safetensors", + "model.layers.28.mlp.experts.54.down_proj.weight_scale": "model-00029-of-00047.safetensors", + "model.layers.28.mlp.experts.54.gate_proj.weight": "model-00029-of-00047.safetensors", + "model.layers.28.mlp.experts.54.gate_proj.weight_scale": "model-00029-of-00047.safetensors", + "model.layers.28.mlp.experts.54.up_proj.weight": "model-00029-of-00047.safetensors", + "model.layers.28.mlp.experts.54.up_proj.weight_scale": "model-00029-of-00047.safetensors", + "model.layers.28.mlp.experts.55.down_proj.weight": "model-00029-of-00047.safetensors", + "model.layers.28.mlp.experts.55.down_proj.weight_scale": "model-00029-of-00047.safetensors", + "model.layers.28.mlp.experts.55.gate_proj.weight": "model-00029-of-00047.safetensors", + "model.layers.28.mlp.experts.55.gate_proj.weight_scale": "model-00029-of-00047.safetensors", + "model.layers.28.mlp.experts.55.up_proj.weight": "model-00029-of-00047.safetensors", + "model.layers.28.mlp.experts.55.up_proj.weight_scale": "model-00029-of-00047.safetensors", + "model.layers.28.mlp.experts.56.down_proj.weight": "model-00029-of-00047.safetensors", + "model.layers.28.mlp.experts.56.down_proj.weight_scale": "model-00029-of-00047.safetensors", + "model.layers.28.mlp.experts.56.gate_proj.weight": "model-00029-of-00047.safetensors", + "model.layers.28.mlp.experts.56.gate_proj.weight_scale": "model-00029-of-00047.safetensors", + "model.layers.28.mlp.experts.56.up_proj.weight": "model-00029-of-00047.safetensors", + "model.layers.28.mlp.experts.56.up_proj.weight_scale": "model-00029-of-00047.safetensors", + "model.layers.28.mlp.experts.57.down_proj.weight": "model-00029-of-00047.safetensors", + "model.layers.28.mlp.experts.57.down_proj.weight_scale": "model-00029-of-00047.safetensors", + "model.layers.28.mlp.experts.57.gate_proj.weight": "model-00029-of-00047.safetensors", + "model.layers.28.mlp.experts.57.gate_proj.weight_scale": "model-00029-of-00047.safetensors", + "model.layers.28.mlp.experts.57.up_proj.weight": "model-00029-of-00047.safetensors", + "model.layers.28.mlp.experts.57.up_proj.weight_scale": "model-00029-of-00047.safetensors", + "model.layers.28.mlp.experts.58.down_proj.weight": "model-00029-of-00047.safetensors", + "model.layers.28.mlp.experts.58.down_proj.weight_scale": "model-00029-of-00047.safetensors", + "model.layers.28.mlp.experts.58.gate_proj.weight": "model-00029-of-00047.safetensors", + "model.layers.28.mlp.experts.58.gate_proj.weight_scale": "model-00029-of-00047.safetensors", + "model.layers.28.mlp.experts.58.up_proj.weight": "model-00029-of-00047.safetensors", + "model.layers.28.mlp.experts.58.up_proj.weight_scale": "model-00029-of-00047.safetensors", + "model.layers.28.mlp.experts.59.down_proj.weight": "model-00029-of-00047.safetensors", + "model.layers.28.mlp.experts.59.down_proj.weight_scale": "model-00029-of-00047.safetensors", + "model.layers.28.mlp.experts.59.gate_proj.weight": "model-00029-of-00047.safetensors", + "model.layers.28.mlp.experts.59.gate_proj.weight_scale": "model-00029-of-00047.safetensors", + "model.layers.28.mlp.experts.59.up_proj.weight": "model-00029-of-00047.safetensors", + "model.layers.28.mlp.experts.59.up_proj.weight_scale": "model-00029-of-00047.safetensors", + "model.layers.28.mlp.experts.6.down_proj.weight": "model-00029-of-00047.safetensors", + "model.layers.28.mlp.experts.6.down_proj.weight_scale": "model-00029-of-00047.safetensors", + "model.layers.28.mlp.experts.6.gate_proj.weight": "model-00029-of-00047.safetensors", + "model.layers.28.mlp.experts.6.gate_proj.weight_scale": "model-00029-of-00047.safetensors", + "model.layers.28.mlp.experts.6.up_proj.weight": "model-00029-of-00047.safetensors", + "model.layers.28.mlp.experts.6.up_proj.weight_scale": "model-00029-of-00047.safetensors", + "model.layers.28.mlp.experts.60.down_proj.weight": "model-00029-of-00047.safetensors", + "model.layers.28.mlp.experts.60.down_proj.weight_scale": "model-00029-of-00047.safetensors", + "model.layers.28.mlp.experts.60.gate_proj.weight": "model-00029-of-00047.safetensors", + "model.layers.28.mlp.experts.60.gate_proj.weight_scale": "model-00029-of-00047.safetensors", + "model.layers.28.mlp.experts.60.up_proj.weight": "model-00029-of-00047.safetensors", + "model.layers.28.mlp.experts.60.up_proj.weight_scale": "model-00029-of-00047.safetensors", + "model.layers.28.mlp.experts.61.down_proj.weight": "model-00029-of-00047.safetensors", + "model.layers.28.mlp.experts.61.down_proj.weight_scale": "model-00029-of-00047.safetensors", + "model.layers.28.mlp.experts.61.gate_proj.weight": "model-00029-of-00047.safetensors", + "model.layers.28.mlp.experts.61.gate_proj.weight_scale": "model-00029-of-00047.safetensors", + "model.layers.28.mlp.experts.61.up_proj.weight": "model-00029-of-00047.safetensors", + "model.layers.28.mlp.experts.61.up_proj.weight_scale": "model-00029-of-00047.safetensors", + "model.layers.28.mlp.experts.62.down_proj.weight": "model-00029-of-00047.safetensors", + "model.layers.28.mlp.experts.62.down_proj.weight_scale": "model-00029-of-00047.safetensors", + "model.layers.28.mlp.experts.62.gate_proj.weight": "model-00029-of-00047.safetensors", + "model.layers.28.mlp.experts.62.gate_proj.weight_scale": "model-00029-of-00047.safetensors", + "model.layers.28.mlp.experts.62.up_proj.weight": "model-00029-of-00047.safetensors", + "model.layers.28.mlp.experts.62.up_proj.weight_scale": "model-00029-of-00047.safetensors", + "model.layers.28.mlp.experts.63.down_proj.weight": "model-00029-of-00047.safetensors", + "model.layers.28.mlp.experts.63.down_proj.weight_scale": "model-00029-of-00047.safetensors", + "model.layers.28.mlp.experts.63.gate_proj.weight": "model-00029-of-00047.safetensors", + "model.layers.28.mlp.experts.63.gate_proj.weight_scale": "model-00029-of-00047.safetensors", + "model.layers.28.mlp.experts.63.up_proj.weight": "model-00029-of-00047.safetensors", + "model.layers.28.mlp.experts.63.up_proj.weight_scale": "model-00029-of-00047.safetensors", + "model.layers.28.mlp.experts.64.down_proj.weight": "model-00029-of-00047.safetensors", + "model.layers.28.mlp.experts.64.down_proj.weight_scale": "model-00029-of-00047.safetensors", + "model.layers.28.mlp.experts.64.gate_proj.weight": "model-00029-of-00047.safetensors", + "model.layers.28.mlp.experts.64.gate_proj.weight_scale": "model-00029-of-00047.safetensors", + "model.layers.28.mlp.experts.64.up_proj.weight": "model-00029-of-00047.safetensors", + "model.layers.28.mlp.experts.64.up_proj.weight_scale": "model-00029-of-00047.safetensors", + "model.layers.28.mlp.experts.65.down_proj.weight": "model-00029-of-00047.safetensors", + "model.layers.28.mlp.experts.65.down_proj.weight_scale": "model-00029-of-00047.safetensors", + "model.layers.28.mlp.experts.65.gate_proj.weight": "model-00029-of-00047.safetensors", + "model.layers.28.mlp.experts.65.gate_proj.weight_scale": "model-00029-of-00047.safetensors", + "model.layers.28.mlp.experts.65.up_proj.weight": "model-00029-of-00047.safetensors", + "model.layers.28.mlp.experts.65.up_proj.weight_scale": "model-00029-of-00047.safetensors", + "model.layers.28.mlp.experts.66.down_proj.weight": "model-00029-of-00047.safetensors", + "model.layers.28.mlp.experts.66.down_proj.weight_scale": "model-00029-of-00047.safetensors", + "model.layers.28.mlp.experts.66.gate_proj.weight": "model-00029-of-00047.safetensors", + "model.layers.28.mlp.experts.66.gate_proj.weight_scale": "model-00029-of-00047.safetensors", + "model.layers.28.mlp.experts.66.up_proj.weight": "model-00029-of-00047.safetensors", + "model.layers.28.mlp.experts.66.up_proj.weight_scale": "model-00029-of-00047.safetensors", + "model.layers.28.mlp.experts.67.down_proj.weight": "model-00029-of-00047.safetensors", + "model.layers.28.mlp.experts.67.down_proj.weight_scale": "model-00029-of-00047.safetensors", + "model.layers.28.mlp.experts.67.gate_proj.weight": "model-00029-of-00047.safetensors", + "model.layers.28.mlp.experts.67.gate_proj.weight_scale": "model-00029-of-00047.safetensors", + "model.layers.28.mlp.experts.67.up_proj.weight": "model-00029-of-00047.safetensors", + "model.layers.28.mlp.experts.67.up_proj.weight_scale": "model-00029-of-00047.safetensors", + "model.layers.28.mlp.experts.68.down_proj.weight": "model-00029-of-00047.safetensors", + "model.layers.28.mlp.experts.68.down_proj.weight_scale": "model-00029-of-00047.safetensors", + "model.layers.28.mlp.experts.68.gate_proj.weight": "model-00029-of-00047.safetensors", + "model.layers.28.mlp.experts.68.gate_proj.weight_scale": "model-00029-of-00047.safetensors", + "model.layers.28.mlp.experts.68.up_proj.weight": "model-00029-of-00047.safetensors", + "model.layers.28.mlp.experts.68.up_proj.weight_scale": "model-00029-of-00047.safetensors", + "model.layers.28.mlp.experts.69.down_proj.weight": "model-00029-of-00047.safetensors", + "model.layers.28.mlp.experts.69.down_proj.weight_scale": "model-00029-of-00047.safetensors", + "model.layers.28.mlp.experts.69.gate_proj.weight": "model-00029-of-00047.safetensors", + "model.layers.28.mlp.experts.69.gate_proj.weight_scale": "model-00029-of-00047.safetensors", + "model.layers.28.mlp.experts.69.up_proj.weight": "model-00029-of-00047.safetensors", + "model.layers.28.mlp.experts.69.up_proj.weight_scale": "model-00029-of-00047.safetensors", + "model.layers.28.mlp.experts.7.down_proj.weight": "model-00029-of-00047.safetensors", + "model.layers.28.mlp.experts.7.down_proj.weight_scale": "model-00029-of-00047.safetensors", + "model.layers.28.mlp.experts.7.gate_proj.weight": "model-00029-of-00047.safetensors", + "model.layers.28.mlp.experts.7.gate_proj.weight_scale": "model-00029-of-00047.safetensors", + "model.layers.28.mlp.experts.7.up_proj.weight": "model-00029-of-00047.safetensors", + "model.layers.28.mlp.experts.7.up_proj.weight_scale": "model-00029-of-00047.safetensors", + "model.layers.28.mlp.experts.70.down_proj.weight": "model-00029-of-00047.safetensors", + "model.layers.28.mlp.experts.70.down_proj.weight_scale": "model-00029-of-00047.safetensors", + "model.layers.28.mlp.experts.70.gate_proj.weight": "model-00029-of-00047.safetensors", + "model.layers.28.mlp.experts.70.gate_proj.weight_scale": "model-00029-of-00047.safetensors", + "model.layers.28.mlp.experts.70.up_proj.weight": "model-00029-of-00047.safetensors", + "model.layers.28.mlp.experts.70.up_proj.weight_scale": "model-00029-of-00047.safetensors", + "model.layers.28.mlp.experts.71.down_proj.weight": "model-00029-of-00047.safetensors", + "model.layers.28.mlp.experts.71.down_proj.weight_scale": "model-00029-of-00047.safetensors", + "model.layers.28.mlp.experts.71.gate_proj.weight": "model-00029-of-00047.safetensors", + "model.layers.28.mlp.experts.71.gate_proj.weight_scale": "model-00029-of-00047.safetensors", + "model.layers.28.mlp.experts.71.up_proj.weight": "model-00029-of-00047.safetensors", + "model.layers.28.mlp.experts.71.up_proj.weight_scale": "model-00029-of-00047.safetensors", + "model.layers.28.mlp.experts.72.down_proj.weight": "model-00029-of-00047.safetensors", + "model.layers.28.mlp.experts.72.down_proj.weight_scale": "model-00029-of-00047.safetensors", + "model.layers.28.mlp.experts.72.gate_proj.weight": "model-00029-of-00047.safetensors", + "model.layers.28.mlp.experts.72.gate_proj.weight_scale": "model-00029-of-00047.safetensors", + "model.layers.28.mlp.experts.72.up_proj.weight": "model-00029-of-00047.safetensors", + "model.layers.28.mlp.experts.72.up_proj.weight_scale": "model-00029-of-00047.safetensors", + "model.layers.28.mlp.experts.73.down_proj.weight": "model-00029-of-00047.safetensors", + "model.layers.28.mlp.experts.73.down_proj.weight_scale": "model-00029-of-00047.safetensors", + "model.layers.28.mlp.experts.73.gate_proj.weight": "model-00029-of-00047.safetensors", + "model.layers.28.mlp.experts.73.gate_proj.weight_scale": "model-00029-of-00047.safetensors", + "model.layers.28.mlp.experts.73.up_proj.weight": "model-00029-of-00047.safetensors", + "model.layers.28.mlp.experts.73.up_proj.weight_scale": "model-00029-of-00047.safetensors", + "model.layers.28.mlp.experts.74.down_proj.weight": "model-00029-of-00047.safetensors", + "model.layers.28.mlp.experts.74.down_proj.weight_scale": "model-00029-of-00047.safetensors", + "model.layers.28.mlp.experts.74.gate_proj.weight": "model-00029-of-00047.safetensors", + "model.layers.28.mlp.experts.74.gate_proj.weight_scale": "model-00029-of-00047.safetensors", + "model.layers.28.mlp.experts.74.up_proj.weight": "model-00029-of-00047.safetensors", + "model.layers.28.mlp.experts.74.up_proj.weight_scale": "model-00029-of-00047.safetensors", + "model.layers.28.mlp.experts.75.down_proj.weight": "model-00029-of-00047.safetensors", + "model.layers.28.mlp.experts.75.down_proj.weight_scale": "model-00029-of-00047.safetensors", + "model.layers.28.mlp.experts.75.gate_proj.weight": "model-00029-of-00047.safetensors", + "model.layers.28.mlp.experts.75.gate_proj.weight_scale": "model-00029-of-00047.safetensors", + "model.layers.28.mlp.experts.75.up_proj.weight": "model-00029-of-00047.safetensors", + "model.layers.28.mlp.experts.75.up_proj.weight_scale": "model-00029-of-00047.safetensors", + "model.layers.28.mlp.experts.76.down_proj.weight": "model-00029-of-00047.safetensors", + "model.layers.28.mlp.experts.76.down_proj.weight_scale": "model-00029-of-00047.safetensors", + "model.layers.28.mlp.experts.76.gate_proj.weight": "model-00029-of-00047.safetensors", + "model.layers.28.mlp.experts.76.gate_proj.weight_scale": "model-00029-of-00047.safetensors", + "model.layers.28.mlp.experts.76.up_proj.weight": "model-00029-of-00047.safetensors", + "model.layers.28.mlp.experts.76.up_proj.weight_scale": "model-00029-of-00047.safetensors", + "model.layers.28.mlp.experts.77.down_proj.weight": "model-00029-of-00047.safetensors", + "model.layers.28.mlp.experts.77.down_proj.weight_scale": "model-00029-of-00047.safetensors", + "model.layers.28.mlp.experts.77.gate_proj.weight": "model-00029-of-00047.safetensors", + "model.layers.28.mlp.experts.77.gate_proj.weight_scale": "model-00029-of-00047.safetensors", + "model.layers.28.mlp.experts.77.up_proj.weight": "model-00029-of-00047.safetensors", + "model.layers.28.mlp.experts.77.up_proj.weight_scale": "model-00029-of-00047.safetensors", + "model.layers.28.mlp.experts.78.down_proj.weight": "model-00029-of-00047.safetensors", + "model.layers.28.mlp.experts.78.down_proj.weight_scale": "model-00029-of-00047.safetensors", + "model.layers.28.mlp.experts.78.gate_proj.weight": "model-00029-of-00047.safetensors", + "model.layers.28.mlp.experts.78.gate_proj.weight_scale": "model-00029-of-00047.safetensors", + "model.layers.28.mlp.experts.78.up_proj.weight": "model-00029-of-00047.safetensors", + "model.layers.28.mlp.experts.78.up_proj.weight_scale": "model-00029-of-00047.safetensors", + "model.layers.28.mlp.experts.79.down_proj.weight": "model-00029-of-00047.safetensors", + "model.layers.28.mlp.experts.79.down_proj.weight_scale": "model-00029-of-00047.safetensors", + "model.layers.28.mlp.experts.79.gate_proj.weight": "model-00029-of-00047.safetensors", + "model.layers.28.mlp.experts.79.gate_proj.weight_scale": "model-00029-of-00047.safetensors", + "model.layers.28.mlp.experts.79.up_proj.weight": "model-00029-of-00047.safetensors", + "model.layers.28.mlp.experts.79.up_proj.weight_scale": "model-00029-of-00047.safetensors", + "model.layers.28.mlp.experts.8.down_proj.weight": "model-00029-of-00047.safetensors", + "model.layers.28.mlp.experts.8.down_proj.weight_scale": "model-00029-of-00047.safetensors", + "model.layers.28.mlp.experts.8.gate_proj.weight": "model-00029-of-00047.safetensors", + "model.layers.28.mlp.experts.8.gate_proj.weight_scale": "model-00029-of-00047.safetensors", + "model.layers.28.mlp.experts.8.up_proj.weight": "model-00029-of-00047.safetensors", + "model.layers.28.mlp.experts.8.up_proj.weight_scale": "model-00029-of-00047.safetensors", + "model.layers.28.mlp.experts.80.down_proj.weight": "model-00029-of-00047.safetensors", + "model.layers.28.mlp.experts.80.down_proj.weight_scale": "model-00029-of-00047.safetensors", + "model.layers.28.mlp.experts.80.gate_proj.weight": "model-00029-of-00047.safetensors", + "model.layers.28.mlp.experts.80.gate_proj.weight_scale": "model-00029-of-00047.safetensors", + "model.layers.28.mlp.experts.80.up_proj.weight": "model-00029-of-00047.safetensors", + "model.layers.28.mlp.experts.80.up_proj.weight_scale": "model-00029-of-00047.safetensors", + "model.layers.28.mlp.experts.81.down_proj.weight": "model-00029-of-00047.safetensors", + "model.layers.28.mlp.experts.81.down_proj.weight_scale": "model-00029-of-00047.safetensors", + "model.layers.28.mlp.experts.81.gate_proj.weight": "model-00029-of-00047.safetensors", + "model.layers.28.mlp.experts.81.gate_proj.weight_scale": "model-00029-of-00047.safetensors", + "model.layers.28.mlp.experts.81.up_proj.weight": "model-00029-of-00047.safetensors", + "model.layers.28.mlp.experts.81.up_proj.weight_scale": "model-00029-of-00047.safetensors", + "model.layers.28.mlp.experts.82.down_proj.weight": "model-00029-of-00047.safetensors", + "model.layers.28.mlp.experts.82.down_proj.weight_scale": "model-00029-of-00047.safetensors", + "model.layers.28.mlp.experts.82.gate_proj.weight": "model-00029-of-00047.safetensors", + "model.layers.28.mlp.experts.82.gate_proj.weight_scale": "model-00029-of-00047.safetensors", + "model.layers.28.mlp.experts.82.up_proj.weight": "model-00029-of-00047.safetensors", + "model.layers.28.mlp.experts.82.up_proj.weight_scale": "model-00029-of-00047.safetensors", + "model.layers.28.mlp.experts.83.down_proj.weight": "model-00029-of-00047.safetensors", + "model.layers.28.mlp.experts.83.down_proj.weight_scale": "model-00029-of-00047.safetensors", + "model.layers.28.mlp.experts.83.gate_proj.weight": "model-00029-of-00047.safetensors", + "model.layers.28.mlp.experts.83.gate_proj.weight_scale": "model-00029-of-00047.safetensors", + "model.layers.28.mlp.experts.83.up_proj.weight": "model-00029-of-00047.safetensors", + "model.layers.28.mlp.experts.83.up_proj.weight_scale": "model-00029-of-00047.safetensors", + "model.layers.28.mlp.experts.84.down_proj.weight": "model-00029-of-00047.safetensors", + "model.layers.28.mlp.experts.84.down_proj.weight_scale": "model-00029-of-00047.safetensors", + "model.layers.28.mlp.experts.84.gate_proj.weight": "model-00029-of-00047.safetensors", + "model.layers.28.mlp.experts.84.gate_proj.weight_scale": "model-00029-of-00047.safetensors", + "model.layers.28.mlp.experts.84.up_proj.weight": "model-00029-of-00047.safetensors", + "model.layers.28.mlp.experts.84.up_proj.weight_scale": "model-00029-of-00047.safetensors", + "model.layers.28.mlp.experts.85.down_proj.weight": "model-00029-of-00047.safetensors", + "model.layers.28.mlp.experts.85.down_proj.weight_scale": "model-00029-of-00047.safetensors", + "model.layers.28.mlp.experts.85.gate_proj.weight": "model-00029-of-00047.safetensors", + "model.layers.28.mlp.experts.85.gate_proj.weight_scale": "model-00029-of-00047.safetensors", + "model.layers.28.mlp.experts.85.up_proj.weight": "model-00029-of-00047.safetensors", + "model.layers.28.mlp.experts.85.up_proj.weight_scale": "model-00029-of-00047.safetensors", + "model.layers.28.mlp.experts.86.down_proj.weight": "model-00029-of-00047.safetensors", + "model.layers.28.mlp.experts.86.down_proj.weight_scale": "model-00029-of-00047.safetensors", + "model.layers.28.mlp.experts.86.gate_proj.weight": "model-00029-of-00047.safetensors", + "model.layers.28.mlp.experts.86.gate_proj.weight_scale": "model-00029-of-00047.safetensors", + "model.layers.28.mlp.experts.86.up_proj.weight": "model-00029-of-00047.safetensors", + "model.layers.28.mlp.experts.86.up_proj.weight_scale": "model-00029-of-00047.safetensors", + "model.layers.28.mlp.experts.87.down_proj.weight": "model-00029-of-00047.safetensors", + "model.layers.28.mlp.experts.87.down_proj.weight_scale": "model-00029-of-00047.safetensors", + "model.layers.28.mlp.experts.87.gate_proj.weight": "model-00029-of-00047.safetensors", + "model.layers.28.mlp.experts.87.gate_proj.weight_scale": "model-00029-of-00047.safetensors", + "model.layers.28.mlp.experts.87.up_proj.weight": "model-00029-of-00047.safetensors", + "model.layers.28.mlp.experts.87.up_proj.weight_scale": "model-00029-of-00047.safetensors", + "model.layers.28.mlp.experts.88.down_proj.weight": "model-00029-of-00047.safetensors", + "model.layers.28.mlp.experts.88.down_proj.weight_scale": "model-00029-of-00047.safetensors", + "model.layers.28.mlp.experts.88.gate_proj.weight": "model-00029-of-00047.safetensors", + "model.layers.28.mlp.experts.88.gate_proj.weight_scale": "model-00029-of-00047.safetensors", + "model.layers.28.mlp.experts.88.up_proj.weight": "model-00029-of-00047.safetensors", + "model.layers.28.mlp.experts.88.up_proj.weight_scale": "model-00029-of-00047.safetensors", + "model.layers.28.mlp.experts.89.down_proj.weight": "model-00029-of-00047.safetensors", + "model.layers.28.mlp.experts.89.down_proj.weight_scale": "model-00029-of-00047.safetensors", + "model.layers.28.mlp.experts.89.gate_proj.weight": "model-00029-of-00047.safetensors", + "model.layers.28.mlp.experts.89.gate_proj.weight_scale": "model-00029-of-00047.safetensors", + "model.layers.28.mlp.experts.89.up_proj.weight": "model-00029-of-00047.safetensors", + "model.layers.28.mlp.experts.89.up_proj.weight_scale": "model-00029-of-00047.safetensors", + "model.layers.28.mlp.experts.9.down_proj.weight": "model-00029-of-00047.safetensors", + "model.layers.28.mlp.experts.9.down_proj.weight_scale": "model-00029-of-00047.safetensors", + "model.layers.28.mlp.experts.9.gate_proj.weight": "model-00029-of-00047.safetensors", + "model.layers.28.mlp.experts.9.gate_proj.weight_scale": "model-00029-of-00047.safetensors", + "model.layers.28.mlp.experts.9.up_proj.weight": "model-00029-of-00047.safetensors", + "model.layers.28.mlp.experts.9.up_proj.weight_scale": "model-00029-of-00047.safetensors", + "model.layers.28.mlp.experts.90.down_proj.weight": "model-00029-of-00047.safetensors", + "model.layers.28.mlp.experts.90.down_proj.weight_scale": "model-00029-of-00047.safetensors", + "model.layers.28.mlp.experts.90.gate_proj.weight": "model-00029-of-00047.safetensors", + "model.layers.28.mlp.experts.90.gate_proj.weight_scale": "model-00029-of-00047.safetensors", + "model.layers.28.mlp.experts.90.up_proj.weight": "model-00029-of-00047.safetensors", + "model.layers.28.mlp.experts.90.up_proj.weight_scale": "model-00029-of-00047.safetensors", + "model.layers.28.mlp.experts.91.down_proj.weight": "model-00029-of-00047.safetensors", + "model.layers.28.mlp.experts.91.down_proj.weight_scale": "model-00029-of-00047.safetensors", + "model.layers.28.mlp.experts.91.gate_proj.weight": "model-00029-of-00047.safetensors", + "model.layers.28.mlp.experts.91.gate_proj.weight_scale": "model-00029-of-00047.safetensors", + "model.layers.28.mlp.experts.91.up_proj.weight": "model-00029-of-00047.safetensors", + "model.layers.28.mlp.experts.91.up_proj.weight_scale": "model-00029-of-00047.safetensors", + "model.layers.28.mlp.experts.92.down_proj.weight": "model-00029-of-00047.safetensors", + "model.layers.28.mlp.experts.92.down_proj.weight_scale": "model-00029-of-00047.safetensors", + "model.layers.28.mlp.experts.92.gate_proj.weight": "model-00029-of-00047.safetensors", + "model.layers.28.mlp.experts.92.gate_proj.weight_scale": "model-00029-of-00047.safetensors", + "model.layers.28.mlp.experts.92.up_proj.weight": "model-00029-of-00047.safetensors", + "model.layers.28.mlp.experts.92.up_proj.weight_scale": "model-00029-of-00047.safetensors", + "model.layers.28.mlp.experts.93.down_proj.weight": "model-00029-of-00047.safetensors", + "model.layers.28.mlp.experts.93.down_proj.weight_scale": "model-00029-of-00047.safetensors", + "model.layers.28.mlp.experts.93.gate_proj.weight": "model-00029-of-00047.safetensors", + "model.layers.28.mlp.experts.93.gate_proj.weight_scale": "model-00029-of-00047.safetensors", + "model.layers.28.mlp.experts.93.up_proj.weight": "model-00029-of-00047.safetensors", + "model.layers.28.mlp.experts.93.up_proj.weight_scale": "model-00029-of-00047.safetensors", + "model.layers.28.mlp.experts.94.down_proj.weight": "model-00029-of-00047.safetensors", + "model.layers.28.mlp.experts.94.down_proj.weight_scale": "model-00029-of-00047.safetensors", + "model.layers.28.mlp.experts.94.gate_proj.weight": "model-00029-of-00047.safetensors", + "model.layers.28.mlp.experts.94.gate_proj.weight_scale": "model-00029-of-00047.safetensors", + "model.layers.28.mlp.experts.94.up_proj.weight": "model-00029-of-00047.safetensors", + "model.layers.28.mlp.experts.94.up_proj.weight_scale": "model-00029-of-00047.safetensors", + "model.layers.28.mlp.experts.95.down_proj.weight": "model-00029-of-00047.safetensors", + "model.layers.28.mlp.experts.95.down_proj.weight_scale": "model-00029-of-00047.safetensors", + "model.layers.28.mlp.experts.95.gate_proj.weight": "model-00029-of-00047.safetensors", + "model.layers.28.mlp.experts.95.gate_proj.weight_scale": "model-00029-of-00047.safetensors", + "model.layers.28.mlp.experts.95.up_proj.weight": "model-00029-of-00047.safetensors", + "model.layers.28.mlp.experts.95.up_proj.weight_scale": "model-00029-of-00047.safetensors", + "model.layers.28.mlp.experts.96.down_proj.weight": "model-00029-of-00047.safetensors", + "model.layers.28.mlp.experts.96.down_proj.weight_scale": "model-00029-of-00047.safetensors", + "model.layers.28.mlp.experts.96.gate_proj.weight": "model-00029-of-00047.safetensors", + "model.layers.28.mlp.experts.96.gate_proj.weight_scale": "model-00029-of-00047.safetensors", + "model.layers.28.mlp.experts.96.up_proj.weight": "model-00029-of-00047.safetensors", + "model.layers.28.mlp.experts.96.up_proj.weight_scale": "model-00029-of-00047.safetensors", + "model.layers.28.mlp.experts.97.down_proj.weight": "model-00029-of-00047.safetensors", + "model.layers.28.mlp.experts.97.down_proj.weight_scale": "model-00029-of-00047.safetensors", + "model.layers.28.mlp.experts.97.gate_proj.weight": "model-00029-of-00047.safetensors", + "model.layers.28.mlp.experts.97.gate_proj.weight_scale": "model-00029-of-00047.safetensors", + "model.layers.28.mlp.experts.97.up_proj.weight": "model-00029-of-00047.safetensors", + "model.layers.28.mlp.experts.97.up_proj.weight_scale": "model-00029-of-00047.safetensors", + "model.layers.28.mlp.experts.98.down_proj.weight": "model-00029-of-00047.safetensors", + "model.layers.28.mlp.experts.98.down_proj.weight_scale": "model-00029-of-00047.safetensors", + "model.layers.28.mlp.experts.98.gate_proj.weight": "model-00029-of-00047.safetensors", + "model.layers.28.mlp.experts.98.gate_proj.weight_scale": "model-00029-of-00047.safetensors", + "model.layers.28.mlp.experts.98.up_proj.weight": "model-00029-of-00047.safetensors", + "model.layers.28.mlp.experts.98.up_proj.weight_scale": "model-00029-of-00047.safetensors", + "model.layers.28.mlp.experts.99.down_proj.weight": "model-00029-of-00047.safetensors", + "model.layers.28.mlp.experts.99.down_proj.weight_scale": "model-00029-of-00047.safetensors", + "model.layers.28.mlp.experts.99.gate_proj.weight": "model-00029-of-00047.safetensors", + "model.layers.28.mlp.experts.99.gate_proj.weight_scale": "model-00029-of-00047.safetensors", + "model.layers.28.mlp.experts.99.up_proj.weight": "model-00029-of-00047.safetensors", + "model.layers.28.mlp.experts.99.up_proj.weight_scale": "model-00029-of-00047.safetensors", + "model.layers.28.mlp.gate.e_score_correction_bias": "model-00029-of-00047.safetensors", + "model.layers.28.mlp.gate.weight": "model-00029-of-00047.safetensors", + "model.layers.28.mlp.shared_experts.down_proj.weight": "model-00029-of-00047.safetensors", + "model.layers.28.mlp.shared_experts.down_proj.weight_scale": "model-00029-of-00047.safetensors", + "model.layers.28.mlp.shared_experts.gate_proj.weight": "model-00029-of-00047.safetensors", + "model.layers.28.mlp.shared_experts.gate_proj.weight_scale": "model-00029-of-00047.safetensors", + "model.layers.28.mlp.shared_experts.up_proj.weight": "model-00029-of-00047.safetensors", + "model.layers.28.mlp.shared_experts.up_proj.weight_scale": "model-00029-of-00047.safetensors", + "model.layers.28.post_attention_layernorm.weight": "model-00029-of-00047.safetensors", + "model.layers.28.self_attn.k_proj.bias": "model-00029-of-00047.safetensors", + "model.layers.28.self_attn.k_proj.weight": "model-00029-of-00047.safetensors", + "model.layers.28.self_attn.k_proj.weight_scale": "model-00029-of-00047.safetensors", + "model.layers.28.self_attn.o_proj.weight": "model-00029-of-00047.safetensors", + "model.layers.28.self_attn.o_proj.weight_scale": "model-00029-of-00047.safetensors", + "model.layers.28.self_attn.q_proj.bias": "model-00029-of-00047.safetensors", + "model.layers.28.self_attn.q_proj.weight": "model-00029-of-00047.safetensors", + "model.layers.28.self_attn.q_proj.weight_scale": "model-00029-of-00047.safetensors", + "model.layers.28.self_attn.v_proj.bias": "model-00029-of-00047.safetensors", + "model.layers.28.self_attn.v_proj.weight": "model-00029-of-00047.safetensors", + "model.layers.28.self_attn.v_proj.weight_scale": "model-00029-of-00047.safetensors", + "model.layers.29.input_layernorm.weight": "model-00030-of-00047.safetensors", + "model.layers.29.mlp.experts.0.down_proj.weight": "model-00030-of-00047.safetensors", + "model.layers.29.mlp.experts.0.down_proj.weight_scale": "model-00030-of-00047.safetensors", + "model.layers.29.mlp.experts.0.gate_proj.weight": "model-00030-of-00047.safetensors", + "model.layers.29.mlp.experts.0.gate_proj.weight_scale": "model-00030-of-00047.safetensors", + "model.layers.29.mlp.experts.0.up_proj.weight": "model-00030-of-00047.safetensors", + "model.layers.29.mlp.experts.0.up_proj.weight_scale": "model-00030-of-00047.safetensors", + "model.layers.29.mlp.experts.1.down_proj.weight": "model-00030-of-00047.safetensors", + "model.layers.29.mlp.experts.1.down_proj.weight_scale": "model-00030-of-00047.safetensors", + "model.layers.29.mlp.experts.1.gate_proj.weight": "model-00030-of-00047.safetensors", + "model.layers.29.mlp.experts.1.gate_proj.weight_scale": "model-00030-of-00047.safetensors", + "model.layers.29.mlp.experts.1.up_proj.weight": "model-00030-of-00047.safetensors", + "model.layers.29.mlp.experts.1.up_proj.weight_scale": "model-00030-of-00047.safetensors", + "model.layers.29.mlp.experts.10.down_proj.weight": "model-00030-of-00047.safetensors", + "model.layers.29.mlp.experts.10.down_proj.weight_scale": "model-00030-of-00047.safetensors", + "model.layers.29.mlp.experts.10.gate_proj.weight": "model-00030-of-00047.safetensors", + "model.layers.29.mlp.experts.10.gate_proj.weight_scale": "model-00030-of-00047.safetensors", + "model.layers.29.mlp.experts.10.up_proj.weight": "model-00030-of-00047.safetensors", + "model.layers.29.mlp.experts.10.up_proj.weight_scale": "model-00030-of-00047.safetensors", + "model.layers.29.mlp.experts.100.down_proj.weight": "model-00030-of-00047.safetensors", + "model.layers.29.mlp.experts.100.down_proj.weight_scale": "model-00030-of-00047.safetensors", + "model.layers.29.mlp.experts.100.gate_proj.weight": "model-00030-of-00047.safetensors", + "model.layers.29.mlp.experts.100.gate_proj.weight_scale": "model-00030-of-00047.safetensors", + "model.layers.29.mlp.experts.100.up_proj.weight": "model-00030-of-00047.safetensors", + "model.layers.29.mlp.experts.100.up_proj.weight_scale": "model-00030-of-00047.safetensors", + "model.layers.29.mlp.experts.101.down_proj.weight": "model-00030-of-00047.safetensors", + "model.layers.29.mlp.experts.101.down_proj.weight_scale": "model-00030-of-00047.safetensors", + "model.layers.29.mlp.experts.101.gate_proj.weight": "model-00030-of-00047.safetensors", + "model.layers.29.mlp.experts.101.gate_proj.weight_scale": "model-00030-of-00047.safetensors", + "model.layers.29.mlp.experts.101.up_proj.weight": "model-00030-of-00047.safetensors", + "model.layers.29.mlp.experts.101.up_proj.weight_scale": "model-00030-of-00047.safetensors", + "model.layers.29.mlp.experts.102.down_proj.weight": "model-00030-of-00047.safetensors", + "model.layers.29.mlp.experts.102.down_proj.weight_scale": "model-00030-of-00047.safetensors", + "model.layers.29.mlp.experts.102.gate_proj.weight": "model-00030-of-00047.safetensors", + "model.layers.29.mlp.experts.102.gate_proj.weight_scale": "model-00030-of-00047.safetensors", + "model.layers.29.mlp.experts.102.up_proj.weight": "model-00030-of-00047.safetensors", + "model.layers.29.mlp.experts.102.up_proj.weight_scale": "model-00030-of-00047.safetensors", + "model.layers.29.mlp.experts.103.down_proj.weight": "model-00030-of-00047.safetensors", + "model.layers.29.mlp.experts.103.down_proj.weight_scale": "model-00030-of-00047.safetensors", + "model.layers.29.mlp.experts.103.gate_proj.weight": "model-00030-of-00047.safetensors", + "model.layers.29.mlp.experts.103.gate_proj.weight_scale": "model-00030-of-00047.safetensors", + "model.layers.29.mlp.experts.103.up_proj.weight": "model-00030-of-00047.safetensors", + "model.layers.29.mlp.experts.103.up_proj.weight_scale": "model-00030-of-00047.safetensors", + "model.layers.29.mlp.experts.104.down_proj.weight": "model-00030-of-00047.safetensors", + "model.layers.29.mlp.experts.104.down_proj.weight_scale": "model-00030-of-00047.safetensors", + "model.layers.29.mlp.experts.104.gate_proj.weight": "model-00030-of-00047.safetensors", + "model.layers.29.mlp.experts.104.gate_proj.weight_scale": "model-00030-of-00047.safetensors", + "model.layers.29.mlp.experts.104.up_proj.weight": "model-00030-of-00047.safetensors", + "model.layers.29.mlp.experts.104.up_proj.weight_scale": "model-00030-of-00047.safetensors", + "model.layers.29.mlp.experts.105.down_proj.weight": "model-00030-of-00047.safetensors", + "model.layers.29.mlp.experts.105.down_proj.weight_scale": "model-00030-of-00047.safetensors", + "model.layers.29.mlp.experts.105.gate_proj.weight": "model-00030-of-00047.safetensors", + "model.layers.29.mlp.experts.105.gate_proj.weight_scale": "model-00030-of-00047.safetensors", + "model.layers.29.mlp.experts.105.up_proj.weight": "model-00030-of-00047.safetensors", + "model.layers.29.mlp.experts.105.up_proj.weight_scale": "model-00030-of-00047.safetensors", + "model.layers.29.mlp.experts.106.down_proj.weight": "model-00030-of-00047.safetensors", + "model.layers.29.mlp.experts.106.down_proj.weight_scale": "model-00030-of-00047.safetensors", + "model.layers.29.mlp.experts.106.gate_proj.weight": "model-00030-of-00047.safetensors", + "model.layers.29.mlp.experts.106.gate_proj.weight_scale": "model-00030-of-00047.safetensors", + "model.layers.29.mlp.experts.106.up_proj.weight": "model-00030-of-00047.safetensors", + "model.layers.29.mlp.experts.106.up_proj.weight_scale": "model-00030-of-00047.safetensors", + "model.layers.29.mlp.experts.107.down_proj.weight": "model-00030-of-00047.safetensors", + "model.layers.29.mlp.experts.107.down_proj.weight_scale": "model-00030-of-00047.safetensors", + "model.layers.29.mlp.experts.107.gate_proj.weight": "model-00030-of-00047.safetensors", + "model.layers.29.mlp.experts.107.gate_proj.weight_scale": "model-00030-of-00047.safetensors", + "model.layers.29.mlp.experts.107.up_proj.weight": "model-00030-of-00047.safetensors", + "model.layers.29.mlp.experts.107.up_proj.weight_scale": "model-00030-of-00047.safetensors", + "model.layers.29.mlp.experts.108.down_proj.weight": "model-00030-of-00047.safetensors", + "model.layers.29.mlp.experts.108.down_proj.weight_scale": "model-00030-of-00047.safetensors", + "model.layers.29.mlp.experts.108.gate_proj.weight": "model-00030-of-00047.safetensors", + "model.layers.29.mlp.experts.108.gate_proj.weight_scale": "model-00030-of-00047.safetensors", + "model.layers.29.mlp.experts.108.up_proj.weight": "model-00030-of-00047.safetensors", + "model.layers.29.mlp.experts.108.up_proj.weight_scale": "model-00030-of-00047.safetensors", + "model.layers.29.mlp.experts.109.down_proj.weight": "model-00030-of-00047.safetensors", + "model.layers.29.mlp.experts.109.down_proj.weight_scale": "model-00030-of-00047.safetensors", + "model.layers.29.mlp.experts.109.gate_proj.weight": "model-00030-of-00047.safetensors", + "model.layers.29.mlp.experts.109.gate_proj.weight_scale": "model-00030-of-00047.safetensors", + "model.layers.29.mlp.experts.109.up_proj.weight": "model-00030-of-00047.safetensors", + "model.layers.29.mlp.experts.109.up_proj.weight_scale": "model-00030-of-00047.safetensors", + "model.layers.29.mlp.experts.11.down_proj.weight": "model-00030-of-00047.safetensors", + "model.layers.29.mlp.experts.11.down_proj.weight_scale": "model-00030-of-00047.safetensors", + "model.layers.29.mlp.experts.11.gate_proj.weight": "model-00030-of-00047.safetensors", + "model.layers.29.mlp.experts.11.gate_proj.weight_scale": "model-00030-of-00047.safetensors", + "model.layers.29.mlp.experts.11.up_proj.weight": "model-00030-of-00047.safetensors", + "model.layers.29.mlp.experts.11.up_proj.weight_scale": "model-00030-of-00047.safetensors", + "model.layers.29.mlp.experts.110.down_proj.weight": "model-00030-of-00047.safetensors", + "model.layers.29.mlp.experts.110.down_proj.weight_scale": "model-00030-of-00047.safetensors", + "model.layers.29.mlp.experts.110.gate_proj.weight": "model-00030-of-00047.safetensors", + "model.layers.29.mlp.experts.110.gate_proj.weight_scale": "model-00030-of-00047.safetensors", + "model.layers.29.mlp.experts.110.up_proj.weight": "model-00030-of-00047.safetensors", + "model.layers.29.mlp.experts.110.up_proj.weight_scale": "model-00030-of-00047.safetensors", + "model.layers.29.mlp.experts.111.down_proj.weight": "model-00030-of-00047.safetensors", + "model.layers.29.mlp.experts.111.down_proj.weight_scale": "model-00030-of-00047.safetensors", + "model.layers.29.mlp.experts.111.gate_proj.weight": "model-00030-of-00047.safetensors", + "model.layers.29.mlp.experts.111.gate_proj.weight_scale": "model-00030-of-00047.safetensors", + "model.layers.29.mlp.experts.111.up_proj.weight": "model-00030-of-00047.safetensors", + "model.layers.29.mlp.experts.111.up_proj.weight_scale": "model-00030-of-00047.safetensors", + "model.layers.29.mlp.experts.112.down_proj.weight": "model-00030-of-00047.safetensors", + "model.layers.29.mlp.experts.112.down_proj.weight_scale": "model-00030-of-00047.safetensors", + "model.layers.29.mlp.experts.112.gate_proj.weight": "model-00030-of-00047.safetensors", + "model.layers.29.mlp.experts.112.gate_proj.weight_scale": "model-00030-of-00047.safetensors", + "model.layers.29.mlp.experts.112.up_proj.weight": "model-00030-of-00047.safetensors", + "model.layers.29.mlp.experts.112.up_proj.weight_scale": "model-00030-of-00047.safetensors", + "model.layers.29.mlp.experts.113.down_proj.weight": "model-00030-of-00047.safetensors", + "model.layers.29.mlp.experts.113.down_proj.weight_scale": "model-00030-of-00047.safetensors", + "model.layers.29.mlp.experts.113.gate_proj.weight": "model-00030-of-00047.safetensors", + "model.layers.29.mlp.experts.113.gate_proj.weight_scale": "model-00030-of-00047.safetensors", + "model.layers.29.mlp.experts.113.up_proj.weight": "model-00030-of-00047.safetensors", + "model.layers.29.mlp.experts.113.up_proj.weight_scale": "model-00030-of-00047.safetensors", + "model.layers.29.mlp.experts.114.down_proj.weight": "model-00030-of-00047.safetensors", + "model.layers.29.mlp.experts.114.down_proj.weight_scale": "model-00030-of-00047.safetensors", + "model.layers.29.mlp.experts.114.gate_proj.weight": "model-00030-of-00047.safetensors", + "model.layers.29.mlp.experts.114.gate_proj.weight_scale": "model-00030-of-00047.safetensors", + "model.layers.29.mlp.experts.114.up_proj.weight": "model-00030-of-00047.safetensors", + "model.layers.29.mlp.experts.114.up_proj.weight_scale": "model-00030-of-00047.safetensors", + "model.layers.29.mlp.experts.115.down_proj.weight": "model-00030-of-00047.safetensors", + "model.layers.29.mlp.experts.115.down_proj.weight_scale": "model-00030-of-00047.safetensors", + "model.layers.29.mlp.experts.115.gate_proj.weight": "model-00030-of-00047.safetensors", + "model.layers.29.mlp.experts.115.gate_proj.weight_scale": "model-00030-of-00047.safetensors", + "model.layers.29.mlp.experts.115.up_proj.weight": "model-00030-of-00047.safetensors", + "model.layers.29.mlp.experts.115.up_proj.weight_scale": "model-00030-of-00047.safetensors", + "model.layers.29.mlp.experts.116.down_proj.weight": "model-00030-of-00047.safetensors", + "model.layers.29.mlp.experts.116.down_proj.weight_scale": "model-00030-of-00047.safetensors", + "model.layers.29.mlp.experts.116.gate_proj.weight": "model-00030-of-00047.safetensors", + "model.layers.29.mlp.experts.116.gate_proj.weight_scale": "model-00030-of-00047.safetensors", + "model.layers.29.mlp.experts.116.up_proj.weight": "model-00030-of-00047.safetensors", + "model.layers.29.mlp.experts.116.up_proj.weight_scale": "model-00030-of-00047.safetensors", + "model.layers.29.mlp.experts.117.down_proj.weight": "model-00030-of-00047.safetensors", + "model.layers.29.mlp.experts.117.down_proj.weight_scale": "model-00030-of-00047.safetensors", + "model.layers.29.mlp.experts.117.gate_proj.weight": "model-00030-of-00047.safetensors", + "model.layers.29.mlp.experts.117.gate_proj.weight_scale": "model-00030-of-00047.safetensors", + "model.layers.29.mlp.experts.117.up_proj.weight": "model-00030-of-00047.safetensors", + "model.layers.29.mlp.experts.117.up_proj.weight_scale": "model-00030-of-00047.safetensors", + "model.layers.29.mlp.experts.118.down_proj.weight": "model-00030-of-00047.safetensors", + "model.layers.29.mlp.experts.118.down_proj.weight_scale": "model-00030-of-00047.safetensors", + "model.layers.29.mlp.experts.118.gate_proj.weight": "model-00030-of-00047.safetensors", + "model.layers.29.mlp.experts.118.gate_proj.weight_scale": "model-00030-of-00047.safetensors", + "model.layers.29.mlp.experts.118.up_proj.weight": "model-00030-of-00047.safetensors", + "model.layers.29.mlp.experts.118.up_proj.weight_scale": "model-00030-of-00047.safetensors", + "model.layers.29.mlp.experts.119.down_proj.weight": "model-00030-of-00047.safetensors", + "model.layers.29.mlp.experts.119.down_proj.weight_scale": "model-00030-of-00047.safetensors", + "model.layers.29.mlp.experts.119.gate_proj.weight": "model-00030-of-00047.safetensors", + "model.layers.29.mlp.experts.119.gate_proj.weight_scale": "model-00030-of-00047.safetensors", + "model.layers.29.mlp.experts.119.up_proj.weight": "model-00030-of-00047.safetensors", + "model.layers.29.mlp.experts.119.up_proj.weight_scale": "model-00030-of-00047.safetensors", + "model.layers.29.mlp.experts.12.down_proj.weight": "model-00030-of-00047.safetensors", + "model.layers.29.mlp.experts.12.down_proj.weight_scale": "model-00030-of-00047.safetensors", + "model.layers.29.mlp.experts.12.gate_proj.weight": "model-00030-of-00047.safetensors", + "model.layers.29.mlp.experts.12.gate_proj.weight_scale": "model-00030-of-00047.safetensors", + "model.layers.29.mlp.experts.12.up_proj.weight": "model-00030-of-00047.safetensors", + "model.layers.29.mlp.experts.12.up_proj.weight_scale": "model-00030-of-00047.safetensors", + "model.layers.29.mlp.experts.120.down_proj.weight": "model-00030-of-00047.safetensors", + "model.layers.29.mlp.experts.120.down_proj.weight_scale": "model-00030-of-00047.safetensors", + "model.layers.29.mlp.experts.120.gate_proj.weight": "model-00030-of-00047.safetensors", + "model.layers.29.mlp.experts.120.gate_proj.weight_scale": "model-00030-of-00047.safetensors", + "model.layers.29.mlp.experts.120.up_proj.weight": "model-00030-of-00047.safetensors", + "model.layers.29.mlp.experts.120.up_proj.weight_scale": "model-00030-of-00047.safetensors", + "model.layers.29.mlp.experts.121.down_proj.weight": "model-00030-of-00047.safetensors", + "model.layers.29.mlp.experts.121.down_proj.weight_scale": "model-00030-of-00047.safetensors", + "model.layers.29.mlp.experts.121.gate_proj.weight": "model-00030-of-00047.safetensors", + "model.layers.29.mlp.experts.121.gate_proj.weight_scale": "model-00030-of-00047.safetensors", + "model.layers.29.mlp.experts.121.up_proj.weight": "model-00030-of-00047.safetensors", + "model.layers.29.mlp.experts.121.up_proj.weight_scale": "model-00030-of-00047.safetensors", + "model.layers.29.mlp.experts.122.down_proj.weight": "model-00030-of-00047.safetensors", + "model.layers.29.mlp.experts.122.down_proj.weight_scale": "model-00030-of-00047.safetensors", + "model.layers.29.mlp.experts.122.gate_proj.weight": "model-00030-of-00047.safetensors", + "model.layers.29.mlp.experts.122.gate_proj.weight_scale": "model-00030-of-00047.safetensors", + "model.layers.29.mlp.experts.122.up_proj.weight": "model-00030-of-00047.safetensors", + "model.layers.29.mlp.experts.122.up_proj.weight_scale": "model-00030-of-00047.safetensors", + "model.layers.29.mlp.experts.123.down_proj.weight": "model-00030-of-00047.safetensors", + "model.layers.29.mlp.experts.123.down_proj.weight_scale": "model-00030-of-00047.safetensors", + "model.layers.29.mlp.experts.123.gate_proj.weight": "model-00030-of-00047.safetensors", + "model.layers.29.mlp.experts.123.gate_proj.weight_scale": "model-00030-of-00047.safetensors", + "model.layers.29.mlp.experts.123.up_proj.weight": "model-00030-of-00047.safetensors", + "model.layers.29.mlp.experts.123.up_proj.weight_scale": "model-00030-of-00047.safetensors", + "model.layers.29.mlp.experts.124.down_proj.weight": "model-00030-of-00047.safetensors", + "model.layers.29.mlp.experts.124.down_proj.weight_scale": "model-00030-of-00047.safetensors", + "model.layers.29.mlp.experts.124.gate_proj.weight": "model-00030-of-00047.safetensors", + "model.layers.29.mlp.experts.124.gate_proj.weight_scale": "model-00030-of-00047.safetensors", + "model.layers.29.mlp.experts.124.up_proj.weight": "model-00030-of-00047.safetensors", + "model.layers.29.mlp.experts.124.up_proj.weight_scale": "model-00030-of-00047.safetensors", + "model.layers.29.mlp.experts.125.down_proj.weight": "model-00030-of-00047.safetensors", + "model.layers.29.mlp.experts.125.down_proj.weight_scale": "model-00030-of-00047.safetensors", + "model.layers.29.mlp.experts.125.gate_proj.weight": "model-00030-of-00047.safetensors", + "model.layers.29.mlp.experts.125.gate_proj.weight_scale": "model-00030-of-00047.safetensors", + "model.layers.29.mlp.experts.125.up_proj.weight": "model-00030-of-00047.safetensors", + "model.layers.29.mlp.experts.125.up_proj.weight_scale": "model-00030-of-00047.safetensors", + "model.layers.29.mlp.experts.126.down_proj.weight": "model-00030-of-00047.safetensors", + "model.layers.29.mlp.experts.126.down_proj.weight_scale": "model-00030-of-00047.safetensors", + "model.layers.29.mlp.experts.126.gate_proj.weight": "model-00030-of-00047.safetensors", + "model.layers.29.mlp.experts.126.gate_proj.weight_scale": "model-00030-of-00047.safetensors", + "model.layers.29.mlp.experts.126.up_proj.weight": "model-00030-of-00047.safetensors", + "model.layers.29.mlp.experts.126.up_proj.weight_scale": "model-00030-of-00047.safetensors", + "model.layers.29.mlp.experts.127.down_proj.weight": "model-00030-of-00047.safetensors", + "model.layers.29.mlp.experts.127.down_proj.weight_scale": "model-00030-of-00047.safetensors", + "model.layers.29.mlp.experts.127.gate_proj.weight": "model-00030-of-00047.safetensors", + "model.layers.29.mlp.experts.127.gate_proj.weight_scale": "model-00030-of-00047.safetensors", + "model.layers.29.mlp.experts.127.up_proj.weight": "model-00030-of-00047.safetensors", + "model.layers.29.mlp.experts.127.up_proj.weight_scale": "model-00030-of-00047.safetensors", + "model.layers.29.mlp.experts.13.down_proj.weight": "model-00030-of-00047.safetensors", + "model.layers.29.mlp.experts.13.down_proj.weight_scale": "model-00030-of-00047.safetensors", + "model.layers.29.mlp.experts.13.gate_proj.weight": "model-00030-of-00047.safetensors", + "model.layers.29.mlp.experts.13.gate_proj.weight_scale": "model-00030-of-00047.safetensors", + "model.layers.29.mlp.experts.13.up_proj.weight": "model-00030-of-00047.safetensors", + "model.layers.29.mlp.experts.13.up_proj.weight_scale": "model-00030-of-00047.safetensors", + "model.layers.29.mlp.experts.14.down_proj.weight": "model-00030-of-00047.safetensors", + "model.layers.29.mlp.experts.14.down_proj.weight_scale": "model-00030-of-00047.safetensors", + "model.layers.29.mlp.experts.14.gate_proj.weight": "model-00030-of-00047.safetensors", + "model.layers.29.mlp.experts.14.gate_proj.weight_scale": "model-00030-of-00047.safetensors", + "model.layers.29.mlp.experts.14.up_proj.weight": "model-00030-of-00047.safetensors", + "model.layers.29.mlp.experts.14.up_proj.weight_scale": "model-00030-of-00047.safetensors", + "model.layers.29.mlp.experts.15.down_proj.weight": "model-00030-of-00047.safetensors", + "model.layers.29.mlp.experts.15.down_proj.weight_scale": "model-00030-of-00047.safetensors", + "model.layers.29.mlp.experts.15.gate_proj.weight": "model-00030-of-00047.safetensors", + "model.layers.29.mlp.experts.15.gate_proj.weight_scale": "model-00030-of-00047.safetensors", + "model.layers.29.mlp.experts.15.up_proj.weight": "model-00030-of-00047.safetensors", + "model.layers.29.mlp.experts.15.up_proj.weight_scale": "model-00030-of-00047.safetensors", + "model.layers.29.mlp.experts.16.down_proj.weight": "model-00030-of-00047.safetensors", + "model.layers.29.mlp.experts.16.down_proj.weight_scale": "model-00030-of-00047.safetensors", + "model.layers.29.mlp.experts.16.gate_proj.weight": "model-00030-of-00047.safetensors", + "model.layers.29.mlp.experts.16.gate_proj.weight_scale": "model-00030-of-00047.safetensors", + "model.layers.29.mlp.experts.16.up_proj.weight": "model-00030-of-00047.safetensors", + "model.layers.29.mlp.experts.16.up_proj.weight_scale": "model-00030-of-00047.safetensors", + "model.layers.29.mlp.experts.17.down_proj.weight": "model-00030-of-00047.safetensors", + "model.layers.29.mlp.experts.17.down_proj.weight_scale": "model-00030-of-00047.safetensors", + "model.layers.29.mlp.experts.17.gate_proj.weight": "model-00030-of-00047.safetensors", + "model.layers.29.mlp.experts.17.gate_proj.weight_scale": "model-00030-of-00047.safetensors", + "model.layers.29.mlp.experts.17.up_proj.weight": "model-00030-of-00047.safetensors", + "model.layers.29.mlp.experts.17.up_proj.weight_scale": "model-00030-of-00047.safetensors", + "model.layers.29.mlp.experts.18.down_proj.weight": "model-00030-of-00047.safetensors", + "model.layers.29.mlp.experts.18.down_proj.weight_scale": "model-00030-of-00047.safetensors", + "model.layers.29.mlp.experts.18.gate_proj.weight": "model-00030-of-00047.safetensors", + "model.layers.29.mlp.experts.18.gate_proj.weight_scale": "model-00030-of-00047.safetensors", + "model.layers.29.mlp.experts.18.up_proj.weight": "model-00030-of-00047.safetensors", + "model.layers.29.mlp.experts.18.up_proj.weight_scale": "model-00030-of-00047.safetensors", + "model.layers.29.mlp.experts.19.down_proj.weight": "model-00030-of-00047.safetensors", + "model.layers.29.mlp.experts.19.down_proj.weight_scale": "model-00030-of-00047.safetensors", + "model.layers.29.mlp.experts.19.gate_proj.weight": "model-00030-of-00047.safetensors", + "model.layers.29.mlp.experts.19.gate_proj.weight_scale": "model-00030-of-00047.safetensors", + "model.layers.29.mlp.experts.19.up_proj.weight": "model-00030-of-00047.safetensors", + "model.layers.29.mlp.experts.19.up_proj.weight_scale": "model-00030-of-00047.safetensors", + "model.layers.29.mlp.experts.2.down_proj.weight": "model-00030-of-00047.safetensors", + "model.layers.29.mlp.experts.2.down_proj.weight_scale": "model-00030-of-00047.safetensors", + "model.layers.29.mlp.experts.2.gate_proj.weight": "model-00030-of-00047.safetensors", + "model.layers.29.mlp.experts.2.gate_proj.weight_scale": "model-00030-of-00047.safetensors", + "model.layers.29.mlp.experts.2.up_proj.weight": "model-00030-of-00047.safetensors", + "model.layers.29.mlp.experts.2.up_proj.weight_scale": "model-00030-of-00047.safetensors", + "model.layers.29.mlp.experts.20.down_proj.weight": "model-00030-of-00047.safetensors", + "model.layers.29.mlp.experts.20.down_proj.weight_scale": "model-00030-of-00047.safetensors", + "model.layers.29.mlp.experts.20.gate_proj.weight": "model-00030-of-00047.safetensors", + "model.layers.29.mlp.experts.20.gate_proj.weight_scale": "model-00030-of-00047.safetensors", + "model.layers.29.mlp.experts.20.up_proj.weight": "model-00030-of-00047.safetensors", + "model.layers.29.mlp.experts.20.up_proj.weight_scale": "model-00030-of-00047.safetensors", + "model.layers.29.mlp.experts.21.down_proj.weight": "model-00030-of-00047.safetensors", + "model.layers.29.mlp.experts.21.down_proj.weight_scale": "model-00030-of-00047.safetensors", + "model.layers.29.mlp.experts.21.gate_proj.weight": "model-00030-of-00047.safetensors", + "model.layers.29.mlp.experts.21.gate_proj.weight_scale": "model-00030-of-00047.safetensors", + "model.layers.29.mlp.experts.21.up_proj.weight": "model-00030-of-00047.safetensors", + "model.layers.29.mlp.experts.21.up_proj.weight_scale": "model-00030-of-00047.safetensors", + "model.layers.29.mlp.experts.22.down_proj.weight": "model-00030-of-00047.safetensors", + "model.layers.29.mlp.experts.22.down_proj.weight_scale": "model-00030-of-00047.safetensors", + "model.layers.29.mlp.experts.22.gate_proj.weight": "model-00030-of-00047.safetensors", + "model.layers.29.mlp.experts.22.gate_proj.weight_scale": "model-00030-of-00047.safetensors", + "model.layers.29.mlp.experts.22.up_proj.weight": "model-00030-of-00047.safetensors", + "model.layers.29.mlp.experts.22.up_proj.weight_scale": "model-00030-of-00047.safetensors", + "model.layers.29.mlp.experts.23.down_proj.weight": "model-00030-of-00047.safetensors", + "model.layers.29.mlp.experts.23.down_proj.weight_scale": "model-00030-of-00047.safetensors", + "model.layers.29.mlp.experts.23.gate_proj.weight": "model-00030-of-00047.safetensors", + "model.layers.29.mlp.experts.23.gate_proj.weight_scale": "model-00030-of-00047.safetensors", + "model.layers.29.mlp.experts.23.up_proj.weight": "model-00030-of-00047.safetensors", + "model.layers.29.mlp.experts.23.up_proj.weight_scale": "model-00030-of-00047.safetensors", + "model.layers.29.mlp.experts.24.down_proj.weight": "model-00030-of-00047.safetensors", + "model.layers.29.mlp.experts.24.down_proj.weight_scale": "model-00030-of-00047.safetensors", + "model.layers.29.mlp.experts.24.gate_proj.weight": "model-00030-of-00047.safetensors", + "model.layers.29.mlp.experts.24.gate_proj.weight_scale": "model-00030-of-00047.safetensors", + "model.layers.29.mlp.experts.24.up_proj.weight": "model-00030-of-00047.safetensors", + "model.layers.29.mlp.experts.24.up_proj.weight_scale": "model-00030-of-00047.safetensors", + "model.layers.29.mlp.experts.25.down_proj.weight": "model-00030-of-00047.safetensors", + "model.layers.29.mlp.experts.25.down_proj.weight_scale": "model-00030-of-00047.safetensors", + "model.layers.29.mlp.experts.25.gate_proj.weight": "model-00030-of-00047.safetensors", + "model.layers.29.mlp.experts.25.gate_proj.weight_scale": "model-00030-of-00047.safetensors", + "model.layers.29.mlp.experts.25.up_proj.weight": "model-00030-of-00047.safetensors", + "model.layers.29.mlp.experts.25.up_proj.weight_scale": "model-00030-of-00047.safetensors", + "model.layers.29.mlp.experts.26.down_proj.weight": "model-00030-of-00047.safetensors", + "model.layers.29.mlp.experts.26.down_proj.weight_scale": "model-00030-of-00047.safetensors", + "model.layers.29.mlp.experts.26.gate_proj.weight": "model-00030-of-00047.safetensors", + "model.layers.29.mlp.experts.26.gate_proj.weight_scale": "model-00030-of-00047.safetensors", + "model.layers.29.mlp.experts.26.up_proj.weight": "model-00030-of-00047.safetensors", + "model.layers.29.mlp.experts.26.up_proj.weight_scale": "model-00030-of-00047.safetensors", + "model.layers.29.mlp.experts.27.down_proj.weight": "model-00030-of-00047.safetensors", + "model.layers.29.mlp.experts.27.down_proj.weight_scale": "model-00030-of-00047.safetensors", + "model.layers.29.mlp.experts.27.gate_proj.weight": "model-00030-of-00047.safetensors", + "model.layers.29.mlp.experts.27.gate_proj.weight_scale": "model-00030-of-00047.safetensors", + "model.layers.29.mlp.experts.27.up_proj.weight": "model-00030-of-00047.safetensors", + "model.layers.29.mlp.experts.27.up_proj.weight_scale": "model-00030-of-00047.safetensors", + "model.layers.29.mlp.experts.28.down_proj.weight": "model-00030-of-00047.safetensors", + "model.layers.29.mlp.experts.28.down_proj.weight_scale": "model-00030-of-00047.safetensors", + "model.layers.29.mlp.experts.28.gate_proj.weight": "model-00030-of-00047.safetensors", + "model.layers.29.mlp.experts.28.gate_proj.weight_scale": "model-00030-of-00047.safetensors", + "model.layers.29.mlp.experts.28.up_proj.weight": "model-00030-of-00047.safetensors", + "model.layers.29.mlp.experts.28.up_proj.weight_scale": "model-00030-of-00047.safetensors", + "model.layers.29.mlp.experts.29.down_proj.weight": "model-00030-of-00047.safetensors", + "model.layers.29.mlp.experts.29.down_proj.weight_scale": "model-00030-of-00047.safetensors", + "model.layers.29.mlp.experts.29.gate_proj.weight": "model-00030-of-00047.safetensors", + "model.layers.29.mlp.experts.29.gate_proj.weight_scale": "model-00030-of-00047.safetensors", + "model.layers.29.mlp.experts.29.up_proj.weight": "model-00030-of-00047.safetensors", + "model.layers.29.mlp.experts.29.up_proj.weight_scale": "model-00030-of-00047.safetensors", + "model.layers.29.mlp.experts.3.down_proj.weight": "model-00030-of-00047.safetensors", + "model.layers.29.mlp.experts.3.down_proj.weight_scale": "model-00030-of-00047.safetensors", + "model.layers.29.mlp.experts.3.gate_proj.weight": "model-00030-of-00047.safetensors", + "model.layers.29.mlp.experts.3.gate_proj.weight_scale": "model-00030-of-00047.safetensors", + "model.layers.29.mlp.experts.3.up_proj.weight": "model-00030-of-00047.safetensors", + "model.layers.29.mlp.experts.3.up_proj.weight_scale": "model-00030-of-00047.safetensors", + "model.layers.29.mlp.experts.30.down_proj.weight": "model-00030-of-00047.safetensors", + "model.layers.29.mlp.experts.30.down_proj.weight_scale": "model-00030-of-00047.safetensors", + "model.layers.29.mlp.experts.30.gate_proj.weight": "model-00030-of-00047.safetensors", + "model.layers.29.mlp.experts.30.gate_proj.weight_scale": "model-00030-of-00047.safetensors", + "model.layers.29.mlp.experts.30.up_proj.weight": "model-00030-of-00047.safetensors", + "model.layers.29.mlp.experts.30.up_proj.weight_scale": "model-00030-of-00047.safetensors", + "model.layers.29.mlp.experts.31.down_proj.weight": "model-00030-of-00047.safetensors", + "model.layers.29.mlp.experts.31.down_proj.weight_scale": "model-00030-of-00047.safetensors", + "model.layers.29.mlp.experts.31.gate_proj.weight": "model-00030-of-00047.safetensors", + "model.layers.29.mlp.experts.31.gate_proj.weight_scale": "model-00030-of-00047.safetensors", + "model.layers.29.mlp.experts.31.up_proj.weight": "model-00030-of-00047.safetensors", + "model.layers.29.mlp.experts.31.up_proj.weight_scale": "model-00030-of-00047.safetensors", + "model.layers.29.mlp.experts.32.down_proj.weight": "model-00030-of-00047.safetensors", + "model.layers.29.mlp.experts.32.down_proj.weight_scale": "model-00030-of-00047.safetensors", + "model.layers.29.mlp.experts.32.gate_proj.weight": "model-00030-of-00047.safetensors", + "model.layers.29.mlp.experts.32.gate_proj.weight_scale": "model-00030-of-00047.safetensors", + "model.layers.29.mlp.experts.32.up_proj.weight": "model-00030-of-00047.safetensors", + "model.layers.29.mlp.experts.32.up_proj.weight_scale": "model-00030-of-00047.safetensors", + "model.layers.29.mlp.experts.33.down_proj.weight": "model-00030-of-00047.safetensors", + "model.layers.29.mlp.experts.33.down_proj.weight_scale": "model-00030-of-00047.safetensors", + "model.layers.29.mlp.experts.33.gate_proj.weight": "model-00030-of-00047.safetensors", + "model.layers.29.mlp.experts.33.gate_proj.weight_scale": "model-00030-of-00047.safetensors", + "model.layers.29.mlp.experts.33.up_proj.weight": "model-00030-of-00047.safetensors", + "model.layers.29.mlp.experts.33.up_proj.weight_scale": "model-00030-of-00047.safetensors", + "model.layers.29.mlp.experts.34.down_proj.weight": "model-00030-of-00047.safetensors", + "model.layers.29.mlp.experts.34.down_proj.weight_scale": "model-00030-of-00047.safetensors", + "model.layers.29.mlp.experts.34.gate_proj.weight": "model-00030-of-00047.safetensors", + "model.layers.29.mlp.experts.34.gate_proj.weight_scale": "model-00030-of-00047.safetensors", + "model.layers.29.mlp.experts.34.up_proj.weight": "model-00030-of-00047.safetensors", + "model.layers.29.mlp.experts.34.up_proj.weight_scale": "model-00030-of-00047.safetensors", + "model.layers.29.mlp.experts.35.down_proj.weight": "model-00030-of-00047.safetensors", + "model.layers.29.mlp.experts.35.down_proj.weight_scale": "model-00030-of-00047.safetensors", + "model.layers.29.mlp.experts.35.gate_proj.weight": "model-00030-of-00047.safetensors", + "model.layers.29.mlp.experts.35.gate_proj.weight_scale": "model-00030-of-00047.safetensors", + "model.layers.29.mlp.experts.35.up_proj.weight": "model-00030-of-00047.safetensors", + "model.layers.29.mlp.experts.35.up_proj.weight_scale": "model-00030-of-00047.safetensors", + "model.layers.29.mlp.experts.36.down_proj.weight": "model-00030-of-00047.safetensors", + "model.layers.29.mlp.experts.36.down_proj.weight_scale": "model-00030-of-00047.safetensors", + "model.layers.29.mlp.experts.36.gate_proj.weight": "model-00030-of-00047.safetensors", + "model.layers.29.mlp.experts.36.gate_proj.weight_scale": "model-00030-of-00047.safetensors", + "model.layers.29.mlp.experts.36.up_proj.weight": "model-00030-of-00047.safetensors", + "model.layers.29.mlp.experts.36.up_proj.weight_scale": "model-00030-of-00047.safetensors", + "model.layers.29.mlp.experts.37.down_proj.weight": "model-00030-of-00047.safetensors", + "model.layers.29.mlp.experts.37.down_proj.weight_scale": "model-00030-of-00047.safetensors", + "model.layers.29.mlp.experts.37.gate_proj.weight": "model-00030-of-00047.safetensors", + "model.layers.29.mlp.experts.37.gate_proj.weight_scale": "model-00030-of-00047.safetensors", + "model.layers.29.mlp.experts.37.up_proj.weight": "model-00030-of-00047.safetensors", + "model.layers.29.mlp.experts.37.up_proj.weight_scale": "model-00030-of-00047.safetensors", + "model.layers.29.mlp.experts.38.down_proj.weight": "model-00030-of-00047.safetensors", + "model.layers.29.mlp.experts.38.down_proj.weight_scale": "model-00030-of-00047.safetensors", + "model.layers.29.mlp.experts.38.gate_proj.weight": "model-00030-of-00047.safetensors", + "model.layers.29.mlp.experts.38.gate_proj.weight_scale": "model-00030-of-00047.safetensors", + "model.layers.29.mlp.experts.38.up_proj.weight": "model-00030-of-00047.safetensors", + "model.layers.29.mlp.experts.38.up_proj.weight_scale": "model-00030-of-00047.safetensors", + "model.layers.29.mlp.experts.39.down_proj.weight": "model-00030-of-00047.safetensors", + "model.layers.29.mlp.experts.39.down_proj.weight_scale": "model-00030-of-00047.safetensors", + "model.layers.29.mlp.experts.39.gate_proj.weight": "model-00030-of-00047.safetensors", + "model.layers.29.mlp.experts.39.gate_proj.weight_scale": "model-00030-of-00047.safetensors", + "model.layers.29.mlp.experts.39.up_proj.weight": "model-00030-of-00047.safetensors", + "model.layers.29.mlp.experts.39.up_proj.weight_scale": "model-00030-of-00047.safetensors", + "model.layers.29.mlp.experts.4.down_proj.weight": "model-00030-of-00047.safetensors", + "model.layers.29.mlp.experts.4.down_proj.weight_scale": "model-00030-of-00047.safetensors", + "model.layers.29.mlp.experts.4.gate_proj.weight": "model-00030-of-00047.safetensors", + "model.layers.29.mlp.experts.4.gate_proj.weight_scale": "model-00030-of-00047.safetensors", + "model.layers.29.mlp.experts.4.up_proj.weight": "model-00030-of-00047.safetensors", + "model.layers.29.mlp.experts.4.up_proj.weight_scale": "model-00030-of-00047.safetensors", + "model.layers.29.mlp.experts.40.down_proj.weight": "model-00030-of-00047.safetensors", + "model.layers.29.mlp.experts.40.down_proj.weight_scale": "model-00030-of-00047.safetensors", + "model.layers.29.mlp.experts.40.gate_proj.weight": "model-00030-of-00047.safetensors", + "model.layers.29.mlp.experts.40.gate_proj.weight_scale": "model-00030-of-00047.safetensors", + "model.layers.29.mlp.experts.40.up_proj.weight": "model-00030-of-00047.safetensors", + "model.layers.29.mlp.experts.40.up_proj.weight_scale": "model-00030-of-00047.safetensors", + "model.layers.29.mlp.experts.41.down_proj.weight": "model-00030-of-00047.safetensors", + "model.layers.29.mlp.experts.41.down_proj.weight_scale": "model-00030-of-00047.safetensors", + "model.layers.29.mlp.experts.41.gate_proj.weight": "model-00030-of-00047.safetensors", + "model.layers.29.mlp.experts.41.gate_proj.weight_scale": "model-00030-of-00047.safetensors", + "model.layers.29.mlp.experts.41.up_proj.weight": "model-00030-of-00047.safetensors", + "model.layers.29.mlp.experts.41.up_proj.weight_scale": "model-00030-of-00047.safetensors", + "model.layers.29.mlp.experts.42.down_proj.weight": "model-00030-of-00047.safetensors", + "model.layers.29.mlp.experts.42.down_proj.weight_scale": "model-00030-of-00047.safetensors", + "model.layers.29.mlp.experts.42.gate_proj.weight": "model-00030-of-00047.safetensors", + "model.layers.29.mlp.experts.42.gate_proj.weight_scale": "model-00030-of-00047.safetensors", + "model.layers.29.mlp.experts.42.up_proj.weight": "model-00030-of-00047.safetensors", + "model.layers.29.mlp.experts.42.up_proj.weight_scale": "model-00030-of-00047.safetensors", + "model.layers.29.mlp.experts.43.down_proj.weight": "model-00030-of-00047.safetensors", + "model.layers.29.mlp.experts.43.down_proj.weight_scale": "model-00030-of-00047.safetensors", + "model.layers.29.mlp.experts.43.gate_proj.weight": "model-00030-of-00047.safetensors", + "model.layers.29.mlp.experts.43.gate_proj.weight_scale": "model-00030-of-00047.safetensors", + "model.layers.29.mlp.experts.43.up_proj.weight": "model-00030-of-00047.safetensors", + "model.layers.29.mlp.experts.43.up_proj.weight_scale": "model-00030-of-00047.safetensors", + "model.layers.29.mlp.experts.44.down_proj.weight": "model-00030-of-00047.safetensors", + "model.layers.29.mlp.experts.44.down_proj.weight_scale": "model-00030-of-00047.safetensors", + "model.layers.29.mlp.experts.44.gate_proj.weight": "model-00030-of-00047.safetensors", + "model.layers.29.mlp.experts.44.gate_proj.weight_scale": "model-00030-of-00047.safetensors", + "model.layers.29.mlp.experts.44.up_proj.weight": "model-00030-of-00047.safetensors", + "model.layers.29.mlp.experts.44.up_proj.weight_scale": "model-00030-of-00047.safetensors", + "model.layers.29.mlp.experts.45.down_proj.weight": "model-00030-of-00047.safetensors", + "model.layers.29.mlp.experts.45.down_proj.weight_scale": "model-00030-of-00047.safetensors", + "model.layers.29.mlp.experts.45.gate_proj.weight": "model-00030-of-00047.safetensors", + "model.layers.29.mlp.experts.45.gate_proj.weight_scale": "model-00030-of-00047.safetensors", + "model.layers.29.mlp.experts.45.up_proj.weight": "model-00030-of-00047.safetensors", + "model.layers.29.mlp.experts.45.up_proj.weight_scale": "model-00030-of-00047.safetensors", + "model.layers.29.mlp.experts.46.down_proj.weight": "model-00030-of-00047.safetensors", + "model.layers.29.mlp.experts.46.down_proj.weight_scale": "model-00030-of-00047.safetensors", + "model.layers.29.mlp.experts.46.gate_proj.weight": "model-00030-of-00047.safetensors", + "model.layers.29.mlp.experts.46.gate_proj.weight_scale": "model-00030-of-00047.safetensors", + "model.layers.29.mlp.experts.46.up_proj.weight": "model-00030-of-00047.safetensors", + "model.layers.29.mlp.experts.46.up_proj.weight_scale": "model-00030-of-00047.safetensors", + "model.layers.29.mlp.experts.47.down_proj.weight": "model-00030-of-00047.safetensors", + "model.layers.29.mlp.experts.47.down_proj.weight_scale": "model-00030-of-00047.safetensors", + "model.layers.29.mlp.experts.47.gate_proj.weight": "model-00030-of-00047.safetensors", + "model.layers.29.mlp.experts.47.gate_proj.weight_scale": "model-00030-of-00047.safetensors", + "model.layers.29.mlp.experts.47.up_proj.weight": "model-00030-of-00047.safetensors", + "model.layers.29.mlp.experts.47.up_proj.weight_scale": "model-00030-of-00047.safetensors", + "model.layers.29.mlp.experts.48.down_proj.weight": "model-00030-of-00047.safetensors", + "model.layers.29.mlp.experts.48.down_proj.weight_scale": "model-00030-of-00047.safetensors", + "model.layers.29.mlp.experts.48.gate_proj.weight": "model-00030-of-00047.safetensors", + "model.layers.29.mlp.experts.48.gate_proj.weight_scale": "model-00030-of-00047.safetensors", + "model.layers.29.mlp.experts.48.up_proj.weight": "model-00030-of-00047.safetensors", + "model.layers.29.mlp.experts.48.up_proj.weight_scale": "model-00030-of-00047.safetensors", + "model.layers.29.mlp.experts.49.down_proj.weight": "model-00030-of-00047.safetensors", + "model.layers.29.mlp.experts.49.down_proj.weight_scale": "model-00030-of-00047.safetensors", + "model.layers.29.mlp.experts.49.gate_proj.weight": "model-00030-of-00047.safetensors", + "model.layers.29.mlp.experts.49.gate_proj.weight_scale": "model-00030-of-00047.safetensors", + "model.layers.29.mlp.experts.49.up_proj.weight": "model-00030-of-00047.safetensors", + "model.layers.29.mlp.experts.49.up_proj.weight_scale": "model-00030-of-00047.safetensors", + "model.layers.29.mlp.experts.5.down_proj.weight": "model-00030-of-00047.safetensors", + "model.layers.29.mlp.experts.5.down_proj.weight_scale": "model-00030-of-00047.safetensors", + "model.layers.29.mlp.experts.5.gate_proj.weight": "model-00030-of-00047.safetensors", + "model.layers.29.mlp.experts.5.gate_proj.weight_scale": "model-00030-of-00047.safetensors", + "model.layers.29.mlp.experts.5.up_proj.weight": "model-00030-of-00047.safetensors", + "model.layers.29.mlp.experts.5.up_proj.weight_scale": "model-00030-of-00047.safetensors", + "model.layers.29.mlp.experts.50.down_proj.weight": "model-00030-of-00047.safetensors", + "model.layers.29.mlp.experts.50.down_proj.weight_scale": "model-00030-of-00047.safetensors", + "model.layers.29.mlp.experts.50.gate_proj.weight": "model-00030-of-00047.safetensors", + "model.layers.29.mlp.experts.50.gate_proj.weight_scale": "model-00030-of-00047.safetensors", + "model.layers.29.mlp.experts.50.up_proj.weight": "model-00030-of-00047.safetensors", + "model.layers.29.mlp.experts.50.up_proj.weight_scale": "model-00030-of-00047.safetensors", + "model.layers.29.mlp.experts.51.down_proj.weight": "model-00030-of-00047.safetensors", + "model.layers.29.mlp.experts.51.down_proj.weight_scale": "model-00030-of-00047.safetensors", + "model.layers.29.mlp.experts.51.gate_proj.weight": "model-00030-of-00047.safetensors", + "model.layers.29.mlp.experts.51.gate_proj.weight_scale": "model-00030-of-00047.safetensors", + "model.layers.29.mlp.experts.51.up_proj.weight": "model-00030-of-00047.safetensors", + "model.layers.29.mlp.experts.51.up_proj.weight_scale": "model-00030-of-00047.safetensors", + "model.layers.29.mlp.experts.52.down_proj.weight": "model-00030-of-00047.safetensors", + "model.layers.29.mlp.experts.52.down_proj.weight_scale": "model-00030-of-00047.safetensors", + "model.layers.29.mlp.experts.52.gate_proj.weight": "model-00030-of-00047.safetensors", + "model.layers.29.mlp.experts.52.gate_proj.weight_scale": "model-00030-of-00047.safetensors", + "model.layers.29.mlp.experts.52.up_proj.weight": "model-00030-of-00047.safetensors", + "model.layers.29.mlp.experts.52.up_proj.weight_scale": "model-00030-of-00047.safetensors", + "model.layers.29.mlp.experts.53.down_proj.weight": "model-00030-of-00047.safetensors", + "model.layers.29.mlp.experts.53.down_proj.weight_scale": "model-00030-of-00047.safetensors", + "model.layers.29.mlp.experts.53.gate_proj.weight": "model-00030-of-00047.safetensors", + "model.layers.29.mlp.experts.53.gate_proj.weight_scale": "model-00030-of-00047.safetensors", + "model.layers.29.mlp.experts.53.up_proj.weight": "model-00030-of-00047.safetensors", + "model.layers.29.mlp.experts.53.up_proj.weight_scale": "model-00030-of-00047.safetensors", + "model.layers.29.mlp.experts.54.down_proj.weight": "model-00030-of-00047.safetensors", + "model.layers.29.mlp.experts.54.down_proj.weight_scale": "model-00030-of-00047.safetensors", + "model.layers.29.mlp.experts.54.gate_proj.weight": "model-00030-of-00047.safetensors", + "model.layers.29.mlp.experts.54.gate_proj.weight_scale": "model-00030-of-00047.safetensors", + "model.layers.29.mlp.experts.54.up_proj.weight": "model-00030-of-00047.safetensors", + "model.layers.29.mlp.experts.54.up_proj.weight_scale": "model-00030-of-00047.safetensors", + "model.layers.29.mlp.experts.55.down_proj.weight": "model-00030-of-00047.safetensors", + "model.layers.29.mlp.experts.55.down_proj.weight_scale": "model-00030-of-00047.safetensors", + "model.layers.29.mlp.experts.55.gate_proj.weight": "model-00030-of-00047.safetensors", + "model.layers.29.mlp.experts.55.gate_proj.weight_scale": "model-00030-of-00047.safetensors", + "model.layers.29.mlp.experts.55.up_proj.weight": "model-00030-of-00047.safetensors", + "model.layers.29.mlp.experts.55.up_proj.weight_scale": "model-00030-of-00047.safetensors", + "model.layers.29.mlp.experts.56.down_proj.weight": "model-00030-of-00047.safetensors", + "model.layers.29.mlp.experts.56.down_proj.weight_scale": "model-00030-of-00047.safetensors", + "model.layers.29.mlp.experts.56.gate_proj.weight": "model-00030-of-00047.safetensors", + "model.layers.29.mlp.experts.56.gate_proj.weight_scale": "model-00030-of-00047.safetensors", + "model.layers.29.mlp.experts.56.up_proj.weight": "model-00030-of-00047.safetensors", + "model.layers.29.mlp.experts.56.up_proj.weight_scale": "model-00030-of-00047.safetensors", + "model.layers.29.mlp.experts.57.down_proj.weight": "model-00030-of-00047.safetensors", + "model.layers.29.mlp.experts.57.down_proj.weight_scale": "model-00030-of-00047.safetensors", + "model.layers.29.mlp.experts.57.gate_proj.weight": "model-00030-of-00047.safetensors", + "model.layers.29.mlp.experts.57.gate_proj.weight_scale": "model-00030-of-00047.safetensors", + "model.layers.29.mlp.experts.57.up_proj.weight": "model-00030-of-00047.safetensors", + "model.layers.29.mlp.experts.57.up_proj.weight_scale": "model-00030-of-00047.safetensors", + "model.layers.29.mlp.experts.58.down_proj.weight": "model-00030-of-00047.safetensors", + "model.layers.29.mlp.experts.58.down_proj.weight_scale": "model-00030-of-00047.safetensors", + "model.layers.29.mlp.experts.58.gate_proj.weight": "model-00030-of-00047.safetensors", + "model.layers.29.mlp.experts.58.gate_proj.weight_scale": "model-00030-of-00047.safetensors", + "model.layers.29.mlp.experts.58.up_proj.weight": "model-00030-of-00047.safetensors", + "model.layers.29.mlp.experts.58.up_proj.weight_scale": "model-00030-of-00047.safetensors", + "model.layers.29.mlp.experts.59.down_proj.weight": "model-00030-of-00047.safetensors", + "model.layers.29.mlp.experts.59.down_proj.weight_scale": "model-00030-of-00047.safetensors", + "model.layers.29.mlp.experts.59.gate_proj.weight": "model-00030-of-00047.safetensors", + "model.layers.29.mlp.experts.59.gate_proj.weight_scale": "model-00030-of-00047.safetensors", + "model.layers.29.mlp.experts.59.up_proj.weight": "model-00030-of-00047.safetensors", + "model.layers.29.mlp.experts.59.up_proj.weight_scale": "model-00030-of-00047.safetensors", + "model.layers.29.mlp.experts.6.down_proj.weight": "model-00030-of-00047.safetensors", + "model.layers.29.mlp.experts.6.down_proj.weight_scale": "model-00030-of-00047.safetensors", + "model.layers.29.mlp.experts.6.gate_proj.weight": "model-00030-of-00047.safetensors", + "model.layers.29.mlp.experts.6.gate_proj.weight_scale": "model-00030-of-00047.safetensors", + "model.layers.29.mlp.experts.6.up_proj.weight": "model-00030-of-00047.safetensors", + "model.layers.29.mlp.experts.6.up_proj.weight_scale": "model-00030-of-00047.safetensors", + "model.layers.29.mlp.experts.60.down_proj.weight": "model-00030-of-00047.safetensors", + "model.layers.29.mlp.experts.60.down_proj.weight_scale": "model-00030-of-00047.safetensors", + "model.layers.29.mlp.experts.60.gate_proj.weight": "model-00030-of-00047.safetensors", + "model.layers.29.mlp.experts.60.gate_proj.weight_scale": "model-00030-of-00047.safetensors", + "model.layers.29.mlp.experts.60.up_proj.weight": "model-00030-of-00047.safetensors", + "model.layers.29.mlp.experts.60.up_proj.weight_scale": "model-00030-of-00047.safetensors", + "model.layers.29.mlp.experts.61.down_proj.weight": "model-00030-of-00047.safetensors", + "model.layers.29.mlp.experts.61.down_proj.weight_scale": "model-00030-of-00047.safetensors", + "model.layers.29.mlp.experts.61.gate_proj.weight": "model-00030-of-00047.safetensors", + "model.layers.29.mlp.experts.61.gate_proj.weight_scale": "model-00030-of-00047.safetensors", + "model.layers.29.mlp.experts.61.up_proj.weight": "model-00030-of-00047.safetensors", + "model.layers.29.mlp.experts.61.up_proj.weight_scale": "model-00030-of-00047.safetensors", + "model.layers.29.mlp.experts.62.down_proj.weight": "model-00030-of-00047.safetensors", + "model.layers.29.mlp.experts.62.down_proj.weight_scale": "model-00030-of-00047.safetensors", + "model.layers.29.mlp.experts.62.gate_proj.weight": "model-00030-of-00047.safetensors", + "model.layers.29.mlp.experts.62.gate_proj.weight_scale": "model-00030-of-00047.safetensors", + "model.layers.29.mlp.experts.62.up_proj.weight": "model-00030-of-00047.safetensors", + "model.layers.29.mlp.experts.62.up_proj.weight_scale": "model-00030-of-00047.safetensors", + "model.layers.29.mlp.experts.63.down_proj.weight": "model-00030-of-00047.safetensors", + "model.layers.29.mlp.experts.63.down_proj.weight_scale": "model-00030-of-00047.safetensors", + "model.layers.29.mlp.experts.63.gate_proj.weight": "model-00030-of-00047.safetensors", + "model.layers.29.mlp.experts.63.gate_proj.weight_scale": "model-00030-of-00047.safetensors", + "model.layers.29.mlp.experts.63.up_proj.weight": "model-00030-of-00047.safetensors", + "model.layers.29.mlp.experts.63.up_proj.weight_scale": "model-00030-of-00047.safetensors", + "model.layers.29.mlp.experts.64.down_proj.weight": "model-00030-of-00047.safetensors", + "model.layers.29.mlp.experts.64.down_proj.weight_scale": "model-00030-of-00047.safetensors", + "model.layers.29.mlp.experts.64.gate_proj.weight": "model-00030-of-00047.safetensors", + "model.layers.29.mlp.experts.64.gate_proj.weight_scale": "model-00030-of-00047.safetensors", + "model.layers.29.mlp.experts.64.up_proj.weight": "model-00030-of-00047.safetensors", + "model.layers.29.mlp.experts.64.up_proj.weight_scale": "model-00030-of-00047.safetensors", + "model.layers.29.mlp.experts.65.down_proj.weight": "model-00030-of-00047.safetensors", + "model.layers.29.mlp.experts.65.down_proj.weight_scale": "model-00030-of-00047.safetensors", + "model.layers.29.mlp.experts.65.gate_proj.weight": "model-00030-of-00047.safetensors", + "model.layers.29.mlp.experts.65.gate_proj.weight_scale": "model-00030-of-00047.safetensors", + "model.layers.29.mlp.experts.65.up_proj.weight": "model-00030-of-00047.safetensors", + "model.layers.29.mlp.experts.65.up_proj.weight_scale": "model-00030-of-00047.safetensors", + "model.layers.29.mlp.experts.66.down_proj.weight": "model-00030-of-00047.safetensors", + "model.layers.29.mlp.experts.66.down_proj.weight_scale": "model-00030-of-00047.safetensors", + "model.layers.29.mlp.experts.66.gate_proj.weight": "model-00030-of-00047.safetensors", + "model.layers.29.mlp.experts.66.gate_proj.weight_scale": "model-00030-of-00047.safetensors", + "model.layers.29.mlp.experts.66.up_proj.weight": "model-00030-of-00047.safetensors", + "model.layers.29.mlp.experts.66.up_proj.weight_scale": "model-00030-of-00047.safetensors", + "model.layers.29.mlp.experts.67.down_proj.weight": "model-00030-of-00047.safetensors", + "model.layers.29.mlp.experts.67.down_proj.weight_scale": "model-00030-of-00047.safetensors", + "model.layers.29.mlp.experts.67.gate_proj.weight": "model-00030-of-00047.safetensors", + "model.layers.29.mlp.experts.67.gate_proj.weight_scale": "model-00030-of-00047.safetensors", + "model.layers.29.mlp.experts.67.up_proj.weight": "model-00030-of-00047.safetensors", + "model.layers.29.mlp.experts.67.up_proj.weight_scale": "model-00030-of-00047.safetensors", + "model.layers.29.mlp.experts.68.down_proj.weight": "model-00030-of-00047.safetensors", + "model.layers.29.mlp.experts.68.down_proj.weight_scale": "model-00030-of-00047.safetensors", + "model.layers.29.mlp.experts.68.gate_proj.weight": "model-00030-of-00047.safetensors", + "model.layers.29.mlp.experts.68.gate_proj.weight_scale": "model-00030-of-00047.safetensors", + "model.layers.29.mlp.experts.68.up_proj.weight": "model-00030-of-00047.safetensors", + "model.layers.29.mlp.experts.68.up_proj.weight_scale": "model-00030-of-00047.safetensors", + "model.layers.29.mlp.experts.69.down_proj.weight": "model-00030-of-00047.safetensors", + "model.layers.29.mlp.experts.69.down_proj.weight_scale": "model-00030-of-00047.safetensors", + "model.layers.29.mlp.experts.69.gate_proj.weight": "model-00030-of-00047.safetensors", + "model.layers.29.mlp.experts.69.gate_proj.weight_scale": "model-00030-of-00047.safetensors", + "model.layers.29.mlp.experts.69.up_proj.weight": "model-00030-of-00047.safetensors", + "model.layers.29.mlp.experts.69.up_proj.weight_scale": "model-00030-of-00047.safetensors", + "model.layers.29.mlp.experts.7.down_proj.weight": "model-00030-of-00047.safetensors", + "model.layers.29.mlp.experts.7.down_proj.weight_scale": "model-00030-of-00047.safetensors", + "model.layers.29.mlp.experts.7.gate_proj.weight": "model-00030-of-00047.safetensors", + "model.layers.29.mlp.experts.7.gate_proj.weight_scale": "model-00030-of-00047.safetensors", + "model.layers.29.mlp.experts.7.up_proj.weight": "model-00030-of-00047.safetensors", + "model.layers.29.mlp.experts.7.up_proj.weight_scale": "model-00030-of-00047.safetensors", + "model.layers.29.mlp.experts.70.down_proj.weight": "model-00030-of-00047.safetensors", + "model.layers.29.mlp.experts.70.down_proj.weight_scale": "model-00030-of-00047.safetensors", + "model.layers.29.mlp.experts.70.gate_proj.weight": "model-00030-of-00047.safetensors", + "model.layers.29.mlp.experts.70.gate_proj.weight_scale": "model-00030-of-00047.safetensors", + "model.layers.29.mlp.experts.70.up_proj.weight": "model-00030-of-00047.safetensors", + "model.layers.29.mlp.experts.70.up_proj.weight_scale": "model-00030-of-00047.safetensors", + "model.layers.29.mlp.experts.71.down_proj.weight": "model-00030-of-00047.safetensors", + "model.layers.29.mlp.experts.71.down_proj.weight_scale": "model-00030-of-00047.safetensors", + "model.layers.29.mlp.experts.71.gate_proj.weight": "model-00030-of-00047.safetensors", + "model.layers.29.mlp.experts.71.gate_proj.weight_scale": "model-00030-of-00047.safetensors", + "model.layers.29.mlp.experts.71.up_proj.weight": "model-00030-of-00047.safetensors", + "model.layers.29.mlp.experts.71.up_proj.weight_scale": "model-00030-of-00047.safetensors", + "model.layers.29.mlp.experts.72.down_proj.weight": "model-00030-of-00047.safetensors", + "model.layers.29.mlp.experts.72.down_proj.weight_scale": "model-00030-of-00047.safetensors", + "model.layers.29.mlp.experts.72.gate_proj.weight": "model-00030-of-00047.safetensors", + "model.layers.29.mlp.experts.72.gate_proj.weight_scale": "model-00030-of-00047.safetensors", + "model.layers.29.mlp.experts.72.up_proj.weight": "model-00030-of-00047.safetensors", + "model.layers.29.mlp.experts.72.up_proj.weight_scale": "model-00030-of-00047.safetensors", + "model.layers.29.mlp.experts.73.down_proj.weight": "model-00030-of-00047.safetensors", + "model.layers.29.mlp.experts.73.down_proj.weight_scale": "model-00030-of-00047.safetensors", + "model.layers.29.mlp.experts.73.gate_proj.weight": "model-00030-of-00047.safetensors", + "model.layers.29.mlp.experts.73.gate_proj.weight_scale": "model-00030-of-00047.safetensors", + "model.layers.29.mlp.experts.73.up_proj.weight": "model-00030-of-00047.safetensors", + "model.layers.29.mlp.experts.73.up_proj.weight_scale": "model-00030-of-00047.safetensors", + "model.layers.29.mlp.experts.74.down_proj.weight": "model-00030-of-00047.safetensors", + "model.layers.29.mlp.experts.74.down_proj.weight_scale": "model-00030-of-00047.safetensors", + "model.layers.29.mlp.experts.74.gate_proj.weight": "model-00030-of-00047.safetensors", + "model.layers.29.mlp.experts.74.gate_proj.weight_scale": "model-00030-of-00047.safetensors", + "model.layers.29.mlp.experts.74.up_proj.weight": "model-00030-of-00047.safetensors", + "model.layers.29.mlp.experts.74.up_proj.weight_scale": "model-00030-of-00047.safetensors", + "model.layers.29.mlp.experts.75.down_proj.weight": "model-00030-of-00047.safetensors", + "model.layers.29.mlp.experts.75.down_proj.weight_scale": "model-00030-of-00047.safetensors", + "model.layers.29.mlp.experts.75.gate_proj.weight": "model-00030-of-00047.safetensors", + "model.layers.29.mlp.experts.75.gate_proj.weight_scale": "model-00030-of-00047.safetensors", + "model.layers.29.mlp.experts.75.up_proj.weight": "model-00030-of-00047.safetensors", + "model.layers.29.mlp.experts.75.up_proj.weight_scale": "model-00030-of-00047.safetensors", + "model.layers.29.mlp.experts.76.down_proj.weight": "model-00030-of-00047.safetensors", + "model.layers.29.mlp.experts.76.down_proj.weight_scale": "model-00030-of-00047.safetensors", + "model.layers.29.mlp.experts.76.gate_proj.weight": "model-00030-of-00047.safetensors", + "model.layers.29.mlp.experts.76.gate_proj.weight_scale": "model-00030-of-00047.safetensors", + "model.layers.29.mlp.experts.76.up_proj.weight": "model-00030-of-00047.safetensors", + "model.layers.29.mlp.experts.76.up_proj.weight_scale": "model-00030-of-00047.safetensors", + "model.layers.29.mlp.experts.77.down_proj.weight": "model-00030-of-00047.safetensors", + "model.layers.29.mlp.experts.77.down_proj.weight_scale": "model-00030-of-00047.safetensors", + "model.layers.29.mlp.experts.77.gate_proj.weight": "model-00030-of-00047.safetensors", + "model.layers.29.mlp.experts.77.gate_proj.weight_scale": "model-00030-of-00047.safetensors", + "model.layers.29.mlp.experts.77.up_proj.weight": "model-00030-of-00047.safetensors", + "model.layers.29.mlp.experts.77.up_proj.weight_scale": "model-00030-of-00047.safetensors", + "model.layers.29.mlp.experts.78.down_proj.weight": "model-00030-of-00047.safetensors", + "model.layers.29.mlp.experts.78.down_proj.weight_scale": "model-00030-of-00047.safetensors", + "model.layers.29.mlp.experts.78.gate_proj.weight": "model-00030-of-00047.safetensors", + "model.layers.29.mlp.experts.78.gate_proj.weight_scale": "model-00030-of-00047.safetensors", + "model.layers.29.mlp.experts.78.up_proj.weight": "model-00030-of-00047.safetensors", + "model.layers.29.mlp.experts.78.up_proj.weight_scale": "model-00030-of-00047.safetensors", + "model.layers.29.mlp.experts.79.down_proj.weight": "model-00030-of-00047.safetensors", + "model.layers.29.mlp.experts.79.down_proj.weight_scale": "model-00030-of-00047.safetensors", + "model.layers.29.mlp.experts.79.gate_proj.weight": "model-00030-of-00047.safetensors", + "model.layers.29.mlp.experts.79.gate_proj.weight_scale": "model-00030-of-00047.safetensors", + "model.layers.29.mlp.experts.79.up_proj.weight": "model-00030-of-00047.safetensors", + "model.layers.29.mlp.experts.79.up_proj.weight_scale": "model-00030-of-00047.safetensors", + "model.layers.29.mlp.experts.8.down_proj.weight": "model-00030-of-00047.safetensors", + "model.layers.29.mlp.experts.8.down_proj.weight_scale": "model-00030-of-00047.safetensors", + "model.layers.29.mlp.experts.8.gate_proj.weight": "model-00030-of-00047.safetensors", + "model.layers.29.mlp.experts.8.gate_proj.weight_scale": "model-00030-of-00047.safetensors", + "model.layers.29.mlp.experts.8.up_proj.weight": "model-00030-of-00047.safetensors", + "model.layers.29.mlp.experts.8.up_proj.weight_scale": "model-00030-of-00047.safetensors", + "model.layers.29.mlp.experts.80.down_proj.weight": "model-00030-of-00047.safetensors", + "model.layers.29.mlp.experts.80.down_proj.weight_scale": "model-00030-of-00047.safetensors", + "model.layers.29.mlp.experts.80.gate_proj.weight": "model-00030-of-00047.safetensors", + "model.layers.29.mlp.experts.80.gate_proj.weight_scale": "model-00030-of-00047.safetensors", + "model.layers.29.mlp.experts.80.up_proj.weight": "model-00030-of-00047.safetensors", + "model.layers.29.mlp.experts.80.up_proj.weight_scale": "model-00030-of-00047.safetensors", + "model.layers.29.mlp.experts.81.down_proj.weight": "model-00030-of-00047.safetensors", + "model.layers.29.mlp.experts.81.down_proj.weight_scale": "model-00030-of-00047.safetensors", + "model.layers.29.mlp.experts.81.gate_proj.weight": "model-00030-of-00047.safetensors", + "model.layers.29.mlp.experts.81.gate_proj.weight_scale": "model-00030-of-00047.safetensors", + "model.layers.29.mlp.experts.81.up_proj.weight": "model-00030-of-00047.safetensors", + "model.layers.29.mlp.experts.81.up_proj.weight_scale": "model-00030-of-00047.safetensors", + "model.layers.29.mlp.experts.82.down_proj.weight": "model-00030-of-00047.safetensors", + "model.layers.29.mlp.experts.82.down_proj.weight_scale": "model-00030-of-00047.safetensors", + "model.layers.29.mlp.experts.82.gate_proj.weight": "model-00030-of-00047.safetensors", + "model.layers.29.mlp.experts.82.gate_proj.weight_scale": "model-00030-of-00047.safetensors", + "model.layers.29.mlp.experts.82.up_proj.weight": "model-00030-of-00047.safetensors", + "model.layers.29.mlp.experts.82.up_proj.weight_scale": "model-00030-of-00047.safetensors", + "model.layers.29.mlp.experts.83.down_proj.weight": "model-00030-of-00047.safetensors", + "model.layers.29.mlp.experts.83.down_proj.weight_scale": "model-00030-of-00047.safetensors", + "model.layers.29.mlp.experts.83.gate_proj.weight": "model-00030-of-00047.safetensors", + "model.layers.29.mlp.experts.83.gate_proj.weight_scale": "model-00030-of-00047.safetensors", + "model.layers.29.mlp.experts.83.up_proj.weight": "model-00030-of-00047.safetensors", + "model.layers.29.mlp.experts.83.up_proj.weight_scale": "model-00030-of-00047.safetensors", + "model.layers.29.mlp.experts.84.down_proj.weight": "model-00030-of-00047.safetensors", + "model.layers.29.mlp.experts.84.down_proj.weight_scale": "model-00030-of-00047.safetensors", + "model.layers.29.mlp.experts.84.gate_proj.weight": "model-00030-of-00047.safetensors", + "model.layers.29.mlp.experts.84.gate_proj.weight_scale": "model-00030-of-00047.safetensors", + "model.layers.29.mlp.experts.84.up_proj.weight": "model-00030-of-00047.safetensors", + "model.layers.29.mlp.experts.84.up_proj.weight_scale": "model-00030-of-00047.safetensors", + "model.layers.29.mlp.experts.85.down_proj.weight": "model-00030-of-00047.safetensors", + "model.layers.29.mlp.experts.85.down_proj.weight_scale": "model-00030-of-00047.safetensors", + "model.layers.29.mlp.experts.85.gate_proj.weight": "model-00030-of-00047.safetensors", + "model.layers.29.mlp.experts.85.gate_proj.weight_scale": "model-00030-of-00047.safetensors", + "model.layers.29.mlp.experts.85.up_proj.weight": "model-00030-of-00047.safetensors", + "model.layers.29.mlp.experts.85.up_proj.weight_scale": "model-00030-of-00047.safetensors", + "model.layers.29.mlp.experts.86.down_proj.weight": "model-00030-of-00047.safetensors", + "model.layers.29.mlp.experts.86.down_proj.weight_scale": "model-00030-of-00047.safetensors", + "model.layers.29.mlp.experts.86.gate_proj.weight": "model-00030-of-00047.safetensors", + "model.layers.29.mlp.experts.86.gate_proj.weight_scale": "model-00030-of-00047.safetensors", + "model.layers.29.mlp.experts.86.up_proj.weight": "model-00030-of-00047.safetensors", + "model.layers.29.mlp.experts.86.up_proj.weight_scale": "model-00030-of-00047.safetensors", + "model.layers.29.mlp.experts.87.down_proj.weight": "model-00030-of-00047.safetensors", + "model.layers.29.mlp.experts.87.down_proj.weight_scale": "model-00030-of-00047.safetensors", + "model.layers.29.mlp.experts.87.gate_proj.weight": "model-00030-of-00047.safetensors", + "model.layers.29.mlp.experts.87.gate_proj.weight_scale": "model-00030-of-00047.safetensors", + "model.layers.29.mlp.experts.87.up_proj.weight": "model-00030-of-00047.safetensors", + "model.layers.29.mlp.experts.87.up_proj.weight_scale": "model-00030-of-00047.safetensors", + "model.layers.29.mlp.experts.88.down_proj.weight": "model-00030-of-00047.safetensors", + "model.layers.29.mlp.experts.88.down_proj.weight_scale": "model-00030-of-00047.safetensors", + "model.layers.29.mlp.experts.88.gate_proj.weight": "model-00030-of-00047.safetensors", + "model.layers.29.mlp.experts.88.gate_proj.weight_scale": "model-00030-of-00047.safetensors", + "model.layers.29.mlp.experts.88.up_proj.weight": "model-00030-of-00047.safetensors", + "model.layers.29.mlp.experts.88.up_proj.weight_scale": "model-00030-of-00047.safetensors", + "model.layers.29.mlp.experts.89.down_proj.weight": "model-00030-of-00047.safetensors", + "model.layers.29.mlp.experts.89.down_proj.weight_scale": "model-00030-of-00047.safetensors", + "model.layers.29.mlp.experts.89.gate_proj.weight": "model-00030-of-00047.safetensors", + "model.layers.29.mlp.experts.89.gate_proj.weight_scale": "model-00030-of-00047.safetensors", + "model.layers.29.mlp.experts.89.up_proj.weight": "model-00030-of-00047.safetensors", + "model.layers.29.mlp.experts.89.up_proj.weight_scale": "model-00030-of-00047.safetensors", + "model.layers.29.mlp.experts.9.down_proj.weight": "model-00030-of-00047.safetensors", + "model.layers.29.mlp.experts.9.down_proj.weight_scale": "model-00030-of-00047.safetensors", + "model.layers.29.mlp.experts.9.gate_proj.weight": "model-00030-of-00047.safetensors", + "model.layers.29.mlp.experts.9.gate_proj.weight_scale": "model-00030-of-00047.safetensors", + "model.layers.29.mlp.experts.9.up_proj.weight": "model-00030-of-00047.safetensors", + "model.layers.29.mlp.experts.9.up_proj.weight_scale": "model-00030-of-00047.safetensors", + "model.layers.29.mlp.experts.90.down_proj.weight": "model-00030-of-00047.safetensors", + "model.layers.29.mlp.experts.90.down_proj.weight_scale": "model-00030-of-00047.safetensors", + "model.layers.29.mlp.experts.90.gate_proj.weight": "model-00030-of-00047.safetensors", + "model.layers.29.mlp.experts.90.gate_proj.weight_scale": "model-00030-of-00047.safetensors", + "model.layers.29.mlp.experts.90.up_proj.weight": "model-00030-of-00047.safetensors", + "model.layers.29.mlp.experts.90.up_proj.weight_scale": "model-00030-of-00047.safetensors", + "model.layers.29.mlp.experts.91.down_proj.weight": "model-00030-of-00047.safetensors", + "model.layers.29.mlp.experts.91.down_proj.weight_scale": "model-00030-of-00047.safetensors", + "model.layers.29.mlp.experts.91.gate_proj.weight": "model-00030-of-00047.safetensors", + "model.layers.29.mlp.experts.91.gate_proj.weight_scale": "model-00030-of-00047.safetensors", + "model.layers.29.mlp.experts.91.up_proj.weight": "model-00030-of-00047.safetensors", + "model.layers.29.mlp.experts.91.up_proj.weight_scale": "model-00030-of-00047.safetensors", + "model.layers.29.mlp.experts.92.down_proj.weight": "model-00030-of-00047.safetensors", + "model.layers.29.mlp.experts.92.down_proj.weight_scale": "model-00030-of-00047.safetensors", + "model.layers.29.mlp.experts.92.gate_proj.weight": "model-00030-of-00047.safetensors", + "model.layers.29.mlp.experts.92.gate_proj.weight_scale": "model-00030-of-00047.safetensors", + "model.layers.29.mlp.experts.92.up_proj.weight": "model-00030-of-00047.safetensors", + "model.layers.29.mlp.experts.92.up_proj.weight_scale": "model-00030-of-00047.safetensors", + "model.layers.29.mlp.experts.93.down_proj.weight": "model-00030-of-00047.safetensors", + "model.layers.29.mlp.experts.93.down_proj.weight_scale": "model-00030-of-00047.safetensors", + "model.layers.29.mlp.experts.93.gate_proj.weight": "model-00030-of-00047.safetensors", + "model.layers.29.mlp.experts.93.gate_proj.weight_scale": "model-00030-of-00047.safetensors", + "model.layers.29.mlp.experts.93.up_proj.weight": "model-00030-of-00047.safetensors", + "model.layers.29.mlp.experts.93.up_proj.weight_scale": "model-00030-of-00047.safetensors", + "model.layers.29.mlp.experts.94.down_proj.weight": "model-00030-of-00047.safetensors", + "model.layers.29.mlp.experts.94.down_proj.weight_scale": "model-00030-of-00047.safetensors", + "model.layers.29.mlp.experts.94.gate_proj.weight": "model-00030-of-00047.safetensors", + "model.layers.29.mlp.experts.94.gate_proj.weight_scale": "model-00030-of-00047.safetensors", + "model.layers.29.mlp.experts.94.up_proj.weight": "model-00030-of-00047.safetensors", + "model.layers.29.mlp.experts.94.up_proj.weight_scale": "model-00030-of-00047.safetensors", + "model.layers.29.mlp.experts.95.down_proj.weight": "model-00030-of-00047.safetensors", + "model.layers.29.mlp.experts.95.down_proj.weight_scale": "model-00030-of-00047.safetensors", + "model.layers.29.mlp.experts.95.gate_proj.weight": "model-00030-of-00047.safetensors", + "model.layers.29.mlp.experts.95.gate_proj.weight_scale": "model-00030-of-00047.safetensors", + "model.layers.29.mlp.experts.95.up_proj.weight": "model-00030-of-00047.safetensors", + "model.layers.29.mlp.experts.95.up_proj.weight_scale": "model-00030-of-00047.safetensors", + "model.layers.29.mlp.experts.96.down_proj.weight": "model-00030-of-00047.safetensors", + "model.layers.29.mlp.experts.96.down_proj.weight_scale": "model-00030-of-00047.safetensors", + "model.layers.29.mlp.experts.96.gate_proj.weight": "model-00030-of-00047.safetensors", + "model.layers.29.mlp.experts.96.gate_proj.weight_scale": "model-00030-of-00047.safetensors", + "model.layers.29.mlp.experts.96.up_proj.weight": "model-00030-of-00047.safetensors", + "model.layers.29.mlp.experts.96.up_proj.weight_scale": "model-00030-of-00047.safetensors", + "model.layers.29.mlp.experts.97.down_proj.weight": "model-00030-of-00047.safetensors", + "model.layers.29.mlp.experts.97.down_proj.weight_scale": "model-00030-of-00047.safetensors", + "model.layers.29.mlp.experts.97.gate_proj.weight": "model-00030-of-00047.safetensors", + "model.layers.29.mlp.experts.97.gate_proj.weight_scale": "model-00030-of-00047.safetensors", + "model.layers.29.mlp.experts.97.up_proj.weight": "model-00030-of-00047.safetensors", + "model.layers.29.mlp.experts.97.up_proj.weight_scale": "model-00030-of-00047.safetensors", + "model.layers.29.mlp.experts.98.down_proj.weight": "model-00030-of-00047.safetensors", + "model.layers.29.mlp.experts.98.down_proj.weight_scale": "model-00030-of-00047.safetensors", + "model.layers.29.mlp.experts.98.gate_proj.weight": "model-00030-of-00047.safetensors", + "model.layers.29.mlp.experts.98.gate_proj.weight_scale": "model-00030-of-00047.safetensors", + "model.layers.29.mlp.experts.98.up_proj.weight": "model-00030-of-00047.safetensors", + "model.layers.29.mlp.experts.98.up_proj.weight_scale": "model-00030-of-00047.safetensors", + "model.layers.29.mlp.experts.99.down_proj.weight": "model-00030-of-00047.safetensors", + "model.layers.29.mlp.experts.99.down_proj.weight_scale": "model-00030-of-00047.safetensors", + "model.layers.29.mlp.experts.99.gate_proj.weight": "model-00030-of-00047.safetensors", + "model.layers.29.mlp.experts.99.gate_proj.weight_scale": "model-00030-of-00047.safetensors", + "model.layers.29.mlp.experts.99.up_proj.weight": "model-00030-of-00047.safetensors", + "model.layers.29.mlp.experts.99.up_proj.weight_scale": "model-00030-of-00047.safetensors", + "model.layers.29.mlp.gate.e_score_correction_bias": "model-00030-of-00047.safetensors", + "model.layers.29.mlp.gate.weight": "model-00030-of-00047.safetensors", + "model.layers.29.mlp.shared_experts.down_proj.weight": "model-00030-of-00047.safetensors", + "model.layers.29.mlp.shared_experts.down_proj.weight_scale": "model-00030-of-00047.safetensors", + "model.layers.29.mlp.shared_experts.gate_proj.weight": "model-00030-of-00047.safetensors", + "model.layers.29.mlp.shared_experts.gate_proj.weight_scale": "model-00030-of-00047.safetensors", + "model.layers.29.mlp.shared_experts.up_proj.weight": "model-00030-of-00047.safetensors", + "model.layers.29.mlp.shared_experts.up_proj.weight_scale": "model-00030-of-00047.safetensors", + "model.layers.29.post_attention_layernorm.weight": "model-00030-of-00047.safetensors", + "model.layers.29.self_attn.k_proj.bias": "model-00030-of-00047.safetensors", + "model.layers.29.self_attn.k_proj.weight": "model-00030-of-00047.safetensors", + "model.layers.29.self_attn.k_proj.weight_scale": "model-00030-of-00047.safetensors", + "model.layers.29.self_attn.o_proj.weight": "model-00030-of-00047.safetensors", + "model.layers.29.self_attn.o_proj.weight_scale": "model-00030-of-00047.safetensors", + "model.layers.29.self_attn.q_proj.bias": "model-00030-of-00047.safetensors", + "model.layers.29.self_attn.q_proj.weight": "model-00030-of-00047.safetensors", + "model.layers.29.self_attn.q_proj.weight_scale": "model-00030-of-00047.safetensors", + "model.layers.29.self_attn.v_proj.bias": "model-00030-of-00047.safetensors", + "model.layers.29.self_attn.v_proj.weight": "model-00030-of-00047.safetensors", + "model.layers.29.self_attn.v_proj.weight_scale": "model-00030-of-00047.safetensors", + "model.layers.30.input_layernorm.weight": "model-00031-of-00047.safetensors", + "model.layers.30.mlp.experts.0.down_proj.weight": "model-00031-of-00047.safetensors", + "model.layers.30.mlp.experts.0.down_proj.weight_scale": "model-00031-of-00047.safetensors", + "model.layers.30.mlp.experts.0.gate_proj.weight": "model-00031-of-00047.safetensors", + "model.layers.30.mlp.experts.0.gate_proj.weight_scale": "model-00031-of-00047.safetensors", + "model.layers.30.mlp.experts.0.up_proj.weight": "model-00031-of-00047.safetensors", + "model.layers.30.mlp.experts.0.up_proj.weight_scale": "model-00031-of-00047.safetensors", + "model.layers.30.mlp.experts.1.down_proj.weight": "model-00031-of-00047.safetensors", + "model.layers.30.mlp.experts.1.down_proj.weight_scale": "model-00031-of-00047.safetensors", + "model.layers.30.mlp.experts.1.gate_proj.weight": "model-00031-of-00047.safetensors", + "model.layers.30.mlp.experts.1.gate_proj.weight_scale": "model-00031-of-00047.safetensors", + "model.layers.30.mlp.experts.1.up_proj.weight": "model-00031-of-00047.safetensors", + "model.layers.30.mlp.experts.1.up_proj.weight_scale": "model-00031-of-00047.safetensors", + "model.layers.30.mlp.experts.10.down_proj.weight": "model-00031-of-00047.safetensors", + "model.layers.30.mlp.experts.10.down_proj.weight_scale": "model-00031-of-00047.safetensors", + "model.layers.30.mlp.experts.10.gate_proj.weight": "model-00031-of-00047.safetensors", + "model.layers.30.mlp.experts.10.gate_proj.weight_scale": "model-00031-of-00047.safetensors", + "model.layers.30.mlp.experts.10.up_proj.weight": "model-00031-of-00047.safetensors", + "model.layers.30.mlp.experts.10.up_proj.weight_scale": "model-00031-of-00047.safetensors", + "model.layers.30.mlp.experts.100.down_proj.weight": "model-00031-of-00047.safetensors", + "model.layers.30.mlp.experts.100.down_proj.weight_scale": "model-00031-of-00047.safetensors", + "model.layers.30.mlp.experts.100.gate_proj.weight": "model-00031-of-00047.safetensors", + "model.layers.30.mlp.experts.100.gate_proj.weight_scale": "model-00031-of-00047.safetensors", + "model.layers.30.mlp.experts.100.up_proj.weight": "model-00031-of-00047.safetensors", + "model.layers.30.mlp.experts.100.up_proj.weight_scale": "model-00031-of-00047.safetensors", + "model.layers.30.mlp.experts.101.down_proj.weight": "model-00031-of-00047.safetensors", + "model.layers.30.mlp.experts.101.down_proj.weight_scale": "model-00031-of-00047.safetensors", + "model.layers.30.mlp.experts.101.gate_proj.weight": "model-00031-of-00047.safetensors", + "model.layers.30.mlp.experts.101.gate_proj.weight_scale": "model-00031-of-00047.safetensors", + "model.layers.30.mlp.experts.101.up_proj.weight": "model-00031-of-00047.safetensors", + "model.layers.30.mlp.experts.101.up_proj.weight_scale": "model-00031-of-00047.safetensors", + "model.layers.30.mlp.experts.102.down_proj.weight": "model-00031-of-00047.safetensors", + "model.layers.30.mlp.experts.102.down_proj.weight_scale": "model-00031-of-00047.safetensors", + "model.layers.30.mlp.experts.102.gate_proj.weight": "model-00031-of-00047.safetensors", + "model.layers.30.mlp.experts.102.gate_proj.weight_scale": "model-00031-of-00047.safetensors", + "model.layers.30.mlp.experts.102.up_proj.weight": "model-00031-of-00047.safetensors", + "model.layers.30.mlp.experts.102.up_proj.weight_scale": "model-00031-of-00047.safetensors", + "model.layers.30.mlp.experts.103.down_proj.weight": "model-00031-of-00047.safetensors", + "model.layers.30.mlp.experts.103.down_proj.weight_scale": "model-00031-of-00047.safetensors", + "model.layers.30.mlp.experts.103.gate_proj.weight": "model-00031-of-00047.safetensors", + "model.layers.30.mlp.experts.103.gate_proj.weight_scale": "model-00031-of-00047.safetensors", + "model.layers.30.mlp.experts.103.up_proj.weight": "model-00031-of-00047.safetensors", + "model.layers.30.mlp.experts.103.up_proj.weight_scale": "model-00031-of-00047.safetensors", + "model.layers.30.mlp.experts.104.down_proj.weight": "model-00031-of-00047.safetensors", + "model.layers.30.mlp.experts.104.down_proj.weight_scale": "model-00031-of-00047.safetensors", + "model.layers.30.mlp.experts.104.gate_proj.weight": "model-00031-of-00047.safetensors", + "model.layers.30.mlp.experts.104.gate_proj.weight_scale": "model-00031-of-00047.safetensors", + "model.layers.30.mlp.experts.104.up_proj.weight": "model-00031-of-00047.safetensors", + "model.layers.30.mlp.experts.104.up_proj.weight_scale": "model-00031-of-00047.safetensors", + "model.layers.30.mlp.experts.105.down_proj.weight": "model-00031-of-00047.safetensors", + "model.layers.30.mlp.experts.105.down_proj.weight_scale": "model-00031-of-00047.safetensors", + "model.layers.30.mlp.experts.105.gate_proj.weight": "model-00031-of-00047.safetensors", + "model.layers.30.mlp.experts.105.gate_proj.weight_scale": "model-00031-of-00047.safetensors", + "model.layers.30.mlp.experts.105.up_proj.weight": "model-00031-of-00047.safetensors", + "model.layers.30.mlp.experts.105.up_proj.weight_scale": "model-00031-of-00047.safetensors", + "model.layers.30.mlp.experts.106.down_proj.weight": "model-00031-of-00047.safetensors", + "model.layers.30.mlp.experts.106.down_proj.weight_scale": "model-00031-of-00047.safetensors", + "model.layers.30.mlp.experts.106.gate_proj.weight": "model-00031-of-00047.safetensors", + "model.layers.30.mlp.experts.106.gate_proj.weight_scale": "model-00031-of-00047.safetensors", + "model.layers.30.mlp.experts.106.up_proj.weight": "model-00031-of-00047.safetensors", + "model.layers.30.mlp.experts.106.up_proj.weight_scale": "model-00031-of-00047.safetensors", + "model.layers.30.mlp.experts.107.down_proj.weight": "model-00031-of-00047.safetensors", + "model.layers.30.mlp.experts.107.down_proj.weight_scale": "model-00031-of-00047.safetensors", + "model.layers.30.mlp.experts.107.gate_proj.weight": "model-00031-of-00047.safetensors", + "model.layers.30.mlp.experts.107.gate_proj.weight_scale": "model-00031-of-00047.safetensors", + "model.layers.30.mlp.experts.107.up_proj.weight": "model-00031-of-00047.safetensors", + "model.layers.30.mlp.experts.107.up_proj.weight_scale": "model-00031-of-00047.safetensors", + "model.layers.30.mlp.experts.108.down_proj.weight": "model-00031-of-00047.safetensors", + "model.layers.30.mlp.experts.108.down_proj.weight_scale": "model-00031-of-00047.safetensors", + "model.layers.30.mlp.experts.108.gate_proj.weight": "model-00031-of-00047.safetensors", + "model.layers.30.mlp.experts.108.gate_proj.weight_scale": "model-00031-of-00047.safetensors", + "model.layers.30.mlp.experts.108.up_proj.weight": "model-00031-of-00047.safetensors", + "model.layers.30.mlp.experts.108.up_proj.weight_scale": "model-00031-of-00047.safetensors", + "model.layers.30.mlp.experts.109.down_proj.weight": "model-00031-of-00047.safetensors", + "model.layers.30.mlp.experts.109.down_proj.weight_scale": "model-00031-of-00047.safetensors", + "model.layers.30.mlp.experts.109.gate_proj.weight": "model-00031-of-00047.safetensors", + "model.layers.30.mlp.experts.109.gate_proj.weight_scale": "model-00031-of-00047.safetensors", + "model.layers.30.mlp.experts.109.up_proj.weight": "model-00031-of-00047.safetensors", + "model.layers.30.mlp.experts.109.up_proj.weight_scale": "model-00031-of-00047.safetensors", + "model.layers.30.mlp.experts.11.down_proj.weight": "model-00031-of-00047.safetensors", + "model.layers.30.mlp.experts.11.down_proj.weight_scale": "model-00031-of-00047.safetensors", + "model.layers.30.mlp.experts.11.gate_proj.weight": "model-00031-of-00047.safetensors", + "model.layers.30.mlp.experts.11.gate_proj.weight_scale": "model-00031-of-00047.safetensors", + "model.layers.30.mlp.experts.11.up_proj.weight": "model-00031-of-00047.safetensors", + "model.layers.30.mlp.experts.11.up_proj.weight_scale": "model-00031-of-00047.safetensors", + "model.layers.30.mlp.experts.110.down_proj.weight": "model-00031-of-00047.safetensors", + "model.layers.30.mlp.experts.110.down_proj.weight_scale": "model-00031-of-00047.safetensors", + "model.layers.30.mlp.experts.110.gate_proj.weight": "model-00031-of-00047.safetensors", + "model.layers.30.mlp.experts.110.gate_proj.weight_scale": "model-00031-of-00047.safetensors", + "model.layers.30.mlp.experts.110.up_proj.weight": "model-00031-of-00047.safetensors", + "model.layers.30.mlp.experts.110.up_proj.weight_scale": "model-00031-of-00047.safetensors", + "model.layers.30.mlp.experts.111.down_proj.weight": "model-00031-of-00047.safetensors", + "model.layers.30.mlp.experts.111.down_proj.weight_scale": "model-00031-of-00047.safetensors", + "model.layers.30.mlp.experts.111.gate_proj.weight": "model-00031-of-00047.safetensors", + "model.layers.30.mlp.experts.111.gate_proj.weight_scale": "model-00031-of-00047.safetensors", + "model.layers.30.mlp.experts.111.up_proj.weight": "model-00031-of-00047.safetensors", + "model.layers.30.mlp.experts.111.up_proj.weight_scale": "model-00031-of-00047.safetensors", + "model.layers.30.mlp.experts.112.down_proj.weight": "model-00031-of-00047.safetensors", + "model.layers.30.mlp.experts.112.down_proj.weight_scale": "model-00031-of-00047.safetensors", + "model.layers.30.mlp.experts.112.gate_proj.weight": "model-00031-of-00047.safetensors", + "model.layers.30.mlp.experts.112.gate_proj.weight_scale": "model-00031-of-00047.safetensors", + "model.layers.30.mlp.experts.112.up_proj.weight": "model-00031-of-00047.safetensors", + "model.layers.30.mlp.experts.112.up_proj.weight_scale": "model-00031-of-00047.safetensors", + "model.layers.30.mlp.experts.113.down_proj.weight": "model-00031-of-00047.safetensors", + "model.layers.30.mlp.experts.113.down_proj.weight_scale": "model-00031-of-00047.safetensors", + "model.layers.30.mlp.experts.113.gate_proj.weight": "model-00031-of-00047.safetensors", + "model.layers.30.mlp.experts.113.gate_proj.weight_scale": "model-00031-of-00047.safetensors", + "model.layers.30.mlp.experts.113.up_proj.weight": "model-00031-of-00047.safetensors", + "model.layers.30.mlp.experts.113.up_proj.weight_scale": "model-00031-of-00047.safetensors", + "model.layers.30.mlp.experts.114.down_proj.weight": "model-00031-of-00047.safetensors", + "model.layers.30.mlp.experts.114.down_proj.weight_scale": "model-00031-of-00047.safetensors", + "model.layers.30.mlp.experts.114.gate_proj.weight": "model-00031-of-00047.safetensors", + "model.layers.30.mlp.experts.114.gate_proj.weight_scale": "model-00031-of-00047.safetensors", + "model.layers.30.mlp.experts.114.up_proj.weight": "model-00031-of-00047.safetensors", + "model.layers.30.mlp.experts.114.up_proj.weight_scale": "model-00031-of-00047.safetensors", + "model.layers.30.mlp.experts.115.down_proj.weight": "model-00031-of-00047.safetensors", + "model.layers.30.mlp.experts.115.down_proj.weight_scale": "model-00031-of-00047.safetensors", + "model.layers.30.mlp.experts.115.gate_proj.weight": "model-00031-of-00047.safetensors", + "model.layers.30.mlp.experts.115.gate_proj.weight_scale": "model-00031-of-00047.safetensors", + "model.layers.30.mlp.experts.115.up_proj.weight": "model-00031-of-00047.safetensors", + "model.layers.30.mlp.experts.115.up_proj.weight_scale": "model-00031-of-00047.safetensors", + "model.layers.30.mlp.experts.116.down_proj.weight": "model-00031-of-00047.safetensors", + "model.layers.30.mlp.experts.116.down_proj.weight_scale": "model-00031-of-00047.safetensors", + "model.layers.30.mlp.experts.116.gate_proj.weight": "model-00031-of-00047.safetensors", + "model.layers.30.mlp.experts.116.gate_proj.weight_scale": "model-00031-of-00047.safetensors", + "model.layers.30.mlp.experts.116.up_proj.weight": "model-00031-of-00047.safetensors", + "model.layers.30.mlp.experts.116.up_proj.weight_scale": "model-00031-of-00047.safetensors", + "model.layers.30.mlp.experts.117.down_proj.weight": "model-00031-of-00047.safetensors", + "model.layers.30.mlp.experts.117.down_proj.weight_scale": "model-00031-of-00047.safetensors", + "model.layers.30.mlp.experts.117.gate_proj.weight": "model-00031-of-00047.safetensors", + "model.layers.30.mlp.experts.117.gate_proj.weight_scale": "model-00031-of-00047.safetensors", + "model.layers.30.mlp.experts.117.up_proj.weight": "model-00031-of-00047.safetensors", + "model.layers.30.mlp.experts.117.up_proj.weight_scale": "model-00031-of-00047.safetensors", + "model.layers.30.mlp.experts.118.down_proj.weight": "model-00031-of-00047.safetensors", + "model.layers.30.mlp.experts.118.down_proj.weight_scale": "model-00031-of-00047.safetensors", + "model.layers.30.mlp.experts.118.gate_proj.weight": "model-00031-of-00047.safetensors", + "model.layers.30.mlp.experts.118.gate_proj.weight_scale": "model-00031-of-00047.safetensors", + "model.layers.30.mlp.experts.118.up_proj.weight": "model-00031-of-00047.safetensors", + "model.layers.30.mlp.experts.118.up_proj.weight_scale": "model-00031-of-00047.safetensors", + "model.layers.30.mlp.experts.119.down_proj.weight": "model-00031-of-00047.safetensors", + "model.layers.30.mlp.experts.119.down_proj.weight_scale": "model-00031-of-00047.safetensors", + "model.layers.30.mlp.experts.119.gate_proj.weight": "model-00031-of-00047.safetensors", + "model.layers.30.mlp.experts.119.gate_proj.weight_scale": "model-00031-of-00047.safetensors", + "model.layers.30.mlp.experts.119.up_proj.weight": "model-00031-of-00047.safetensors", + "model.layers.30.mlp.experts.119.up_proj.weight_scale": "model-00031-of-00047.safetensors", + "model.layers.30.mlp.experts.12.down_proj.weight": "model-00031-of-00047.safetensors", + "model.layers.30.mlp.experts.12.down_proj.weight_scale": "model-00031-of-00047.safetensors", + "model.layers.30.mlp.experts.12.gate_proj.weight": "model-00031-of-00047.safetensors", + "model.layers.30.mlp.experts.12.gate_proj.weight_scale": "model-00031-of-00047.safetensors", + "model.layers.30.mlp.experts.12.up_proj.weight": "model-00031-of-00047.safetensors", + "model.layers.30.mlp.experts.12.up_proj.weight_scale": "model-00031-of-00047.safetensors", + "model.layers.30.mlp.experts.120.down_proj.weight": "model-00031-of-00047.safetensors", + "model.layers.30.mlp.experts.120.down_proj.weight_scale": "model-00031-of-00047.safetensors", + "model.layers.30.mlp.experts.120.gate_proj.weight": "model-00031-of-00047.safetensors", + "model.layers.30.mlp.experts.120.gate_proj.weight_scale": "model-00031-of-00047.safetensors", + "model.layers.30.mlp.experts.120.up_proj.weight": "model-00031-of-00047.safetensors", + "model.layers.30.mlp.experts.120.up_proj.weight_scale": "model-00031-of-00047.safetensors", + "model.layers.30.mlp.experts.121.down_proj.weight": "model-00031-of-00047.safetensors", + "model.layers.30.mlp.experts.121.down_proj.weight_scale": "model-00031-of-00047.safetensors", + "model.layers.30.mlp.experts.121.gate_proj.weight": "model-00031-of-00047.safetensors", + "model.layers.30.mlp.experts.121.gate_proj.weight_scale": "model-00031-of-00047.safetensors", + "model.layers.30.mlp.experts.121.up_proj.weight": "model-00031-of-00047.safetensors", + "model.layers.30.mlp.experts.121.up_proj.weight_scale": "model-00031-of-00047.safetensors", + "model.layers.30.mlp.experts.122.down_proj.weight": "model-00031-of-00047.safetensors", + "model.layers.30.mlp.experts.122.down_proj.weight_scale": "model-00031-of-00047.safetensors", + "model.layers.30.mlp.experts.122.gate_proj.weight": "model-00031-of-00047.safetensors", + "model.layers.30.mlp.experts.122.gate_proj.weight_scale": "model-00031-of-00047.safetensors", + "model.layers.30.mlp.experts.122.up_proj.weight": "model-00031-of-00047.safetensors", + "model.layers.30.mlp.experts.122.up_proj.weight_scale": "model-00031-of-00047.safetensors", + "model.layers.30.mlp.experts.123.down_proj.weight": "model-00031-of-00047.safetensors", + "model.layers.30.mlp.experts.123.down_proj.weight_scale": "model-00031-of-00047.safetensors", + "model.layers.30.mlp.experts.123.gate_proj.weight": "model-00031-of-00047.safetensors", + "model.layers.30.mlp.experts.123.gate_proj.weight_scale": "model-00031-of-00047.safetensors", + "model.layers.30.mlp.experts.123.up_proj.weight": "model-00031-of-00047.safetensors", + "model.layers.30.mlp.experts.123.up_proj.weight_scale": "model-00031-of-00047.safetensors", + "model.layers.30.mlp.experts.124.down_proj.weight": "model-00031-of-00047.safetensors", + "model.layers.30.mlp.experts.124.down_proj.weight_scale": "model-00031-of-00047.safetensors", + "model.layers.30.mlp.experts.124.gate_proj.weight": "model-00031-of-00047.safetensors", + "model.layers.30.mlp.experts.124.gate_proj.weight_scale": "model-00031-of-00047.safetensors", + "model.layers.30.mlp.experts.124.up_proj.weight": "model-00031-of-00047.safetensors", + "model.layers.30.mlp.experts.124.up_proj.weight_scale": "model-00031-of-00047.safetensors", + "model.layers.30.mlp.experts.125.down_proj.weight": "model-00031-of-00047.safetensors", + "model.layers.30.mlp.experts.125.down_proj.weight_scale": "model-00031-of-00047.safetensors", + "model.layers.30.mlp.experts.125.gate_proj.weight": "model-00031-of-00047.safetensors", + "model.layers.30.mlp.experts.125.gate_proj.weight_scale": "model-00031-of-00047.safetensors", + "model.layers.30.mlp.experts.125.up_proj.weight": "model-00031-of-00047.safetensors", + "model.layers.30.mlp.experts.125.up_proj.weight_scale": "model-00031-of-00047.safetensors", + "model.layers.30.mlp.experts.126.down_proj.weight": "model-00031-of-00047.safetensors", + "model.layers.30.mlp.experts.126.down_proj.weight_scale": "model-00031-of-00047.safetensors", + "model.layers.30.mlp.experts.126.gate_proj.weight": "model-00031-of-00047.safetensors", + "model.layers.30.mlp.experts.126.gate_proj.weight_scale": "model-00031-of-00047.safetensors", + "model.layers.30.mlp.experts.126.up_proj.weight": "model-00031-of-00047.safetensors", + "model.layers.30.mlp.experts.126.up_proj.weight_scale": "model-00031-of-00047.safetensors", + "model.layers.30.mlp.experts.127.down_proj.weight": "model-00031-of-00047.safetensors", + "model.layers.30.mlp.experts.127.down_proj.weight_scale": "model-00031-of-00047.safetensors", + "model.layers.30.mlp.experts.127.gate_proj.weight": "model-00031-of-00047.safetensors", + "model.layers.30.mlp.experts.127.gate_proj.weight_scale": "model-00031-of-00047.safetensors", + "model.layers.30.mlp.experts.127.up_proj.weight": "model-00031-of-00047.safetensors", + "model.layers.30.mlp.experts.127.up_proj.weight_scale": "model-00031-of-00047.safetensors", + "model.layers.30.mlp.experts.13.down_proj.weight": "model-00031-of-00047.safetensors", + "model.layers.30.mlp.experts.13.down_proj.weight_scale": "model-00031-of-00047.safetensors", + "model.layers.30.mlp.experts.13.gate_proj.weight": "model-00031-of-00047.safetensors", + "model.layers.30.mlp.experts.13.gate_proj.weight_scale": "model-00031-of-00047.safetensors", + "model.layers.30.mlp.experts.13.up_proj.weight": "model-00031-of-00047.safetensors", + "model.layers.30.mlp.experts.13.up_proj.weight_scale": "model-00031-of-00047.safetensors", + "model.layers.30.mlp.experts.14.down_proj.weight": "model-00031-of-00047.safetensors", + "model.layers.30.mlp.experts.14.down_proj.weight_scale": "model-00031-of-00047.safetensors", + "model.layers.30.mlp.experts.14.gate_proj.weight": "model-00031-of-00047.safetensors", + "model.layers.30.mlp.experts.14.gate_proj.weight_scale": "model-00031-of-00047.safetensors", + "model.layers.30.mlp.experts.14.up_proj.weight": "model-00031-of-00047.safetensors", + "model.layers.30.mlp.experts.14.up_proj.weight_scale": "model-00031-of-00047.safetensors", + "model.layers.30.mlp.experts.15.down_proj.weight": "model-00031-of-00047.safetensors", + "model.layers.30.mlp.experts.15.down_proj.weight_scale": "model-00031-of-00047.safetensors", + "model.layers.30.mlp.experts.15.gate_proj.weight": "model-00031-of-00047.safetensors", + "model.layers.30.mlp.experts.15.gate_proj.weight_scale": "model-00031-of-00047.safetensors", + "model.layers.30.mlp.experts.15.up_proj.weight": "model-00031-of-00047.safetensors", + "model.layers.30.mlp.experts.15.up_proj.weight_scale": "model-00031-of-00047.safetensors", + "model.layers.30.mlp.experts.16.down_proj.weight": "model-00031-of-00047.safetensors", + "model.layers.30.mlp.experts.16.down_proj.weight_scale": "model-00031-of-00047.safetensors", + "model.layers.30.mlp.experts.16.gate_proj.weight": "model-00031-of-00047.safetensors", + "model.layers.30.mlp.experts.16.gate_proj.weight_scale": "model-00031-of-00047.safetensors", + "model.layers.30.mlp.experts.16.up_proj.weight": "model-00031-of-00047.safetensors", + "model.layers.30.mlp.experts.16.up_proj.weight_scale": "model-00031-of-00047.safetensors", + "model.layers.30.mlp.experts.17.down_proj.weight": "model-00031-of-00047.safetensors", + "model.layers.30.mlp.experts.17.down_proj.weight_scale": "model-00031-of-00047.safetensors", + "model.layers.30.mlp.experts.17.gate_proj.weight": "model-00031-of-00047.safetensors", + "model.layers.30.mlp.experts.17.gate_proj.weight_scale": "model-00031-of-00047.safetensors", + "model.layers.30.mlp.experts.17.up_proj.weight": "model-00031-of-00047.safetensors", + "model.layers.30.mlp.experts.17.up_proj.weight_scale": "model-00031-of-00047.safetensors", + "model.layers.30.mlp.experts.18.down_proj.weight": "model-00031-of-00047.safetensors", + "model.layers.30.mlp.experts.18.down_proj.weight_scale": "model-00031-of-00047.safetensors", + "model.layers.30.mlp.experts.18.gate_proj.weight": "model-00031-of-00047.safetensors", + "model.layers.30.mlp.experts.18.gate_proj.weight_scale": "model-00031-of-00047.safetensors", + "model.layers.30.mlp.experts.18.up_proj.weight": "model-00031-of-00047.safetensors", + "model.layers.30.mlp.experts.18.up_proj.weight_scale": "model-00031-of-00047.safetensors", + "model.layers.30.mlp.experts.19.down_proj.weight": "model-00031-of-00047.safetensors", + "model.layers.30.mlp.experts.19.down_proj.weight_scale": "model-00031-of-00047.safetensors", + "model.layers.30.mlp.experts.19.gate_proj.weight": "model-00031-of-00047.safetensors", + "model.layers.30.mlp.experts.19.gate_proj.weight_scale": "model-00031-of-00047.safetensors", + "model.layers.30.mlp.experts.19.up_proj.weight": "model-00031-of-00047.safetensors", + "model.layers.30.mlp.experts.19.up_proj.weight_scale": "model-00031-of-00047.safetensors", + "model.layers.30.mlp.experts.2.down_proj.weight": "model-00031-of-00047.safetensors", + "model.layers.30.mlp.experts.2.down_proj.weight_scale": "model-00031-of-00047.safetensors", + "model.layers.30.mlp.experts.2.gate_proj.weight": "model-00031-of-00047.safetensors", + "model.layers.30.mlp.experts.2.gate_proj.weight_scale": "model-00031-of-00047.safetensors", + "model.layers.30.mlp.experts.2.up_proj.weight": "model-00031-of-00047.safetensors", + "model.layers.30.mlp.experts.2.up_proj.weight_scale": "model-00031-of-00047.safetensors", + "model.layers.30.mlp.experts.20.down_proj.weight": "model-00031-of-00047.safetensors", + "model.layers.30.mlp.experts.20.down_proj.weight_scale": "model-00031-of-00047.safetensors", + "model.layers.30.mlp.experts.20.gate_proj.weight": "model-00031-of-00047.safetensors", + "model.layers.30.mlp.experts.20.gate_proj.weight_scale": "model-00031-of-00047.safetensors", + "model.layers.30.mlp.experts.20.up_proj.weight": "model-00031-of-00047.safetensors", + "model.layers.30.mlp.experts.20.up_proj.weight_scale": "model-00031-of-00047.safetensors", + "model.layers.30.mlp.experts.21.down_proj.weight": "model-00031-of-00047.safetensors", + "model.layers.30.mlp.experts.21.down_proj.weight_scale": "model-00031-of-00047.safetensors", + "model.layers.30.mlp.experts.21.gate_proj.weight": "model-00031-of-00047.safetensors", + "model.layers.30.mlp.experts.21.gate_proj.weight_scale": "model-00031-of-00047.safetensors", + "model.layers.30.mlp.experts.21.up_proj.weight": "model-00031-of-00047.safetensors", + "model.layers.30.mlp.experts.21.up_proj.weight_scale": "model-00031-of-00047.safetensors", + "model.layers.30.mlp.experts.22.down_proj.weight": "model-00031-of-00047.safetensors", + "model.layers.30.mlp.experts.22.down_proj.weight_scale": "model-00031-of-00047.safetensors", + "model.layers.30.mlp.experts.22.gate_proj.weight": "model-00031-of-00047.safetensors", + "model.layers.30.mlp.experts.22.gate_proj.weight_scale": "model-00031-of-00047.safetensors", + "model.layers.30.mlp.experts.22.up_proj.weight": "model-00031-of-00047.safetensors", + "model.layers.30.mlp.experts.22.up_proj.weight_scale": "model-00031-of-00047.safetensors", + "model.layers.30.mlp.experts.23.down_proj.weight": "model-00031-of-00047.safetensors", + "model.layers.30.mlp.experts.23.down_proj.weight_scale": "model-00031-of-00047.safetensors", + "model.layers.30.mlp.experts.23.gate_proj.weight": "model-00031-of-00047.safetensors", + "model.layers.30.mlp.experts.23.gate_proj.weight_scale": "model-00031-of-00047.safetensors", + "model.layers.30.mlp.experts.23.up_proj.weight": "model-00031-of-00047.safetensors", + "model.layers.30.mlp.experts.23.up_proj.weight_scale": "model-00031-of-00047.safetensors", + "model.layers.30.mlp.experts.24.down_proj.weight": "model-00031-of-00047.safetensors", + "model.layers.30.mlp.experts.24.down_proj.weight_scale": "model-00031-of-00047.safetensors", + "model.layers.30.mlp.experts.24.gate_proj.weight": "model-00031-of-00047.safetensors", + "model.layers.30.mlp.experts.24.gate_proj.weight_scale": "model-00031-of-00047.safetensors", + "model.layers.30.mlp.experts.24.up_proj.weight": "model-00031-of-00047.safetensors", + "model.layers.30.mlp.experts.24.up_proj.weight_scale": "model-00031-of-00047.safetensors", + "model.layers.30.mlp.experts.25.down_proj.weight": "model-00031-of-00047.safetensors", + "model.layers.30.mlp.experts.25.down_proj.weight_scale": "model-00031-of-00047.safetensors", + "model.layers.30.mlp.experts.25.gate_proj.weight": "model-00031-of-00047.safetensors", + "model.layers.30.mlp.experts.25.gate_proj.weight_scale": "model-00031-of-00047.safetensors", + "model.layers.30.mlp.experts.25.up_proj.weight": "model-00031-of-00047.safetensors", + "model.layers.30.mlp.experts.25.up_proj.weight_scale": "model-00031-of-00047.safetensors", + "model.layers.30.mlp.experts.26.down_proj.weight": "model-00031-of-00047.safetensors", + "model.layers.30.mlp.experts.26.down_proj.weight_scale": "model-00031-of-00047.safetensors", + "model.layers.30.mlp.experts.26.gate_proj.weight": "model-00031-of-00047.safetensors", + "model.layers.30.mlp.experts.26.gate_proj.weight_scale": "model-00031-of-00047.safetensors", + "model.layers.30.mlp.experts.26.up_proj.weight": "model-00031-of-00047.safetensors", + "model.layers.30.mlp.experts.26.up_proj.weight_scale": "model-00031-of-00047.safetensors", + "model.layers.30.mlp.experts.27.down_proj.weight": "model-00031-of-00047.safetensors", + "model.layers.30.mlp.experts.27.down_proj.weight_scale": "model-00031-of-00047.safetensors", + "model.layers.30.mlp.experts.27.gate_proj.weight": "model-00031-of-00047.safetensors", + "model.layers.30.mlp.experts.27.gate_proj.weight_scale": "model-00031-of-00047.safetensors", + "model.layers.30.mlp.experts.27.up_proj.weight": "model-00031-of-00047.safetensors", + "model.layers.30.mlp.experts.27.up_proj.weight_scale": "model-00031-of-00047.safetensors", + "model.layers.30.mlp.experts.28.down_proj.weight": "model-00031-of-00047.safetensors", + "model.layers.30.mlp.experts.28.down_proj.weight_scale": "model-00031-of-00047.safetensors", + "model.layers.30.mlp.experts.28.gate_proj.weight": "model-00031-of-00047.safetensors", + "model.layers.30.mlp.experts.28.gate_proj.weight_scale": "model-00031-of-00047.safetensors", + "model.layers.30.mlp.experts.28.up_proj.weight": "model-00031-of-00047.safetensors", + "model.layers.30.mlp.experts.28.up_proj.weight_scale": "model-00031-of-00047.safetensors", + "model.layers.30.mlp.experts.29.down_proj.weight": "model-00031-of-00047.safetensors", + "model.layers.30.mlp.experts.29.down_proj.weight_scale": "model-00031-of-00047.safetensors", + "model.layers.30.mlp.experts.29.gate_proj.weight": "model-00031-of-00047.safetensors", + "model.layers.30.mlp.experts.29.gate_proj.weight_scale": "model-00031-of-00047.safetensors", + "model.layers.30.mlp.experts.29.up_proj.weight": "model-00031-of-00047.safetensors", + "model.layers.30.mlp.experts.29.up_proj.weight_scale": "model-00031-of-00047.safetensors", + "model.layers.30.mlp.experts.3.down_proj.weight": "model-00031-of-00047.safetensors", + "model.layers.30.mlp.experts.3.down_proj.weight_scale": "model-00031-of-00047.safetensors", + "model.layers.30.mlp.experts.3.gate_proj.weight": "model-00031-of-00047.safetensors", + "model.layers.30.mlp.experts.3.gate_proj.weight_scale": "model-00031-of-00047.safetensors", + "model.layers.30.mlp.experts.3.up_proj.weight": "model-00031-of-00047.safetensors", + "model.layers.30.mlp.experts.3.up_proj.weight_scale": "model-00031-of-00047.safetensors", + "model.layers.30.mlp.experts.30.down_proj.weight": "model-00031-of-00047.safetensors", + "model.layers.30.mlp.experts.30.down_proj.weight_scale": "model-00031-of-00047.safetensors", + "model.layers.30.mlp.experts.30.gate_proj.weight": "model-00031-of-00047.safetensors", + "model.layers.30.mlp.experts.30.gate_proj.weight_scale": "model-00031-of-00047.safetensors", + "model.layers.30.mlp.experts.30.up_proj.weight": "model-00031-of-00047.safetensors", + "model.layers.30.mlp.experts.30.up_proj.weight_scale": "model-00031-of-00047.safetensors", + "model.layers.30.mlp.experts.31.down_proj.weight": "model-00031-of-00047.safetensors", + "model.layers.30.mlp.experts.31.down_proj.weight_scale": "model-00031-of-00047.safetensors", + "model.layers.30.mlp.experts.31.gate_proj.weight": "model-00031-of-00047.safetensors", + "model.layers.30.mlp.experts.31.gate_proj.weight_scale": "model-00031-of-00047.safetensors", + "model.layers.30.mlp.experts.31.up_proj.weight": "model-00031-of-00047.safetensors", + "model.layers.30.mlp.experts.31.up_proj.weight_scale": "model-00031-of-00047.safetensors", + "model.layers.30.mlp.experts.32.down_proj.weight": "model-00031-of-00047.safetensors", + "model.layers.30.mlp.experts.32.down_proj.weight_scale": "model-00031-of-00047.safetensors", + "model.layers.30.mlp.experts.32.gate_proj.weight": "model-00031-of-00047.safetensors", + "model.layers.30.mlp.experts.32.gate_proj.weight_scale": "model-00031-of-00047.safetensors", + "model.layers.30.mlp.experts.32.up_proj.weight": "model-00031-of-00047.safetensors", + "model.layers.30.mlp.experts.32.up_proj.weight_scale": "model-00031-of-00047.safetensors", + "model.layers.30.mlp.experts.33.down_proj.weight": "model-00031-of-00047.safetensors", + "model.layers.30.mlp.experts.33.down_proj.weight_scale": "model-00031-of-00047.safetensors", + "model.layers.30.mlp.experts.33.gate_proj.weight": "model-00031-of-00047.safetensors", + "model.layers.30.mlp.experts.33.gate_proj.weight_scale": "model-00031-of-00047.safetensors", + "model.layers.30.mlp.experts.33.up_proj.weight": "model-00031-of-00047.safetensors", + "model.layers.30.mlp.experts.33.up_proj.weight_scale": "model-00031-of-00047.safetensors", + "model.layers.30.mlp.experts.34.down_proj.weight": "model-00031-of-00047.safetensors", + "model.layers.30.mlp.experts.34.down_proj.weight_scale": "model-00031-of-00047.safetensors", + "model.layers.30.mlp.experts.34.gate_proj.weight": "model-00031-of-00047.safetensors", + "model.layers.30.mlp.experts.34.gate_proj.weight_scale": "model-00031-of-00047.safetensors", + "model.layers.30.mlp.experts.34.up_proj.weight": "model-00031-of-00047.safetensors", + "model.layers.30.mlp.experts.34.up_proj.weight_scale": "model-00031-of-00047.safetensors", + "model.layers.30.mlp.experts.35.down_proj.weight": "model-00031-of-00047.safetensors", + "model.layers.30.mlp.experts.35.down_proj.weight_scale": "model-00031-of-00047.safetensors", + "model.layers.30.mlp.experts.35.gate_proj.weight": "model-00031-of-00047.safetensors", + "model.layers.30.mlp.experts.35.gate_proj.weight_scale": "model-00031-of-00047.safetensors", + "model.layers.30.mlp.experts.35.up_proj.weight": "model-00031-of-00047.safetensors", + "model.layers.30.mlp.experts.35.up_proj.weight_scale": "model-00031-of-00047.safetensors", + "model.layers.30.mlp.experts.36.down_proj.weight": "model-00031-of-00047.safetensors", + "model.layers.30.mlp.experts.36.down_proj.weight_scale": "model-00031-of-00047.safetensors", + "model.layers.30.mlp.experts.36.gate_proj.weight": "model-00031-of-00047.safetensors", + "model.layers.30.mlp.experts.36.gate_proj.weight_scale": "model-00031-of-00047.safetensors", + "model.layers.30.mlp.experts.36.up_proj.weight": "model-00031-of-00047.safetensors", + "model.layers.30.mlp.experts.36.up_proj.weight_scale": "model-00031-of-00047.safetensors", + "model.layers.30.mlp.experts.37.down_proj.weight": "model-00031-of-00047.safetensors", + "model.layers.30.mlp.experts.37.down_proj.weight_scale": "model-00031-of-00047.safetensors", + "model.layers.30.mlp.experts.37.gate_proj.weight": "model-00031-of-00047.safetensors", + "model.layers.30.mlp.experts.37.gate_proj.weight_scale": "model-00031-of-00047.safetensors", + "model.layers.30.mlp.experts.37.up_proj.weight": "model-00031-of-00047.safetensors", + "model.layers.30.mlp.experts.37.up_proj.weight_scale": "model-00031-of-00047.safetensors", + "model.layers.30.mlp.experts.38.down_proj.weight": "model-00031-of-00047.safetensors", + "model.layers.30.mlp.experts.38.down_proj.weight_scale": "model-00031-of-00047.safetensors", + "model.layers.30.mlp.experts.38.gate_proj.weight": "model-00031-of-00047.safetensors", + "model.layers.30.mlp.experts.38.gate_proj.weight_scale": "model-00031-of-00047.safetensors", + "model.layers.30.mlp.experts.38.up_proj.weight": "model-00031-of-00047.safetensors", + "model.layers.30.mlp.experts.38.up_proj.weight_scale": "model-00031-of-00047.safetensors", + "model.layers.30.mlp.experts.39.down_proj.weight": "model-00031-of-00047.safetensors", + "model.layers.30.mlp.experts.39.down_proj.weight_scale": "model-00031-of-00047.safetensors", + "model.layers.30.mlp.experts.39.gate_proj.weight": "model-00031-of-00047.safetensors", + "model.layers.30.mlp.experts.39.gate_proj.weight_scale": "model-00031-of-00047.safetensors", + "model.layers.30.mlp.experts.39.up_proj.weight": "model-00031-of-00047.safetensors", + "model.layers.30.mlp.experts.39.up_proj.weight_scale": "model-00031-of-00047.safetensors", + "model.layers.30.mlp.experts.4.down_proj.weight": "model-00031-of-00047.safetensors", + "model.layers.30.mlp.experts.4.down_proj.weight_scale": "model-00031-of-00047.safetensors", + "model.layers.30.mlp.experts.4.gate_proj.weight": "model-00031-of-00047.safetensors", + "model.layers.30.mlp.experts.4.gate_proj.weight_scale": "model-00031-of-00047.safetensors", + "model.layers.30.mlp.experts.4.up_proj.weight": "model-00031-of-00047.safetensors", + "model.layers.30.mlp.experts.4.up_proj.weight_scale": "model-00031-of-00047.safetensors", + "model.layers.30.mlp.experts.40.down_proj.weight": "model-00031-of-00047.safetensors", + "model.layers.30.mlp.experts.40.down_proj.weight_scale": "model-00031-of-00047.safetensors", + "model.layers.30.mlp.experts.40.gate_proj.weight": "model-00031-of-00047.safetensors", + "model.layers.30.mlp.experts.40.gate_proj.weight_scale": "model-00031-of-00047.safetensors", + "model.layers.30.mlp.experts.40.up_proj.weight": "model-00031-of-00047.safetensors", + "model.layers.30.mlp.experts.40.up_proj.weight_scale": "model-00031-of-00047.safetensors", + "model.layers.30.mlp.experts.41.down_proj.weight": "model-00031-of-00047.safetensors", + "model.layers.30.mlp.experts.41.down_proj.weight_scale": "model-00031-of-00047.safetensors", + "model.layers.30.mlp.experts.41.gate_proj.weight": "model-00031-of-00047.safetensors", + "model.layers.30.mlp.experts.41.gate_proj.weight_scale": "model-00031-of-00047.safetensors", + "model.layers.30.mlp.experts.41.up_proj.weight": "model-00031-of-00047.safetensors", + "model.layers.30.mlp.experts.41.up_proj.weight_scale": "model-00031-of-00047.safetensors", + "model.layers.30.mlp.experts.42.down_proj.weight": "model-00031-of-00047.safetensors", + "model.layers.30.mlp.experts.42.down_proj.weight_scale": "model-00031-of-00047.safetensors", + "model.layers.30.mlp.experts.42.gate_proj.weight": "model-00031-of-00047.safetensors", + "model.layers.30.mlp.experts.42.gate_proj.weight_scale": "model-00031-of-00047.safetensors", + "model.layers.30.mlp.experts.42.up_proj.weight": "model-00031-of-00047.safetensors", + "model.layers.30.mlp.experts.42.up_proj.weight_scale": "model-00031-of-00047.safetensors", + "model.layers.30.mlp.experts.43.down_proj.weight": "model-00031-of-00047.safetensors", + "model.layers.30.mlp.experts.43.down_proj.weight_scale": "model-00031-of-00047.safetensors", + "model.layers.30.mlp.experts.43.gate_proj.weight": "model-00031-of-00047.safetensors", + "model.layers.30.mlp.experts.43.gate_proj.weight_scale": "model-00031-of-00047.safetensors", + "model.layers.30.mlp.experts.43.up_proj.weight": "model-00031-of-00047.safetensors", + "model.layers.30.mlp.experts.43.up_proj.weight_scale": "model-00031-of-00047.safetensors", + "model.layers.30.mlp.experts.44.down_proj.weight": "model-00031-of-00047.safetensors", + "model.layers.30.mlp.experts.44.down_proj.weight_scale": "model-00031-of-00047.safetensors", + "model.layers.30.mlp.experts.44.gate_proj.weight": "model-00031-of-00047.safetensors", + "model.layers.30.mlp.experts.44.gate_proj.weight_scale": "model-00031-of-00047.safetensors", + "model.layers.30.mlp.experts.44.up_proj.weight": "model-00031-of-00047.safetensors", + "model.layers.30.mlp.experts.44.up_proj.weight_scale": "model-00031-of-00047.safetensors", + "model.layers.30.mlp.experts.45.down_proj.weight": "model-00031-of-00047.safetensors", + "model.layers.30.mlp.experts.45.down_proj.weight_scale": "model-00031-of-00047.safetensors", + "model.layers.30.mlp.experts.45.gate_proj.weight": "model-00031-of-00047.safetensors", + "model.layers.30.mlp.experts.45.gate_proj.weight_scale": "model-00031-of-00047.safetensors", + "model.layers.30.mlp.experts.45.up_proj.weight": "model-00031-of-00047.safetensors", + "model.layers.30.mlp.experts.45.up_proj.weight_scale": "model-00031-of-00047.safetensors", + "model.layers.30.mlp.experts.46.down_proj.weight": "model-00031-of-00047.safetensors", + "model.layers.30.mlp.experts.46.down_proj.weight_scale": "model-00031-of-00047.safetensors", + "model.layers.30.mlp.experts.46.gate_proj.weight": "model-00031-of-00047.safetensors", + "model.layers.30.mlp.experts.46.gate_proj.weight_scale": "model-00031-of-00047.safetensors", + "model.layers.30.mlp.experts.46.up_proj.weight": "model-00031-of-00047.safetensors", + "model.layers.30.mlp.experts.46.up_proj.weight_scale": "model-00031-of-00047.safetensors", + "model.layers.30.mlp.experts.47.down_proj.weight": "model-00031-of-00047.safetensors", + "model.layers.30.mlp.experts.47.down_proj.weight_scale": "model-00031-of-00047.safetensors", + "model.layers.30.mlp.experts.47.gate_proj.weight": "model-00031-of-00047.safetensors", + "model.layers.30.mlp.experts.47.gate_proj.weight_scale": "model-00031-of-00047.safetensors", + "model.layers.30.mlp.experts.47.up_proj.weight": "model-00031-of-00047.safetensors", + "model.layers.30.mlp.experts.47.up_proj.weight_scale": "model-00031-of-00047.safetensors", + "model.layers.30.mlp.experts.48.down_proj.weight": "model-00031-of-00047.safetensors", + "model.layers.30.mlp.experts.48.down_proj.weight_scale": "model-00031-of-00047.safetensors", + "model.layers.30.mlp.experts.48.gate_proj.weight": "model-00031-of-00047.safetensors", + "model.layers.30.mlp.experts.48.gate_proj.weight_scale": "model-00031-of-00047.safetensors", + "model.layers.30.mlp.experts.48.up_proj.weight": "model-00031-of-00047.safetensors", + "model.layers.30.mlp.experts.48.up_proj.weight_scale": "model-00031-of-00047.safetensors", + "model.layers.30.mlp.experts.49.down_proj.weight": "model-00031-of-00047.safetensors", + "model.layers.30.mlp.experts.49.down_proj.weight_scale": "model-00031-of-00047.safetensors", + "model.layers.30.mlp.experts.49.gate_proj.weight": "model-00031-of-00047.safetensors", + "model.layers.30.mlp.experts.49.gate_proj.weight_scale": "model-00031-of-00047.safetensors", + "model.layers.30.mlp.experts.49.up_proj.weight": "model-00031-of-00047.safetensors", + "model.layers.30.mlp.experts.49.up_proj.weight_scale": "model-00031-of-00047.safetensors", + "model.layers.30.mlp.experts.5.down_proj.weight": "model-00031-of-00047.safetensors", + "model.layers.30.mlp.experts.5.down_proj.weight_scale": "model-00031-of-00047.safetensors", + "model.layers.30.mlp.experts.5.gate_proj.weight": "model-00031-of-00047.safetensors", + "model.layers.30.mlp.experts.5.gate_proj.weight_scale": "model-00031-of-00047.safetensors", + "model.layers.30.mlp.experts.5.up_proj.weight": "model-00031-of-00047.safetensors", + "model.layers.30.mlp.experts.5.up_proj.weight_scale": "model-00031-of-00047.safetensors", + "model.layers.30.mlp.experts.50.down_proj.weight": "model-00031-of-00047.safetensors", + "model.layers.30.mlp.experts.50.down_proj.weight_scale": "model-00031-of-00047.safetensors", + "model.layers.30.mlp.experts.50.gate_proj.weight": "model-00031-of-00047.safetensors", + "model.layers.30.mlp.experts.50.gate_proj.weight_scale": "model-00031-of-00047.safetensors", + "model.layers.30.mlp.experts.50.up_proj.weight": "model-00031-of-00047.safetensors", + "model.layers.30.mlp.experts.50.up_proj.weight_scale": "model-00031-of-00047.safetensors", + "model.layers.30.mlp.experts.51.down_proj.weight": "model-00031-of-00047.safetensors", + "model.layers.30.mlp.experts.51.down_proj.weight_scale": "model-00031-of-00047.safetensors", + "model.layers.30.mlp.experts.51.gate_proj.weight": "model-00031-of-00047.safetensors", + "model.layers.30.mlp.experts.51.gate_proj.weight_scale": "model-00031-of-00047.safetensors", + "model.layers.30.mlp.experts.51.up_proj.weight": "model-00031-of-00047.safetensors", + "model.layers.30.mlp.experts.51.up_proj.weight_scale": "model-00031-of-00047.safetensors", + "model.layers.30.mlp.experts.52.down_proj.weight": "model-00031-of-00047.safetensors", + "model.layers.30.mlp.experts.52.down_proj.weight_scale": "model-00031-of-00047.safetensors", + "model.layers.30.mlp.experts.52.gate_proj.weight": "model-00031-of-00047.safetensors", + "model.layers.30.mlp.experts.52.gate_proj.weight_scale": "model-00031-of-00047.safetensors", + "model.layers.30.mlp.experts.52.up_proj.weight": "model-00031-of-00047.safetensors", + "model.layers.30.mlp.experts.52.up_proj.weight_scale": "model-00031-of-00047.safetensors", + "model.layers.30.mlp.experts.53.down_proj.weight": "model-00031-of-00047.safetensors", + "model.layers.30.mlp.experts.53.down_proj.weight_scale": "model-00031-of-00047.safetensors", + "model.layers.30.mlp.experts.53.gate_proj.weight": "model-00031-of-00047.safetensors", + "model.layers.30.mlp.experts.53.gate_proj.weight_scale": "model-00031-of-00047.safetensors", + "model.layers.30.mlp.experts.53.up_proj.weight": "model-00031-of-00047.safetensors", + "model.layers.30.mlp.experts.53.up_proj.weight_scale": "model-00031-of-00047.safetensors", + "model.layers.30.mlp.experts.54.down_proj.weight": "model-00031-of-00047.safetensors", + "model.layers.30.mlp.experts.54.down_proj.weight_scale": "model-00031-of-00047.safetensors", + "model.layers.30.mlp.experts.54.gate_proj.weight": "model-00031-of-00047.safetensors", + "model.layers.30.mlp.experts.54.gate_proj.weight_scale": "model-00031-of-00047.safetensors", + "model.layers.30.mlp.experts.54.up_proj.weight": "model-00031-of-00047.safetensors", + "model.layers.30.mlp.experts.54.up_proj.weight_scale": "model-00031-of-00047.safetensors", + "model.layers.30.mlp.experts.55.down_proj.weight": "model-00031-of-00047.safetensors", + "model.layers.30.mlp.experts.55.down_proj.weight_scale": "model-00031-of-00047.safetensors", + "model.layers.30.mlp.experts.55.gate_proj.weight": "model-00031-of-00047.safetensors", + "model.layers.30.mlp.experts.55.gate_proj.weight_scale": "model-00031-of-00047.safetensors", + "model.layers.30.mlp.experts.55.up_proj.weight": "model-00031-of-00047.safetensors", + "model.layers.30.mlp.experts.55.up_proj.weight_scale": "model-00031-of-00047.safetensors", + "model.layers.30.mlp.experts.56.down_proj.weight": "model-00031-of-00047.safetensors", + "model.layers.30.mlp.experts.56.down_proj.weight_scale": "model-00031-of-00047.safetensors", + "model.layers.30.mlp.experts.56.gate_proj.weight": "model-00031-of-00047.safetensors", + "model.layers.30.mlp.experts.56.gate_proj.weight_scale": "model-00031-of-00047.safetensors", + "model.layers.30.mlp.experts.56.up_proj.weight": "model-00031-of-00047.safetensors", + "model.layers.30.mlp.experts.56.up_proj.weight_scale": "model-00031-of-00047.safetensors", + "model.layers.30.mlp.experts.57.down_proj.weight": "model-00031-of-00047.safetensors", + "model.layers.30.mlp.experts.57.down_proj.weight_scale": "model-00031-of-00047.safetensors", + "model.layers.30.mlp.experts.57.gate_proj.weight": "model-00031-of-00047.safetensors", + "model.layers.30.mlp.experts.57.gate_proj.weight_scale": "model-00031-of-00047.safetensors", + "model.layers.30.mlp.experts.57.up_proj.weight": "model-00031-of-00047.safetensors", + "model.layers.30.mlp.experts.57.up_proj.weight_scale": "model-00031-of-00047.safetensors", + "model.layers.30.mlp.experts.58.down_proj.weight": "model-00031-of-00047.safetensors", + "model.layers.30.mlp.experts.58.down_proj.weight_scale": "model-00031-of-00047.safetensors", + "model.layers.30.mlp.experts.58.gate_proj.weight": "model-00031-of-00047.safetensors", + "model.layers.30.mlp.experts.58.gate_proj.weight_scale": "model-00031-of-00047.safetensors", + "model.layers.30.mlp.experts.58.up_proj.weight": "model-00031-of-00047.safetensors", + "model.layers.30.mlp.experts.58.up_proj.weight_scale": "model-00031-of-00047.safetensors", + "model.layers.30.mlp.experts.59.down_proj.weight": "model-00031-of-00047.safetensors", + "model.layers.30.mlp.experts.59.down_proj.weight_scale": "model-00031-of-00047.safetensors", + "model.layers.30.mlp.experts.59.gate_proj.weight": "model-00031-of-00047.safetensors", + "model.layers.30.mlp.experts.59.gate_proj.weight_scale": "model-00031-of-00047.safetensors", + "model.layers.30.mlp.experts.59.up_proj.weight": "model-00031-of-00047.safetensors", + "model.layers.30.mlp.experts.59.up_proj.weight_scale": "model-00031-of-00047.safetensors", + "model.layers.30.mlp.experts.6.down_proj.weight": "model-00031-of-00047.safetensors", + "model.layers.30.mlp.experts.6.down_proj.weight_scale": "model-00031-of-00047.safetensors", + "model.layers.30.mlp.experts.6.gate_proj.weight": "model-00031-of-00047.safetensors", + "model.layers.30.mlp.experts.6.gate_proj.weight_scale": "model-00031-of-00047.safetensors", + "model.layers.30.mlp.experts.6.up_proj.weight": "model-00031-of-00047.safetensors", + "model.layers.30.mlp.experts.6.up_proj.weight_scale": "model-00031-of-00047.safetensors", + "model.layers.30.mlp.experts.60.down_proj.weight": "model-00031-of-00047.safetensors", + "model.layers.30.mlp.experts.60.down_proj.weight_scale": "model-00031-of-00047.safetensors", + "model.layers.30.mlp.experts.60.gate_proj.weight": "model-00031-of-00047.safetensors", + "model.layers.30.mlp.experts.60.gate_proj.weight_scale": "model-00031-of-00047.safetensors", + "model.layers.30.mlp.experts.60.up_proj.weight": "model-00031-of-00047.safetensors", + "model.layers.30.mlp.experts.60.up_proj.weight_scale": "model-00031-of-00047.safetensors", + "model.layers.30.mlp.experts.61.down_proj.weight": "model-00031-of-00047.safetensors", + "model.layers.30.mlp.experts.61.down_proj.weight_scale": "model-00031-of-00047.safetensors", + "model.layers.30.mlp.experts.61.gate_proj.weight": "model-00031-of-00047.safetensors", + "model.layers.30.mlp.experts.61.gate_proj.weight_scale": "model-00031-of-00047.safetensors", + "model.layers.30.mlp.experts.61.up_proj.weight": "model-00031-of-00047.safetensors", + "model.layers.30.mlp.experts.61.up_proj.weight_scale": "model-00031-of-00047.safetensors", + "model.layers.30.mlp.experts.62.down_proj.weight": "model-00031-of-00047.safetensors", + "model.layers.30.mlp.experts.62.down_proj.weight_scale": "model-00031-of-00047.safetensors", + "model.layers.30.mlp.experts.62.gate_proj.weight": "model-00031-of-00047.safetensors", + "model.layers.30.mlp.experts.62.gate_proj.weight_scale": "model-00031-of-00047.safetensors", + "model.layers.30.mlp.experts.62.up_proj.weight": "model-00031-of-00047.safetensors", + "model.layers.30.mlp.experts.62.up_proj.weight_scale": "model-00031-of-00047.safetensors", + "model.layers.30.mlp.experts.63.down_proj.weight": "model-00031-of-00047.safetensors", + "model.layers.30.mlp.experts.63.down_proj.weight_scale": "model-00031-of-00047.safetensors", + "model.layers.30.mlp.experts.63.gate_proj.weight": "model-00031-of-00047.safetensors", + "model.layers.30.mlp.experts.63.gate_proj.weight_scale": "model-00031-of-00047.safetensors", + "model.layers.30.mlp.experts.63.up_proj.weight": "model-00031-of-00047.safetensors", + "model.layers.30.mlp.experts.63.up_proj.weight_scale": "model-00031-of-00047.safetensors", + "model.layers.30.mlp.experts.64.down_proj.weight": "model-00031-of-00047.safetensors", + "model.layers.30.mlp.experts.64.down_proj.weight_scale": "model-00031-of-00047.safetensors", + "model.layers.30.mlp.experts.64.gate_proj.weight": "model-00031-of-00047.safetensors", + "model.layers.30.mlp.experts.64.gate_proj.weight_scale": "model-00031-of-00047.safetensors", + "model.layers.30.mlp.experts.64.up_proj.weight": "model-00031-of-00047.safetensors", + "model.layers.30.mlp.experts.64.up_proj.weight_scale": "model-00031-of-00047.safetensors", + "model.layers.30.mlp.experts.65.down_proj.weight": "model-00031-of-00047.safetensors", + "model.layers.30.mlp.experts.65.down_proj.weight_scale": "model-00031-of-00047.safetensors", + "model.layers.30.mlp.experts.65.gate_proj.weight": "model-00031-of-00047.safetensors", + "model.layers.30.mlp.experts.65.gate_proj.weight_scale": "model-00031-of-00047.safetensors", + "model.layers.30.mlp.experts.65.up_proj.weight": "model-00031-of-00047.safetensors", + "model.layers.30.mlp.experts.65.up_proj.weight_scale": "model-00031-of-00047.safetensors", + "model.layers.30.mlp.experts.66.down_proj.weight": "model-00031-of-00047.safetensors", + "model.layers.30.mlp.experts.66.down_proj.weight_scale": "model-00031-of-00047.safetensors", + "model.layers.30.mlp.experts.66.gate_proj.weight": "model-00031-of-00047.safetensors", + "model.layers.30.mlp.experts.66.gate_proj.weight_scale": "model-00031-of-00047.safetensors", + "model.layers.30.mlp.experts.66.up_proj.weight": "model-00031-of-00047.safetensors", + "model.layers.30.mlp.experts.66.up_proj.weight_scale": "model-00031-of-00047.safetensors", + "model.layers.30.mlp.experts.67.down_proj.weight": "model-00031-of-00047.safetensors", + "model.layers.30.mlp.experts.67.down_proj.weight_scale": "model-00031-of-00047.safetensors", + "model.layers.30.mlp.experts.67.gate_proj.weight": "model-00031-of-00047.safetensors", + "model.layers.30.mlp.experts.67.gate_proj.weight_scale": "model-00031-of-00047.safetensors", + "model.layers.30.mlp.experts.67.up_proj.weight": "model-00031-of-00047.safetensors", + "model.layers.30.mlp.experts.67.up_proj.weight_scale": "model-00031-of-00047.safetensors", + "model.layers.30.mlp.experts.68.down_proj.weight": "model-00031-of-00047.safetensors", + "model.layers.30.mlp.experts.68.down_proj.weight_scale": "model-00031-of-00047.safetensors", + "model.layers.30.mlp.experts.68.gate_proj.weight": "model-00031-of-00047.safetensors", + "model.layers.30.mlp.experts.68.gate_proj.weight_scale": "model-00031-of-00047.safetensors", + "model.layers.30.mlp.experts.68.up_proj.weight": "model-00031-of-00047.safetensors", + "model.layers.30.mlp.experts.68.up_proj.weight_scale": "model-00031-of-00047.safetensors", + "model.layers.30.mlp.experts.69.down_proj.weight": "model-00031-of-00047.safetensors", + "model.layers.30.mlp.experts.69.down_proj.weight_scale": "model-00031-of-00047.safetensors", + "model.layers.30.mlp.experts.69.gate_proj.weight": "model-00031-of-00047.safetensors", + "model.layers.30.mlp.experts.69.gate_proj.weight_scale": "model-00031-of-00047.safetensors", + "model.layers.30.mlp.experts.69.up_proj.weight": "model-00031-of-00047.safetensors", + "model.layers.30.mlp.experts.69.up_proj.weight_scale": "model-00031-of-00047.safetensors", + "model.layers.30.mlp.experts.7.down_proj.weight": "model-00031-of-00047.safetensors", + "model.layers.30.mlp.experts.7.down_proj.weight_scale": "model-00031-of-00047.safetensors", + "model.layers.30.mlp.experts.7.gate_proj.weight": "model-00031-of-00047.safetensors", + "model.layers.30.mlp.experts.7.gate_proj.weight_scale": "model-00031-of-00047.safetensors", + "model.layers.30.mlp.experts.7.up_proj.weight": "model-00031-of-00047.safetensors", + "model.layers.30.mlp.experts.7.up_proj.weight_scale": "model-00031-of-00047.safetensors", + "model.layers.30.mlp.experts.70.down_proj.weight": "model-00031-of-00047.safetensors", + "model.layers.30.mlp.experts.70.down_proj.weight_scale": "model-00031-of-00047.safetensors", + "model.layers.30.mlp.experts.70.gate_proj.weight": "model-00031-of-00047.safetensors", + "model.layers.30.mlp.experts.70.gate_proj.weight_scale": "model-00031-of-00047.safetensors", + "model.layers.30.mlp.experts.70.up_proj.weight": "model-00031-of-00047.safetensors", + "model.layers.30.mlp.experts.70.up_proj.weight_scale": "model-00031-of-00047.safetensors", + "model.layers.30.mlp.experts.71.down_proj.weight": "model-00031-of-00047.safetensors", + "model.layers.30.mlp.experts.71.down_proj.weight_scale": "model-00031-of-00047.safetensors", + "model.layers.30.mlp.experts.71.gate_proj.weight": "model-00031-of-00047.safetensors", + "model.layers.30.mlp.experts.71.gate_proj.weight_scale": "model-00031-of-00047.safetensors", + "model.layers.30.mlp.experts.71.up_proj.weight": "model-00031-of-00047.safetensors", + "model.layers.30.mlp.experts.71.up_proj.weight_scale": "model-00031-of-00047.safetensors", + "model.layers.30.mlp.experts.72.down_proj.weight": "model-00031-of-00047.safetensors", + "model.layers.30.mlp.experts.72.down_proj.weight_scale": "model-00031-of-00047.safetensors", + "model.layers.30.mlp.experts.72.gate_proj.weight": "model-00031-of-00047.safetensors", + "model.layers.30.mlp.experts.72.gate_proj.weight_scale": "model-00031-of-00047.safetensors", + "model.layers.30.mlp.experts.72.up_proj.weight": "model-00031-of-00047.safetensors", + "model.layers.30.mlp.experts.72.up_proj.weight_scale": "model-00031-of-00047.safetensors", + "model.layers.30.mlp.experts.73.down_proj.weight": "model-00031-of-00047.safetensors", + "model.layers.30.mlp.experts.73.down_proj.weight_scale": "model-00031-of-00047.safetensors", + "model.layers.30.mlp.experts.73.gate_proj.weight": "model-00031-of-00047.safetensors", + "model.layers.30.mlp.experts.73.gate_proj.weight_scale": "model-00031-of-00047.safetensors", + "model.layers.30.mlp.experts.73.up_proj.weight": "model-00031-of-00047.safetensors", + "model.layers.30.mlp.experts.73.up_proj.weight_scale": "model-00031-of-00047.safetensors", + "model.layers.30.mlp.experts.74.down_proj.weight": "model-00031-of-00047.safetensors", + "model.layers.30.mlp.experts.74.down_proj.weight_scale": "model-00031-of-00047.safetensors", + "model.layers.30.mlp.experts.74.gate_proj.weight": "model-00031-of-00047.safetensors", + "model.layers.30.mlp.experts.74.gate_proj.weight_scale": "model-00031-of-00047.safetensors", + "model.layers.30.mlp.experts.74.up_proj.weight": "model-00031-of-00047.safetensors", + "model.layers.30.mlp.experts.74.up_proj.weight_scale": "model-00031-of-00047.safetensors", + "model.layers.30.mlp.experts.75.down_proj.weight": "model-00031-of-00047.safetensors", + "model.layers.30.mlp.experts.75.down_proj.weight_scale": "model-00031-of-00047.safetensors", + "model.layers.30.mlp.experts.75.gate_proj.weight": "model-00031-of-00047.safetensors", + "model.layers.30.mlp.experts.75.gate_proj.weight_scale": "model-00031-of-00047.safetensors", + "model.layers.30.mlp.experts.75.up_proj.weight": "model-00031-of-00047.safetensors", + "model.layers.30.mlp.experts.75.up_proj.weight_scale": "model-00031-of-00047.safetensors", + "model.layers.30.mlp.experts.76.down_proj.weight": "model-00031-of-00047.safetensors", + "model.layers.30.mlp.experts.76.down_proj.weight_scale": "model-00031-of-00047.safetensors", + "model.layers.30.mlp.experts.76.gate_proj.weight": "model-00031-of-00047.safetensors", + "model.layers.30.mlp.experts.76.gate_proj.weight_scale": "model-00031-of-00047.safetensors", + "model.layers.30.mlp.experts.76.up_proj.weight": "model-00031-of-00047.safetensors", + "model.layers.30.mlp.experts.76.up_proj.weight_scale": "model-00031-of-00047.safetensors", + "model.layers.30.mlp.experts.77.down_proj.weight": "model-00031-of-00047.safetensors", + "model.layers.30.mlp.experts.77.down_proj.weight_scale": "model-00031-of-00047.safetensors", + "model.layers.30.mlp.experts.77.gate_proj.weight": "model-00031-of-00047.safetensors", + "model.layers.30.mlp.experts.77.gate_proj.weight_scale": "model-00031-of-00047.safetensors", + "model.layers.30.mlp.experts.77.up_proj.weight": "model-00031-of-00047.safetensors", + "model.layers.30.mlp.experts.77.up_proj.weight_scale": "model-00031-of-00047.safetensors", + "model.layers.30.mlp.experts.78.down_proj.weight": "model-00031-of-00047.safetensors", + "model.layers.30.mlp.experts.78.down_proj.weight_scale": "model-00031-of-00047.safetensors", + "model.layers.30.mlp.experts.78.gate_proj.weight": "model-00031-of-00047.safetensors", + "model.layers.30.mlp.experts.78.gate_proj.weight_scale": "model-00031-of-00047.safetensors", + "model.layers.30.mlp.experts.78.up_proj.weight": "model-00031-of-00047.safetensors", + "model.layers.30.mlp.experts.78.up_proj.weight_scale": "model-00031-of-00047.safetensors", + "model.layers.30.mlp.experts.79.down_proj.weight": "model-00031-of-00047.safetensors", + "model.layers.30.mlp.experts.79.down_proj.weight_scale": "model-00031-of-00047.safetensors", + "model.layers.30.mlp.experts.79.gate_proj.weight": "model-00031-of-00047.safetensors", + "model.layers.30.mlp.experts.79.gate_proj.weight_scale": "model-00031-of-00047.safetensors", + "model.layers.30.mlp.experts.79.up_proj.weight": "model-00031-of-00047.safetensors", + "model.layers.30.mlp.experts.79.up_proj.weight_scale": "model-00031-of-00047.safetensors", + "model.layers.30.mlp.experts.8.down_proj.weight": "model-00031-of-00047.safetensors", + "model.layers.30.mlp.experts.8.down_proj.weight_scale": "model-00031-of-00047.safetensors", + "model.layers.30.mlp.experts.8.gate_proj.weight": "model-00031-of-00047.safetensors", + "model.layers.30.mlp.experts.8.gate_proj.weight_scale": "model-00031-of-00047.safetensors", + "model.layers.30.mlp.experts.8.up_proj.weight": "model-00031-of-00047.safetensors", + "model.layers.30.mlp.experts.8.up_proj.weight_scale": "model-00031-of-00047.safetensors", + "model.layers.30.mlp.experts.80.down_proj.weight": "model-00031-of-00047.safetensors", + "model.layers.30.mlp.experts.80.down_proj.weight_scale": "model-00031-of-00047.safetensors", + "model.layers.30.mlp.experts.80.gate_proj.weight": "model-00031-of-00047.safetensors", + "model.layers.30.mlp.experts.80.gate_proj.weight_scale": "model-00031-of-00047.safetensors", + "model.layers.30.mlp.experts.80.up_proj.weight": "model-00031-of-00047.safetensors", + "model.layers.30.mlp.experts.80.up_proj.weight_scale": "model-00031-of-00047.safetensors", + "model.layers.30.mlp.experts.81.down_proj.weight": "model-00031-of-00047.safetensors", + "model.layers.30.mlp.experts.81.down_proj.weight_scale": "model-00031-of-00047.safetensors", + "model.layers.30.mlp.experts.81.gate_proj.weight": "model-00031-of-00047.safetensors", + "model.layers.30.mlp.experts.81.gate_proj.weight_scale": "model-00031-of-00047.safetensors", + "model.layers.30.mlp.experts.81.up_proj.weight": "model-00031-of-00047.safetensors", + "model.layers.30.mlp.experts.81.up_proj.weight_scale": "model-00031-of-00047.safetensors", + "model.layers.30.mlp.experts.82.down_proj.weight": "model-00031-of-00047.safetensors", + "model.layers.30.mlp.experts.82.down_proj.weight_scale": "model-00031-of-00047.safetensors", + "model.layers.30.mlp.experts.82.gate_proj.weight": "model-00031-of-00047.safetensors", + "model.layers.30.mlp.experts.82.gate_proj.weight_scale": "model-00031-of-00047.safetensors", + "model.layers.30.mlp.experts.82.up_proj.weight": "model-00031-of-00047.safetensors", + "model.layers.30.mlp.experts.82.up_proj.weight_scale": "model-00031-of-00047.safetensors", + "model.layers.30.mlp.experts.83.down_proj.weight": "model-00031-of-00047.safetensors", + "model.layers.30.mlp.experts.83.down_proj.weight_scale": "model-00031-of-00047.safetensors", + "model.layers.30.mlp.experts.83.gate_proj.weight": "model-00031-of-00047.safetensors", + "model.layers.30.mlp.experts.83.gate_proj.weight_scale": "model-00031-of-00047.safetensors", + "model.layers.30.mlp.experts.83.up_proj.weight": "model-00031-of-00047.safetensors", + "model.layers.30.mlp.experts.83.up_proj.weight_scale": "model-00031-of-00047.safetensors", + "model.layers.30.mlp.experts.84.down_proj.weight": "model-00031-of-00047.safetensors", + "model.layers.30.mlp.experts.84.down_proj.weight_scale": "model-00031-of-00047.safetensors", + "model.layers.30.mlp.experts.84.gate_proj.weight": "model-00031-of-00047.safetensors", + "model.layers.30.mlp.experts.84.gate_proj.weight_scale": "model-00031-of-00047.safetensors", + "model.layers.30.mlp.experts.84.up_proj.weight": "model-00031-of-00047.safetensors", + "model.layers.30.mlp.experts.84.up_proj.weight_scale": "model-00031-of-00047.safetensors", + "model.layers.30.mlp.experts.85.down_proj.weight": "model-00031-of-00047.safetensors", + "model.layers.30.mlp.experts.85.down_proj.weight_scale": "model-00031-of-00047.safetensors", + "model.layers.30.mlp.experts.85.gate_proj.weight": "model-00031-of-00047.safetensors", + "model.layers.30.mlp.experts.85.gate_proj.weight_scale": "model-00031-of-00047.safetensors", + "model.layers.30.mlp.experts.85.up_proj.weight": "model-00031-of-00047.safetensors", + "model.layers.30.mlp.experts.85.up_proj.weight_scale": "model-00031-of-00047.safetensors", + "model.layers.30.mlp.experts.86.down_proj.weight": "model-00031-of-00047.safetensors", + "model.layers.30.mlp.experts.86.down_proj.weight_scale": "model-00031-of-00047.safetensors", + "model.layers.30.mlp.experts.86.gate_proj.weight": "model-00031-of-00047.safetensors", + "model.layers.30.mlp.experts.86.gate_proj.weight_scale": "model-00031-of-00047.safetensors", + "model.layers.30.mlp.experts.86.up_proj.weight": "model-00031-of-00047.safetensors", + "model.layers.30.mlp.experts.86.up_proj.weight_scale": "model-00031-of-00047.safetensors", + "model.layers.30.mlp.experts.87.down_proj.weight": "model-00031-of-00047.safetensors", + "model.layers.30.mlp.experts.87.down_proj.weight_scale": "model-00031-of-00047.safetensors", + "model.layers.30.mlp.experts.87.gate_proj.weight": "model-00031-of-00047.safetensors", + "model.layers.30.mlp.experts.87.gate_proj.weight_scale": "model-00031-of-00047.safetensors", + "model.layers.30.mlp.experts.87.up_proj.weight": "model-00031-of-00047.safetensors", + "model.layers.30.mlp.experts.87.up_proj.weight_scale": "model-00031-of-00047.safetensors", + "model.layers.30.mlp.experts.88.down_proj.weight": "model-00031-of-00047.safetensors", + "model.layers.30.mlp.experts.88.down_proj.weight_scale": "model-00031-of-00047.safetensors", + "model.layers.30.mlp.experts.88.gate_proj.weight": "model-00031-of-00047.safetensors", + "model.layers.30.mlp.experts.88.gate_proj.weight_scale": "model-00031-of-00047.safetensors", + "model.layers.30.mlp.experts.88.up_proj.weight": "model-00031-of-00047.safetensors", + "model.layers.30.mlp.experts.88.up_proj.weight_scale": "model-00031-of-00047.safetensors", + "model.layers.30.mlp.experts.89.down_proj.weight": "model-00031-of-00047.safetensors", + "model.layers.30.mlp.experts.89.down_proj.weight_scale": "model-00031-of-00047.safetensors", + "model.layers.30.mlp.experts.89.gate_proj.weight": "model-00031-of-00047.safetensors", + "model.layers.30.mlp.experts.89.gate_proj.weight_scale": "model-00031-of-00047.safetensors", + "model.layers.30.mlp.experts.89.up_proj.weight": "model-00031-of-00047.safetensors", + "model.layers.30.mlp.experts.89.up_proj.weight_scale": "model-00031-of-00047.safetensors", + "model.layers.30.mlp.experts.9.down_proj.weight": "model-00031-of-00047.safetensors", + "model.layers.30.mlp.experts.9.down_proj.weight_scale": "model-00031-of-00047.safetensors", + "model.layers.30.mlp.experts.9.gate_proj.weight": "model-00031-of-00047.safetensors", + "model.layers.30.mlp.experts.9.gate_proj.weight_scale": "model-00031-of-00047.safetensors", + "model.layers.30.mlp.experts.9.up_proj.weight": "model-00031-of-00047.safetensors", + "model.layers.30.mlp.experts.9.up_proj.weight_scale": "model-00031-of-00047.safetensors", + "model.layers.30.mlp.experts.90.down_proj.weight": "model-00031-of-00047.safetensors", + "model.layers.30.mlp.experts.90.down_proj.weight_scale": "model-00031-of-00047.safetensors", + "model.layers.30.mlp.experts.90.gate_proj.weight": "model-00031-of-00047.safetensors", + "model.layers.30.mlp.experts.90.gate_proj.weight_scale": "model-00031-of-00047.safetensors", + "model.layers.30.mlp.experts.90.up_proj.weight": "model-00031-of-00047.safetensors", + "model.layers.30.mlp.experts.90.up_proj.weight_scale": "model-00031-of-00047.safetensors", + "model.layers.30.mlp.experts.91.down_proj.weight": "model-00031-of-00047.safetensors", + "model.layers.30.mlp.experts.91.down_proj.weight_scale": "model-00031-of-00047.safetensors", + "model.layers.30.mlp.experts.91.gate_proj.weight": "model-00031-of-00047.safetensors", + "model.layers.30.mlp.experts.91.gate_proj.weight_scale": "model-00031-of-00047.safetensors", + "model.layers.30.mlp.experts.91.up_proj.weight": "model-00031-of-00047.safetensors", + "model.layers.30.mlp.experts.91.up_proj.weight_scale": "model-00031-of-00047.safetensors", + "model.layers.30.mlp.experts.92.down_proj.weight": "model-00031-of-00047.safetensors", + "model.layers.30.mlp.experts.92.down_proj.weight_scale": "model-00031-of-00047.safetensors", + "model.layers.30.mlp.experts.92.gate_proj.weight": "model-00031-of-00047.safetensors", + "model.layers.30.mlp.experts.92.gate_proj.weight_scale": "model-00031-of-00047.safetensors", + "model.layers.30.mlp.experts.92.up_proj.weight": "model-00031-of-00047.safetensors", + "model.layers.30.mlp.experts.92.up_proj.weight_scale": "model-00031-of-00047.safetensors", + "model.layers.30.mlp.experts.93.down_proj.weight": "model-00031-of-00047.safetensors", + "model.layers.30.mlp.experts.93.down_proj.weight_scale": "model-00031-of-00047.safetensors", + "model.layers.30.mlp.experts.93.gate_proj.weight": "model-00031-of-00047.safetensors", + "model.layers.30.mlp.experts.93.gate_proj.weight_scale": "model-00031-of-00047.safetensors", + "model.layers.30.mlp.experts.93.up_proj.weight": "model-00031-of-00047.safetensors", + "model.layers.30.mlp.experts.93.up_proj.weight_scale": "model-00031-of-00047.safetensors", + "model.layers.30.mlp.experts.94.down_proj.weight": "model-00031-of-00047.safetensors", + "model.layers.30.mlp.experts.94.down_proj.weight_scale": "model-00031-of-00047.safetensors", + "model.layers.30.mlp.experts.94.gate_proj.weight": "model-00031-of-00047.safetensors", + "model.layers.30.mlp.experts.94.gate_proj.weight_scale": "model-00031-of-00047.safetensors", + "model.layers.30.mlp.experts.94.up_proj.weight": "model-00031-of-00047.safetensors", + "model.layers.30.mlp.experts.94.up_proj.weight_scale": "model-00031-of-00047.safetensors", + "model.layers.30.mlp.experts.95.down_proj.weight": "model-00031-of-00047.safetensors", + "model.layers.30.mlp.experts.95.down_proj.weight_scale": "model-00031-of-00047.safetensors", + "model.layers.30.mlp.experts.95.gate_proj.weight": "model-00031-of-00047.safetensors", + "model.layers.30.mlp.experts.95.gate_proj.weight_scale": "model-00031-of-00047.safetensors", + "model.layers.30.mlp.experts.95.up_proj.weight": "model-00031-of-00047.safetensors", + "model.layers.30.mlp.experts.95.up_proj.weight_scale": "model-00031-of-00047.safetensors", + "model.layers.30.mlp.experts.96.down_proj.weight": "model-00031-of-00047.safetensors", + "model.layers.30.mlp.experts.96.down_proj.weight_scale": "model-00031-of-00047.safetensors", + "model.layers.30.mlp.experts.96.gate_proj.weight": "model-00031-of-00047.safetensors", + "model.layers.30.mlp.experts.96.gate_proj.weight_scale": "model-00031-of-00047.safetensors", + "model.layers.30.mlp.experts.96.up_proj.weight": "model-00031-of-00047.safetensors", + "model.layers.30.mlp.experts.96.up_proj.weight_scale": "model-00031-of-00047.safetensors", + "model.layers.30.mlp.experts.97.down_proj.weight": "model-00031-of-00047.safetensors", + "model.layers.30.mlp.experts.97.down_proj.weight_scale": "model-00031-of-00047.safetensors", + "model.layers.30.mlp.experts.97.gate_proj.weight": "model-00031-of-00047.safetensors", + "model.layers.30.mlp.experts.97.gate_proj.weight_scale": "model-00031-of-00047.safetensors", + "model.layers.30.mlp.experts.97.up_proj.weight": "model-00031-of-00047.safetensors", + "model.layers.30.mlp.experts.97.up_proj.weight_scale": "model-00031-of-00047.safetensors", + "model.layers.30.mlp.experts.98.down_proj.weight": "model-00031-of-00047.safetensors", + "model.layers.30.mlp.experts.98.down_proj.weight_scale": "model-00031-of-00047.safetensors", + "model.layers.30.mlp.experts.98.gate_proj.weight": "model-00031-of-00047.safetensors", + "model.layers.30.mlp.experts.98.gate_proj.weight_scale": "model-00031-of-00047.safetensors", + "model.layers.30.mlp.experts.98.up_proj.weight": "model-00031-of-00047.safetensors", + "model.layers.30.mlp.experts.98.up_proj.weight_scale": "model-00031-of-00047.safetensors", + "model.layers.30.mlp.experts.99.down_proj.weight": "model-00031-of-00047.safetensors", + "model.layers.30.mlp.experts.99.down_proj.weight_scale": "model-00031-of-00047.safetensors", + "model.layers.30.mlp.experts.99.gate_proj.weight": "model-00031-of-00047.safetensors", + "model.layers.30.mlp.experts.99.gate_proj.weight_scale": "model-00031-of-00047.safetensors", + "model.layers.30.mlp.experts.99.up_proj.weight": "model-00031-of-00047.safetensors", + "model.layers.30.mlp.experts.99.up_proj.weight_scale": "model-00031-of-00047.safetensors", + "model.layers.30.mlp.gate.e_score_correction_bias": "model-00031-of-00047.safetensors", + "model.layers.30.mlp.gate.weight": "model-00031-of-00047.safetensors", + "model.layers.30.mlp.shared_experts.down_proj.weight": "model-00031-of-00047.safetensors", + "model.layers.30.mlp.shared_experts.down_proj.weight_scale": "model-00031-of-00047.safetensors", + "model.layers.30.mlp.shared_experts.gate_proj.weight": "model-00031-of-00047.safetensors", + "model.layers.30.mlp.shared_experts.gate_proj.weight_scale": "model-00031-of-00047.safetensors", + "model.layers.30.mlp.shared_experts.up_proj.weight": "model-00031-of-00047.safetensors", + "model.layers.30.mlp.shared_experts.up_proj.weight_scale": "model-00031-of-00047.safetensors", + "model.layers.30.post_attention_layernorm.weight": "model-00031-of-00047.safetensors", + "model.layers.30.self_attn.k_proj.bias": "model-00031-of-00047.safetensors", + "model.layers.30.self_attn.k_proj.weight": "model-00031-of-00047.safetensors", + "model.layers.30.self_attn.k_proj.weight_scale": "model-00031-of-00047.safetensors", + "model.layers.30.self_attn.o_proj.weight": "model-00031-of-00047.safetensors", + "model.layers.30.self_attn.o_proj.weight_scale": "model-00031-of-00047.safetensors", + "model.layers.30.self_attn.q_proj.bias": "model-00031-of-00047.safetensors", + "model.layers.30.self_attn.q_proj.weight": "model-00031-of-00047.safetensors", + "model.layers.30.self_attn.q_proj.weight_scale": "model-00031-of-00047.safetensors", + "model.layers.30.self_attn.v_proj.bias": "model-00031-of-00047.safetensors", + "model.layers.30.self_attn.v_proj.weight": "model-00031-of-00047.safetensors", + "model.layers.30.self_attn.v_proj.weight_scale": "model-00031-of-00047.safetensors", + "model.layers.31.input_layernorm.weight": "model-00032-of-00047.safetensors", + "model.layers.31.mlp.experts.0.down_proj.weight": "model-00032-of-00047.safetensors", + "model.layers.31.mlp.experts.0.down_proj.weight_scale": "model-00032-of-00047.safetensors", + "model.layers.31.mlp.experts.0.gate_proj.weight": "model-00032-of-00047.safetensors", + "model.layers.31.mlp.experts.0.gate_proj.weight_scale": "model-00032-of-00047.safetensors", + "model.layers.31.mlp.experts.0.up_proj.weight": "model-00032-of-00047.safetensors", + "model.layers.31.mlp.experts.0.up_proj.weight_scale": "model-00032-of-00047.safetensors", + "model.layers.31.mlp.experts.1.down_proj.weight": "model-00032-of-00047.safetensors", + "model.layers.31.mlp.experts.1.down_proj.weight_scale": "model-00032-of-00047.safetensors", + "model.layers.31.mlp.experts.1.gate_proj.weight": "model-00032-of-00047.safetensors", + "model.layers.31.mlp.experts.1.gate_proj.weight_scale": "model-00032-of-00047.safetensors", + "model.layers.31.mlp.experts.1.up_proj.weight": "model-00032-of-00047.safetensors", + "model.layers.31.mlp.experts.1.up_proj.weight_scale": "model-00032-of-00047.safetensors", + "model.layers.31.mlp.experts.10.down_proj.weight": "model-00032-of-00047.safetensors", + "model.layers.31.mlp.experts.10.down_proj.weight_scale": "model-00032-of-00047.safetensors", + "model.layers.31.mlp.experts.10.gate_proj.weight": "model-00032-of-00047.safetensors", + "model.layers.31.mlp.experts.10.gate_proj.weight_scale": "model-00032-of-00047.safetensors", + "model.layers.31.mlp.experts.10.up_proj.weight": "model-00032-of-00047.safetensors", + "model.layers.31.mlp.experts.10.up_proj.weight_scale": "model-00032-of-00047.safetensors", + "model.layers.31.mlp.experts.100.down_proj.weight": "model-00032-of-00047.safetensors", + "model.layers.31.mlp.experts.100.down_proj.weight_scale": "model-00032-of-00047.safetensors", + "model.layers.31.mlp.experts.100.gate_proj.weight": "model-00032-of-00047.safetensors", + "model.layers.31.mlp.experts.100.gate_proj.weight_scale": "model-00032-of-00047.safetensors", + "model.layers.31.mlp.experts.100.up_proj.weight": "model-00032-of-00047.safetensors", + "model.layers.31.mlp.experts.100.up_proj.weight_scale": "model-00032-of-00047.safetensors", + "model.layers.31.mlp.experts.101.down_proj.weight": "model-00032-of-00047.safetensors", + "model.layers.31.mlp.experts.101.down_proj.weight_scale": "model-00032-of-00047.safetensors", + "model.layers.31.mlp.experts.101.gate_proj.weight": "model-00032-of-00047.safetensors", + "model.layers.31.mlp.experts.101.gate_proj.weight_scale": "model-00032-of-00047.safetensors", + "model.layers.31.mlp.experts.101.up_proj.weight": "model-00032-of-00047.safetensors", + "model.layers.31.mlp.experts.101.up_proj.weight_scale": "model-00032-of-00047.safetensors", + "model.layers.31.mlp.experts.102.down_proj.weight": "model-00032-of-00047.safetensors", + "model.layers.31.mlp.experts.102.down_proj.weight_scale": "model-00032-of-00047.safetensors", + "model.layers.31.mlp.experts.102.gate_proj.weight": "model-00032-of-00047.safetensors", + "model.layers.31.mlp.experts.102.gate_proj.weight_scale": "model-00032-of-00047.safetensors", + "model.layers.31.mlp.experts.102.up_proj.weight": "model-00032-of-00047.safetensors", + "model.layers.31.mlp.experts.102.up_proj.weight_scale": "model-00032-of-00047.safetensors", + "model.layers.31.mlp.experts.103.down_proj.weight": "model-00032-of-00047.safetensors", + "model.layers.31.mlp.experts.103.down_proj.weight_scale": "model-00032-of-00047.safetensors", + "model.layers.31.mlp.experts.103.gate_proj.weight": "model-00032-of-00047.safetensors", + "model.layers.31.mlp.experts.103.gate_proj.weight_scale": "model-00032-of-00047.safetensors", + "model.layers.31.mlp.experts.103.up_proj.weight": "model-00032-of-00047.safetensors", + "model.layers.31.mlp.experts.103.up_proj.weight_scale": "model-00032-of-00047.safetensors", + "model.layers.31.mlp.experts.104.down_proj.weight": "model-00032-of-00047.safetensors", + "model.layers.31.mlp.experts.104.down_proj.weight_scale": "model-00032-of-00047.safetensors", + "model.layers.31.mlp.experts.104.gate_proj.weight": "model-00032-of-00047.safetensors", + "model.layers.31.mlp.experts.104.gate_proj.weight_scale": "model-00032-of-00047.safetensors", + "model.layers.31.mlp.experts.104.up_proj.weight": "model-00032-of-00047.safetensors", + "model.layers.31.mlp.experts.104.up_proj.weight_scale": "model-00032-of-00047.safetensors", + "model.layers.31.mlp.experts.105.down_proj.weight": "model-00032-of-00047.safetensors", + "model.layers.31.mlp.experts.105.down_proj.weight_scale": "model-00032-of-00047.safetensors", + "model.layers.31.mlp.experts.105.gate_proj.weight": "model-00032-of-00047.safetensors", + "model.layers.31.mlp.experts.105.gate_proj.weight_scale": "model-00032-of-00047.safetensors", + "model.layers.31.mlp.experts.105.up_proj.weight": "model-00032-of-00047.safetensors", + "model.layers.31.mlp.experts.105.up_proj.weight_scale": "model-00032-of-00047.safetensors", + "model.layers.31.mlp.experts.106.down_proj.weight": "model-00032-of-00047.safetensors", + "model.layers.31.mlp.experts.106.down_proj.weight_scale": "model-00032-of-00047.safetensors", + "model.layers.31.mlp.experts.106.gate_proj.weight": "model-00032-of-00047.safetensors", + "model.layers.31.mlp.experts.106.gate_proj.weight_scale": "model-00032-of-00047.safetensors", + "model.layers.31.mlp.experts.106.up_proj.weight": "model-00032-of-00047.safetensors", + "model.layers.31.mlp.experts.106.up_proj.weight_scale": "model-00032-of-00047.safetensors", + "model.layers.31.mlp.experts.107.down_proj.weight": "model-00032-of-00047.safetensors", + "model.layers.31.mlp.experts.107.down_proj.weight_scale": "model-00032-of-00047.safetensors", + "model.layers.31.mlp.experts.107.gate_proj.weight": "model-00032-of-00047.safetensors", + "model.layers.31.mlp.experts.107.gate_proj.weight_scale": "model-00032-of-00047.safetensors", + "model.layers.31.mlp.experts.107.up_proj.weight": "model-00032-of-00047.safetensors", + "model.layers.31.mlp.experts.107.up_proj.weight_scale": "model-00032-of-00047.safetensors", + "model.layers.31.mlp.experts.108.down_proj.weight": "model-00032-of-00047.safetensors", + "model.layers.31.mlp.experts.108.down_proj.weight_scale": "model-00032-of-00047.safetensors", + "model.layers.31.mlp.experts.108.gate_proj.weight": "model-00032-of-00047.safetensors", + "model.layers.31.mlp.experts.108.gate_proj.weight_scale": "model-00032-of-00047.safetensors", + "model.layers.31.mlp.experts.108.up_proj.weight": "model-00032-of-00047.safetensors", + "model.layers.31.mlp.experts.108.up_proj.weight_scale": "model-00032-of-00047.safetensors", + "model.layers.31.mlp.experts.109.down_proj.weight": "model-00032-of-00047.safetensors", + "model.layers.31.mlp.experts.109.down_proj.weight_scale": "model-00032-of-00047.safetensors", + "model.layers.31.mlp.experts.109.gate_proj.weight": "model-00032-of-00047.safetensors", + "model.layers.31.mlp.experts.109.gate_proj.weight_scale": "model-00032-of-00047.safetensors", + "model.layers.31.mlp.experts.109.up_proj.weight": "model-00032-of-00047.safetensors", + "model.layers.31.mlp.experts.109.up_proj.weight_scale": "model-00032-of-00047.safetensors", + "model.layers.31.mlp.experts.11.down_proj.weight": "model-00032-of-00047.safetensors", + "model.layers.31.mlp.experts.11.down_proj.weight_scale": "model-00032-of-00047.safetensors", + "model.layers.31.mlp.experts.11.gate_proj.weight": "model-00032-of-00047.safetensors", + "model.layers.31.mlp.experts.11.gate_proj.weight_scale": "model-00032-of-00047.safetensors", + "model.layers.31.mlp.experts.11.up_proj.weight": "model-00032-of-00047.safetensors", + "model.layers.31.mlp.experts.11.up_proj.weight_scale": "model-00032-of-00047.safetensors", + "model.layers.31.mlp.experts.110.down_proj.weight": "model-00032-of-00047.safetensors", + "model.layers.31.mlp.experts.110.down_proj.weight_scale": "model-00032-of-00047.safetensors", + "model.layers.31.mlp.experts.110.gate_proj.weight": "model-00032-of-00047.safetensors", + "model.layers.31.mlp.experts.110.gate_proj.weight_scale": "model-00032-of-00047.safetensors", + "model.layers.31.mlp.experts.110.up_proj.weight": "model-00032-of-00047.safetensors", + "model.layers.31.mlp.experts.110.up_proj.weight_scale": "model-00032-of-00047.safetensors", + "model.layers.31.mlp.experts.111.down_proj.weight": "model-00032-of-00047.safetensors", + "model.layers.31.mlp.experts.111.down_proj.weight_scale": "model-00032-of-00047.safetensors", + "model.layers.31.mlp.experts.111.gate_proj.weight": "model-00032-of-00047.safetensors", + "model.layers.31.mlp.experts.111.gate_proj.weight_scale": "model-00032-of-00047.safetensors", + "model.layers.31.mlp.experts.111.up_proj.weight": "model-00032-of-00047.safetensors", + "model.layers.31.mlp.experts.111.up_proj.weight_scale": "model-00032-of-00047.safetensors", + "model.layers.31.mlp.experts.112.down_proj.weight": "model-00032-of-00047.safetensors", + "model.layers.31.mlp.experts.112.down_proj.weight_scale": "model-00032-of-00047.safetensors", + "model.layers.31.mlp.experts.112.gate_proj.weight": "model-00032-of-00047.safetensors", + "model.layers.31.mlp.experts.112.gate_proj.weight_scale": "model-00032-of-00047.safetensors", + "model.layers.31.mlp.experts.112.up_proj.weight": "model-00032-of-00047.safetensors", + "model.layers.31.mlp.experts.112.up_proj.weight_scale": "model-00032-of-00047.safetensors", + "model.layers.31.mlp.experts.113.down_proj.weight": "model-00032-of-00047.safetensors", + "model.layers.31.mlp.experts.113.down_proj.weight_scale": "model-00032-of-00047.safetensors", + "model.layers.31.mlp.experts.113.gate_proj.weight": "model-00032-of-00047.safetensors", + "model.layers.31.mlp.experts.113.gate_proj.weight_scale": "model-00032-of-00047.safetensors", + "model.layers.31.mlp.experts.113.up_proj.weight": "model-00032-of-00047.safetensors", + "model.layers.31.mlp.experts.113.up_proj.weight_scale": "model-00032-of-00047.safetensors", + "model.layers.31.mlp.experts.114.down_proj.weight": "model-00032-of-00047.safetensors", + "model.layers.31.mlp.experts.114.down_proj.weight_scale": "model-00032-of-00047.safetensors", + "model.layers.31.mlp.experts.114.gate_proj.weight": "model-00032-of-00047.safetensors", + "model.layers.31.mlp.experts.114.gate_proj.weight_scale": "model-00032-of-00047.safetensors", + "model.layers.31.mlp.experts.114.up_proj.weight": "model-00032-of-00047.safetensors", + "model.layers.31.mlp.experts.114.up_proj.weight_scale": "model-00032-of-00047.safetensors", + "model.layers.31.mlp.experts.115.down_proj.weight": "model-00032-of-00047.safetensors", + "model.layers.31.mlp.experts.115.down_proj.weight_scale": "model-00032-of-00047.safetensors", + "model.layers.31.mlp.experts.115.gate_proj.weight": "model-00032-of-00047.safetensors", + "model.layers.31.mlp.experts.115.gate_proj.weight_scale": "model-00032-of-00047.safetensors", + "model.layers.31.mlp.experts.115.up_proj.weight": "model-00032-of-00047.safetensors", + "model.layers.31.mlp.experts.115.up_proj.weight_scale": "model-00032-of-00047.safetensors", + "model.layers.31.mlp.experts.116.down_proj.weight": "model-00032-of-00047.safetensors", + "model.layers.31.mlp.experts.116.down_proj.weight_scale": "model-00032-of-00047.safetensors", + "model.layers.31.mlp.experts.116.gate_proj.weight": "model-00032-of-00047.safetensors", + "model.layers.31.mlp.experts.116.gate_proj.weight_scale": "model-00032-of-00047.safetensors", + "model.layers.31.mlp.experts.116.up_proj.weight": "model-00032-of-00047.safetensors", + "model.layers.31.mlp.experts.116.up_proj.weight_scale": "model-00032-of-00047.safetensors", + "model.layers.31.mlp.experts.117.down_proj.weight": "model-00032-of-00047.safetensors", + "model.layers.31.mlp.experts.117.down_proj.weight_scale": "model-00032-of-00047.safetensors", + "model.layers.31.mlp.experts.117.gate_proj.weight": "model-00032-of-00047.safetensors", + "model.layers.31.mlp.experts.117.gate_proj.weight_scale": "model-00032-of-00047.safetensors", + "model.layers.31.mlp.experts.117.up_proj.weight": "model-00032-of-00047.safetensors", + "model.layers.31.mlp.experts.117.up_proj.weight_scale": "model-00032-of-00047.safetensors", + "model.layers.31.mlp.experts.118.down_proj.weight": "model-00032-of-00047.safetensors", + "model.layers.31.mlp.experts.118.down_proj.weight_scale": "model-00032-of-00047.safetensors", + "model.layers.31.mlp.experts.118.gate_proj.weight": "model-00032-of-00047.safetensors", + "model.layers.31.mlp.experts.118.gate_proj.weight_scale": "model-00032-of-00047.safetensors", + "model.layers.31.mlp.experts.118.up_proj.weight": "model-00032-of-00047.safetensors", + "model.layers.31.mlp.experts.118.up_proj.weight_scale": "model-00032-of-00047.safetensors", + "model.layers.31.mlp.experts.119.down_proj.weight": "model-00032-of-00047.safetensors", + "model.layers.31.mlp.experts.119.down_proj.weight_scale": "model-00032-of-00047.safetensors", + "model.layers.31.mlp.experts.119.gate_proj.weight": "model-00032-of-00047.safetensors", + "model.layers.31.mlp.experts.119.gate_proj.weight_scale": "model-00032-of-00047.safetensors", + "model.layers.31.mlp.experts.119.up_proj.weight": "model-00032-of-00047.safetensors", + "model.layers.31.mlp.experts.119.up_proj.weight_scale": "model-00032-of-00047.safetensors", + "model.layers.31.mlp.experts.12.down_proj.weight": "model-00032-of-00047.safetensors", + "model.layers.31.mlp.experts.12.down_proj.weight_scale": "model-00032-of-00047.safetensors", + "model.layers.31.mlp.experts.12.gate_proj.weight": "model-00032-of-00047.safetensors", + "model.layers.31.mlp.experts.12.gate_proj.weight_scale": "model-00032-of-00047.safetensors", + "model.layers.31.mlp.experts.12.up_proj.weight": "model-00032-of-00047.safetensors", + "model.layers.31.mlp.experts.12.up_proj.weight_scale": "model-00032-of-00047.safetensors", + "model.layers.31.mlp.experts.120.down_proj.weight": "model-00032-of-00047.safetensors", + "model.layers.31.mlp.experts.120.down_proj.weight_scale": "model-00032-of-00047.safetensors", + "model.layers.31.mlp.experts.120.gate_proj.weight": "model-00032-of-00047.safetensors", + "model.layers.31.mlp.experts.120.gate_proj.weight_scale": "model-00032-of-00047.safetensors", + "model.layers.31.mlp.experts.120.up_proj.weight": "model-00032-of-00047.safetensors", + "model.layers.31.mlp.experts.120.up_proj.weight_scale": "model-00032-of-00047.safetensors", + "model.layers.31.mlp.experts.121.down_proj.weight": "model-00032-of-00047.safetensors", + "model.layers.31.mlp.experts.121.down_proj.weight_scale": "model-00032-of-00047.safetensors", + "model.layers.31.mlp.experts.121.gate_proj.weight": "model-00032-of-00047.safetensors", + "model.layers.31.mlp.experts.121.gate_proj.weight_scale": "model-00032-of-00047.safetensors", + "model.layers.31.mlp.experts.121.up_proj.weight": "model-00032-of-00047.safetensors", + "model.layers.31.mlp.experts.121.up_proj.weight_scale": "model-00032-of-00047.safetensors", + "model.layers.31.mlp.experts.122.down_proj.weight": "model-00032-of-00047.safetensors", + "model.layers.31.mlp.experts.122.down_proj.weight_scale": "model-00032-of-00047.safetensors", + "model.layers.31.mlp.experts.122.gate_proj.weight": "model-00032-of-00047.safetensors", + "model.layers.31.mlp.experts.122.gate_proj.weight_scale": "model-00032-of-00047.safetensors", + "model.layers.31.mlp.experts.122.up_proj.weight": "model-00032-of-00047.safetensors", + "model.layers.31.mlp.experts.122.up_proj.weight_scale": "model-00032-of-00047.safetensors", + "model.layers.31.mlp.experts.123.down_proj.weight": "model-00032-of-00047.safetensors", + "model.layers.31.mlp.experts.123.down_proj.weight_scale": "model-00032-of-00047.safetensors", + "model.layers.31.mlp.experts.123.gate_proj.weight": "model-00032-of-00047.safetensors", + "model.layers.31.mlp.experts.123.gate_proj.weight_scale": "model-00032-of-00047.safetensors", + "model.layers.31.mlp.experts.123.up_proj.weight": "model-00032-of-00047.safetensors", + "model.layers.31.mlp.experts.123.up_proj.weight_scale": "model-00032-of-00047.safetensors", + "model.layers.31.mlp.experts.124.down_proj.weight": "model-00032-of-00047.safetensors", + "model.layers.31.mlp.experts.124.down_proj.weight_scale": "model-00032-of-00047.safetensors", + "model.layers.31.mlp.experts.124.gate_proj.weight": "model-00032-of-00047.safetensors", + "model.layers.31.mlp.experts.124.gate_proj.weight_scale": "model-00032-of-00047.safetensors", + "model.layers.31.mlp.experts.124.up_proj.weight": "model-00032-of-00047.safetensors", + "model.layers.31.mlp.experts.124.up_proj.weight_scale": "model-00032-of-00047.safetensors", + "model.layers.31.mlp.experts.125.down_proj.weight": "model-00032-of-00047.safetensors", + "model.layers.31.mlp.experts.125.down_proj.weight_scale": "model-00032-of-00047.safetensors", + "model.layers.31.mlp.experts.125.gate_proj.weight": "model-00032-of-00047.safetensors", + "model.layers.31.mlp.experts.125.gate_proj.weight_scale": "model-00032-of-00047.safetensors", + "model.layers.31.mlp.experts.125.up_proj.weight": "model-00032-of-00047.safetensors", + "model.layers.31.mlp.experts.125.up_proj.weight_scale": "model-00032-of-00047.safetensors", + "model.layers.31.mlp.experts.126.down_proj.weight": "model-00032-of-00047.safetensors", + "model.layers.31.mlp.experts.126.down_proj.weight_scale": "model-00032-of-00047.safetensors", + "model.layers.31.mlp.experts.126.gate_proj.weight": "model-00032-of-00047.safetensors", + "model.layers.31.mlp.experts.126.gate_proj.weight_scale": "model-00032-of-00047.safetensors", + "model.layers.31.mlp.experts.126.up_proj.weight": "model-00032-of-00047.safetensors", + "model.layers.31.mlp.experts.126.up_proj.weight_scale": "model-00032-of-00047.safetensors", + "model.layers.31.mlp.experts.127.down_proj.weight": "model-00032-of-00047.safetensors", + "model.layers.31.mlp.experts.127.down_proj.weight_scale": "model-00032-of-00047.safetensors", + "model.layers.31.mlp.experts.127.gate_proj.weight": "model-00032-of-00047.safetensors", + "model.layers.31.mlp.experts.127.gate_proj.weight_scale": "model-00032-of-00047.safetensors", + "model.layers.31.mlp.experts.127.up_proj.weight": "model-00032-of-00047.safetensors", + "model.layers.31.mlp.experts.127.up_proj.weight_scale": "model-00032-of-00047.safetensors", + "model.layers.31.mlp.experts.13.down_proj.weight": "model-00032-of-00047.safetensors", + "model.layers.31.mlp.experts.13.down_proj.weight_scale": "model-00032-of-00047.safetensors", + "model.layers.31.mlp.experts.13.gate_proj.weight": "model-00032-of-00047.safetensors", + "model.layers.31.mlp.experts.13.gate_proj.weight_scale": "model-00032-of-00047.safetensors", + "model.layers.31.mlp.experts.13.up_proj.weight": "model-00032-of-00047.safetensors", + "model.layers.31.mlp.experts.13.up_proj.weight_scale": "model-00032-of-00047.safetensors", + "model.layers.31.mlp.experts.14.down_proj.weight": "model-00032-of-00047.safetensors", + "model.layers.31.mlp.experts.14.down_proj.weight_scale": "model-00032-of-00047.safetensors", + "model.layers.31.mlp.experts.14.gate_proj.weight": "model-00032-of-00047.safetensors", + "model.layers.31.mlp.experts.14.gate_proj.weight_scale": "model-00032-of-00047.safetensors", + "model.layers.31.mlp.experts.14.up_proj.weight": "model-00032-of-00047.safetensors", + "model.layers.31.mlp.experts.14.up_proj.weight_scale": "model-00032-of-00047.safetensors", + "model.layers.31.mlp.experts.15.down_proj.weight": "model-00032-of-00047.safetensors", + "model.layers.31.mlp.experts.15.down_proj.weight_scale": "model-00032-of-00047.safetensors", + "model.layers.31.mlp.experts.15.gate_proj.weight": "model-00032-of-00047.safetensors", + "model.layers.31.mlp.experts.15.gate_proj.weight_scale": "model-00032-of-00047.safetensors", + "model.layers.31.mlp.experts.15.up_proj.weight": "model-00032-of-00047.safetensors", + "model.layers.31.mlp.experts.15.up_proj.weight_scale": "model-00032-of-00047.safetensors", + "model.layers.31.mlp.experts.16.down_proj.weight": "model-00032-of-00047.safetensors", + "model.layers.31.mlp.experts.16.down_proj.weight_scale": "model-00032-of-00047.safetensors", + "model.layers.31.mlp.experts.16.gate_proj.weight": "model-00032-of-00047.safetensors", + "model.layers.31.mlp.experts.16.gate_proj.weight_scale": "model-00032-of-00047.safetensors", + "model.layers.31.mlp.experts.16.up_proj.weight": "model-00032-of-00047.safetensors", + "model.layers.31.mlp.experts.16.up_proj.weight_scale": "model-00032-of-00047.safetensors", + "model.layers.31.mlp.experts.17.down_proj.weight": "model-00032-of-00047.safetensors", + "model.layers.31.mlp.experts.17.down_proj.weight_scale": "model-00032-of-00047.safetensors", + "model.layers.31.mlp.experts.17.gate_proj.weight": "model-00032-of-00047.safetensors", + "model.layers.31.mlp.experts.17.gate_proj.weight_scale": "model-00032-of-00047.safetensors", + "model.layers.31.mlp.experts.17.up_proj.weight": "model-00032-of-00047.safetensors", + "model.layers.31.mlp.experts.17.up_proj.weight_scale": "model-00032-of-00047.safetensors", + "model.layers.31.mlp.experts.18.down_proj.weight": "model-00032-of-00047.safetensors", + "model.layers.31.mlp.experts.18.down_proj.weight_scale": "model-00032-of-00047.safetensors", + "model.layers.31.mlp.experts.18.gate_proj.weight": "model-00032-of-00047.safetensors", + "model.layers.31.mlp.experts.18.gate_proj.weight_scale": "model-00032-of-00047.safetensors", + "model.layers.31.mlp.experts.18.up_proj.weight": "model-00032-of-00047.safetensors", + "model.layers.31.mlp.experts.18.up_proj.weight_scale": "model-00032-of-00047.safetensors", + "model.layers.31.mlp.experts.19.down_proj.weight": "model-00032-of-00047.safetensors", + "model.layers.31.mlp.experts.19.down_proj.weight_scale": "model-00032-of-00047.safetensors", + "model.layers.31.mlp.experts.19.gate_proj.weight": "model-00032-of-00047.safetensors", + "model.layers.31.mlp.experts.19.gate_proj.weight_scale": "model-00032-of-00047.safetensors", + "model.layers.31.mlp.experts.19.up_proj.weight": "model-00032-of-00047.safetensors", + "model.layers.31.mlp.experts.19.up_proj.weight_scale": "model-00032-of-00047.safetensors", + "model.layers.31.mlp.experts.2.down_proj.weight": "model-00032-of-00047.safetensors", + "model.layers.31.mlp.experts.2.down_proj.weight_scale": "model-00032-of-00047.safetensors", + "model.layers.31.mlp.experts.2.gate_proj.weight": "model-00032-of-00047.safetensors", + "model.layers.31.mlp.experts.2.gate_proj.weight_scale": "model-00032-of-00047.safetensors", + "model.layers.31.mlp.experts.2.up_proj.weight": "model-00032-of-00047.safetensors", + "model.layers.31.mlp.experts.2.up_proj.weight_scale": "model-00032-of-00047.safetensors", + "model.layers.31.mlp.experts.20.down_proj.weight": "model-00032-of-00047.safetensors", + "model.layers.31.mlp.experts.20.down_proj.weight_scale": "model-00032-of-00047.safetensors", + "model.layers.31.mlp.experts.20.gate_proj.weight": "model-00032-of-00047.safetensors", + "model.layers.31.mlp.experts.20.gate_proj.weight_scale": "model-00032-of-00047.safetensors", + "model.layers.31.mlp.experts.20.up_proj.weight": "model-00032-of-00047.safetensors", + "model.layers.31.mlp.experts.20.up_proj.weight_scale": "model-00032-of-00047.safetensors", + "model.layers.31.mlp.experts.21.down_proj.weight": "model-00032-of-00047.safetensors", + "model.layers.31.mlp.experts.21.down_proj.weight_scale": "model-00032-of-00047.safetensors", + "model.layers.31.mlp.experts.21.gate_proj.weight": "model-00032-of-00047.safetensors", + "model.layers.31.mlp.experts.21.gate_proj.weight_scale": "model-00032-of-00047.safetensors", + "model.layers.31.mlp.experts.21.up_proj.weight": "model-00032-of-00047.safetensors", + "model.layers.31.mlp.experts.21.up_proj.weight_scale": "model-00032-of-00047.safetensors", + "model.layers.31.mlp.experts.22.down_proj.weight": "model-00032-of-00047.safetensors", + "model.layers.31.mlp.experts.22.down_proj.weight_scale": "model-00032-of-00047.safetensors", + "model.layers.31.mlp.experts.22.gate_proj.weight": "model-00032-of-00047.safetensors", + "model.layers.31.mlp.experts.22.gate_proj.weight_scale": "model-00032-of-00047.safetensors", + "model.layers.31.mlp.experts.22.up_proj.weight": "model-00032-of-00047.safetensors", + "model.layers.31.mlp.experts.22.up_proj.weight_scale": "model-00032-of-00047.safetensors", + "model.layers.31.mlp.experts.23.down_proj.weight": "model-00032-of-00047.safetensors", + "model.layers.31.mlp.experts.23.down_proj.weight_scale": "model-00032-of-00047.safetensors", + "model.layers.31.mlp.experts.23.gate_proj.weight": "model-00032-of-00047.safetensors", + "model.layers.31.mlp.experts.23.gate_proj.weight_scale": "model-00032-of-00047.safetensors", + "model.layers.31.mlp.experts.23.up_proj.weight": "model-00032-of-00047.safetensors", + "model.layers.31.mlp.experts.23.up_proj.weight_scale": "model-00032-of-00047.safetensors", + "model.layers.31.mlp.experts.24.down_proj.weight": "model-00032-of-00047.safetensors", + "model.layers.31.mlp.experts.24.down_proj.weight_scale": "model-00032-of-00047.safetensors", + "model.layers.31.mlp.experts.24.gate_proj.weight": "model-00032-of-00047.safetensors", + "model.layers.31.mlp.experts.24.gate_proj.weight_scale": "model-00032-of-00047.safetensors", + "model.layers.31.mlp.experts.24.up_proj.weight": "model-00032-of-00047.safetensors", + "model.layers.31.mlp.experts.24.up_proj.weight_scale": "model-00032-of-00047.safetensors", + "model.layers.31.mlp.experts.25.down_proj.weight": "model-00032-of-00047.safetensors", + "model.layers.31.mlp.experts.25.down_proj.weight_scale": "model-00032-of-00047.safetensors", + "model.layers.31.mlp.experts.25.gate_proj.weight": "model-00032-of-00047.safetensors", + "model.layers.31.mlp.experts.25.gate_proj.weight_scale": "model-00032-of-00047.safetensors", + "model.layers.31.mlp.experts.25.up_proj.weight": "model-00032-of-00047.safetensors", + "model.layers.31.mlp.experts.25.up_proj.weight_scale": "model-00032-of-00047.safetensors", + "model.layers.31.mlp.experts.26.down_proj.weight": "model-00032-of-00047.safetensors", + "model.layers.31.mlp.experts.26.down_proj.weight_scale": "model-00032-of-00047.safetensors", + "model.layers.31.mlp.experts.26.gate_proj.weight": "model-00032-of-00047.safetensors", + "model.layers.31.mlp.experts.26.gate_proj.weight_scale": "model-00032-of-00047.safetensors", + "model.layers.31.mlp.experts.26.up_proj.weight": "model-00032-of-00047.safetensors", + "model.layers.31.mlp.experts.26.up_proj.weight_scale": "model-00032-of-00047.safetensors", + "model.layers.31.mlp.experts.27.down_proj.weight": "model-00032-of-00047.safetensors", + "model.layers.31.mlp.experts.27.down_proj.weight_scale": "model-00032-of-00047.safetensors", + "model.layers.31.mlp.experts.27.gate_proj.weight": "model-00032-of-00047.safetensors", + "model.layers.31.mlp.experts.27.gate_proj.weight_scale": "model-00032-of-00047.safetensors", + "model.layers.31.mlp.experts.27.up_proj.weight": "model-00032-of-00047.safetensors", + "model.layers.31.mlp.experts.27.up_proj.weight_scale": "model-00032-of-00047.safetensors", + "model.layers.31.mlp.experts.28.down_proj.weight": "model-00032-of-00047.safetensors", + "model.layers.31.mlp.experts.28.down_proj.weight_scale": "model-00032-of-00047.safetensors", + "model.layers.31.mlp.experts.28.gate_proj.weight": "model-00032-of-00047.safetensors", + "model.layers.31.mlp.experts.28.gate_proj.weight_scale": "model-00032-of-00047.safetensors", + "model.layers.31.mlp.experts.28.up_proj.weight": "model-00032-of-00047.safetensors", + "model.layers.31.mlp.experts.28.up_proj.weight_scale": "model-00032-of-00047.safetensors", + "model.layers.31.mlp.experts.29.down_proj.weight": "model-00032-of-00047.safetensors", + "model.layers.31.mlp.experts.29.down_proj.weight_scale": "model-00032-of-00047.safetensors", + "model.layers.31.mlp.experts.29.gate_proj.weight": "model-00032-of-00047.safetensors", + "model.layers.31.mlp.experts.29.gate_proj.weight_scale": "model-00032-of-00047.safetensors", + "model.layers.31.mlp.experts.29.up_proj.weight": "model-00032-of-00047.safetensors", + "model.layers.31.mlp.experts.29.up_proj.weight_scale": "model-00032-of-00047.safetensors", + "model.layers.31.mlp.experts.3.down_proj.weight": "model-00032-of-00047.safetensors", + "model.layers.31.mlp.experts.3.down_proj.weight_scale": "model-00032-of-00047.safetensors", + "model.layers.31.mlp.experts.3.gate_proj.weight": "model-00032-of-00047.safetensors", + "model.layers.31.mlp.experts.3.gate_proj.weight_scale": "model-00032-of-00047.safetensors", + "model.layers.31.mlp.experts.3.up_proj.weight": "model-00032-of-00047.safetensors", + "model.layers.31.mlp.experts.3.up_proj.weight_scale": "model-00032-of-00047.safetensors", + "model.layers.31.mlp.experts.30.down_proj.weight": "model-00032-of-00047.safetensors", + "model.layers.31.mlp.experts.30.down_proj.weight_scale": "model-00032-of-00047.safetensors", + "model.layers.31.mlp.experts.30.gate_proj.weight": "model-00032-of-00047.safetensors", + "model.layers.31.mlp.experts.30.gate_proj.weight_scale": "model-00032-of-00047.safetensors", + "model.layers.31.mlp.experts.30.up_proj.weight": "model-00032-of-00047.safetensors", + "model.layers.31.mlp.experts.30.up_proj.weight_scale": "model-00032-of-00047.safetensors", + "model.layers.31.mlp.experts.31.down_proj.weight": "model-00032-of-00047.safetensors", + "model.layers.31.mlp.experts.31.down_proj.weight_scale": "model-00032-of-00047.safetensors", + "model.layers.31.mlp.experts.31.gate_proj.weight": "model-00032-of-00047.safetensors", + "model.layers.31.mlp.experts.31.gate_proj.weight_scale": "model-00032-of-00047.safetensors", + "model.layers.31.mlp.experts.31.up_proj.weight": "model-00032-of-00047.safetensors", + "model.layers.31.mlp.experts.31.up_proj.weight_scale": "model-00032-of-00047.safetensors", + "model.layers.31.mlp.experts.32.down_proj.weight": "model-00032-of-00047.safetensors", + "model.layers.31.mlp.experts.32.down_proj.weight_scale": "model-00032-of-00047.safetensors", + "model.layers.31.mlp.experts.32.gate_proj.weight": "model-00032-of-00047.safetensors", + "model.layers.31.mlp.experts.32.gate_proj.weight_scale": "model-00032-of-00047.safetensors", + "model.layers.31.mlp.experts.32.up_proj.weight": "model-00032-of-00047.safetensors", + "model.layers.31.mlp.experts.32.up_proj.weight_scale": "model-00032-of-00047.safetensors", + "model.layers.31.mlp.experts.33.down_proj.weight": "model-00032-of-00047.safetensors", + "model.layers.31.mlp.experts.33.down_proj.weight_scale": "model-00032-of-00047.safetensors", + "model.layers.31.mlp.experts.33.gate_proj.weight": "model-00032-of-00047.safetensors", + "model.layers.31.mlp.experts.33.gate_proj.weight_scale": "model-00032-of-00047.safetensors", + "model.layers.31.mlp.experts.33.up_proj.weight": "model-00032-of-00047.safetensors", + "model.layers.31.mlp.experts.33.up_proj.weight_scale": "model-00032-of-00047.safetensors", + "model.layers.31.mlp.experts.34.down_proj.weight": "model-00032-of-00047.safetensors", + "model.layers.31.mlp.experts.34.down_proj.weight_scale": "model-00032-of-00047.safetensors", + "model.layers.31.mlp.experts.34.gate_proj.weight": "model-00032-of-00047.safetensors", + "model.layers.31.mlp.experts.34.gate_proj.weight_scale": "model-00032-of-00047.safetensors", + "model.layers.31.mlp.experts.34.up_proj.weight": "model-00032-of-00047.safetensors", + "model.layers.31.mlp.experts.34.up_proj.weight_scale": "model-00032-of-00047.safetensors", + "model.layers.31.mlp.experts.35.down_proj.weight": "model-00032-of-00047.safetensors", + "model.layers.31.mlp.experts.35.down_proj.weight_scale": "model-00032-of-00047.safetensors", + "model.layers.31.mlp.experts.35.gate_proj.weight": "model-00032-of-00047.safetensors", + "model.layers.31.mlp.experts.35.gate_proj.weight_scale": "model-00032-of-00047.safetensors", + "model.layers.31.mlp.experts.35.up_proj.weight": "model-00032-of-00047.safetensors", + "model.layers.31.mlp.experts.35.up_proj.weight_scale": "model-00032-of-00047.safetensors", + "model.layers.31.mlp.experts.36.down_proj.weight": "model-00032-of-00047.safetensors", + "model.layers.31.mlp.experts.36.down_proj.weight_scale": "model-00032-of-00047.safetensors", + "model.layers.31.mlp.experts.36.gate_proj.weight": "model-00032-of-00047.safetensors", + "model.layers.31.mlp.experts.36.gate_proj.weight_scale": "model-00032-of-00047.safetensors", + "model.layers.31.mlp.experts.36.up_proj.weight": "model-00032-of-00047.safetensors", + "model.layers.31.mlp.experts.36.up_proj.weight_scale": "model-00032-of-00047.safetensors", + "model.layers.31.mlp.experts.37.down_proj.weight": "model-00032-of-00047.safetensors", + "model.layers.31.mlp.experts.37.down_proj.weight_scale": "model-00032-of-00047.safetensors", + "model.layers.31.mlp.experts.37.gate_proj.weight": "model-00032-of-00047.safetensors", + "model.layers.31.mlp.experts.37.gate_proj.weight_scale": "model-00032-of-00047.safetensors", + "model.layers.31.mlp.experts.37.up_proj.weight": "model-00032-of-00047.safetensors", + "model.layers.31.mlp.experts.37.up_proj.weight_scale": "model-00032-of-00047.safetensors", + "model.layers.31.mlp.experts.38.down_proj.weight": "model-00032-of-00047.safetensors", + "model.layers.31.mlp.experts.38.down_proj.weight_scale": "model-00032-of-00047.safetensors", + "model.layers.31.mlp.experts.38.gate_proj.weight": "model-00032-of-00047.safetensors", + "model.layers.31.mlp.experts.38.gate_proj.weight_scale": "model-00032-of-00047.safetensors", + "model.layers.31.mlp.experts.38.up_proj.weight": "model-00032-of-00047.safetensors", + "model.layers.31.mlp.experts.38.up_proj.weight_scale": "model-00032-of-00047.safetensors", + "model.layers.31.mlp.experts.39.down_proj.weight": "model-00032-of-00047.safetensors", + "model.layers.31.mlp.experts.39.down_proj.weight_scale": "model-00032-of-00047.safetensors", + "model.layers.31.mlp.experts.39.gate_proj.weight": "model-00032-of-00047.safetensors", + "model.layers.31.mlp.experts.39.gate_proj.weight_scale": "model-00032-of-00047.safetensors", + "model.layers.31.mlp.experts.39.up_proj.weight": "model-00032-of-00047.safetensors", + "model.layers.31.mlp.experts.39.up_proj.weight_scale": "model-00032-of-00047.safetensors", + "model.layers.31.mlp.experts.4.down_proj.weight": "model-00032-of-00047.safetensors", + "model.layers.31.mlp.experts.4.down_proj.weight_scale": "model-00032-of-00047.safetensors", + "model.layers.31.mlp.experts.4.gate_proj.weight": "model-00032-of-00047.safetensors", + "model.layers.31.mlp.experts.4.gate_proj.weight_scale": "model-00032-of-00047.safetensors", + "model.layers.31.mlp.experts.4.up_proj.weight": "model-00032-of-00047.safetensors", + "model.layers.31.mlp.experts.4.up_proj.weight_scale": "model-00032-of-00047.safetensors", + "model.layers.31.mlp.experts.40.down_proj.weight": "model-00032-of-00047.safetensors", + "model.layers.31.mlp.experts.40.down_proj.weight_scale": "model-00032-of-00047.safetensors", + "model.layers.31.mlp.experts.40.gate_proj.weight": "model-00032-of-00047.safetensors", + "model.layers.31.mlp.experts.40.gate_proj.weight_scale": "model-00032-of-00047.safetensors", + "model.layers.31.mlp.experts.40.up_proj.weight": "model-00032-of-00047.safetensors", + "model.layers.31.mlp.experts.40.up_proj.weight_scale": "model-00032-of-00047.safetensors", + "model.layers.31.mlp.experts.41.down_proj.weight": "model-00032-of-00047.safetensors", + "model.layers.31.mlp.experts.41.down_proj.weight_scale": "model-00032-of-00047.safetensors", + "model.layers.31.mlp.experts.41.gate_proj.weight": "model-00032-of-00047.safetensors", + "model.layers.31.mlp.experts.41.gate_proj.weight_scale": "model-00032-of-00047.safetensors", + "model.layers.31.mlp.experts.41.up_proj.weight": "model-00032-of-00047.safetensors", + "model.layers.31.mlp.experts.41.up_proj.weight_scale": "model-00032-of-00047.safetensors", + "model.layers.31.mlp.experts.42.down_proj.weight": "model-00032-of-00047.safetensors", + "model.layers.31.mlp.experts.42.down_proj.weight_scale": "model-00032-of-00047.safetensors", + "model.layers.31.mlp.experts.42.gate_proj.weight": "model-00032-of-00047.safetensors", + "model.layers.31.mlp.experts.42.gate_proj.weight_scale": "model-00032-of-00047.safetensors", + "model.layers.31.mlp.experts.42.up_proj.weight": "model-00032-of-00047.safetensors", + "model.layers.31.mlp.experts.42.up_proj.weight_scale": "model-00032-of-00047.safetensors", + "model.layers.31.mlp.experts.43.down_proj.weight": "model-00032-of-00047.safetensors", + "model.layers.31.mlp.experts.43.down_proj.weight_scale": "model-00032-of-00047.safetensors", + "model.layers.31.mlp.experts.43.gate_proj.weight": "model-00032-of-00047.safetensors", + "model.layers.31.mlp.experts.43.gate_proj.weight_scale": "model-00032-of-00047.safetensors", + "model.layers.31.mlp.experts.43.up_proj.weight": "model-00032-of-00047.safetensors", + "model.layers.31.mlp.experts.43.up_proj.weight_scale": "model-00032-of-00047.safetensors", + "model.layers.31.mlp.experts.44.down_proj.weight": "model-00032-of-00047.safetensors", + "model.layers.31.mlp.experts.44.down_proj.weight_scale": "model-00032-of-00047.safetensors", + "model.layers.31.mlp.experts.44.gate_proj.weight": "model-00032-of-00047.safetensors", + "model.layers.31.mlp.experts.44.gate_proj.weight_scale": "model-00032-of-00047.safetensors", + "model.layers.31.mlp.experts.44.up_proj.weight": "model-00032-of-00047.safetensors", + "model.layers.31.mlp.experts.44.up_proj.weight_scale": "model-00032-of-00047.safetensors", + "model.layers.31.mlp.experts.45.down_proj.weight": "model-00032-of-00047.safetensors", + "model.layers.31.mlp.experts.45.down_proj.weight_scale": "model-00032-of-00047.safetensors", + "model.layers.31.mlp.experts.45.gate_proj.weight": "model-00032-of-00047.safetensors", + "model.layers.31.mlp.experts.45.gate_proj.weight_scale": "model-00032-of-00047.safetensors", + "model.layers.31.mlp.experts.45.up_proj.weight": "model-00032-of-00047.safetensors", + "model.layers.31.mlp.experts.45.up_proj.weight_scale": "model-00032-of-00047.safetensors", + "model.layers.31.mlp.experts.46.down_proj.weight": "model-00032-of-00047.safetensors", + "model.layers.31.mlp.experts.46.down_proj.weight_scale": "model-00032-of-00047.safetensors", + "model.layers.31.mlp.experts.46.gate_proj.weight": "model-00032-of-00047.safetensors", + "model.layers.31.mlp.experts.46.gate_proj.weight_scale": "model-00032-of-00047.safetensors", + "model.layers.31.mlp.experts.46.up_proj.weight": "model-00032-of-00047.safetensors", + "model.layers.31.mlp.experts.46.up_proj.weight_scale": "model-00032-of-00047.safetensors", + "model.layers.31.mlp.experts.47.down_proj.weight": "model-00032-of-00047.safetensors", + "model.layers.31.mlp.experts.47.down_proj.weight_scale": "model-00032-of-00047.safetensors", + "model.layers.31.mlp.experts.47.gate_proj.weight": "model-00032-of-00047.safetensors", + "model.layers.31.mlp.experts.47.gate_proj.weight_scale": "model-00032-of-00047.safetensors", + "model.layers.31.mlp.experts.47.up_proj.weight": "model-00032-of-00047.safetensors", + "model.layers.31.mlp.experts.47.up_proj.weight_scale": "model-00032-of-00047.safetensors", + "model.layers.31.mlp.experts.48.down_proj.weight": "model-00032-of-00047.safetensors", + "model.layers.31.mlp.experts.48.down_proj.weight_scale": "model-00032-of-00047.safetensors", + "model.layers.31.mlp.experts.48.gate_proj.weight": "model-00032-of-00047.safetensors", + "model.layers.31.mlp.experts.48.gate_proj.weight_scale": "model-00032-of-00047.safetensors", + "model.layers.31.mlp.experts.48.up_proj.weight": "model-00032-of-00047.safetensors", + "model.layers.31.mlp.experts.48.up_proj.weight_scale": "model-00032-of-00047.safetensors", + "model.layers.31.mlp.experts.49.down_proj.weight": "model-00032-of-00047.safetensors", + "model.layers.31.mlp.experts.49.down_proj.weight_scale": "model-00032-of-00047.safetensors", + "model.layers.31.mlp.experts.49.gate_proj.weight": "model-00032-of-00047.safetensors", + "model.layers.31.mlp.experts.49.gate_proj.weight_scale": "model-00032-of-00047.safetensors", + "model.layers.31.mlp.experts.49.up_proj.weight": "model-00032-of-00047.safetensors", + "model.layers.31.mlp.experts.49.up_proj.weight_scale": "model-00032-of-00047.safetensors", + "model.layers.31.mlp.experts.5.down_proj.weight": "model-00032-of-00047.safetensors", + "model.layers.31.mlp.experts.5.down_proj.weight_scale": "model-00032-of-00047.safetensors", + "model.layers.31.mlp.experts.5.gate_proj.weight": "model-00032-of-00047.safetensors", + "model.layers.31.mlp.experts.5.gate_proj.weight_scale": "model-00032-of-00047.safetensors", + "model.layers.31.mlp.experts.5.up_proj.weight": "model-00032-of-00047.safetensors", + "model.layers.31.mlp.experts.5.up_proj.weight_scale": "model-00032-of-00047.safetensors", + "model.layers.31.mlp.experts.50.down_proj.weight": "model-00032-of-00047.safetensors", + "model.layers.31.mlp.experts.50.down_proj.weight_scale": "model-00032-of-00047.safetensors", + "model.layers.31.mlp.experts.50.gate_proj.weight": "model-00032-of-00047.safetensors", + "model.layers.31.mlp.experts.50.gate_proj.weight_scale": "model-00032-of-00047.safetensors", + "model.layers.31.mlp.experts.50.up_proj.weight": "model-00032-of-00047.safetensors", + "model.layers.31.mlp.experts.50.up_proj.weight_scale": "model-00032-of-00047.safetensors", + "model.layers.31.mlp.experts.51.down_proj.weight": "model-00032-of-00047.safetensors", + "model.layers.31.mlp.experts.51.down_proj.weight_scale": "model-00032-of-00047.safetensors", + "model.layers.31.mlp.experts.51.gate_proj.weight": "model-00032-of-00047.safetensors", + "model.layers.31.mlp.experts.51.gate_proj.weight_scale": "model-00032-of-00047.safetensors", + "model.layers.31.mlp.experts.51.up_proj.weight": "model-00032-of-00047.safetensors", + "model.layers.31.mlp.experts.51.up_proj.weight_scale": "model-00032-of-00047.safetensors", + "model.layers.31.mlp.experts.52.down_proj.weight": "model-00032-of-00047.safetensors", + "model.layers.31.mlp.experts.52.down_proj.weight_scale": "model-00032-of-00047.safetensors", + "model.layers.31.mlp.experts.52.gate_proj.weight": "model-00032-of-00047.safetensors", + "model.layers.31.mlp.experts.52.gate_proj.weight_scale": "model-00032-of-00047.safetensors", + "model.layers.31.mlp.experts.52.up_proj.weight": "model-00032-of-00047.safetensors", + "model.layers.31.mlp.experts.52.up_proj.weight_scale": "model-00032-of-00047.safetensors", + "model.layers.31.mlp.experts.53.down_proj.weight": "model-00032-of-00047.safetensors", + "model.layers.31.mlp.experts.53.down_proj.weight_scale": "model-00032-of-00047.safetensors", + "model.layers.31.mlp.experts.53.gate_proj.weight": "model-00032-of-00047.safetensors", + "model.layers.31.mlp.experts.53.gate_proj.weight_scale": "model-00032-of-00047.safetensors", + "model.layers.31.mlp.experts.53.up_proj.weight": "model-00032-of-00047.safetensors", + "model.layers.31.mlp.experts.53.up_proj.weight_scale": "model-00032-of-00047.safetensors", + "model.layers.31.mlp.experts.54.down_proj.weight": "model-00032-of-00047.safetensors", + "model.layers.31.mlp.experts.54.down_proj.weight_scale": "model-00032-of-00047.safetensors", + "model.layers.31.mlp.experts.54.gate_proj.weight": "model-00032-of-00047.safetensors", + "model.layers.31.mlp.experts.54.gate_proj.weight_scale": "model-00032-of-00047.safetensors", + "model.layers.31.mlp.experts.54.up_proj.weight": "model-00032-of-00047.safetensors", + "model.layers.31.mlp.experts.54.up_proj.weight_scale": "model-00032-of-00047.safetensors", + "model.layers.31.mlp.experts.55.down_proj.weight": "model-00032-of-00047.safetensors", + "model.layers.31.mlp.experts.55.down_proj.weight_scale": "model-00032-of-00047.safetensors", + "model.layers.31.mlp.experts.55.gate_proj.weight": "model-00032-of-00047.safetensors", + "model.layers.31.mlp.experts.55.gate_proj.weight_scale": "model-00032-of-00047.safetensors", + "model.layers.31.mlp.experts.55.up_proj.weight": "model-00032-of-00047.safetensors", + "model.layers.31.mlp.experts.55.up_proj.weight_scale": "model-00032-of-00047.safetensors", + "model.layers.31.mlp.experts.56.down_proj.weight": "model-00032-of-00047.safetensors", + "model.layers.31.mlp.experts.56.down_proj.weight_scale": "model-00032-of-00047.safetensors", + "model.layers.31.mlp.experts.56.gate_proj.weight": "model-00032-of-00047.safetensors", + "model.layers.31.mlp.experts.56.gate_proj.weight_scale": "model-00032-of-00047.safetensors", + "model.layers.31.mlp.experts.56.up_proj.weight": "model-00032-of-00047.safetensors", + "model.layers.31.mlp.experts.56.up_proj.weight_scale": "model-00032-of-00047.safetensors", + "model.layers.31.mlp.experts.57.down_proj.weight": "model-00032-of-00047.safetensors", + "model.layers.31.mlp.experts.57.down_proj.weight_scale": "model-00032-of-00047.safetensors", + "model.layers.31.mlp.experts.57.gate_proj.weight": "model-00032-of-00047.safetensors", + "model.layers.31.mlp.experts.57.gate_proj.weight_scale": "model-00032-of-00047.safetensors", + "model.layers.31.mlp.experts.57.up_proj.weight": "model-00032-of-00047.safetensors", + "model.layers.31.mlp.experts.57.up_proj.weight_scale": "model-00032-of-00047.safetensors", + "model.layers.31.mlp.experts.58.down_proj.weight": "model-00032-of-00047.safetensors", + "model.layers.31.mlp.experts.58.down_proj.weight_scale": "model-00032-of-00047.safetensors", + "model.layers.31.mlp.experts.58.gate_proj.weight": "model-00032-of-00047.safetensors", + "model.layers.31.mlp.experts.58.gate_proj.weight_scale": "model-00032-of-00047.safetensors", + "model.layers.31.mlp.experts.58.up_proj.weight": "model-00032-of-00047.safetensors", + "model.layers.31.mlp.experts.58.up_proj.weight_scale": "model-00032-of-00047.safetensors", + "model.layers.31.mlp.experts.59.down_proj.weight": "model-00032-of-00047.safetensors", + "model.layers.31.mlp.experts.59.down_proj.weight_scale": "model-00032-of-00047.safetensors", + "model.layers.31.mlp.experts.59.gate_proj.weight": "model-00032-of-00047.safetensors", + "model.layers.31.mlp.experts.59.gate_proj.weight_scale": "model-00032-of-00047.safetensors", + "model.layers.31.mlp.experts.59.up_proj.weight": "model-00032-of-00047.safetensors", + "model.layers.31.mlp.experts.59.up_proj.weight_scale": "model-00032-of-00047.safetensors", + "model.layers.31.mlp.experts.6.down_proj.weight": "model-00032-of-00047.safetensors", + "model.layers.31.mlp.experts.6.down_proj.weight_scale": "model-00032-of-00047.safetensors", + "model.layers.31.mlp.experts.6.gate_proj.weight": "model-00032-of-00047.safetensors", + "model.layers.31.mlp.experts.6.gate_proj.weight_scale": "model-00032-of-00047.safetensors", + "model.layers.31.mlp.experts.6.up_proj.weight": "model-00032-of-00047.safetensors", + "model.layers.31.mlp.experts.6.up_proj.weight_scale": "model-00032-of-00047.safetensors", + "model.layers.31.mlp.experts.60.down_proj.weight": "model-00032-of-00047.safetensors", + "model.layers.31.mlp.experts.60.down_proj.weight_scale": "model-00032-of-00047.safetensors", + "model.layers.31.mlp.experts.60.gate_proj.weight": "model-00032-of-00047.safetensors", + "model.layers.31.mlp.experts.60.gate_proj.weight_scale": "model-00032-of-00047.safetensors", + "model.layers.31.mlp.experts.60.up_proj.weight": "model-00032-of-00047.safetensors", + "model.layers.31.mlp.experts.60.up_proj.weight_scale": "model-00032-of-00047.safetensors", + "model.layers.31.mlp.experts.61.down_proj.weight": "model-00032-of-00047.safetensors", + "model.layers.31.mlp.experts.61.down_proj.weight_scale": "model-00032-of-00047.safetensors", + "model.layers.31.mlp.experts.61.gate_proj.weight": "model-00032-of-00047.safetensors", + "model.layers.31.mlp.experts.61.gate_proj.weight_scale": "model-00032-of-00047.safetensors", + "model.layers.31.mlp.experts.61.up_proj.weight": "model-00032-of-00047.safetensors", + "model.layers.31.mlp.experts.61.up_proj.weight_scale": "model-00032-of-00047.safetensors", + "model.layers.31.mlp.experts.62.down_proj.weight": "model-00032-of-00047.safetensors", + "model.layers.31.mlp.experts.62.down_proj.weight_scale": "model-00032-of-00047.safetensors", + "model.layers.31.mlp.experts.62.gate_proj.weight": "model-00032-of-00047.safetensors", + "model.layers.31.mlp.experts.62.gate_proj.weight_scale": "model-00032-of-00047.safetensors", + "model.layers.31.mlp.experts.62.up_proj.weight": "model-00032-of-00047.safetensors", + "model.layers.31.mlp.experts.62.up_proj.weight_scale": "model-00032-of-00047.safetensors", + "model.layers.31.mlp.experts.63.down_proj.weight": "model-00032-of-00047.safetensors", + "model.layers.31.mlp.experts.63.down_proj.weight_scale": "model-00032-of-00047.safetensors", + "model.layers.31.mlp.experts.63.gate_proj.weight": "model-00032-of-00047.safetensors", + "model.layers.31.mlp.experts.63.gate_proj.weight_scale": "model-00032-of-00047.safetensors", + "model.layers.31.mlp.experts.63.up_proj.weight": "model-00032-of-00047.safetensors", + "model.layers.31.mlp.experts.63.up_proj.weight_scale": "model-00032-of-00047.safetensors", + "model.layers.31.mlp.experts.64.down_proj.weight": "model-00032-of-00047.safetensors", + "model.layers.31.mlp.experts.64.down_proj.weight_scale": "model-00032-of-00047.safetensors", + "model.layers.31.mlp.experts.64.gate_proj.weight": "model-00032-of-00047.safetensors", + "model.layers.31.mlp.experts.64.gate_proj.weight_scale": "model-00032-of-00047.safetensors", + "model.layers.31.mlp.experts.64.up_proj.weight": "model-00032-of-00047.safetensors", + "model.layers.31.mlp.experts.64.up_proj.weight_scale": "model-00032-of-00047.safetensors", + "model.layers.31.mlp.experts.65.down_proj.weight": "model-00032-of-00047.safetensors", + "model.layers.31.mlp.experts.65.down_proj.weight_scale": "model-00032-of-00047.safetensors", + "model.layers.31.mlp.experts.65.gate_proj.weight": "model-00032-of-00047.safetensors", + "model.layers.31.mlp.experts.65.gate_proj.weight_scale": "model-00032-of-00047.safetensors", + "model.layers.31.mlp.experts.65.up_proj.weight": "model-00032-of-00047.safetensors", + "model.layers.31.mlp.experts.65.up_proj.weight_scale": "model-00032-of-00047.safetensors", + "model.layers.31.mlp.experts.66.down_proj.weight": "model-00032-of-00047.safetensors", + "model.layers.31.mlp.experts.66.down_proj.weight_scale": "model-00032-of-00047.safetensors", + "model.layers.31.mlp.experts.66.gate_proj.weight": "model-00032-of-00047.safetensors", + "model.layers.31.mlp.experts.66.gate_proj.weight_scale": "model-00032-of-00047.safetensors", + "model.layers.31.mlp.experts.66.up_proj.weight": "model-00032-of-00047.safetensors", + "model.layers.31.mlp.experts.66.up_proj.weight_scale": "model-00032-of-00047.safetensors", + "model.layers.31.mlp.experts.67.down_proj.weight": "model-00032-of-00047.safetensors", + "model.layers.31.mlp.experts.67.down_proj.weight_scale": "model-00032-of-00047.safetensors", + "model.layers.31.mlp.experts.67.gate_proj.weight": "model-00032-of-00047.safetensors", + "model.layers.31.mlp.experts.67.gate_proj.weight_scale": "model-00032-of-00047.safetensors", + "model.layers.31.mlp.experts.67.up_proj.weight": "model-00032-of-00047.safetensors", + "model.layers.31.mlp.experts.67.up_proj.weight_scale": "model-00032-of-00047.safetensors", + "model.layers.31.mlp.experts.68.down_proj.weight": "model-00032-of-00047.safetensors", + "model.layers.31.mlp.experts.68.down_proj.weight_scale": "model-00032-of-00047.safetensors", + "model.layers.31.mlp.experts.68.gate_proj.weight": "model-00032-of-00047.safetensors", + "model.layers.31.mlp.experts.68.gate_proj.weight_scale": "model-00032-of-00047.safetensors", + "model.layers.31.mlp.experts.68.up_proj.weight": "model-00032-of-00047.safetensors", + "model.layers.31.mlp.experts.68.up_proj.weight_scale": "model-00032-of-00047.safetensors", + "model.layers.31.mlp.experts.69.down_proj.weight": "model-00032-of-00047.safetensors", + "model.layers.31.mlp.experts.69.down_proj.weight_scale": "model-00032-of-00047.safetensors", + "model.layers.31.mlp.experts.69.gate_proj.weight": "model-00032-of-00047.safetensors", + "model.layers.31.mlp.experts.69.gate_proj.weight_scale": "model-00032-of-00047.safetensors", + "model.layers.31.mlp.experts.69.up_proj.weight": "model-00032-of-00047.safetensors", + "model.layers.31.mlp.experts.69.up_proj.weight_scale": "model-00032-of-00047.safetensors", + "model.layers.31.mlp.experts.7.down_proj.weight": "model-00032-of-00047.safetensors", + "model.layers.31.mlp.experts.7.down_proj.weight_scale": "model-00032-of-00047.safetensors", + "model.layers.31.mlp.experts.7.gate_proj.weight": "model-00032-of-00047.safetensors", + "model.layers.31.mlp.experts.7.gate_proj.weight_scale": "model-00032-of-00047.safetensors", + "model.layers.31.mlp.experts.7.up_proj.weight": "model-00032-of-00047.safetensors", + "model.layers.31.mlp.experts.7.up_proj.weight_scale": "model-00032-of-00047.safetensors", + "model.layers.31.mlp.experts.70.down_proj.weight": "model-00032-of-00047.safetensors", + "model.layers.31.mlp.experts.70.down_proj.weight_scale": "model-00032-of-00047.safetensors", + "model.layers.31.mlp.experts.70.gate_proj.weight": "model-00032-of-00047.safetensors", + "model.layers.31.mlp.experts.70.gate_proj.weight_scale": "model-00032-of-00047.safetensors", + "model.layers.31.mlp.experts.70.up_proj.weight": "model-00032-of-00047.safetensors", + "model.layers.31.mlp.experts.70.up_proj.weight_scale": "model-00032-of-00047.safetensors", + "model.layers.31.mlp.experts.71.down_proj.weight": "model-00032-of-00047.safetensors", + "model.layers.31.mlp.experts.71.down_proj.weight_scale": "model-00032-of-00047.safetensors", + "model.layers.31.mlp.experts.71.gate_proj.weight": "model-00032-of-00047.safetensors", + "model.layers.31.mlp.experts.71.gate_proj.weight_scale": "model-00032-of-00047.safetensors", + "model.layers.31.mlp.experts.71.up_proj.weight": "model-00032-of-00047.safetensors", + "model.layers.31.mlp.experts.71.up_proj.weight_scale": "model-00032-of-00047.safetensors", + "model.layers.31.mlp.experts.72.down_proj.weight": "model-00032-of-00047.safetensors", + "model.layers.31.mlp.experts.72.down_proj.weight_scale": "model-00032-of-00047.safetensors", + "model.layers.31.mlp.experts.72.gate_proj.weight": "model-00032-of-00047.safetensors", + "model.layers.31.mlp.experts.72.gate_proj.weight_scale": "model-00032-of-00047.safetensors", + "model.layers.31.mlp.experts.72.up_proj.weight": "model-00032-of-00047.safetensors", + "model.layers.31.mlp.experts.72.up_proj.weight_scale": "model-00032-of-00047.safetensors", + "model.layers.31.mlp.experts.73.down_proj.weight": "model-00032-of-00047.safetensors", + "model.layers.31.mlp.experts.73.down_proj.weight_scale": "model-00032-of-00047.safetensors", + "model.layers.31.mlp.experts.73.gate_proj.weight": "model-00032-of-00047.safetensors", + "model.layers.31.mlp.experts.73.gate_proj.weight_scale": "model-00032-of-00047.safetensors", + "model.layers.31.mlp.experts.73.up_proj.weight": "model-00032-of-00047.safetensors", + "model.layers.31.mlp.experts.73.up_proj.weight_scale": "model-00032-of-00047.safetensors", + "model.layers.31.mlp.experts.74.down_proj.weight": "model-00032-of-00047.safetensors", + "model.layers.31.mlp.experts.74.down_proj.weight_scale": "model-00032-of-00047.safetensors", + "model.layers.31.mlp.experts.74.gate_proj.weight": "model-00032-of-00047.safetensors", + "model.layers.31.mlp.experts.74.gate_proj.weight_scale": "model-00032-of-00047.safetensors", + "model.layers.31.mlp.experts.74.up_proj.weight": "model-00032-of-00047.safetensors", + "model.layers.31.mlp.experts.74.up_proj.weight_scale": "model-00032-of-00047.safetensors", + "model.layers.31.mlp.experts.75.down_proj.weight": "model-00032-of-00047.safetensors", + "model.layers.31.mlp.experts.75.down_proj.weight_scale": "model-00032-of-00047.safetensors", + "model.layers.31.mlp.experts.75.gate_proj.weight": "model-00032-of-00047.safetensors", + "model.layers.31.mlp.experts.75.gate_proj.weight_scale": "model-00032-of-00047.safetensors", + "model.layers.31.mlp.experts.75.up_proj.weight": "model-00032-of-00047.safetensors", + "model.layers.31.mlp.experts.75.up_proj.weight_scale": "model-00032-of-00047.safetensors", + "model.layers.31.mlp.experts.76.down_proj.weight": "model-00032-of-00047.safetensors", + "model.layers.31.mlp.experts.76.down_proj.weight_scale": "model-00032-of-00047.safetensors", + "model.layers.31.mlp.experts.76.gate_proj.weight": "model-00032-of-00047.safetensors", + "model.layers.31.mlp.experts.76.gate_proj.weight_scale": "model-00032-of-00047.safetensors", + "model.layers.31.mlp.experts.76.up_proj.weight": "model-00032-of-00047.safetensors", + "model.layers.31.mlp.experts.76.up_proj.weight_scale": "model-00032-of-00047.safetensors", + "model.layers.31.mlp.experts.77.down_proj.weight": "model-00032-of-00047.safetensors", + "model.layers.31.mlp.experts.77.down_proj.weight_scale": "model-00032-of-00047.safetensors", + "model.layers.31.mlp.experts.77.gate_proj.weight": "model-00032-of-00047.safetensors", + "model.layers.31.mlp.experts.77.gate_proj.weight_scale": "model-00032-of-00047.safetensors", + "model.layers.31.mlp.experts.77.up_proj.weight": "model-00032-of-00047.safetensors", + "model.layers.31.mlp.experts.77.up_proj.weight_scale": "model-00032-of-00047.safetensors", + "model.layers.31.mlp.experts.78.down_proj.weight": "model-00032-of-00047.safetensors", + "model.layers.31.mlp.experts.78.down_proj.weight_scale": "model-00032-of-00047.safetensors", + "model.layers.31.mlp.experts.78.gate_proj.weight": "model-00032-of-00047.safetensors", + "model.layers.31.mlp.experts.78.gate_proj.weight_scale": "model-00032-of-00047.safetensors", + "model.layers.31.mlp.experts.78.up_proj.weight": "model-00032-of-00047.safetensors", + "model.layers.31.mlp.experts.78.up_proj.weight_scale": "model-00032-of-00047.safetensors", + "model.layers.31.mlp.experts.79.down_proj.weight": "model-00032-of-00047.safetensors", + "model.layers.31.mlp.experts.79.down_proj.weight_scale": "model-00032-of-00047.safetensors", + "model.layers.31.mlp.experts.79.gate_proj.weight": "model-00032-of-00047.safetensors", + "model.layers.31.mlp.experts.79.gate_proj.weight_scale": "model-00032-of-00047.safetensors", + "model.layers.31.mlp.experts.79.up_proj.weight": "model-00032-of-00047.safetensors", + "model.layers.31.mlp.experts.79.up_proj.weight_scale": "model-00032-of-00047.safetensors", + "model.layers.31.mlp.experts.8.down_proj.weight": "model-00032-of-00047.safetensors", + "model.layers.31.mlp.experts.8.down_proj.weight_scale": "model-00032-of-00047.safetensors", + "model.layers.31.mlp.experts.8.gate_proj.weight": "model-00032-of-00047.safetensors", + "model.layers.31.mlp.experts.8.gate_proj.weight_scale": "model-00032-of-00047.safetensors", + "model.layers.31.mlp.experts.8.up_proj.weight": "model-00032-of-00047.safetensors", + "model.layers.31.mlp.experts.8.up_proj.weight_scale": "model-00032-of-00047.safetensors", + "model.layers.31.mlp.experts.80.down_proj.weight": "model-00032-of-00047.safetensors", + "model.layers.31.mlp.experts.80.down_proj.weight_scale": "model-00032-of-00047.safetensors", + "model.layers.31.mlp.experts.80.gate_proj.weight": "model-00032-of-00047.safetensors", + "model.layers.31.mlp.experts.80.gate_proj.weight_scale": "model-00032-of-00047.safetensors", + "model.layers.31.mlp.experts.80.up_proj.weight": "model-00032-of-00047.safetensors", + "model.layers.31.mlp.experts.80.up_proj.weight_scale": "model-00032-of-00047.safetensors", + "model.layers.31.mlp.experts.81.down_proj.weight": "model-00032-of-00047.safetensors", + "model.layers.31.mlp.experts.81.down_proj.weight_scale": "model-00032-of-00047.safetensors", + "model.layers.31.mlp.experts.81.gate_proj.weight": "model-00032-of-00047.safetensors", + "model.layers.31.mlp.experts.81.gate_proj.weight_scale": "model-00032-of-00047.safetensors", + "model.layers.31.mlp.experts.81.up_proj.weight": "model-00032-of-00047.safetensors", + "model.layers.31.mlp.experts.81.up_proj.weight_scale": "model-00032-of-00047.safetensors", + "model.layers.31.mlp.experts.82.down_proj.weight": "model-00032-of-00047.safetensors", + "model.layers.31.mlp.experts.82.down_proj.weight_scale": "model-00032-of-00047.safetensors", + "model.layers.31.mlp.experts.82.gate_proj.weight": "model-00032-of-00047.safetensors", + "model.layers.31.mlp.experts.82.gate_proj.weight_scale": "model-00032-of-00047.safetensors", + "model.layers.31.mlp.experts.82.up_proj.weight": "model-00032-of-00047.safetensors", + "model.layers.31.mlp.experts.82.up_proj.weight_scale": "model-00032-of-00047.safetensors", + "model.layers.31.mlp.experts.83.down_proj.weight": "model-00032-of-00047.safetensors", + "model.layers.31.mlp.experts.83.down_proj.weight_scale": "model-00032-of-00047.safetensors", + "model.layers.31.mlp.experts.83.gate_proj.weight": "model-00032-of-00047.safetensors", + "model.layers.31.mlp.experts.83.gate_proj.weight_scale": "model-00032-of-00047.safetensors", + "model.layers.31.mlp.experts.83.up_proj.weight": "model-00032-of-00047.safetensors", + "model.layers.31.mlp.experts.83.up_proj.weight_scale": "model-00032-of-00047.safetensors", + "model.layers.31.mlp.experts.84.down_proj.weight": "model-00032-of-00047.safetensors", + "model.layers.31.mlp.experts.84.down_proj.weight_scale": "model-00032-of-00047.safetensors", + "model.layers.31.mlp.experts.84.gate_proj.weight": "model-00032-of-00047.safetensors", + "model.layers.31.mlp.experts.84.gate_proj.weight_scale": "model-00032-of-00047.safetensors", + "model.layers.31.mlp.experts.84.up_proj.weight": "model-00032-of-00047.safetensors", + "model.layers.31.mlp.experts.84.up_proj.weight_scale": "model-00032-of-00047.safetensors", + "model.layers.31.mlp.experts.85.down_proj.weight": "model-00032-of-00047.safetensors", + "model.layers.31.mlp.experts.85.down_proj.weight_scale": "model-00032-of-00047.safetensors", + "model.layers.31.mlp.experts.85.gate_proj.weight": "model-00032-of-00047.safetensors", + "model.layers.31.mlp.experts.85.gate_proj.weight_scale": "model-00032-of-00047.safetensors", + "model.layers.31.mlp.experts.85.up_proj.weight": "model-00032-of-00047.safetensors", + "model.layers.31.mlp.experts.85.up_proj.weight_scale": "model-00032-of-00047.safetensors", + "model.layers.31.mlp.experts.86.down_proj.weight": "model-00032-of-00047.safetensors", + "model.layers.31.mlp.experts.86.down_proj.weight_scale": "model-00032-of-00047.safetensors", + "model.layers.31.mlp.experts.86.gate_proj.weight": "model-00032-of-00047.safetensors", + "model.layers.31.mlp.experts.86.gate_proj.weight_scale": "model-00032-of-00047.safetensors", + "model.layers.31.mlp.experts.86.up_proj.weight": "model-00032-of-00047.safetensors", + "model.layers.31.mlp.experts.86.up_proj.weight_scale": "model-00032-of-00047.safetensors", + "model.layers.31.mlp.experts.87.down_proj.weight": "model-00032-of-00047.safetensors", + "model.layers.31.mlp.experts.87.down_proj.weight_scale": "model-00032-of-00047.safetensors", + "model.layers.31.mlp.experts.87.gate_proj.weight": "model-00032-of-00047.safetensors", + "model.layers.31.mlp.experts.87.gate_proj.weight_scale": "model-00032-of-00047.safetensors", + "model.layers.31.mlp.experts.87.up_proj.weight": "model-00032-of-00047.safetensors", + "model.layers.31.mlp.experts.87.up_proj.weight_scale": "model-00032-of-00047.safetensors", + "model.layers.31.mlp.experts.88.down_proj.weight": "model-00032-of-00047.safetensors", + "model.layers.31.mlp.experts.88.down_proj.weight_scale": "model-00032-of-00047.safetensors", + "model.layers.31.mlp.experts.88.gate_proj.weight": "model-00032-of-00047.safetensors", + "model.layers.31.mlp.experts.88.gate_proj.weight_scale": "model-00032-of-00047.safetensors", + "model.layers.31.mlp.experts.88.up_proj.weight": "model-00032-of-00047.safetensors", + "model.layers.31.mlp.experts.88.up_proj.weight_scale": "model-00032-of-00047.safetensors", + "model.layers.31.mlp.experts.89.down_proj.weight": "model-00032-of-00047.safetensors", + "model.layers.31.mlp.experts.89.down_proj.weight_scale": "model-00032-of-00047.safetensors", + "model.layers.31.mlp.experts.89.gate_proj.weight": "model-00032-of-00047.safetensors", + "model.layers.31.mlp.experts.89.gate_proj.weight_scale": "model-00032-of-00047.safetensors", + "model.layers.31.mlp.experts.89.up_proj.weight": "model-00032-of-00047.safetensors", + "model.layers.31.mlp.experts.89.up_proj.weight_scale": "model-00032-of-00047.safetensors", + "model.layers.31.mlp.experts.9.down_proj.weight": "model-00032-of-00047.safetensors", + "model.layers.31.mlp.experts.9.down_proj.weight_scale": "model-00032-of-00047.safetensors", + "model.layers.31.mlp.experts.9.gate_proj.weight": "model-00032-of-00047.safetensors", + "model.layers.31.mlp.experts.9.gate_proj.weight_scale": "model-00032-of-00047.safetensors", + "model.layers.31.mlp.experts.9.up_proj.weight": "model-00032-of-00047.safetensors", + "model.layers.31.mlp.experts.9.up_proj.weight_scale": "model-00032-of-00047.safetensors", + "model.layers.31.mlp.experts.90.down_proj.weight": "model-00032-of-00047.safetensors", + "model.layers.31.mlp.experts.90.down_proj.weight_scale": "model-00032-of-00047.safetensors", + "model.layers.31.mlp.experts.90.gate_proj.weight": "model-00032-of-00047.safetensors", + "model.layers.31.mlp.experts.90.gate_proj.weight_scale": "model-00032-of-00047.safetensors", + "model.layers.31.mlp.experts.90.up_proj.weight": "model-00032-of-00047.safetensors", + "model.layers.31.mlp.experts.90.up_proj.weight_scale": "model-00032-of-00047.safetensors", + "model.layers.31.mlp.experts.91.down_proj.weight": "model-00032-of-00047.safetensors", + "model.layers.31.mlp.experts.91.down_proj.weight_scale": "model-00032-of-00047.safetensors", + "model.layers.31.mlp.experts.91.gate_proj.weight": "model-00032-of-00047.safetensors", + "model.layers.31.mlp.experts.91.gate_proj.weight_scale": "model-00032-of-00047.safetensors", + "model.layers.31.mlp.experts.91.up_proj.weight": "model-00032-of-00047.safetensors", + "model.layers.31.mlp.experts.91.up_proj.weight_scale": "model-00032-of-00047.safetensors", + "model.layers.31.mlp.experts.92.down_proj.weight": "model-00032-of-00047.safetensors", + "model.layers.31.mlp.experts.92.down_proj.weight_scale": "model-00032-of-00047.safetensors", + "model.layers.31.mlp.experts.92.gate_proj.weight": "model-00032-of-00047.safetensors", + "model.layers.31.mlp.experts.92.gate_proj.weight_scale": "model-00032-of-00047.safetensors", + "model.layers.31.mlp.experts.92.up_proj.weight": "model-00032-of-00047.safetensors", + "model.layers.31.mlp.experts.92.up_proj.weight_scale": "model-00032-of-00047.safetensors", + "model.layers.31.mlp.experts.93.down_proj.weight": "model-00032-of-00047.safetensors", + "model.layers.31.mlp.experts.93.down_proj.weight_scale": "model-00032-of-00047.safetensors", + "model.layers.31.mlp.experts.93.gate_proj.weight": "model-00032-of-00047.safetensors", + "model.layers.31.mlp.experts.93.gate_proj.weight_scale": "model-00032-of-00047.safetensors", + "model.layers.31.mlp.experts.93.up_proj.weight": "model-00032-of-00047.safetensors", + "model.layers.31.mlp.experts.93.up_proj.weight_scale": "model-00032-of-00047.safetensors", + "model.layers.31.mlp.experts.94.down_proj.weight": "model-00032-of-00047.safetensors", + "model.layers.31.mlp.experts.94.down_proj.weight_scale": "model-00032-of-00047.safetensors", + "model.layers.31.mlp.experts.94.gate_proj.weight": "model-00032-of-00047.safetensors", + "model.layers.31.mlp.experts.94.gate_proj.weight_scale": "model-00032-of-00047.safetensors", + "model.layers.31.mlp.experts.94.up_proj.weight": "model-00032-of-00047.safetensors", + "model.layers.31.mlp.experts.94.up_proj.weight_scale": "model-00032-of-00047.safetensors", + "model.layers.31.mlp.experts.95.down_proj.weight": "model-00032-of-00047.safetensors", + "model.layers.31.mlp.experts.95.down_proj.weight_scale": "model-00032-of-00047.safetensors", + "model.layers.31.mlp.experts.95.gate_proj.weight": "model-00032-of-00047.safetensors", + "model.layers.31.mlp.experts.95.gate_proj.weight_scale": "model-00032-of-00047.safetensors", + "model.layers.31.mlp.experts.95.up_proj.weight": "model-00032-of-00047.safetensors", + "model.layers.31.mlp.experts.95.up_proj.weight_scale": "model-00032-of-00047.safetensors", + "model.layers.31.mlp.experts.96.down_proj.weight": "model-00032-of-00047.safetensors", + "model.layers.31.mlp.experts.96.down_proj.weight_scale": "model-00032-of-00047.safetensors", + "model.layers.31.mlp.experts.96.gate_proj.weight": "model-00032-of-00047.safetensors", + "model.layers.31.mlp.experts.96.gate_proj.weight_scale": "model-00032-of-00047.safetensors", + "model.layers.31.mlp.experts.96.up_proj.weight": "model-00032-of-00047.safetensors", + "model.layers.31.mlp.experts.96.up_proj.weight_scale": "model-00032-of-00047.safetensors", + "model.layers.31.mlp.experts.97.down_proj.weight": "model-00032-of-00047.safetensors", + "model.layers.31.mlp.experts.97.down_proj.weight_scale": "model-00032-of-00047.safetensors", + "model.layers.31.mlp.experts.97.gate_proj.weight": "model-00032-of-00047.safetensors", + "model.layers.31.mlp.experts.97.gate_proj.weight_scale": "model-00032-of-00047.safetensors", + "model.layers.31.mlp.experts.97.up_proj.weight": "model-00032-of-00047.safetensors", + "model.layers.31.mlp.experts.97.up_proj.weight_scale": "model-00032-of-00047.safetensors", + "model.layers.31.mlp.experts.98.down_proj.weight": "model-00032-of-00047.safetensors", + "model.layers.31.mlp.experts.98.down_proj.weight_scale": "model-00032-of-00047.safetensors", + "model.layers.31.mlp.experts.98.gate_proj.weight": "model-00032-of-00047.safetensors", + "model.layers.31.mlp.experts.98.gate_proj.weight_scale": "model-00032-of-00047.safetensors", + "model.layers.31.mlp.experts.98.up_proj.weight": "model-00032-of-00047.safetensors", + "model.layers.31.mlp.experts.98.up_proj.weight_scale": "model-00032-of-00047.safetensors", + "model.layers.31.mlp.experts.99.down_proj.weight": "model-00032-of-00047.safetensors", + "model.layers.31.mlp.experts.99.down_proj.weight_scale": "model-00032-of-00047.safetensors", + "model.layers.31.mlp.experts.99.gate_proj.weight": "model-00032-of-00047.safetensors", + "model.layers.31.mlp.experts.99.gate_proj.weight_scale": "model-00032-of-00047.safetensors", + "model.layers.31.mlp.experts.99.up_proj.weight": "model-00032-of-00047.safetensors", + "model.layers.31.mlp.experts.99.up_proj.weight_scale": "model-00032-of-00047.safetensors", + "model.layers.31.mlp.gate.e_score_correction_bias": "model-00032-of-00047.safetensors", + "model.layers.31.mlp.gate.weight": "model-00032-of-00047.safetensors", + "model.layers.31.mlp.shared_experts.down_proj.weight": "model-00032-of-00047.safetensors", + "model.layers.31.mlp.shared_experts.down_proj.weight_scale": "model-00032-of-00047.safetensors", + "model.layers.31.mlp.shared_experts.gate_proj.weight": "model-00032-of-00047.safetensors", + "model.layers.31.mlp.shared_experts.gate_proj.weight_scale": "model-00032-of-00047.safetensors", + "model.layers.31.mlp.shared_experts.up_proj.weight": "model-00032-of-00047.safetensors", + "model.layers.31.mlp.shared_experts.up_proj.weight_scale": "model-00032-of-00047.safetensors", + "model.layers.31.post_attention_layernorm.weight": "model-00032-of-00047.safetensors", + "model.layers.31.self_attn.k_proj.bias": "model-00032-of-00047.safetensors", + "model.layers.31.self_attn.k_proj.weight": "model-00032-of-00047.safetensors", + "model.layers.31.self_attn.k_proj.weight_scale": "model-00032-of-00047.safetensors", + "model.layers.31.self_attn.o_proj.weight": "model-00032-of-00047.safetensors", + "model.layers.31.self_attn.o_proj.weight_scale": "model-00032-of-00047.safetensors", + "model.layers.31.self_attn.q_proj.bias": "model-00032-of-00047.safetensors", + "model.layers.31.self_attn.q_proj.weight": "model-00032-of-00047.safetensors", + "model.layers.31.self_attn.q_proj.weight_scale": "model-00032-of-00047.safetensors", + "model.layers.31.self_attn.v_proj.bias": "model-00032-of-00047.safetensors", + "model.layers.31.self_attn.v_proj.weight": "model-00032-of-00047.safetensors", + "model.layers.31.self_attn.v_proj.weight_scale": "model-00032-of-00047.safetensors", + "model.layers.32.input_layernorm.weight": "model-00033-of-00047.safetensors", + "model.layers.32.mlp.experts.0.down_proj.weight": "model-00033-of-00047.safetensors", + "model.layers.32.mlp.experts.0.down_proj.weight_scale": "model-00033-of-00047.safetensors", + "model.layers.32.mlp.experts.0.gate_proj.weight": "model-00033-of-00047.safetensors", + "model.layers.32.mlp.experts.0.gate_proj.weight_scale": "model-00033-of-00047.safetensors", + "model.layers.32.mlp.experts.0.up_proj.weight": "model-00033-of-00047.safetensors", + "model.layers.32.mlp.experts.0.up_proj.weight_scale": "model-00033-of-00047.safetensors", + "model.layers.32.mlp.experts.1.down_proj.weight": "model-00033-of-00047.safetensors", + "model.layers.32.mlp.experts.1.down_proj.weight_scale": "model-00033-of-00047.safetensors", + "model.layers.32.mlp.experts.1.gate_proj.weight": "model-00033-of-00047.safetensors", + "model.layers.32.mlp.experts.1.gate_proj.weight_scale": "model-00033-of-00047.safetensors", + "model.layers.32.mlp.experts.1.up_proj.weight": "model-00033-of-00047.safetensors", + "model.layers.32.mlp.experts.1.up_proj.weight_scale": "model-00033-of-00047.safetensors", + "model.layers.32.mlp.experts.10.down_proj.weight": "model-00033-of-00047.safetensors", + "model.layers.32.mlp.experts.10.down_proj.weight_scale": "model-00033-of-00047.safetensors", + "model.layers.32.mlp.experts.10.gate_proj.weight": "model-00033-of-00047.safetensors", + "model.layers.32.mlp.experts.10.gate_proj.weight_scale": "model-00033-of-00047.safetensors", + "model.layers.32.mlp.experts.10.up_proj.weight": "model-00033-of-00047.safetensors", + "model.layers.32.mlp.experts.10.up_proj.weight_scale": "model-00033-of-00047.safetensors", + "model.layers.32.mlp.experts.100.down_proj.weight": "model-00033-of-00047.safetensors", + "model.layers.32.mlp.experts.100.down_proj.weight_scale": "model-00033-of-00047.safetensors", + "model.layers.32.mlp.experts.100.gate_proj.weight": "model-00033-of-00047.safetensors", + "model.layers.32.mlp.experts.100.gate_proj.weight_scale": "model-00033-of-00047.safetensors", + "model.layers.32.mlp.experts.100.up_proj.weight": "model-00033-of-00047.safetensors", + "model.layers.32.mlp.experts.100.up_proj.weight_scale": "model-00033-of-00047.safetensors", + "model.layers.32.mlp.experts.101.down_proj.weight": "model-00033-of-00047.safetensors", + "model.layers.32.mlp.experts.101.down_proj.weight_scale": "model-00033-of-00047.safetensors", + "model.layers.32.mlp.experts.101.gate_proj.weight": "model-00033-of-00047.safetensors", + "model.layers.32.mlp.experts.101.gate_proj.weight_scale": "model-00033-of-00047.safetensors", + "model.layers.32.mlp.experts.101.up_proj.weight": "model-00033-of-00047.safetensors", + "model.layers.32.mlp.experts.101.up_proj.weight_scale": "model-00033-of-00047.safetensors", + "model.layers.32.mlp.experts.102.down_proj.weight": "model-00033-of-00047.safetensors", + "model.layers.32.mlp.experts.102.down_proj.weight_scale": "model-00033-of-00047.safetensors", + "model.layers.32.mlp.experts.102.gate_proj.weight": "model-00033-of-00047.safetensors", + "model.layers.32.mlp.experts.102.gate_proj.weight_scale": "model-00033-of-00047.safetensors", + "model.layers.32.mlp.experts.102.up_proj.weight": "model-00033-of-00047.safetensors", + "model.layers.32.mlp.experts.102.up_proj.weight_scale": "model-00033-of-00047.safetensors", + "model.layers.32.mlp.experts.103.down_proj.weight": "model-00033-of-00047.safetensors", + "model.layers.32.mlp.experts.103.down_proj.weight_scale": "model-00033-of-00047.safetensors", + "model.layers.32.mlp.experts.103.gate_proj.weight": "model-00033-of-00047.safetensors", + "model.layers.32.mlp.experts.103.gate_proj.weight_scale": "model-00033-of-00047.safetensors", + "model.layers.32.mlp.experts.103.up_proj.weight": "model-00033-of-00047.safetensors", + "model.layers.32.mlp.experts.103.up_proj.weight_scale": "model-00033-of-00047.safetensors", + "model.layers.32.mlp.experts.104.down_proj.weight": "model-00033-of-00047.safetensors", + "model.layers.32.mlp.experts.104.down_proj.weight_scale": "model-00033-of-00047.safetensors", + "model.layers.32.mlp.experts.104.gate_proj.weight": "model-00033-of-00047.safetensors", + "model.layers.32.mlp.experts.104.gate_proj.weight_scale": "model-00033-of-00047.safetensors", + "model.layers.32.mlp.experts.104.up_proj.weight": "model-00033-of-00047.safetensors", + "model.layers.32.mlp.experts.104.up_proj.weight_scale": "model-00033-of-00047.safetensors", + "model.layers.32.mlp.experts.105.down_proj.weight": "model-00033-of-00047.safetensors", + "model.layers.32.mlp.experts.105.down_proj.weight_scale": "model-00033-of-00047.safetensors", + "model.layers.32.mlp.experts.105.gate_proj.weight": "model-00033-of-00047.safetensors", + "model.layers.32.mlp.experts.105.gate_proj.weight_scale": "model-00033-of-00047.safetensors", + "model.layers.32.mlp.experts.105.up_proj.weight": "model-00033-of-00047.safetensors", + "model.layers.32.mlp.experts.105.up_proj.weight_scale": "model-00033-of-00047.safetensors", + "model.layers.32.mlp.experts.106.down_proj.weight": "model-00033-of-00047.safetensors", + "model.layers.32.mlp.experts.106.down_proj.weight_scale": "model-00033-of-00047.safetensors", + "model.layers.32.mlp.experts.106.gate_proj.weight": "model-00033-of-00047.safetensors", + "model.layers.32.mlp.experts.106.gate_proj.weight_scale": "model-00033-of-00047.safetensors", + "model.layers.32.mlp.experts.106.up_proj.weight": "model-00033-of-00047.safetensors", + "model.layers.32.mlp.experts.106.up_proj.weight_scale": "model-00033-of-00047.safetensors", + "model.layers.32.mlp.experts.107.down_proj.weight": "model-00033-of-00047.safetensors", + "model.layers.32.mlp.experts.107.down_proj.weight_scale": "model-00033-of-00047.safetensors", + "model.layers.32.mlp.experts.107.gate_proj.weight": "model-00033-of-00047.safetensors", + "model.layers.32.mlp.experts.107.gate_proj.weight_scale": "model-00033-of-00047.safetensors", + "model.layers.32.mlp.experts.107.up_proj.weight": "model-00033-of-00047.safetensors", + "model.layers.32.mlp.experts.107.up_proj.weight_scale": "model-00033-of-00047.safetensors", + "model.layers.32.mlp.experts.108.down_proj.weight": "model-00033-of-00047.safetensors", + "model.layers.32.mlp.experts.108.down_proj.weight_scale": "model-00033-of-00047.safetensors", + "model.layers.32.mlp.experts.108.gate_proj.weight": "model-00033-of-00047.safetensors", + "model.layers.32.mlp.experts.108.gate_proj.weight_scale": "model-00033-of-00047.safetensors", + "model.layers.32.mlp.experts.108.up_proj.weight": "model-00033-of-00047.safetensors", + "model.layers.32.mlp.experts.108.up_proj.weight_scale": "model-00033-of-00047.safetensors", + "model.layers.32.mlp.experts.109.down_proj.weight": "model-00033-of-00047.safetensors", + "model.layers.32.mlp.experts.109.down_proj.weight_scale": "model-00033-of-00047.safetensors", + "model.layers.32.mlp.experts.109.gate_proj.weight": "model-00033-of-00047.safetensors", + "model.layers.32.mlp.experts.109.gate_proj.weight_scale": "model-00033-of-00047.safetensors", + "model.layers.32.mlp.experts.109.up_proj.weight": "model-00033-of-00047.safetensors", + "model.layers.32.mlp.experts.109.up_proj.weight_scale": "model-00033-of-00047.safetensors", + "model.layers.32.mlp.experts.11.down_proj.weight": "model-00033-of-00047.safetensors", + "model.layers.32.mlp.experts.11.down_proj.weight_scale": "model-00033-of-00047.safetensors", + "model.layers.32.mlp.experts.11.gate_proj.weight": "model-00033-of-00047.safetensors", + "model.layers.32.mlp.experts.11.gate_proj.weight_scale": "model-00033-of-00047.safetensors", + "model.layers.32.mlp.experts.11.up_proj.weight": "model-00033-of-00047.safetensors", + "model.layers.32.mlp.experts.11.up_proj.weight_scale": "model-00033-of-00047.safetensors", + "model.layers.32.mlp.experts.110.down_proj.weight": "model-00033-of-00047.safetensors", + "model.layers.32.mlp.experts.110.down_proj.weight_scale": "model-00033-of-00047.safetensors", + "model.layers.32.mlp.experts.110.gate_proj.weight": "model-00033-of-00047.safetensors", + "model.layers.32.mlp.experts.110.gate_proj.weight_scale": "model-00033-of-00047.safetensors", + "model.layers.32.mlp.experts.110.up_proj.weight": "model-00033-of-00047.safetensors", + "model.layers.32.mlp.experts.110.up_proj.weight_scale": "model-00033-of-00047.safetensors", + "model.layers.32.mlp.experts.111.down_proj.weight": "model-00033-of-00047.safetensors", + "model.layers.32.mlp.experts.111.down_proj.weight_scale": "model-00033-of-00047.safetensors", + "model.layers.32.mlp.experts.111.gate_proj.weight": "model-00033-of-00047.safetensors", + "model.layers.32.mlp.experts.111.gate_proj.weight_scale": "model-00033-of-00047.safetensors", + "model.layers.32.mlp.experts.111.up_proj.weight": "model-00033-of-00047.safetensors", + "model.layers.32.mlp.experts.111.up_proj.weight_scale": "model-00033-of-00047.safetensors", + "model.layers.32.mlp.experts.112.down_proj.weight": "model-00033-of-00047.safetensors", + "model.layers.32.mlp.experts.112.down_proj.weight_scale": "model-00033-of-00047.safetensors", + "model.layers.32.mlp.experts.112.gate_proj.weight": "model-00033-of-00047.safetensors", + "model.layers.32.mlp.experts.112.gate_proj.weight_scale": "model-00033-of-00047.safetensors", + "model.layers.32.mlp.experts.112.up_proj.weight": "model-00033-of-00047.safetensors", + "model.layers.32.mlp.experts.112.up_proj.weight_scale": "model-00033-of-00047.safetensors", + "model.layers.32.mlp.experts.113.down_proj.weight": "model-00033-of-00047.safetensors", + "model.layers.32.mlp.experts.113.down_proj.weight_scale": "model-00033-of-00047.safetensors", + "model.layers.32.mlp.experts.113.gate_proj.weight": "model-00033-of-00047.safetensors", + "model.layers.32.mlp.experts.113.gate_proj.weight_scale": "model-00033-of-00047.safetensors", + "model.layers.32.mlp.experts.113.up_proj.weight": "model-00033-of-00047.safetensors", + "model.layers.32.mlp.experts.113.up_proj.weight_scale": "model-00033-of-00047.safetensors", + "model.layers.32.mlp.experts.114.down_proj.weight": "model-00033-of-00047.safetensors", + "model.layers.32.mlp.experts.114.down_proj.weight_scale": "model-00033-of-00047.safetensors", + "model.layers.32.mlp.experts.114.gate_proj.weight": "model-00033-of-00047.safetensors", + "model.layers.32.mlp.experts.114.gate_proj.weight_scale": "model-00033-of-00047.safetensors", + "model.layers.32.mlp.experts.114.up_proj.weight": "model-00033-of-00047.safetensors", + "model.layers.32.mlp.experts.114.up_proj.weight_scale": "model-00033-of-00047.safetensors", + "model.layers.32.mlp.experts.115.down_proj.weight": "model-00033-of-00047.safetensors", + "model.layers.32.mlp.experts.115.down_proj.weight_scale": "model-00033-of-00047.safetensors", + "model.layers.32.mlp.experts.115.gate_proj.weight": "model-00033-of-00047.safetensors", + "model.layers.32.mlp.experts.115.gate_proj.weight_scale": "model-00033-of-00047.safetensors", + "model.layers.32.mlp.experts.115.up_proj.weight": "model-00033-of-00047.safetensors", + "model.layers.32.mlp.experts.115.up_proj.weight_scale": "model-00033-of-00047.safetensors", + "model.layers.32.mlp.experts.116.down_proj.weight": "model-00033-of-00047.safetensors", + "model.layers.32.mlp.experts.116.down_proj.weight_scale": "model-00033-of-00047.safetensors", + "model.layers.32.mlp.experts.116.gate_proj.weight": "model-00033-of-00047.safetensors", + "model.layers.32.mlp.experts.116.gate_proj.weight_scale": "model-00033-of-00047.safetensors", + "model.layers.32.mlp.experts.116.up_proj.weight": "model-00033-of-00047.safetensors", + "model.layers.32.mlp.experts.116.up_proj.weight_scale": "model-00033-of-00047.safetensors", + "model.layers.32.mlp.experts.117.down_proj.weight": "model-00033-of-00047.safetensors", + "model.layers.32.mlp.experts.117.down_proj.weight_scale": "model-00033-of-00047.safetensors", + "model.layers.32.mlp.experts.117.gate_proj.weight": "model-00033-of-00047.safetensors", + "model.layers.32.mlp.experts.117.gate_proj.weight_scale": "model-00033-of-00047.safetensors", + "model.layers.32.mlp.experts.117.up_proj.weight": "model-00033-of-00047.safetensors", + "model.layers.32.mlp.experts.117.up_proj.weight_scale": "model-00033-of-00047.safetensors", + "model.layers.32.mlp.experts.118.down_proj.weight": "model-00033-of-00047.safetensors", + "model.layers.32.mlp.experts.118.down_proj.weight_scale": "model-00033-of-00047.safetensors", + "model.layers.32.mlp.experts.118.gate_proj.weight": "model-00033-of-00047.safetensors", + "model.layers.32.mlp.experts.118.gate_proj.weight_scale": "model-00033-of-00047.safetensors", + "model.layers.32.mlp.experts.118.up_proj.weight": "model-00033-of-00047.safetensors", + "model.layers.32.mlp.experts.118.up_proj.weight_scale": "model-00033-of-00047.safetensors", + "model.layers.32.mlp.experts.119.down_proj.weight": "model-00033-of-00047.safetensors", + "model.layers.32.mlp.experts.119.down_proj.weight_scale": "model-00033-of-00047.safetensors", + "model.layers.32.mlp.experts.119.gate_proj.weight": "model-00033-of-00047.safetensors", + "model.layers.32.mlp.experts.119.gate_proj.weight_scale": "model-00033-of-00047.safetensors", + "model.layers.32.mlp.experts.119.up_proj.weight": "model-00033-of-00047.safetensors", + "model.layers.32.mlp.experts.119.up_proj.weight_scale": "model-00033-of-00047.safetensors", + "model.layers.32.mlp.experts.12.down_proj.weight": "model-00033-of-00047.safetensors", + "model.layers.32.mlp.experts.12.down_proj.weight_scale": "model-00033-of-00047.safetensors", + "model.layers.32.mlp.experts.12.gate_proj.weight": "model-00033-of-00047.safetensors", + "model.layers.32.mlp.experts.12.gate_proj.weight_scale": "model-00033-of-00047.safetensors", + "model.layers.32.mlp.experts.12.up_proj.weight": "model-00033-of-00047.safetensors", + "model.layers.32.mlp.experts.12.up_proj.weight_scale": "model-00033-of-00047.safetensors", + "model.layers.32.mlp.experts.120.down_proj.weight": "model-00033-of-00047.safetensors", + "model.layers.32.mlp.experts.120.down_proj.weight_scale": "model-00033-of-00047.safetensors", + "model.layers.32.mlp.experts.120.gate_proj.weight": "model-00033-of-00047.safetensors", + "model.layers.32.mlp.experts.120.gate_proj.weight_scale": "model-00033-of-00047.safetensors", + "model.layers.32.mlp.experts.120.up_proj.weight": "model-00033-of-00047.safetensors", + "model.layers.32.mlp.experts.120.up_proj.weight_scale": "model-00033-of-00047.safetensors", + "model.layers.32.mlp.experts.121.down_proj.weight": "model-00033-of-00047.safetensors", + "model.layers.32.mlp.experts.121.down_proj.weight_scale": "model-00033-of-00047.safetensors", + "model.layers.32.mlp.experts.121.gate_proj.weight": "model-00033-of-00047.safetensors", + "model.layers.32.mlp.experts.121.gate_proj.weight_scale": "model-00033-of-00047.safetensors", + "model.layers.32.mlp.experts.121.up_proj.weight": "model-00033-of-00047.safetensors", + "model.layers.32.mlp.experts.121.up_proj.weight_scale": "model-00033-of-00047.safetensors", + "model.layers.32.mlp.experts.122.down_proj.weight": "model-00033-of-00047.safetensors", + "model.layers.32.mlp.experts.122.down_proj.weight_scale": "model-00033-of-00047.safetensors", + "model.layers.32.mlp.experts.122.gate_proj.weight": "model-00033-of-00047.safetensors", + "model.layers.32.mlp.experts.122.gate_proj.weight_scale": "model-00033-of-00047.safetensors", + "model.layers.32.mlp.experts.122.up_proj.weight": "model-00033-of-00047.safetensors", + "model.layers.32.mlp.experts.122.up_proj.weight_scale": "model-00033-of-00047.safetensors", + "model.layers.32.mlp.experts.123.down_proj.weight": "model-00033-of-00047.safetensors", + "model.layers.32.mlp.experts.123.down_proj.weight_scale": "model-00033-of-00047.safetensors", + "model.layers.32.mlp.experts.123.gate_proj.weight": "model-00033-of-00047.safetensors", + "model.layers.32.mlp.experts.123.gate_proj.weight_scale": "model-00033-of-00047.safetensors", + "model.layers.32.mlp.experts.123.up_proj.weight": "model-00033-of-00047.safetensors", + "model.layers.32.mlp.experts.123.up_proj.weight_scale": "model-00033-of-00047.safetensors", + "model.layers.32.mlp.experts.124.down_proj.weight": "model-00033-of-00047.safetensors", + "model.layers.32.mlp.experts.124.down_proj.weight_scale": "model-00033-of-00047.safetensors", + "model.layers.32.mlp.experts.124.gate_proj.weight": "model-00033-of-00047.safetensors", + "model.layers.32.mlp.experts.124.gate_proj.weight_scale": "model-00033-of-00047.safetensors", + "model.layers.32.mlp.experts.124.up_proj.weight": "model-00033-of-00047.safetensors", + "model.layers.32.mlp.experts.124.up_proj.weight_scale": "model-00033-of-00047.safetensors", + "model.layers.32.mlp.experts.125.down_proj.weight": "model-00033-of-00047.safetensors", + "model.layers.32.mlp.experts.125.down_proj.weight_scale": "model-00033-of-00047.safetensors", + "model.layers.32.mlp.experts.125.gate_proj.weight": "model-00033-of-00047.safetensors", + "model.layers.32.mlp.experts.125.gate_proj.weight_scale": "model-00033-of-00047.safetensors", + "model.layers.32.mlp.experts.125.up_proj.weight": "model-00033-of-00047.safetensors", + "model.layers.32.mlp.experts.125.up_proj.weight_scale": "model-00033-of-00047.safetensors", + "model.layers.32.mlp.experts.126.down_proj.weight": "model-00033-of-00047.safetensors", + "model.layers.32.mlp.experts.126.down_proj.weight_scale": "model-00033-of-00047.safetensors", + "model.layers.32.mlp.experts.126.gate_proj.weight": "model-00033-of-00047.safetensors", + "model.layers.32.mlp.experts.126.gate_proj.weight_scale": "model-00033-of-00047.safetensors", + "model.layers.32.mlp.experts.126.up_proj.weight": "model-00033-of-00047.safetensors", + "model.layers.32.mlp.experts.126.up_proj.weight_scale": "model-00033-of-00047.safetensors", + "model.layers.32.mlp.experts.127.down_proj.weight": "model-00033-of-00047.safetensors", + "model.layers.32.mlp.experts.127.down_proj.weight_scale": "model-00033-of-00047.safetensors", + "model.layers.32.mlp.experts.127.gate_proj.weight": "model-00033-of-00047.safetensors", + "model.layers.32.mlp.experts.127.gate_proj.weight_scale": "model-00033-of-00047.safetensors", + "model.layers.32.mlp.experts.127.up_proj.weight": "model-00033-of-00047.safetensors", + "model.layers.32.mlp.experts.127.up_proj.weight_scale": "model-00033-of-00047.safetensors", + "model.layers.32.mlp.experts.13.down_proj.weight": "model-00033-of-00047.safetensors", + "model.layers.32.mlp.experts.13.down_proj.weight_scale": "model-00033-of-00047.safetensors", + "model.layers.32.mlp.experts.13.gate_proj.weight": "model-00033-of-00047.safetensors", + "model.layers.32.mlp.experts.13.gate_proj.weight_scale": "model-00033-of-00047.safetensors", + "model.layers.32.mlp.experts.13.up_proj.weight": "model-00033-of-00047.safetensors", + "model.layers.32.mlp.experts.13.up_proj.weight_scale": "model-00033-of-00047.safetensors", + "model.layers.32.mlp.experts.14.down_proj.weight": "model-00033-of-00047.safetensors", + "model.layers.32.mlp.experts.14.down_proj.weight_scale": "model-00033-of-00047.safetensors", + "model.layers.32.mlp.experts.14.gate_proj.weight": "model-00033-of-00047.safetensors", + "model.layers.32.mlp.experts.14.gate_proj.weight_scale": "model-00033-of-00047.safetensors", + "model.layers.32.mlp.experts.14.up_proj.weight": "model-00033-of-00047.safetensors", + "model.layers.32.mlp.experts.14.up_proj.weight_scale": "model-00033-of-00047.safetensors", + "model.layers.32.mlp.experts.15.down_proj.weight": "model-00033-of-00047.safetensors", + "model.layers.32.mlp.experts.15.down_proj.weight_scale": "model-00033-of-00047.safetensors", + "model.layers.32.mlp.experts.15.gate_proj.weight": "model-00033-of-00047.safetensors", + "model.layers.32.mlp.experts.15.gate_proj.weight_scale": "model-00033-of-00047.safetensors", + "model.layers.32.mlp.experts.15.up_proj.weight": "model-00033-of-00047.safetensors", + "model.layers.32.mlp.experts.15.up_proj.weight_scale": "model-00033-of-00047.safetensors", + "model.layers.32.mlp.experts.16.down_proj.weight": "model-00033-of-00047.safetensors", + "model.layers.32.mlp.experts.16.down_proj.weight_scale": "model-00033-of-00047.safetensors", + "model.layers.32.mlp.experts.16.gate_proj.weight": "model-00033-of-00047.safetensors", + "model.layers.32.mlp.experts.16.gate_proj.weight_scale": "model-00033-of-00047.safetensors", + "model.layers.32.mlp.experts.16.up_proj.weight": "model-00033-of-00047.safetensors", + "model.layers.32.mlp.experts.16.up_proj.weight_scale": "model-00033-of-00047.safetensors", + "model.layers.32.mlp.experts.17.down_proj.weight": "model-00033-of-00047.safetensors", + "model.layers.32.mlp.experts.17.down_proj.weight_scale": "model-00033-of-00047.safetensors", + "model.layers.32.mlp.experts.17.gate_proj.weight": "model-00033-of-00047.safetensors", + "model.layers.32.mlp.experts.17.gate_proj.weight_scale": "model-00033-of-00047.safetensors", + "model.layers.32.mlp.experts.17.up_proj.weight": "model-00033-of-00047.safetensors", + "model.layers.32.mlp.experts.17.up_proj.weight_scale": "model-00033-of-00047.safetensors", + "model.layers.32.mlp.experts.18.down_proj.weight": "model-00033-of-00047.safetensors", + "model.layers.32.mlp.experts.18.down_proj.weight_scale": "model-00033-of-00047.safetensors", + "model.layers.32.mlp.experts.18.gate_proj.weight": "model-00033-of-00047.safetensors", + "model.layers.32.mlp.experts.18.gate_proj.weight_scale": "model-00033-of-00047.safetensors", + "model.layers.32.mlp.experts.18.up_proj.weight": "model-00033-of-00047.safetensors", + "model.layers.32.mlp.experts.18.up_proj.weight_scale": "model-00033-of-00047.safetensors", + "model.layers.32.mlp.experts.19.down_proj.weight": "model-00033-of-00047.safetensors", + "model.layers.32.mlp.experts.19.down_proj.weight_scale": "model-00033-of-00047.safetensors", + "model.layers.32.mlp.experts.19.gate_proj.weight": "model-00033-of-00047.safetensors", + "model.layers.32.mlp.experts.19.gate_proj.weight_scale": "model-00033-of-00047.safetensors", + "model.layers.32.mlp.experts.19.up_proj.weight": "model-00033-of-00047.safetensors", + "model.layers.32.mlp.experts.19.up_proj.weight_scale": "model-00033-of-00047.safetensors", + "model.layers.32.mlp.experts.2.down_proj.weight": "model-00033-of-00047.safetensors", + "model.layers.32.mlp.experts.2.down_proj.weight_scale": "model-00033-of-00047.safetensors", + "model.layers.32.mlp.experts.2.gate_proj.weight": "model-00033-of-00047.safetensors", + "model.layers.32.mlp.experts.2.gate_proj.weight_scale": "model-00033-of-00047.safetensors", + "model.layers.32.mlp.experts.2.up_proj.weight": "model-00033-of-00047.safetensors", + "model.layers.32.mlp.experts.2.up_proj.weight_scale": "model-00033-of-00047.safetensors", + "model.layers.32.mlp.experts.20.down_proj.weight": "model-00033-of-00047.safetensors", + "model.layers.32.mlp.experts.20.down_proj.weight_scale": "model-00033-of-00047.safetensors", + "model.layers.32.mlp.experts.20.gate_proj.weight": "model-00033-of-00047.safetensors", + "model.layers.32.mlp.experts.20.gate_proj.weight_scale": "model-00033-of-00047.safetensors", + "model.layers.32.mlp.experts.20.up_proj.weight": "model-00033-of-00047.safetensors", + "model.layers.32.mlp.experts.20.up_proj.weight_scale": "model-00033-of-00047.safetensors", + "model.layers.32.mlp.experts.21.down_proj.weight": "model-00033-of-00047.safetensors", + "model.layers.32.mlp.experts.21.down_proj.weight_scale": "model-00033-of-00047.safetensors", + "model.layers.32.mlp.experts.21.gate_proj.weight": "model-00033-of-00047.safetensors", + "model.layers.32.mlp.experts.21.gate_proj.weight_scale": "model-00033-of-00047.safetensors", + "model.layers.32.mlp.experts.21.up_proj.weight": "model-00033-of-00047.safetensors", + "model.layers.32.mlp.experts.21.up_proj.weight_scale": "model-00033-of-00047.safetensors", + "model.layers.32.mlp.experts.22.down_proj.weight": "model-00033-of-00047.safetensors", + "model.layers.32.mlp.experts.22.down_proj.weight_scale": "model-00033-of-00047.safetensors", + "model.layers.32.mlp.experts.22.gate_proj.weight": "model-00033-of-00047.safetensors", + "model.layers.32.mlp.experts.22.gate_proj.weight_scale": "model-00033-of-00047.safetensors", + "model.layers.32.mlp.experts.22.up_proj.weight": "model-00033-of-00047.safetensors", + "model.layers.32.mlp.experts.22.up_proj.weight_scale": "model-00033-of-00047.safetensors", + "model.layers.32.mlp.experts.23.down_proj.weight": "model-00033-of-00047.safetensors", + "model.layers.32.mlp.experts.23.down_proj.weight_scale": "model-00033-of-00047.safetensors", + "model.layers.32.mlp.experts.23.gate_proj.weight": "model-00033-of-00047.safetensors", + "model.layers.32.mlp.experts.23.gate_proj.weight_scale": "model-00033-of-00047.safetensors", + "model.layers.32.mlp.experts.23.up_proj.weight": "model-00033-of-00047.safetensors", + "model.layers.32.mlp.experts.23.up_proj.weight_scale": "model-00033-of-00047.safetensors", + "model.layers.32.mlp.experts.24.down_proj.weight": "model-00033-of-00047.safetensors", + "model.layers.32.mlp.experts.24.down_proj.weight_scale": "model-00033-of-00047.safetensors", + "model.layers.32.mlp.experts.24.gate_proj.weight": "model-00033-of-00047.safetensors", + "model.layers.32.mlp.experts.24.gate_proj.weight_scale": "model-00033-of-00047.safetensors", + "model.layers.32.mlp.experts.24.up_proj.weight": "model-00033-of-00047.safetensors", + "model.layers.32.mlp.experts.24.up_proj.weight_scale": "model-00033-of-00047.safetensors", + "model.layers.32.mlp.experts.25.down_proj.weight": "model-00033-of-00047.safetensors", + "model.layers.32.mlp.experts.25.down_proj.weight_scale": "model-00033-of-00047.safetensors", + "model.layers.32.mlp.experts.25.gate_proj.weight": "model-00033-of-00047.safetensors", + "model.layers.32.mlp.experts.25.gate_proj.weight_scale": "model-00033-of-00047.safetensors", + "model.layers.32.mlp.experts.25.up_proj.weight": "model-00033-of-00047.safetensors", + "model.layers.32.mlp.experts.25.up_proj.weight_scale": "model-00033-of-00047.safetensors", + "model.layers.32.mlp.experts.26.down_proj.weight": "model-00033-of-00047.safetensors", + "model.layers.32.mlp.experts.26.down_proj.weight_scale": "model-00033-of-00047.safetensors", + "model.layers.32.mlp.experts.26.gate_proj.weight": "model-00033-of-00047.safetensors", + "model.layers.32.mlp.experts.26.gate_proj.weight_scale": "model-00033-of-00047.safetensors", + "model.layers.32.mlp.experts.26.up_proj.weight": "model-00033-of-00047.safetensors", + "model.layers.32.mlp.experts.26.up_proj.weight_scale": "model-00033-of-00047.safetensors", + "model.layers.32.mlp.experts.27.down_proj.weight": "model-00033-of-00047.safetensors", + "model.layers.32.mlp.experts.27.down_proj.weight_scale": "model-00033-of-00047.safetensors", + "model.layers.32.mlp.experts.27.gate_proj.weight": "model-00033-of-00047.safetensors", + "model.layers.32.mlp.experts.27.gate_proj.weight_scale": "model-00033-of-00047.safetensors", + "model.layers.32.mlp.experts.27.up_proj.weight": "model-00033-of-00047.safetensors", + "model.layers.32.mlp.experts.27.up_proj.weight_scale": "model-00033-of-00047.safetensors", + "model.layers.32.mlp.experts.28.down_proj.weight": "model-00033-of-00047.safetensors", + "model.layers.32.mlp.experts.28.down_proj.weight_scale": "model-00033-of-00047.safetensors", + "model.layers.32.mlp.experts.28.gate_proj.weight": "model-00033-of-00047.safetensors", + "model.layers.32.mlp.experts.28.gate_proj.weight_scale": "model-00033-of-00047.safetensors", + "model.layers.32.mlp.experts.28.up_proj.weight": "model-00033-of-00047.safetensors", + "model.layers.32.mlp.experts.28.up_proj.weight_scale": "model-00033-of-00047.safetensors", + "model.layers.32.mlp.experts.29.down_proj.weight": "model-00033-of-00047.safetensors", + "model.layers.32.mlp.experts.29.down_proj.weight_scale": "model-00033-of-00047.safetensors", + "model.layers.32.mlp.experts.29.gate_proj.weight": "model-00033-of-00047.safetensors", + "model.layers.32.mlp.experts.29.gate_proj.weight_scale": "model-00033-of-00047.safetensors", + "model.layers.32.mlp.experts.29.up_proj.weight": "model-00033-of-00047.safetensors", + "model.layers.32.mlp.experts.29.up_proj.weight_scale": "model-00033-of-00047.safetensors", + "model.layers.32.mlp.experts.3.down_proj.weight": "model-00033-of-00047.safetensors", + "model.layers.32.mlp.experts.3.down_proj.weight_scale": "model-00033-of-00047.safetensors", + "model.layers.32.mlp.experts.3.gate_proj.weight": "model-00033-of-00047.safetensors", + "model.layers.32.mlp.experts.3.gate_proj.weight_scale": "model-00033-of-00047.safetensors", + "model.layers.32.mlp.experts.3.up_proj.weight": "model-00033-of-00047.safetensors", + "model.layers.32.mlp.experts.3.up_proj.weight_scale": "model-00033-of-00047.safetensors", + "model.layers.32.mlp.experts.30.down_proj.weight": "model-00033-of-00047.safetensors", + "model.layers.32.mlp.experts.30.down_proj.weight_scale": "model-00033-of-00047.safetensors", + "model.layers.32.mlp.experts.30.gate_proj.weight": "model-00033-of-00047.safetensors", + "model.layers.32.mlp.experts.30.gate_proj.weight_scale": "model-00033-of-00047.safetensors", + "model.layers.32.mlp.experts.30.up_proj.weight": "model-00033-of-00047.safetensors", + "model.layers.32.mlp.experts.30.up_proj.weight_scale": "model-00033-of-00047.safetensors", + "model.layers.32.mlp.experts.31.down_proj.weight": "model-00033-of-00047.safetensors", + "model.layers.32.mlp.experts.31.down_proj.weight_scale": "model-00033-of-00047.safetensors", + "model.layers.32.mlp.experts.31.gate_proj.weight": "model-00033-of-00047.safetensors", + "model.layers.32.mlp.experts.31.gate_proj.weight_scale": "model-00033-of-00047.safetensors", + "model.layers.32.mlp.experts.31.up_proj.weight": "model-00033-of-00047.safetensors", + "model.layers.32.mlp.experts.31.up_proj.weight_scale": "model-00033-of-00047.safetensors", + "model.layers.32.mlp.experts.32.down_proj.weight": "model-00033-of-00047.safetensors", + "model.layers.32.mlp.experts.32.down_proj.weight_scale": "model-00033-of-00047.safetensors", + "model.layers.32.mlp.experts.32.gate_proj.weight": "model-00033-of-00047.safetensors", + "model.layers.32.mlp.experts.32.gate_proj.weight_scale": "model-00033-of-00047.safetensors", + "model.layers.32.mlp.experts.32.up_proj.weight": "model-00033-of-00047.safetensors", + "model.layers.32.mlp.experts.32.up_proj.weight_scale": "model-00033-of-00047.safetensors", + "model.layers.32.mlp.experts.33.down_proj.weight": "model-00033-of-00047.safetensors", + "model.layers.32.mlp.experts.33.down_proj.weight_scale": "model-00033-of-00047.safetensors", + "model.layers.32.mlp.experts.33.gate_proj.weight": "model-00033-of-00047.safetensors", + "model.layers.32.mlp.experts.33.gate_proj.weight_scale": "model-00033-of-00047.safetensors", + "model.layers.32.mlp.experts.33.up_proj.weight": "model-00033-of-00047.safetensors", + "model.layers.32.mlp.experts.33.up_proj.weight_scale": "model-00033-of-00047.safetensors", + "model.layers.32.mlp.experts.34.down_proj.weight": "model-00033-of-00047.safetensors", + "model.layers.32.mlp.experts.34.down_proj.weight_scale": "model-00033-of-00047.safetensors", + "model.layers.32.mlp.experts.34.gate_proj.weight": "model-00033-of-00047.safetensors", + "model.layers.32.mlp.experts.34.gate_proj.weight_scale": "model-00033-of-00047.safetensors", + "model.layers.32.mlp.experts.34.up_proj.weight": "model-00033-of-00047.safetensors", + "model.layers.32.mlp.experts.34.up_proj.weight_scale": "model-00033-of-00047.safetensors", + "model.layers.32.mlp.experts.35.down_proj.weight": "model-00033-of-00047.safetensors", + "model.layers.32.mlp.experts.35.down_proj.weight_scale": "model-00033-of-00047.safetensors", + "model.layers.32.mlp.experts.35.gate_proj.weight": "model-00033-of-00047.safetensors", + "model.layers.32.mlp.experts.35.gate_proj.weight_scale": "model-00033-of-00047.safetensors", + "model.layers.32.mlp.experts.35.up_proj.weight": "model-00033-of-00047.safetensors", + "model.layers.32.mlp.experts.35.up_proj.weight_scale": "model-00033-of-00047.safetensors", + "model.layers.32.mlp.experts.36.down_proj.weight": "model-00033-of-00047.safetensors", + "model.layers.32.mlp.experts.36.down_proj.weight_scale": "model-00033-of-00047.safetensors", + "model.layers.32.mlp.experts.36.gate_proj.weight": "model-00033-of-00047.safetensors", + "model.layers.32.mlp.experts.36.gate_proj.weight_scale": "model-00033-of-00047.safetensors", + "model.layers.32.mlp.experts.36.up_proj.weight": "model-00033-of-00047.safetensors", + "model.layers.32.mlp.experts.36.up_proj.weight_scale": "model-00033-of-00047.safetensors", + "model.layers.32.mlp.experts.37.down_proj.weight": "model-00033-of-00047.safetensors", + "model.layers.32.mlp.experts.37.down_proj.weight_scale": "model-00033-of-00047.safetensors", + "model.layers.32.mlp.experts.37.gate_proj.weight": "model-00033-of-00047.safetensors", + "model.layers.32.mlp.experts.37.gate_proj.weight_scale": "model-00033-of-00047.safetensors", + "model.layers.32.mlp.experts.37.up_proj.weight": "model-00033-of-00047.safetensors", + "model.layers.32.mlp.experts.37.up_proj.weight_scale": "model-00033-of-00047.safetensors", + "model.layers.32.mlp.experts.38.down_proj.weight": "model-00033-of-00047.safetensors", + "model.layers.32.mlp.experts.38.down_proj.weight_scale": "model-00033-of-00047.safetensors", + "model.layers.32.mlp.experts.38.gate_proj.weight": "model-00033-of-00047.safetensors", + "model.layers.32.mlp.experts.38.gate_proj.weight_scale": "model-00033-of-00047.safetensors", + "model.layers.32.mlp.experts.38.up_proj.weight": "model-00033-of-00047.safetensors", + "model.layers.32.mlp.experts.38.up_proj.weight_scale": "model-00033-of-00047.safetensors", + "model.layers.32.mlp.experts.39.down_proj.weight": "model-00033-of-00047.safetensors", + "model.layers.32.mlp.experts.39.down_proj.weight_scale": "model-00033-of-00047.safetensors", + "model.layers.32.mlp.experts.39.gate_proj.weight": "model-00033-of-00047.safetensors", + "model.layers.32.mlp.experts.39.gate_proj.weight_scale": "model-00033-of-00047.safetensors", + "model.layers.32.mlp.experts.39.up_proj.weight": "model-00033-of-00047.safetensors", + "model.layers.32.mlp.experts.39.up_proj.weight_scale": "model-00033-of-00047.safetensors", + "model.layers.32.mlp.experts.4.down_proj.weight": "model-00033-of-00047.safetensors", + "model.layers.32.mlp.experts.4.down_proj.weight_scale": "model-00033-of-00047.safetensors", + "model.layers.32.mlp.experts.4.gate_proj.weight": "model-00033-of-00047.safetensors", + "model.layers.32.mlp.experts.4.gate_proj.weight_scale": "model-00033-of-00047.safetensors", + "model.layers.32.mlp.experts.4.up_proj.weight": "model-00033-of-00047.safetensors", + "model.layers.32.mlp.experts.4.up_proj.weight_scale": "model-00033-of-00047.safetensors", + "model.layers.32.mlp.experts.40.down_proj.weight": "model-00033-of-00047.safetensors", + "model.layers.32.mlp.experts.40.down_proj.weight_scale": "model-00033-of-00047.safetensors", + "model.layers.32.mlp.experts.40.gate_proj.weight": "model-00033-of-00047.safetensors", + "model.layers.32.mlp.experts.40.gate_proj.weight_scale": "model-00033-of-00047.safetensors", + "model.layers.32.mlp.experts.40.up_proj.weight": "model-00033-of-00047.safetensors", + "model.layers.32.mlp.experts.40.up_proj.weight_scale": "model-00033-of-00047.safetensors", + "model.layers.32.mlp.experts.41.down_proj.weight": "model-00033-of-00047.safetensors", + "model.layers.32.mlp.experts.41.down_proj.weight_scale": "model-00033-of-00047.safetensors", + "model.layers.32.mlp.experts.41.gate_proj.weight": "model-00033-of-00047.safetensors", + "model.layers.32.mlp.experts.41.gate_proj.weight_scale": "model-00033-of-00047.safetensors", + "model.layers.32.mlp.experts.41.up_proj.weight": "model-00033-of-00047.safetensors", + "model.layers.32.mlp.experts.41.up_proj.weight_scale": "model-00033-of-00047.safetensors", + "model.layers.32.mlp.experts.42.down_proj.weight": "model-00033-of-00047.safetensors", + "model.layers.32.mlp.experts.42.down_proj.weight_scale": "model-00033-of-00047.safetensors", + "model.layers.32.mlp.experts.42.gate_proj.weight": "model-00033-of-00047.safetensors", + "model.layers.32.mlp.experts.42.gate_proj.weight_scale": "model-00033-of-00047.safetensors", + "model.layers.32.mlp.experts.42.up_proj.weight": "model-00033-of-00047.safetensors", + "model.layers.32.mlp.experts.42.up_proj.weight_scale": "model-00033-of-00047.safetensors", + "model.layers.32.mlp.experts.43.down_proj.weight": "model-00033-of-00047.safetensors", + "model.layers.32.mlp.experts.43.down_proj.weight_scale": "model-00033-of-00047.safetensors", + "model.layers.32.mlp.experts.43.gate_proj.weight": "model-00033-of-00047.safetensors", + "model.layers.32.mlp.experts.43.gate_proj.weight_scale": "model-00033-of-00047.safetensors", + "model.layers.32.mlp.experts.43.up_proj.weight": "model-00033-of-00047.safetensors", + "model.layers.32.mlp.experts.43.up_proj.weight_scale": "model-00033-of-00047.safetensors", + "model.layers.32.mlp.experts.44.down_proj.weight": "model-00033-of-00047.safetensors", + "model.layers.32.mlp.experts.44.down_proj.weight_scale": "model-00033-of-00047.safetensors", + "model.layers.32.mlp.experts.44.gate_proj.weight": "model-00033-of-00047.safetensors", + "model.layers.32.mlp.experts.44.gate_proj.weight_scale": "model-00033-of-00047.safetensors", + "model.layers.32.mlp.experts.44.up_proj.weight": "model-00033-of-00047.safetensors", + "model.layers.32.mlp.experts.44.up_proj.weight_scale": "model-00033-of-00047.safetensors", + "model.layers.32.mlp.experts.45.down_proj.weight": "model-00033-of-00047.safetensors", + "model.layers.32.mlp.experts.45.down_proj.weight_scale": "model-00033-of-00047.safetensors", + "model.layers.32.mlp.experts.45.gate_proj.weight": "model-00033-of-00047.safetensors", + "model.layers.32.mlp.experts.45.gate_proj.weight_scale": "model-00033-of-00047.safetensors", + "model.layers.32.mlp.experts.45.up_proj.weight": "model-00033-of-00047.safetensors", + "model.layers.32.mlp.experts.45.up_proj.weight_scale": "model-00033-of-00047.safetensors", + "model.layers.32.mlp.experts.46.down_proj.weight": "model-00033-of-00047.safetensors", + "model.layers.32.mlp.experts.46.down_proj.weight_scale": "model-00033-of-00047.safetensors", + "model.layers.32.mlp.experts.46.gate_proj.weight": "model-00033-of-00047.safetensors", + "model.layers.32.mlp.experts.46.gate_proj.weight_scale": "model-00033-of-00047.safetensors", + "model.layers.32.mlp.experts.46.up_proj.weight": "model-00033-of-00047.safetensors", + "model.layers.32.mlp.experts.46.up_proj.weight_scale": "model-00033-of-00047.safetensors", + "model.layers.32.mlp.experts.47.down_proj.weight": "model-00033-of-00047.safetensors", + "model.layers.32.mlp.experts.47.down_proj.weight_scale": "model-00033-of-00047.safetensors", + "model.layers.32.mlp.experts.47.gate_proj.weight": "model-00033-of-00047.safetensors", + "model.layers.32.mlp.experts.47.gate_proj.weight_scale": "model-00033-of-00047.safetensors", + "model.layers.32.mlp.experts.47.up_proj.weight": "model-00033-of-00047.safetensors", + "model.layers.32.mlp.experts.47.up_proj.weight_scale": "model-00033-of-00047.safetensors", + "model.layers.32.mlp.experts.48.down_proj.weight": "model-00033-of-00047.safetensors", + "model.layers.32.mlp.experts.48.down_proj.weight_scale": "model-00033-of-00047.safetensors", + "model.layers.32.mlp.experts.48.gate_proj.weight": "model-00033-of-00047.safetensors", + "model.layers.32.mlp.experts.48.gate_proj.weight_scale": "model-00033-of-00047.safetensors", + "model.layers.32.mlp.experts.48.up_proj.weight": "model-00033-of-00047.safetensors", + "model.layers.32.mlp.experts.48.up_proj.weight_scale": "model-00033-of-00047.safetensors", + "model.layers.32.mlp.experts.49.down_proj.weight": "model-00033-of-00047.safetensors", + "model.layers.32.mlp.experts.49.down_proj.weight_scale": "model-00033-of-00047.safetensors", + "model.layers.32.mlp.experts.49.gate_proj.weight": "model-00033-of-00047.safetensors", + "model.layers.32.mlp.experts.49.gate_proj.weight_scale": "model-00033-of-00047.safetensors", + "model.layers.32.mlp.experts.49.up_proj.weight": "model-00033-of-00047.safetensors", + "model.layers.32.mlp.experts.49.up_proj.weight_scale": "model-00033-of-00047.safetensors", + "model.layers.32.mlp.experts.5.down_proj.weight": "model-00033-of-00047.safetensors", + "model.layers.32.mlp.experts.5.down_proj.weight_scale": "model-00033-of-00047.safetensors", + "model.layers.32.mlp.experts.5.gate_proj.weight": "model-00033-of-00047.safetensors", + "model.layers.32.mlp.experts.5.gate_proj.weight_scale": "model-00033-of-00047.safetensors", + "model.layers.32.mlp.experts.5.up_proj.weight": "model-00033-of-00047.safetensors", + "model.layers.32.mlp.experts.5.up_proj.weight_scale": "model-00033-of-00047.safetensors", + "model.layers.32.mlp.experts.50.down_proj.weight": "model-00033-of-00047.safetensors", + "model.layers.32.mlp.experts.50.down_proj.weight_scale": "model-00033-of-00047.safetensors", + "model.layers.32.mlp.experts.50.gate_proj.weight": "model-00033-of-00047.safetensors", + "model.layers.32.mlp.experts.50.gate_proj.weight_scale": "model-00033-of-00047.safetensors", + "model.layers.32.mlp.experts.50.up_proj.weight": "model-00033-of-00047.safetensors", + "model.layers.32.mlp.experts.50.up_proj.weight_scale": "model-00033-of-00047.safetensors", + "model.layers.32.mlp.experts.51.down_proj.weight": "model-00033-of-00047.safetensors", + "model.layers.32.mlp.experts.51.down_proj.weight_scale": "model-00033-of-00047.safetensors", + "model.layers.32.mlp.experts.51.gate_proj.weight": "model-00033-of-00047.safetensors", + "model.layers.32.mlp.experts.51.gate_proj.weight_scale": "model-00033-of-00047.safetensors", + "model.layers.32.mlp.experts.51.up_proj.weight": "model-00033-of-00047.safetensors", + "model.layers.32.mlp.experts.51.up_proj.weight_scale": "model-00033-of-00047.safetensors", + "model.layers.32.mlp.experts.52.down_proj.weight": "model-00033-of-00047.safetensors", + "model.layers.32.mlp.experts.52.down_proj.weight_scale": "model-00033-of-00047.safetensors", + "model.layers.32.mlp.experts.52.gate_proj.weight": "model-00033-of-00047.safetensors", + "model.layers.32.mlp.experts.52.gate_proj.weight_scale": "model-00033-of-00047.safetensors", + "model.layers.32.mlp.experts.52.up_proj.weight": "model-00033-of-00047.safetensors", + "model.layers.32.mlp.experts.52.up_proj.weight_scale": "model-00033-of-00047.safetensors", + "model.layers.32.mlp.experts.53.down_proj.weight": "model-00033-of-00047.safetensors", + "model.layers.32.mlp.experts.53.down_proj.weight_scale": "model-00033-of-00047.safetensors", + "model.layers.32.mlp.experts.53.gate_proj.weight": "model-00033-of-00047.safetensors", + "model.layers.32.mlp.experts.53.gate_proj.weight_scale": "model-00033-of-00047.safetensors", + "model.layers.32.mlp.experts.53.up_proj.weight": "model-00033-of-00047.safetensors", + "model.layers.32.mlp.experts.53.up_proj.weight_scale": "model-00033-of-00047.safetensors", + "model.layers.32.mlp.experts.54.down_proj.weight": "model-00033-of-00047.safetensors", + "model.layers.32.mlp.experts.54.down_proj.weight_scale": "model-00033-of-00047.safetensors", + "model.layers.32.mlp.experts.54.gate_proj.weight": "model-00033-of-00047.safetensors", + "model.layers.32.mlp.experts.54.gate_proj.weight_scale": "model-00033-of-00047.safetensors", + "model.layers.32.mlp.experts.54.up_proj.weight": "model-00033-of-00047.safetensors", + "model.layers.32.mlp.experts.54.up_proj.weight_scale": "model-00033-of-00047.safetensors", + "model.layers.32.mlp.experts.55.down_proj.weight": "model-00033-of-00047.safetensors", + "model.layers.32.mlp.experts.55.down_proj.weight_scale": "model-00033-of-00047.safetensors", + "model.layers.32.mlp.experts.55.gate_proj.weight": "model-00033-of-00047.safetensors", + "model.layers.32.mlp.experts.55.gate_proj.weight_scale": "model-00033-of-00047.safetensors", + "model.layers.32.mlp.experts.55.up_proj.weight": "model-00033-of-00047.safetensors", + "model.layers.32.mlp.experts.55.up_proj.weight_scale": "model-00033-of-00047.safetensors", + "model.layers.32.mlp.experts.56.down_proj.weight": "model-00033-of-00047.safetensors", + "model.layers.32.mlp.experts.56.down_proj.weight_scale": "model-00033-of-00047.safetensors", + "model.layers.32.mlp.experts.56.gate_proj.weight": "model-00033-of-00047.safetensors", + "model.layers.32.mlp.experts.56.gate_proj.weight_scale": "model-00033-of-00047.safetensors", + "model.layers.32.mlp.experts.56.up_proj.weight": "model-00033-of-00047.safetensors", + "model.layers.32.mlp.experts.56.up_proj.weight_scale": "model-00033-of-00047.safetensors", + "model.layers.32.mlp.experts.57.down_proj.weight": "model-00033-of-00047.safetensors", + "model.layers.32.mlp.experts.57.down_proj.weight_scale": "model-00033-of-00047.safetensors", + "model.layers.32.mlp.experts.57.gate_proj.weight": "model-00033-of-00047.safetensors", + "model.layers.32.mlp.experts.57.gate_proj.weight_scale": "model-00033-of-00047.safetensors", + "model.layers.32.mlp.experts.57.up_proj.weight": "model-00033-of-00047.safetensors", + "model.layers.32.mlp.experts.57.up_proj.weight_scale": "model-00033-of-00047.safetensors", + "model.layers.32.mlp.experts.58.down_proj.weight": "model-00033-of-00047.safetensors", + "model.layers.32.mlp.experts.58.down_proj.weight_scale": "model-00033-of-00047.safetensors", + "model.layers.32.mlp.experts.58.gate_proj.weight": "model-00033-of-00047.safetensors", + "model.layers.32.mlp.experts.58.gate_proj.weight_scale": "model-00033-of-00047.safetensors", + "model.layers.32.mlp.experts.58.up_proj.weight": "model-00033-of-00047.safetensors", + "model.layers.32.mlp.experts.58.up_proj.weight_scale": "model-00033-of-00047.safetensors", + "model.layers.32.mlp.experts.59.down_proj.weight": "model-00033-of-00047.safetensors", + "model.layers.32.mlp.experts.59.down_proj.weight_scale": "model-00033-of-00047.safetensors", + "model.layers.32.mlp.experts.59.gate_proj.weight": "model-00033-of-00047.safetensors", + "model.layers.32.mlp.experts.59.gate_proj.weight_scale": "model-00033-of-00047.safetensors", + "model.layers.32.mlp.experts.59.up_proj.weight": "model-00033-of-00047.safetensors", + "model.layers.32.mlp.experts.59.up_proj.weight_scale": "model-00033-of-00047.safetensors", + "model.layers.32.mlp.experts.6.down_proj.weight": "model-00033-of-00047.safetensors", + "model.layers.32.mlp.experts.6.down_proj.weight_scale": "model-00033-of-00047.safetensors", + "model.layers.32.mlp.experts.6.gate_proj.weight": "model-00033-of-00047.safetensors", + "model.layers.32.mlp.experts.6.gate_proj.weight_scale": "model-00033-of-00047.safetensors", + "model.layers.32.mlp.experts.6.up_proj.weight": "model-00033-of-00047.safetensors", + "model.layers.32.mlp.experts.6.up_proj.weight_scale": "model-00033-of-00047.safetensors", + "model.layers.32.mlp.experts.60.down_proj.weight": "model-00033-of-00047.safetensors", + "model.layers.32.mlp.experts.60.down_proj.weight_scale": "model-00033-of-00047.safetensors", + "model.layers.32.mlp.experts.60.gate_proj.weight": "model-00033-of-00047.safetensors", + "model.layers.32.mlp.experts.60.gate_proj.weight_scale": "model-00033-of-00047.safetensors", + "model.layers.32.mlp.experts.60.up_proj.weight": "model-00033-of-00047.safetensors", + "model.layers.32.mlp.experts.60.up_proj.weight_scale": "model-00033-of-00047.safetensors", + "model.layers.32.mlp.experts.61.down_proj.weight": "model-00033-of-00047.safetensors", + "model.layers.32.mlp.experts.61.down_proj.weight_scale": "model-00033-of-00047.safetensors", + "model.layers.32.mlp.experts.61.gate_proj.weight": "model-00033-of-00047.safetensors", + "model.layers.32.mlp.experts.61.gate_proj.weight_scale": "model-00033-of-00047.safetensors", + "model.layers.32.mlp.experts.61.up_proj.weight": "model-00033-of-00047.safetensors", + "model.layers.32.mlp.experts.61.up_proj.weight_scale": "model-00033-of-00047.safetensors", + "model.layers.32.mlp.experts.62.down_proj.weight": "model-00033-of-00047.safetensors", + "model.layers.32.mlp.experts.62.down_proj.weight_scale": "model-00033-of-00047.safetensors", + "model.layers.32.mlp.experts.62.gate_proj.weight": "model-00033-of-00047.safetensors", + "model.layers.32.mlp.experts.62.gate_proj.weight_scale": "model-00033-of-00047.safetensors", + "model.layers.32.mlp.experts.62.up_proj.weight": "model-00033-of-00047.safetensors", + "model.layers.32.mlp.experts.62.up_proj.weight_scale": "model-00033-of-00047.safetensors", + "model.layers.32.mlp.experts.63.down_proj.weight": "model-00033-of-00047.safetensors", + "model.layers.32.mlp.experts.63.down_proj.weight_scale": "model-00033-of-00047.safetensors", + "model.layers.32.mlp.experts.63.gate_proj.weight": "model-00033-of-00047.safetensors", + "model.layers.32.mlp.experts.63.gate_proj.weight_scale": "model-00033-of-00047.safetensors", + "model.layers.32.mlp.experts.63.up_proj.weight": "model-00033-of-00047.safetensors", + "model.layers.32.mlp.experts.63.up_proj.weight_scale": "model-00033-of-00047.safetensors", + "model.layers.32.mlp.experts.64.down_proj.weight": "model-00033-of-00047.safetensors", + "model.layers.32.mlp.experts.64.down_proj.weight_scale": "model-00033-of-00047.safetensors", + "model.layers.32.mlp.experts.64.gate_proj.weight": "model-00033-of-00047.safetensors", + "model.layers.32.mlp.experts.64.gate_proj.weight_scale": "model-00033-of-00047.safetensors", + "model.layers.32.mlp.experts.64.up_proj.weight": "model-00033-of-00047.safetensors", + "model.layers.32.mlp.experts.64.up_proj.weight_scale": "model-00033-of-00047.safetensors", + "model.layers.32.mlp.experts.65.down_proj.weight": "model-00033-of-00047.safetensors", + "model.layers.32.mlp.experts.65.down_proj.weight_scale": "model-00033-of-00047.safetensors", + "model.layers.32.mlp.experts.65.gate_proj.weight": "model-00033-of-00047.safetensors", + "model.layers.32.mlp.experts.65.gate_proj.weight_scale": "model-00033-of-00047.safetensors", + "model.layers.32.mlp.experts.65.up_proj.weight": "model-00033-of-00047.safetensors", + "model.layers.32.mlp.experts.65.up_proj.weight_scale": "model-00033-of-00047.safetensors", + "model.layers.32.mlp.experts.66.down_proj.weight": "model-00033-of-00047.safetensors", + "model.layers.32.mlp.experts.66.down_proj.weight_scale": "model-00033-of-00047.safetensors", + "model.layers.32.mlp.experts.66.gate_proj.weight": "model-00033-of-00047.safetensors", + "model.layers.32.mlp.experts.66.gate_proj.weight_scale": "model-00033-of-00047.safetensors", + "model.layers.32.mlp.experts.66.up_proj.weight": "model-00033-of-00047.safetensors", + "model.layers.32.mlp.experts.66.up_proj.weight_scale": "model-00033-of-00047.safetensors", + "model.layers.32.mlp.experts.67.down_proj.weight": "model-00033-of-00047.safetensors", + "model.layers.32.mlp.experts.67.down_proj.weight_scale": "model-00033-of-00047.safetensors", + "model.layers.32.mlp.experts.67.gate_proj.weight": "model-00033-of-00047.safetensors", + "model.layers.32.mlp.experts.67.gate_proj.weight_scale": "model-00033-of-00047.safetensors", + "model.layers.32.mlp.experts.67.up_proj.weight": "model-00033-of-00047.safetensors", + "model.layers.32.mlp.experts.67.up_proj.weight_scale": "model-00033-of-00047.safetensors", + "model.layers.32.mlp.experts.68.down_proj.weight": "model-00033-of-00047.safetensors", + "model.layers.32.mlp.experts.68.down_proj.weight_scale": "model-00033-of-00047.safetensors", + "model.layers.32.mlp.experts.68.gate_proj.weight": "model-00033-of-00047.safetensors", + "model.layers.32.mlp.experts.68.gate_proj.weight_scale": "model-00033-of-00047.safetensors", + "model.layers.32.mlp.experts.68.up_proj.weight": "model-00033-of-00047.safetensors", + "model.layers.32.mlp.experts.68.up_proj.weight_scale": "model-00033-of-00047.safetensors", + "model.layers.32.mlp.experts.69.down_proj.weight": "model-00033-of-00047.safetensors", + "model.layers.32.mlp.experts.69.down_proj.weight_scale": "model-00033-of-00047.safetensors", + "model.layers.32.mlp.experts.69.gate_proj.weight": "model-00033-of-00047.safetensors", + "model.layers.32.mlp.experts.69.gate_proj.weight_scale": "model-00033-of-00047.safetensors", + "model.layers.32.mlp.experts.69.up_proj.weight": "model-00033-of-00047.safetensors", + "model.layers.32.mlp.experts.69.up_proj.weight_scale": "model-00033-of-00047.safetensors", + "model.layers.32.mlp.experts.7.down_proj.weight": "model-00033-of-00047.safetensors", + "model.layers.32.mlp.experts.7.down_proj.weight_scale": "model-00033-of-00047.safetensors", + "model.layers.32.mlp.experts.7.gate_proj.weight": "model-00033-of-00047.safetensors", + "model.layers.32.mlp.experts.7.gate_proj.weight_scale": "model-00033-of-00047.safetensors", + "model.layers.32.mlp.experts.7.up_proj.weight": "model-00033-of-00047.safetensors", + "model.layers.32.mlp.experts.7.up_proj.weight_scale": "model-00033-of-00047.safetensors", + "model.layers.32.mlp.experts.70.down_proj.weight": "model-00033-of-00047.safetensors", + "model.layers.32.mlp.experts.70.down_proj.weight_scale": "model-00033-of-00047.safetensors", + "model.layers.32.mlp.experts.70.gate_proj.weight": "model-00033-of-00047.safetensors", + "model.layers.32.mlp.experts.70.gate_proj.weight_scale": "model-00033-of-00047.safetensors", + "model.layers.32.mlp.experts.70.up_proj.weight": "model-00033-of-00047.safetensors", + "model.layers.32.mlp.experts.70.up_proj.weight_scale": "model-00033-of-00047.safetensors", + "model.layers.32.mlp.experts.71.down_proj.weight": "model-00033-of-00047.safetensors", + "model.layers.32.mlp.experts.71.down_proj.weight_scale": "model-00033-of-00047.safetensors", + "model.layers.32.mlp.experts.71.gate_proj.weight": "model-00033-of-00047.safetensors", + "model.layers.32.mlp.experts.71.gate_proj.weight_scale": "model-00033-of-00047.safetensors", + "model.layers.32.mlp.experts.71.up_proj.weight": "model-00033-of-00047.safetensors", + "model.layers.32.mlp.experts.71.up_proj.weight_scale": "model-00033-of-00047.safetensors", + "model.layers.32.mlp.experts.72.down_proj.weight": "model-00033-of-00047.safetensors", + "model.layers.32.mlp.experts.72.down_proj.weight_scale": "model-00033-of-00047.safetensors", + "model.layers.32.mlp.experts.72.gate_proj.weight": "model-00033-of-00047.safetensors", + "model.layers.32.mlp.experts.72.gate_proj.weight_scale": "model-00033-of-00047.safetensors", + "model.layers.32.mlp.experts.72.up_proj.weight": "model-00033-of-00047.safetensors", + "model.layers.32.mlp.experts.72.up_proj.weight_scale": "model-00033-of-00047.safetensors", + "model.layers.32.mlp.experts.73.down_proj.weight": "model-00033-of-00047.safetensors", + "model.layers.32.mlp.experts.73.down_proj.weight_scale": "model-00033-of-00047.safetensors", + "model.layers.32.mlp.experts.73.gate_proj.weight": "model-00033-of-00047.safetensors", + "model.layers.32.mlp.experts.73.gate_proj.weight_scale": "model-00033-of-00047.safetensors", + "model.layers.32.mlp.experts.73.up_proj.weight": "model-00033-of-00047.safetensors", + "model.layers.32.mlp.experts.73.up_proj.weight_scale": "model-00033-of-00047.safetensors", + "model.layers.32.mlp.experts.74.down_proj.weight": "model-00033-of-00047.safetensors", + "model.layers.32.mlp.experts.74.down_proj.weight_scale": "model-00033-of-00047.safetensors", + "model.layers.32.mlp.experts.74.gate_proj.weight": "model-00033-of-00047.safetensors", + "model.layers.32.mlp.experts.74.gate_proj.weight_scale": "model-00033-of-00047.safetensors", + "model.layers.32.mlp.experts.74.up_proj.weight": "model-00033-of-00047.safetensors", + "model.layers.32.mlp.experts.74.up_proj.weight_scale": "model-00033-of-00047.safetensors", + "model.layers.32.mlp.experts.75.down_proj.weight": "model-00033-of-00047.safetensors", + "model.layers.32.mlp.experts.75.down_proj.weight_scale": "model-00033-of-00047.safetensors", + "model.layers.32.mlp.experts.75.gate_proj.weight": "model-00033-of-00047.safetensors", + "model.layers.32.mlp.experts.75.gate_proj.weight_scale": "model-00033-of-00047.safetensors", + "model.layers.32.mlp.experts.75.up_proj.weight": "model-00033-of-00047.safetensors", + "model.layers.32.mlp.experts.75.up_proj.weight_scale": "model-00033-of-00047.safetensors", + "model.layers.32.mlp.experts.76.down_proj.weight": "model-00033-of-00047.safetensors", + "model.layers.32.mlp.experts.76.down_proj.weight_scale": "model-00033-of-00047.safetensors", + "model.layers.32.mlp.experts.76.gate_proj.weight": "model-00033-of-00047.safetensors", + "model.layers.32.mlp.experts.76.gate_proj.weight_scale": "model-00033-of-00047.safetensors", + "model.layers.32.mlp.experts.76.up_proj.weight": "model-00033-of-00047.safetensors", + "model.layers.32.mlp.experts.76.up_proj.weight_scale": "model-00033-of-00047.safetensors", + "model.layers.32.mlp.experts.77.down_proj.weight": "model-00033-of-00047.safetensors", + "model.layers.32.mlp.experts.77.down_proj.weight_scale": "model-00033-of-00047.safetensors", + "model.layers.32.mlp.experts.77.gate_proj.weight": "model-00033-of-00047.safetensors", + "model.layers.32.mlp.experts.77.gate_proj.weight_scale": "model-00033-of-00047.safetensors", + "model.layers.32.mlp.experts.77.up_proj.weight": "model-00033-of-00047.safetensors", + "model.layers.32.mlp.experts.77.up_proj.weight_scale": "model-00033-of-00047.safetensors", + "model.layers.32.mlp.experts.78.down_proj.weight": "model-00033-of-00047.safetensors", + "model.layers.32.mlp.experts.78.down_proj.weight_scale": "model-00033-of-00047.safetensors", + "model.layers.32.mlp.experts.78.gate_proj.weight": "model-00033-of-00047.safetensors", + "model.layers.32.mlp.experts.78.gate_proj.weight_scale": "model-00033-of-00047.safetensors", + "model.layers.32.mlp.experts.78.up_proj.weight": "model-00033-of-00047.safetensors", + "model.layers.32.mlp.experts.78.up_proj.weight_scale": "model-00033-of-00047.safetensors", + "model.layers.32.mlp.experts.79.down_proj.weight": "model-00033-of-00047.safetensors", + "model.layers.32.mlp.experts.79.down_proj.weight_scale": "model-00033-of-00047.safetensors", + "model.layers.32.mlp.experts.79.gate_proj.weight": "model-00033-of-00047.safetensors", + "model.layers.32.mlp.experts.79.gate_proj.weight_scale": "model-00033-of-00047.safetensors", + "model.layers.32.mlp.experts.79.up_proj.weight": "model-00033-of-00047.safetensors", + "model.layers.32.mlp.experts.79.up_proj.weight_scale": "model-00033-of-00047.safetensors", + "model.layers.32.mlp.experts.8.down_proj.weight": "model-00033-of-00047.safetensors", + "model.layers.32.mlp.experts.8.down_proj.weight_scale": "model-00033-of-00047.safetensors", + "model.layers.32.mlp.experts.8.gate_proj.weight": "model-00033-of-00047.safetensors", + "model.layers.32.mlp.experts.8.gate_proj.weight_scale": "model-00033-of-00047.safetensors", + "model.layers.32.mlp.experts.8.up_proj.weight": "model-00033-of-00047.safetensors", + "model.layers.32.mlp.experts.8.up_proj.weight_scale": "model-00033-of-00047.safetensors", + "model.layers.32.mlp.experts.80.down_proj.weight": "model-00033-of-00047.safetensors", + "model.layers.32.mlp.experts.80.down_proj.weight_scale": "model-00033-of-00047.safetensors", + "model.layers.32.mlp.experts.80.gate_proj.weight": "model-00033-of-00047.safetensors", + "model.layers.32.mlp.experts.80.gate_proj.weight_scale": "model-00033-of-00047.safetensors", + "model.layers.32.mlp.experts.80.up_proj.weight": "model-00033-of-00047.safetensors", + "model.layers.32.mlp.experts.80.up_proj.weight_scale": "model-00033-of-00047.safetensors", + "model.layers.32.mlp.experts.81.down_proj.weight": "model-00033-of-00047.safetensors", + "model.layers.32.mlp.experts.81.down_proj.weight_scale": "model-00033-of-00047.safetensors", + "model.layers.32.mlp.experts.81.gate_proj.weight": "model-00033-of-00047.safetensors", + "model.layers.32.mlp.experts.81.gate_proj.weight_scale": "model-00033-of-00047.safetensors", + "model.layers.32.mlp.experts.81.up_proj.weight": "model-00033-of-00047.safetensors", + "model.layers.32.mlp.experts.81.up_proj.weight_scale": "model-00033-of-00047.safetensors", + "model.layers.32.mlp.experts.82.down_proj.weight": "model-00033-of-00047.safetensors", + "model.layers.32.mlp.experts.82.down_proj.weight_scale": "model-00033-of-00047.safetensors", + "model.layers.32.mlp.experts.82.gate_proj.weight": "model-00033-of-00047.safetensors", + "model.layers.32.mlp.experts.82.gate_proj.weight_scale": "model-00033-of-00047.safetensors", + "model.layers.32.mlp.experts.82.up_proj.weight": "model-00033-of-00047.safetensors", + "model.layers.32.mlp.experts.82.up_proj.weight_scale": "model-00033-of-00047.safetensors", + "model.layers.32.mlp.experts.83.down_proj.weight": "model-00033-of-00047.safetensors", + "model.layers.32.mlp.experts.83.down_proj.weight_scale": "model-00033-of-00047.safetensors", + "model.layers.32.mlp.experts.83.gate_proj.weight": "model-00033-of-00047.safetensors", + "model.layers.32.mlp.experts.83.gate_proj.weight_scale": "model-00033-of-00047.safetensors", + "model.layers.32.mlp.experts.83.up_proj.weight": "model-00033-of-00047.safetensors", + "model.layers.32.mlp.experts.83.up_proj.weight_scale": "model-00033-of-00047.safetensors", + "model.layers.32.mlp.experts.84.down_proj.weight": "model-00033-of-00047.safetensors", + "model.layers.32.mlp.experts.84.down_proj.weight_scale": "model-00033-of-00047.safetensors", + "model.layers.32.mlp.experts.84.gate_proj.weight": "model-00033-of-00047.safetensors", + "model.layers.32.mlp.experts.84.gate_proj.weight_scale": "model-00033-of-00047.safetensors", + "model.layers.32.mlp.experts.84.up_proj.weight": "model-00033-of-00047.safetensors", + "model.layers.32.mlp.experts.84.up_proj.weight_scale": "model-00033-of-00047.safetensors", + "model.layers.32.mlp.experts.85.down_proj.weight": "model-00033-of-00047.safetensors", + "model.layers.32.mlp.experts.85.down_proj.weight_scale": "model-00033-of-00047.safetensors", + "model.layers.32.mlp.experts.85.gate_proj.weight": "model-00033-of-00047.safetensors", + "model.layers.32.mlp.experts.85.gate_proj.weight_scale": "model-00033-of-00047.safetensors", + "model.layers.32.mlp.experts.85.up_proj.weight": "model-00033-of-00047.safetensors", + "model.layers.32.mlp.experts.85.up_proj.weight_scale": "model-00033-of-00047.safetensors", + "model.layers.32.mlp.experts.86.down_proj.weight": "model-00033-of-00047.safetensors", + "model.layers.32.mlp.experts.86.down_proj.weight_scale": "model-00033-of-00047.safetensors", + "model.layers.32.mlp.experts.86.gate_proj.weight": "model-00033-of-00047.safetensors", + "model.layers.32.mlp.experts.86.gate_proj.weight_scale": "model-00033-of-00047.safetensors", + "model.layers.32.mlp.experts.86.up_proj.weight": "model-00033-of-00047.safetensors", + "model.layers.32.mlp.experts.86.up_proj.weight_scale": "model-00033-of-00047.safetensors", + "model.layers.32.mlp.experts.87.down_proj.weight": "model-00033-of-00047.safetensors", + "model.layers.32.mlp.experts.87.down_proj.weight_scale": "model-00033-of-00047.safetensors", + "model.layers.32.mlp.experts.87.gate_proj.weight": "model-00033-of-00047.safetensors", + "model.layers.32.mlp.experts.87.gate_proj.weight_scale": "model-00033-of-00047.safetensors", + "model.layers.32.mlp.experts.87.up_proj.weight": "model-00033-of-00047.safetensors", + "model.layers.32.mlp.experts.87.up_proj.weight_scale": "model-00033-of-00047.safetensors", + "model.layers.32.mlp.experts.88.down_proj.weight": "model-00033-of-00047.safetensors", + "model.layers.32.mlp.experts.88.down_proj.weight_scale": "model-00033-of-00047.safetensors", + "model.layers.32.mlp.experts.88.gate_proj.weight": "model-00033-of-00047.safetensors", + "model.layers.32.mlp.experts.88.gate_proj.weight_scale": "model-00033-of-00047.safetensors", + "model.layers.32.mlp.experts.88.up_proj.weight": "model-00033-of-00047.safetensors", + "model.layers.32.mlp.experts.88.up_proj.weight_scale": "model-00033-of-00047.safetensors", + "model.layers.32.mlp.experts.89.down_proj.weight": "model-00033-of-00047.safetensors", + "model.layers.32.mlp.experts.89.down_proj.weight_scale": "model-00033-of-00047.safetensors", + "model.layers.32.mlp.experts.89.gate_proj.weight": "model-00033-of-00047.safetensors", + "model.layers.32.mlp.experts.89.gate_proj.weight_scale": "model-00033-of-00047.safetensors", + "model.layers.32.mlp.experts.89.up_proj.weight": "model-00033-of-00047.safetensors", + "model.layers.32.mlp.experts.89.up_proj.weight_scale": "model-00033-of-00047.safetensors", + "model.layers.32.mlp.experts.9.down_proj.weight": "model-00033-of-00047.safetensors", + "model.layers.32.mlp.experts.9.down_proj.weight_scale": "model-00033-of-00047.safetensors", + "model.layers.32.mlp.experts.9.gate_proj.weight": "model-00033-of-00047.safetensors", + "model.layers.32.mlp.experts.9.gate_proj.weight_scale": "model-00033-of-00047.safetensors", + "model.layers.32.mlp.experts.9.up_proj.weight": "model-00033-of-00047.safetensors", + "model.layers.32.mlp.experts.9.up_proj.weight_scale": "model-00033-of-00047.safetensors", + "model.layers.32.mlp.experts.90.down_proj.weight": "model-00033-of-00047.safetensors", + "model.layers.32.mlp.experts.90.down_proj.weight_scale": "model-00033-of-00047.safetensors", + "model.layers.32.mlp.experts.90.gate_proj.weight": "model-00033-of-00047.safetensors", + "model.layers.32.mlp.experts.90.gate_proj.weight_scale": "model-00033-of-00047.safetensors", + "model.layers.32.mlp.experts.90.up_proj.weight": "model-00033-of-00047.safetensors", + "model.layers.32.mlp.experts.90.up_proj.weight_scale": "model-00033-of-00047.safetensors", + "model.layers.32.mlp.experts.91.down_proj.weight": "model-00033-of-00047.safetensors", + "model.layers.32.mlp.experts.91.down_proj.weight_scale": "model-00033-of-00047.safetensors", + "model.layers.32.mlp.experts.91.gate_proj.weight": "model-00033-of-00047.safetensors", + "model.layers.32.mlp.experts.91.gate_proj.weight_scale": "model-00033-of-00047.safetensors", + "model.layers.32.mlp.experts.91.up_proj.weight": "model-00033-of-00047.safetensors", + "model.layers.32.mlp.experts.91.up_proj.weight_scale": "model-00033-of-00047.safetensors", + "model.layers.32.mlp.experts.92.down_proj.weight": "model-00033-of-00047.safetensors", + "model.layers.32.mlp.experts.92.down_proj.weight_scale": "model-00033-of-00047.safetensors", + "model.layers.32.mlp.experts.92.gate_proj.weight": "model-00033-of-00047.safetensors", + "model.layers.32.mlp.experts.92.gate_proj.weight_scale": "model-00033-of-00047.safetensors", + "model.layers.32.mlp.experts.92.up_proj.weight": "model-00033-of-00047.safetensors", + "model.layers.32.mlp.experts.92.up_proj.weight_scale": "model-00033-of-00047.safetensors", + "model.layers.32.mlp.experts.93.down_proj.weight": "model-00033-of-00047.safetensors", + "model.layers.32.mlp.experts.93.down_proj.weight_scale": "model-00033-of-00047.safetensors", + "model.layers.32.mlp.experts.93.gate_proj.weight": "model-00033-of-00047.safetensors", + "model.layers.32.mlp.experts.93.gate_proj.weight_scale": "model-00033-of-00047.safetensors", + "model.layers.32.mlp.experts.93.up_proj.weight": "model-00033-of-00047.safetensors", + "model.layers.32.mlp.experts.93.up_proj.weight_scale": "model-00033-of-00047.safetensors", + "model.layers.32.mlp.experts.94.down_proj.weight": "model-00033-of-00047.safetensors", + "model.layers.32.mlp.experts.94.down_proj.weight_scale": "model-00033-of-00047.safetensors", + "model.layers.32.mlp.experts.94.gate_proj.weight": "model-00033-of-00047.safetensors", + "model.layers.32.mlp.experts.94.gate_proj.weight_scale": "model-00033-of-00047.safetensors", + "model.layers.32.mlp.experts.94.up_proj.weight": "model-00033-of-00047.safetensors", + "model.layers.32.mlp.experts.94.up_proj.weight_scale": "model-00033-of-00047.safetensors", + "model.layers.32.mlp.experts.95.down_proj.weight": "model-00033-of-00047.safetensors", + "model.layers.32.mlp.experts.95.down_proj.weight_scale": "model-00033-of-00047.safetensors", + "model.layers.32.mlp.experts.95.gate_proj.weight": "model-00033-of-00047.safetensors", + "model.layers.32.mlp.experts.95.gate_proj.weight_scale": "model-00033-of-00047.safetensors", + "model.layers.32.mlp.experts.95.up_proj.weight": "model-00033-of-00047.safetensors", + "model.layers.32.mlp.experts.95.up_proj.weight_scale": "model-00033-of-00047.safetensors", + "model.layers.32.mlp.experts.96.down_proj.weight": "model-00033-of-00047.safetensors", + "model.layers.32.mlp.experts.96.down_proj.weight_scale": "model-00033-of-00047.safetensors", + "model.layers.32.mlp.experts.96.gate_proj.weight": "model-00033-of-00047.safetensors", + "model.layers.32.mlp.experts.96.gate_proj.weight_scale": "model-00033-of-00047.safetensors", + "model.layers.32.mlp.experts.96.up_proj.weight": "model-00033-of-00047.safetensors", + "model.layers.32.mlp.experts.96.up_proj.weight_scale": "model-00033-of-00047.safetensors", + "model.layers.32.mlp.experts.97.down_proj.weight": "model-00033-of-00047.safetensors", + "model.layers.32.mlp.experts.97.down_proj.weight_scale": "model-00033-of-00047.safetensors", + "model.layers.32.mlp.experts.97.gate_proj.weight": "model-00033-of-00047.safetensors", + "model.layers.32.mlp.experts.97.gate_proj.weight_scale": "model-00033-of-00047.safetensors", + "model.layers.32.mlp.experts.97.up_proj.weight": "model-00033-of-00047.safetensors", + "model.layers.32.mlp.experts.97.up_proj.weight_scale": "model-00033-of-00047.safetensors", + "model.layers.32.mlp.experts.98.down_proj.weight": "model-00033-of-00047.safetensors", + "model.layers.32.mlp.experts.98.down_proj.weight_scale": "model-00033-of-00047.safetensors", + "model.layers.32.mlp.experts.98.gate_proj.weight": "model-00033-of-00047.safetensors", + "model.layers.32.mlp.experts.98.gate_proj.weight_scale": "model-00033-of-00047.safetensors", + "model.layers.32.mlp.experts.98.up_proj.weight": "model-00033-of-00047.safetensors", + "model.layers.32.mlp.experts.98.up_proj.weight_scale": "model-00033-of-00047.safetensors", + "model.layers.32.mlp.experts.99.down_proj.weight": "model-00033-of-00047.safetensors", + "model.layers.32.mlp.experts.99.down_proj.weight_scale": "model-00033-of-00047.safetensors", + "model.layers.32.mlp.experts.99.gate_proj.weight": "model-00033-of-00047.safetensors", + "model.layers.32.mlp.experts.99.gate_proj.weight_scale": "model-00033-of-00047.safetensors", + "model.layers.32.mlp.experts.99.up_proj.weight": "model-00033-of-00047.safetensors", + "model.layers.32.mlp.experts.99.up_proj.weight_scale": "model-00033-of-00047.safetensors", + "model.layers.32.mlp.gate.e_score_correction_bias": "model-00033-of-00047.safetensors", + "model.layers.32.mlp.gate.weight": "model-00033-of-00047.safetensors", + "model.layers.32.mlp.shared_experts.down_proj.weight": "model-00033-of-00047.safetensors", + "model.layers.32.mlp.shared_experts.down_proj.weight_scale": "model-00033-of-00047.safetensors", + "model.layers.32.mlp.shared_experts.gate_proj.weight": "model-00033-of-00047.safetensors", + "model.layers.32.mlp.shared_experts.gate_proj.weight_scale": "model-00033-of-00047.safetensors", + "model.layers.32.mlp.shared_experts.up_proj.weight": "model-00033-of-00047.safetensors", + "model.layers.32.mlp.shared_experts.up_proj.weight_scale": "model-00033-of-00047.safetensors", + "model.layers.32.post_attention_layernorm.weight": "model-00033-of-00047.safetensors", + "model.layers.32.self_attn.k_proj.bias": "model-00033-of-00047.safetensors", + "model.layers.32.self_attn.k_proj.weight": "model-00033-of-00047.safetensors", + "model.layers.32.self_attn.k_proj.weight_scale": "model-00033-of-00047.safetensors", + "model.layers.32.self_attn.o_proj.weight": "model-00033-of-00047.safetensors", + "model.layers.32.self_attn.o_proj.weight_scale": "model-00033-of-00047.safetensors", + "model.layers.32.self_attn.q_proj.bias": "model-00033-of-00047.safetensors", + "model.layers.32.self_attn.q_proj.weight": "model-00033-of-00047.safetensors", + "model.layers.32.self_attn.q_proj.weight_scale": "model-00033-of-00047.safetensors", + "model.layers.32.self_attn.v_proj.bias": "model-00033-of-00047.safetensors", + "model.layers.32.self_attn.v_proj.weight": "model-00033-of-00047.safetensors", + "model.layers.32.self_attn.v_proj.weight_scale": "model-00033-of-00047.safetensors", + "model.layers.33.input_layernorm.weight": "model-00034-of-00047.safetensors", + "model.layers.33.mlp.experts.0.down_proj.weight": "model-00034-of-00047.safetensors", + "model.layers.33.mlp.experts.0.down_proj.weight_scale": "model-00034-of-00047.safetensors", + "model.layers.33.mlp.experts.0.gate_proj.weight": "model-00034-of-00047.safetensors", + "model.layers.33.mlp.experts.0.gate_proj.weight_scale": "model-00034-of-00047.safetensors", + "model.layers.33.mlp.experts.0.up_proj.weight": "model-00034-of-00047.safetensors", + "model.layers.33.mlp.experts.0.up_proj.weight_scale": "model-00034-of-00047.safetensors", + "model.layers.33.mlp.experts.1.down_proj.weight": "model-00034-of-00047.safetensors", + "model.layers.33.mlp.experts.1.down_proj.weight_scale": "model-00034-of-00047.safetensors", + "model.layers.33.mlp.experts.1.gate_proj.weight": "model-00034-of-00047.safetensors", + "model.layers.33.mlp.experts.1.gate_proj.weight_scale": "model-00034-of-00047.safetensors", + "model.layers.33.mlp.experts.1.up_proj.weight": "model-00034-of-00047.safetensors", + "model.layers.33.mlp.experts.1.up_proj.weight_scale": "model-00034-of-00047.safetensors", + "model.layers.33.mlp.experts.10.down_proj.weight": "model-00034-of-00047.safetensors", + "model.layers.33.mlp.experts.10.down_proj.weight_scale": "model-00034-of-00047.safetensors", + "model.layers.33.mlp.experts.10.gate_proj.weight": "model-00034-of-00047.safetensors", + "model.layers.33.mlp.experts.10.gate_proj.weight_scale": "model-00034-of-00047.safetensors", + "model.layers.33.mlp.experts.10.up_proj.weight": "model-00034-of-00047.safetensors", + "model.layers.33.mlp.experts.10.up_proj.weight_scale": "model-00034-of-00047.safetensors", + "model.layers.33.mlp.experts.100.down_proj.weight": "model-00034-of-00047.safetensors", + "model.layers.33.mlp.experts.100.down_proj.weight_scale": "model-00034-of-00047.safetensors", + "model.layers.33.mlp.experts.100.gate_proj.weight": "model-00034-of-00047.safetensors", + "model.layers.33.mlp.experts.100.gate_proj.weight_scale": "model-00034-of-00047.safetensors", + "model.layers.33.mlp.experts.100.up_proj.weight": "model-00034-of-00047.safetensors", + "model.layers.33.mlp.experts.100.up_proj.weight_scale": "model-00034-of-00047.safetensors", + "model.layers.33.mlp.experts.101.down_proj.weight": "model-00034-of-00047.safetensors", + "model.layers.33.mlp.experts.101.down_proj.weight_scale": "model-00034-of-00047.safetensors", + "model.layers.33.mlp.experts.101.gate_proj.weight": "model-00034-of-00047.safetensors", + "model.layers.33.mlp.experts.101.gate_proj.weight_scale": "model-00034-of-00047.safetensors", + "model.layers.33.mlp.experts.101.up_proj.weight": "model-00034-of-00047.safetensors", + "model.layers.33.mlp.experts.101.up_proj.weight_scale": "model-00034-of-00047.safetensors", + "model.layers.33.mlp.experts.102.down_proj.weight": "model-00034-of-00047.safetensors", + "model.layers.33.mlp.experts.102.down_proj.weight_scale": "model-00034-of-00047.safetensors", + "model.layers.33.mlp.experts.102.gate_proj.weight": "model-00034-of-00047.safetensors", + "model.layers.33.mlp.experts.102.gate_proj.weight_scale": "model-00034-of-00047.safetensors", + "model.layers.33.mlp.experts.102.up_proj.weight": "model-00034-of-00047.safetensors", + "model.layers.33.mlp.experts.102.up_proj.weight_scale": "model-00034-of-00047.safetensors", + "model.layers.33.mlp.experts.103.down_proj.weight": "model-00034-of-00047.safetensors", + "model.layers.33.mlp.experts.103.down_proj.weight_scale": "model-00034-of-00047.safetensors", + "model.layers.33.mlp.experts.103.gate_proj.weight": "model-00034-of-00047.safetensors", + "model.layers.33.mlp.experts.103.gate_proj.weight_scale": "model-00034-of-00047.safetensors", + "model.layers.33.mlp.experts.103.up_proj.weight": "model-00034-of-00047.safetensors", + "model.layers.33.mlp.experts.103.up_proj.weight_scale": "model-00034-of-00047.safetensors", + "model.layers.33.mlp.experts.104.down_proj.weight": "model-00034-of-00047.safetensors", + "model.layers.33.mlp.experts.104.down_proj.weight_scale": "model-00034-of-00047.safetensors", + "model.layers.33.mlp.experts.104.gate_proj.weight": "model-00034-of-00047.safetensors", + "model.layers.33.mlp.experts.104.gate_proj.weight_scale": "model-00034-of-00047.safetensors", + "model.layers.33.mlp.experts.104.up_proj.weight": "model-00034-of-00047.safetensors", + "model.layers.33.mlp.experts.104.up_proj.weight_scale": "model-00034-of-00047.safetensors", + "model.layers.33.mlp.experts.105.down_proj.weight": "model-00034-of-00047.safetensors", + "model.layers.33.mlp.experts.105.down_proj.weight_scale": "model-00034-of-00047.safetensors", + "model.layers.33.mlp.experts.105.gate_proj.weight": "model-00034-of-00047.safetensors", + "model.layers.33.mlp.experts.105.gate_proj.weight_scale": "model-00034-of-00047.safetensors", + "model.layers.33.mlp.experts.105.up_proj.weight": "model-00034-of-00047.safetensors", + "model.layers.33.mlp.experts.105.up_proj.weight_scale": "model-00034-of-00047.safetensors", + "model.layers.33.mlp.experts.106.down_proj.weight": "model-00034-of-00047.safetensors", + "model.layers.33.mlp.experts.106.down_proj.weight_scale": "model-00034-of-00047.safetensors", + "model.layers.33.mlp.experts.106.gate_proj.weight": "model-00034-of-00047.safetensors", + "model.layers.33.mlp.experts.106.gate_proj.weight_scale": "model-00034-of-00047.safetensors", + "model.layers.33.mlp.experts.106.up_proj.weight": "model-00034-of-00047.safetensors", + "model.layers.33.mlp.experts.106.up_proj.weight_scale": "model-00034-of-00047.safetensors", + "model.layers.33.mlp.experts.107.down_proj.weight": "model-00034-of-00047.safetensors", + "model.layers.33.mlp.experts.107.down_proj.weight_scale": "model-00034-of-00047.safetensors", + "model.layers.33.mlp.experts.107.gate_proj.weight": "model-00034-of-00047.safetensors", + "model.layers.33.mlp.experts.107.gate_proj.weight_scale": "model-00034-of-00047.safetensors", + "model.layers.33.mlp.experts.107.up_proj.weight": "model-00034-of-00047.safetensors", + "model.layers.33.mlp.experts.107.up_proj.weight_scale": "model-00034-of-00047.safetensors", + "model.layers.33.mlp.experts.108.down_proj.weight": "model-00034-of-00047.safetensors", + "model.layers.33.mlp.experts.108.down_proj.weight_scale": "model-00034-of-00047.safetensors", + "model.layers.33.mlp.experts.108.gate_proj.weight": "model-00034-of-00047.safetensors", + "model.layers.33.mlp.experts.108.gate_proj.weight_scale": "model-00034-of-00047.safetensors", + "model.layers.33.mlp.experts.108.up_proj.weight": "model-00034-of-00047.safetensors", + "model.layers.33.mlp.experts.108.up_proj.weight_scale": "model-00034-of-00047.safetensors", + "model.layers.33.mlp.experts.109.down_proj.weight": "model-00034-of-00047.safetensors", + "model.layers.33.mlp.experts.109.down_proj.weight_scale": "model-00034-of-00047.safetensors", + "model.layers.33.mlp.experts.109.gate_proj.weight": "model-00034-of-00047.safetensors", + "model.layers.33.mlp.experts.109.gate_proj.weight_scale": "model-00034-of-00047.safetensors", + "model.layers.33.mlp.experts.109.up_proj.weight": "model-00034-of-00047.safetensors", + "model.layers.33.mlp.experts.109.up_proj.weight_scale": "model-00034-of-00047.safetensors", + "model.layers.33.mlp.experts.11.down_proj.weight": "model-00034-of-00047.safetensors", + "model.layers.33.mlp.experts.11.down_proj.weight_scale": "model-00034-of-00047.safetensors", + "model.layers.33.mlp.experts.11.gate_proj.weight": "model-00034-of-00047.safetensors", + "model.layers.33.mlp.experts.11.gate_proj.weight_scale": "model-00034-of-00047.safetensors", + "model.layers.33.mlp.experts.11.up_proj.weight": "model-00034-of-00047.safetensors", + "model.layers.33.mlp.experts.11.up_proj.weight_scale": "model-00034-of-00047.safetensors", + "model.layers.33.mlp.experts.110.down_proj.weight": "model-00034-of-00047.safetensors", + "model.layers.33.mlp.experts.110.down_proj.weight_scale": "model-00034-of-00047.safetensors", + "model.layers.33.mlp.experts.110.gate_proj.weight": "model-00034-of-00047.safetensors", + "model.layers.33.mlp.experts.110.gate_proj.weight_scale": "model-00034-of-00047.safetensors", + "model.layers.33.mlp.experts.110.up_proj.weight": "model-00034-of-00047.safetensors", + "model.layers.33.mlp.experts.110.up_proj.weight_scale": "model-00034-of-00047.safetensors", + "model.layers.33.mlp.experts.111.down_proj.weight": "model-00034-of-00047.safetensors", + "model.layers.33.mlp.experts.111.down_proj.weight_scale": "model-00034-of-00047.safetensors", + "model.layers.33.mlp.experts.111.gate_proj.weight": "model-00034-of-00047.safetensors", + "model.layers.33.mlp.experts.111.gate_proj.weight_scale": "model-00034-of-00047.safetensors", + "model.layers.33.mlp.experts.111.up_proj.weight": "model-00034-of-00047.safetensors", + "model.layers.33.mlp.experts.111.up_proj.weight_scale": "model-00034-of-00047.safetensors", + "model.layers.33.mlp.experts.112.down_proj.weight": "model-00034-of-00047.safetensors", + "model.layers.33.mlp.experts.112.down_proj.weight_scale": "model-00034-of-00047.safetensors", + "model.layers.33.mlp.experts.112.gate_proj.weight": "model-00034-of-00047.safetensors", + "model.layers.33.mlp.experts.112.gate_proj.weight_scale": "model-00034-of-00047.safetensors", + "model.layers.33.mlp.experts.112.up_proj.weight": "model-00034-of-00047.safetensors", + "model.layers.33.mlp.experts.112.up_proj.weight_scale": "model-00034-of-00047.safetensors", + "model.layers.33.mlp.experts.113.down_proj.weight": "model-00034-of-00047.safetensors", + "model.layers.33.mlp.experts.113.down_proj.weight_scale": "model-00034-of-00047.safetensors", + "model.layers.33.mlp.experts.113.gate_proj.weight": "model-00034-of-00047.safetensors", + "model.layers.33.mlp.experts.113.gate_proj.weight_scale": "model-00034-of-00047.safetensors", + "model.layers.33.mlp.experts.113.up_proj.weight": "model-00034-of-00047.safetensors", + "model.layers.33.mlp.experts.113.up_proj.weight_scale": "model-00034-of-00047.safetensors", + "model.layers.33.mlp.experts.114.down_proj.weight": "model-00034-of-00047.safetensors", + "model.layers.33.mlp.experts.114.down_proj.weight_scale": "model-00034-of-00047.safetensors", + "model.layers.33.mlp.experts.114.gate_proj.weight": "model-00034-of-00047.safetensors", + "model.layers.33.mlp.experts.114.gate_proj.weight_scale": "model-00034-of-00047.safetensors", + "model.layers.33.mlp.experts.114.up_proj.weight": "model-00034-of-00047.safetensors", + "model.layers.33.mlp.experts.114.up_proj.weight_scale": "model-00034-of-00047.safetensors", + "model.layers.33.mlp.experts.115.down_proj.weight": "model-00034-of-00047.safetensors", + "model.layers.33.mlp.experts.115.down_proj.weight_scale": "model-00034-of-00047.safetensors", + "model.layers.33.mlp.experts.115.gate_proj.weight": "model-00034-of-00047.safetensors", + "model.layers.33.mlp.experts.115.gate_proj.weight_scale": "model-00034-of-00047.safetensors", + "model.layers.33.mlp.experts.115.up_proj.weight": "model-00034-of-00047.safetensors", + "model.layers.33.mlp.experts.115.up_proj.weight_scale": "model-00034-of-00047.safetensors", + "model.layers.33.mlp.experts.116.down_proj.weight": "model-00034-of-00047.safetensors", + "model.layers.33.mlp.experts.116.down_proj.weight_scale": "model-00034-of-00047.safetensors", + "model.layers.33.mlp.experts.116.gate_proj.weight": "model-00034-of-00047.safetensors", + "model.layers.33.mlp.experts.116.gate_proj.weight_scale": "model-00034-of-00047.safetensors", + "model.layers.33.mlp.experts.116.up_proj.weight": "model-00034-of-00047.safetensors", + "model.layers.33.mlp.experts.116.up_proj.weight_scale": "model-00034-of-00047.safetensors", + "model.layers.33.mlp.experts.117.down_proj.weight": "model-00034-of-00047.safetensors", + "model.layers.33.mlp.experts.117.down_proj.weight_scale": "model-00034-of-00047.safetensors", + "model.layers.33.mlp.experts.117.gate_proj.weight": "model-00034-of-00047.safetensors", + "model.layers.33.mlp.experts.117.gate_proj.weight_scale": "model-00034-of-00047.safetensors", + "model.layers.33.mlp.experts.117.up_proj.weight": "model-00034-of-00047.safetensors", + "model.layers.33.mlp.experts.117.up_proj.weight_scale": "model-00034-of-00047.safetensors", + "model.layers.33.mlp.experts.118.down_proj.weight": "model-00034-of-00047.safetensors", + "model.layers.33.mlp.experts.118.down_proj.weight_scale": "model-00034-of-00047.safetensors", + "model.layers.33.mlp.experts.118.gate_proj.weight": "model-00034-of-00047.safetensors", + "model.layers.33.mlp.experts.118.gate_proj.weight_scale": "model-00034-of-00047.safetensors", + "model.layers.33.mlp.experts.118.up_proj.weight": "model-00034-of-00047.safetensors", + "model.layers.33.mlp.experts.118.up_proj.weight_scale": "model-00034-of-00047.safetensors", + "model.layers.33.mlp.experts.119.down_proj.weight": "model-00034-of-00047.safetensors", + "model.layers.33.mlp.experts.119.down_proj.weight_scale": "model-00034-of-00047.safetensors", + "model.layers.33.mlp.experts.119.gate_proj.weight": "model-00034-of-00047.safetensors", + "model.layers.33.mlp.experts.119.gate_proj.weight_scale": "model-00034-of-00047.safetensors", + "model.layers.33.mlp.experts.119.up_proj.weight": "model-00034-of-00047.safetensors", + "model.layers.33.mlp.experts.119.up_proj.weight_scale": "model-00034-of-00047.safetensors", + "model.layers.33.mlp.experts.12.down_proj.weight": "model-00034-of-00047.safetensors", + "model.layers.33.mlp.experts.12.down_proj.weight_scale": "model-00034-of-00047.safetensors", + "model.layers.33.mlp.experts.12.gate_proj.weight": "model-00034-of-00047.safetensors", + "model.layers.33.mlp.experts.12.gate_proj.weight_scale": "model-00034-of-00047.safetensors", + "model.layers.33.mlp.experts.12.up_proj.weight": "model-00034-of-00047.safetensors", + "model.layers.33.mlp.experts.12.up_proj.weight_scale": "model-00034-of-00047.safetensors", + "model.layers.33.mlp.experts.120.down_proj.weight": "model-00034-of-00047.safetensors", + "model.layers.33.mlp.experts.120.down_proj.weight_scale": "model-00034-of-00047.safetensors", + "model.layers.33.mlp.experts.120.gate_proj.weight": "model-00034-of-00047.safetensors", + "model.layers.33.mlp.experts.120.gate_proj.weight_scale": "model-00034-of-00047.safetensors", + "model.layers.33.mlp.experts.120.up_proj.weight": "model-00034-of-00047.safetensors", + "model.layers.33.mlp.experts.120.up_proj.weight_scale": "model-00034-of-00047.safetensors", + "model.layers.33.mlp.experts.121.down_proj.weight": "model-00034-of-00047.safetensors", + "model.layers.33.mlp.experts.121.down_proj.weight_scale": "model-00034-of-00047.safetensors", + "model.layers.33.mlp.experts.121.gate_proj.weight": "model-00034-of-00047.safetensors", + "model.layers.33.mlp.experts.121.gate_proj.weight_scale": "model-00034-of-00047.safetensors", + "model.layers.33.mlp.experts.121.up_proj.weight": "model-00034-of-00047.safetensors", + "model.layers.33.mlp.experts.121.up_proj.weight_scale": "model-00034-of-00047.safetensors", + "model.layers.33.mlp.experts.122.down_proj.weight": "model-00034-of-00047.safetensors", + "model.layers.33.mlp.experts.122.down_proj.weight_scale": "model-00034-of-00047.safetensors", + "model.layers.33.mlp.experts.122.gate_proj.weight": "model-00034-of-00047.safetensors", + "model.layers.33.mlp.experts.122.gate_proj.weight_scale": "model-00034-of-00047.safetensors", + "model.layers.33.mlp.experts.122.up_proj.weight": "model-00034-of-00047.safetensors", + "model.layers.33.mlp.experts.122.up_proj.weight_scale": "model-00034-of-00047.safetensors", + "model.layers.33.mlp.experts.123.down_proj.weight": "model-00034-of-00047.safetensors", + "model.layers.33.mlp.experts.123.down_proj.weight_scale": "model-00034-of-00047.safetensors", + "model.layers.33.mlp.experts.123.gate_proj.weight": "model-00034-of-00047.safetensors", + "model.layers.33.mlp.experts.123.gate_proj.weight_scale": "model-00034-of-00047.safetensors", + "model.layers.33.mlp.experts.123.up_proj.weight": "model-00034-of-00047.safetensors", + "model.layers.33.mlp.experts.123.up_proj.weight_scale": "model-00034-of-00047.safetensors", + "model.layers.33.mlp.experts.124.down_proj.weight": "model-00034-of-00047.safetensors", + "model.layers.33.mlp.experts.124.down_proj.weight_scale": "model-00034-of-00047.safetensors", + "model.layers.33.mlp.experts.124.gate_proj.weight": "model-00034-of-00047.safetensors", + "model.layers.33.mlp.experts.124.gate_proj.weight_scale": "model-00034-of-00047.safetensors", + "model.layers.33.mlp.experts.124.up_proj.weight": "model-00034-of-00047.safetensors", + "model.layers.33.mlp.experts.124.up_proj.weight_scale": "model-00034-of-00047.safetensors", + "model.layers.33.mlp.experts.125.down_proj.weight": "model-00034-of-00047.safetensors", + "model.layers.33.mlp.experts.125.down_proj.weight_scale": "model-00034-of-00047.safetensors", + "model.layers.33.mlp.experts.125.gate_proj.weight": "model-00034-of-00047.safetensors", + "model.layers.33.mlp.experts.125.gate_proj.weight_scale": "model-00034-of-00047.safetensors", + "model.layers.33.mlp.experts.125.up_proj.weight": "model-00034-of-00047.safetensors", + "model.layers.33.mlp.experts.125.up_proj.weight_scale": "model-00034-of-00047.safetensors", + "model.layers.33.mlp.experts.126.down_proj.weight": "model-00034-of-00047.safetensors", + "model.layers.33.mlp.experts.126.down_proj.weight_scale": "model-00034-of-00047.safetensors", + "model.layers.33.mlp.experts.126.gate_proj.weight": "model-00034-of-00047.safetensors", + "model.layers.33.mlp.experts.126.gate_proj.weight_scale": "model-00034-of-00047.safetensors", + "model.layers.33.mlp.experts.126.up_proj.weight": "model-00034-of-00047.safetensors", + "model.layers.33.mlp.experts.126.up_proj.weight_scale": "model-00034-of-00047.safetensors", + "model.layers.33.mlp.experts.127.down_proj.weight": "model-00034-of-00047.safetensors", + "model.layers.33.mlp.experts.127.down_proj.weight_scale": "model-00034-of-00047.safetensors", + "model.layers.33.mlp.experts.127.gate_proj.weight": "model-00034-of-00047.safetensors", + "model.layers.33.mlp.experts.127.gate_proj.weight_scale": "model-00034-of-00047.safetensors", + "model.layers.33.mlp.experts.127.up_proj.weight": "model-00034-of-00047.safetensors", + "model.layers.33.mlp.experts.127.up_proj.weight_scale": "model-00034-of-00047.safetensors", + "model.layers.33.mlp.experts.13.down_proj.weight": "model-00034-of-00047.safetensors", + "model.layers.33.mlp.experts.13.down_proj.weight_scale": "model-00034-of-00047.safetensors", + "model.layers.33.mlp.experts.13.gate_proj.weight": "model-00034-of-00047.safetensors", + "model.layers.33.mlp.experts.13.gate_proj.weight_scale": "model-00034-of-00047.safetensors", + "model.layers.33.mlp.experts.13.up_proj.weight": "model-00034-of-00047.safetensors", + "model.layers.33.mlp.experts.13.up_proj.weight_scale": "model-00034-of-00047.safetensors", + "model.layers.33.mlp.experts.14.down_proj.weight": "model-00034-of-00047.safetensors", + "model.layers.33.mlp.experts.14.down_proj.weight_scale": "model-00034-of-00047.safetensors", + "model.layers.33.mlp.experts.14.gate_proj.weight": "model-00034-of-00047.safetensors", + "model.layers.33.mlp.experts.14.gate_proj.weight_scale": "model-00034-of-00047.safetensors", + "model.layers.33.mlp.experts.14.up_proj.weight": "model-00034-of-00047.safetensors", + "model.layers.33.mlp.experts.14.up_proj.weight_scale": "model-00034-of-00047.safetensors", + "model.layers.33.mlp.experts.15.down_proj.weight": "model-00034-of-00047.safetensors", + "model.layers.33.mlp.experts.15.down_proj.weight_scale": "model-00034-of-00047.safetensors", + "model.layers.33.mlp.experts.15.gate_proj.weight": "model-00034-of-00047.safetensors", + "model.layers.33.mlp.experts.15.gate_proj.weight_scale": "model-00034-of-00047.safetensors", + "model.layers.33.mlp.experts.15.up_proj.weight": "model-00034-of-00047.safetensors", + "model.layers.33.mlp.experts.15.up_proj.weight_scale": "model-00034-of-00047.safetensors", + "model.layers.33.mlp.experts.16.down_proj.weight": "model-00034-of-00047.safetensors", + "model.layers.33.mlp.experts.16.down_proj.weight_scale": "model-00034-of-00047.safetensors", + "model.layers.33.mlp.experts.16.gate_proj.weight": "model-00034-of-00047.safetensors", + "model.layers.33.mlp.experts.16.gate_proj.weight_scale": "model-00034-of-00047.safetensors", + "model.layers.33.mlp.experts.16.up_proj.weight": "model-00034-of-00047.safetensors", + "model.layers.33.mlp.experts.16.up_proj.weight_scale": "model-00034-of-00047.safetensors", + "model.layers.33.mlp.experts.17.down_proj.weight": "model-00034-of-00047.safetensors", + "model.layers.33.mlp.experts.17.down_proj.weight_scale": "model-00034-of-00047.safetensors", + "model.layers.33.mlp.experts.17.gate_proj.weight": "model-00034-of-00047.safetensors", + "model.layers.33.mlp.experts.17.gate_proj.weight_scale": "model-00034-of-00047.safetensors", + "model.layers.33.mlp.experts.17.up_proj.weight": "model-00034-of-00047.safetensors", + "model.layers.33.mlp.experts.17.up_proj.weight_scale": "model-00034-of-00047.safetensors", + "model.layers.33.mlp.experts.18.down_proj.weight": "model-00034-of-00047.safetensors", + "model.layers.33.mlp.experts.18.down_proj.weight_scale": "model-00034-of-00047.safetensors", + "model.layers.33.mlp.experts.18.gate_proj.weight": "model-00034-of-00047.safetensors", + "model.layers.33.mlp.experts.18.gate_proj.weight_scale": "model-00034-of-00047.safetensors", + "model.layers.33.mlp.experts.18.up_proj.weight": "model-00034-of-00047.safetensors", + "model.layers.33.mlp.experts.18.up_proj.weight_scale": "model-00034-of-00047.safetensors", + "model.layers.33.mlp.experts.19.down_proj.weight": "model-00034-of-00047.safetensors", + "model.layers.33.mlp.experts.19.down_proj.weight_scale": "model-00034-of-00047.safetensors", + "model.layers.33.mlp.experts.19.gate_proj.weight": "model-00034-of-00047.safetensors", + "model.layers.33.mlp.experts.19.gate_proj.weight_scale": "model-00034-of-00047.safetensors", + "model.layers.33.mlp.experts.19.up_proj.weight": "model-00034-of-00047.safetensors", + "model.layers.33.mlp.experts.19.up_proj.weight_scale": "model-00034-of-00047.safetensors", + "model.layers.33.mlp.experts.2.down_proj.weight": "model-00034-of-00047.safetensors", + "model.layers.33.mlp.experts.2.down_proj.weight_scale": "model-00034-of-00047.safetensors", + "model.layers.33.mlp.experts.2.gate_proj.weight": "model-00034-of-00047.safetensors", + "model.layers.33.mlp.experts.2.gate_proj.weight_scale": "model-00034-of-00047.safetensors", + "model.layers.33.mlp.experts.2.up_proj.weight": "model-00034-of-00047.safetensors", + "model.layers.33.mlp.experts.2.up_proj.weight_scale": "model-00034-of-00047.safetensors", + "model.layers.33.mlp.experts.20.down_proj.weight": "model-00034-of-00047.safetensors", + "model.layers.33.mlp.experts.20.down_proj.weight_scale": "model-00034-of-00047.safetensors", + "model.layers.33.mlp.experts.20.gate_proj.weight": "model-00034-of-00047.safetensors", + "model.layers.33.mlp.experts.20.gate_proj.weight_scale": "model-00034-of-00047.safetensors", + "model.layers.33.mlp.experts.20.up_proj.weight": "model-00034-of-00047.safetensors", + "model.layers.33.mlp.experts.20.up_proj.weight_scale": "model-00034-of-00047.safetensors", + "model.layers.33.mlp.experts.21.down_proj.weight": "model-00034-of-00047.safetensors", + "model.layers.33.mlp.experts.21.down_proj.weight_scale": "model-00034-of-00047.safetensors", + "model.layers.33.mlp.experts.21.gate_proj.weight": "model-00034-of-00047.safetensors", + "model.layers.33.mlp.experts.21.gate_proj.weight_scale": "model-00034-of-00047.safetensors", + "model.layers.33.mlp.experts.21.up_proj.weight": "model-00034-of-00047.safetensors", + "model.layers.33.mlp.experts.21.up_proj.weight_scale": "model-00034-of-00047.safetensors", + "model.layers.33.mlp.experts.22.down_proj.weight": "model-00034-of-00047.safetensors", + "model.layers.33.mlp.experts.22.down_proj.weight_scale": "model-00034-of-00047.safetensors", + "model.layers.33.mlp.experts.22.gate_proj.weight": "model-00034-of-00047.safetensors", + "model.layers.33.mlp.experts.22.gate_proj.weight_scale": "model-00034-of-00047.safetensors", + "model.layers.33.mlp.experts.22.up_proj.weight": "model-00034-of-00047.safetensors", + "model.layers.33.mlp.experts.22.up_proj.weight_scale": "model-00034-of-00047.safetensors", + "model.layers.33.mlp.experts.23.down_proj.weight": "model-00034-of-00047.safetensors", + "model.layers.33.mlp.experts.23.down_proj.weight_scale": "model-00034-of-00047.safetensors", + "model.layers.33.mlp.experts.23.gate_proj.weight": "model-00034-of-00047.safetensors", + "model.layers.33.mlp.experts.23.gate_proj.weight_scale": "model-00034-of-00047.safetensors", + "model.layers.33.mlp.experts.23.up_proj.weight": "model-00034-of-00047.safetensors", + "model.layers.33.mlp.experts.23.up_proj.weight_scale": "model-00034-of-00047.safetensors", + "model.layers.33.mlp.experts.24.down_proj.weight": "model-00034-of-00047.safetensors", + "model.layers.33.mlp.experts.24.down_proj.weight_scale": "model-00034-of-00047.safetensors", + "model.layers.33.mlp.experts.24.gate_proj.weight": "model-00034-of-00047.safetensors", + "model.layers.33.mlp.experts.24.gate_proj.weight_scale": "model-00034-of-00047.safetensors", + "model.layers.33.mlp.experts.24.up_proj.weight": "model-00034-of-00047.safetensors", + "model.layers.33.mlp.experts.24.up_proj.weight_scale": "model-00034-of-00047.safetensors", + "model.layers.33.mlp.experts.25.down_proj.weight": "model-00034-of-00047.safetensors", + "model.layers.33.mlp.experts.25.down_proj.weight_scale": "model-00034-of-00047.safetensors", + "model.layers.33.mlp.experts.25.gate_proj.weight": "model-00034-of-00047.safetensors", + "model.layers.33.mlp.experts.25.gate_proj.weight_scale": "model-00034-of-00047.safetensors", + "model.layers.33.mlp.experts.25.up_proj.weight": "model-00034-of-00047.safetensors", + "model.layers.33.mlp.experts.25.up_proj.weight_scale": "model-00034-of-00047.safetensors", + "model.layers.33.mlp.experts.26.down_proj.weight": "model-00034-of-00047.safetensors", + "model.layers.33.mlp.experts.26.down_proj.weight_scale": "model-00034-of-00047.safetensors", + "model.layers.33.mlp.experts.26.gate_proj.weight": "model-00034-of-00047.safetensors", + "model.layers.33.mlp.experts.26.gate_proj.weight_scale": "model-00034-of-00047.safetensors", + "model.layers.33.mlp.experts.26.up_proj.weight": "model-00034-of-00047.safetensors", + "model.layers.33.mlp.experts.26.up_proj.weight_scale": "model-00034-of-00047.safetensors", + "model.layers.33.mlp.experts.27.down_proj.weight": "model-00034-of-00047.safetensors", + "model.layers.33.mlp.experts.27.down_proj.weight_scale": "model-00034-of-00047.safetensors", + "model.layers.33.mlp.experts.27.gate_proj.weight": "model-00034-of-00047.safetensors", + "model.layers.33.mlp.experts.27.gate_proj.weight_scale": "model-00034-of-00047.safetensors", + "model.layers.33.mlp.experts.27.up_proj.weight": "model-00034-of-00047.safetensors", + "model.layers.33.mlp.experts.27.up_proj.weight_scale": "model-00034-of-00047.safetensors", + "model.layers.33.mlp.experts.28.down_proj.weight": "model-00034-of-00047.safetensors", + "model.layers.33.mlp.experts.28.down_proj.weight_scale": "model-00034-of-00047.safetensors", + "model.layers.33.mlp.experts.28.gate_proj.weight": "model-00034-of-00047.safetensors", + "model.layers.33.mlp.experts.28.gate_proj.weight_scale": "model-00034-of-00047.safetensors", + "model.layers.33.mlp.experts.28.up_proj.weight": "model-00034-of-00047.safetensors", + "model.layers.33.mlp.experts.28.up_proj.weight_scale": "model-00034-of-00047.safetensors", + "model.layers.33.mlp.experts.29.down_proj.weight": "model-00034-of-00047.safetensors", + "model.layers.33.mlp.experts.29.down_proj.weight_scale": "model-00034-of-00047.safetensors", + "model.layers.33.mlp.experts.29.gate_proj.weight": "model-00034-of-00047.safetensors", + "model.layers.33.mlp.experts.29.gate_proj.weight_scale": "model-00034-of-00047.safetensors", + "model.layers.33.mlp.experts.29.up_proj.weight": "model-00034-of-00047.safetensors", + "model.layers.33.mlp.experts.29.up_proj.weight_scale": "model-00034-of-00047.safetensors", + "model.layers.33.mlp.experts.3.down_proj.weight": "model-00034-of-00047.safetensors", + "model.layers.33.mlp.experts.3.down_proj.weight_scale": "model-00034-of-00047.safetensors", + "model.layers.33.mlp.experts.3.gate_proj.weight": "model-00034-of-00047.safetensors", + "model.layers.33.mlp.experts.3.gate_proj.weight_scale": "model-00034-of-00047.safetensors", + "model.layers.33.mlp.experts.3.up_proj.weight": "model-00034-of-00047.safetensors", + "model.layers.33.mlp.experts.3.up_proj.weight_scale": "model-00034-of-00047.safetensors", + "model.layers.33.mlp.experts.30.down_proj.weight": "model-00034-of-00047.safetensors", + "model.layers.33.mlp.experts.30.down_proj.weight_scale": "model-00034-of-00047.safetensors", + "model.layers.33.mlp.experts.30.gate_proj.weight": "model-00034-of-00047.safetensors", + "model.layers.33.mlp.experts.30.gate_proj.weight_scale": "model-00034-of-00047.safetensors", + "model.layers.33.mlp.experts.30.up_proj.weight": "model-00034-of-00047.safetensors", + "model.layers.33.mlp.experts.30.up_proj.weight_scale": "model-00034-of-00047.safetensors", + "model.layers.33.mlp.experts.31.down_proj.weight": "model-00034-of-00047.safetensors", + "model.layers.33.mlp.experts.31.down_proj.weight_scale": "model-00034-of-00047.safetensors", + "model.layers.33.mlp.experts.31.gate_proj.weight": "model-00034-of-00047.safetensors", + "model.layers.33.mlp.experts.31.gate_proj.weight_scale": "model-00034-of-00047.safetensors", + "model.layers.33.mlp.experts.31.up_proj.weight": "model-00034-of-00047.safetensors", + "model.layers.33.mlp.experts.31.up_proj.weight_scale": "model-00034-of-00047.safetensors", + "model.layers.33.mlp.experts.32.down_proj.weight": "model-00034-of-00047.safetensors", + "model.layers.33.mlp.experts.32.down_proj.weight_scale": "model-00034-of-00047.safetensors", + "model.layers.33.mlp.experts.32.gate_proj.weight": "model-00034-of-00047.safetensors", + "model.layers.33.mlp.experts.32.gate_proj.weight_scale": "model-00034-of-00047.safetensors", + "model.layers.33.mlp.experts.32.up_proj.weight": "model-00034-of-00047.safetensors", + "model.layers.33.mlp.experts.32.up_proj.weight_scale": "model-00034-of-00047.safetensors", + "model.layers.33.mlp.experts.33.down_proj.weight": "model-00034-of-00047.safetensors", + "model.layers.33.mlp.experts.33.down_proj.weight_scale": "model-00034-of-00047.safetensors", + "model.layers.33.mlp.experts.33.gate_proj.weight": "model-00034-of-00047.safetensors", + "model.layers.33.mlp.experts.33.gate_proj.weight_scale": "model-00034-of-00047.safetensors", + "model.layers.33.mlp.experts.33.up_proj.weight": "model-00034-of-00047.safetensors", + "model.layers.33.mlp.experts.33.up_proj.weight_scale": "model-00034-of-00047.safetensors", + "model.layers.33.mlp.experts.34.down_proj.weight": "model-00034-of-00047.safetensors", + "model.layers.33.mlp.experts.34.down_proj.weight_scale": "model-00034-of-00047.safetensors", + "model.layers.33.mlp.experts.34.gate_proj.weight": "model-00034-of-00047.safetensors", + "model.layers.33.mlp.experts.34.gate_proj.weight_scale": "model-00034-of-00047.safetensors", + "model.layers.33.mlp.experts.34.up_proj.weight": "model-00034-of-00047.safetensors", + "model.layers.33.mlp.experts.34.up_proj.weight_scale": "model-00034-of-00047.safetensors", + "model.layers.33.mlp.experts.35.down_proj.weight": "model-00034-of-00047.safetensors", + "model.layers.33.mlp.experts.35.down_proj.weight_scale": "model-00034-of-00047.safetensors", + "model.layers.33.mlp.experts.35.gate_proj.weight": "model-00034-of-00047.safetensors", + "model.layers.33.mlp.experts.35.gate_proj.weight_scale": "model-00034-of-00047.safetensors", + "model.layers.33.mlp.experts.35.up_proj.weight": "model-00034-of-00047.safetensors", + "model.layers.33.mlp.experts.35.up_proj.weight_scale": "model-00034-of-00047.safetensors", + "model.layers.33.mlp.experts.36.down_proj.weight": "model-00034-of-00047.safetensors", + "model.layers.33.mlp.experts.36.down_proj.weight_scale": "model-00034-of-00047.safetensors", + "model.layers.33.mlp.experts.36.gate_proj.weight": "model-00034-of-00047.safetensors", + "model.layers.33.mlp.experts.36.gate_proj.weight_scale": "model-00034-of-00047.safetensors", + "model.layers.33.mlp.experts.36.up_proj.weight": "model-00034-of-00047.safetensors", + "model.layers.33.mlp.experts.36.up_proj.weight_scale": "model-00034-of-00047.safetensors", + "model.layers.33.mlp.experts.37.down_proj.weight": "model-00034-of-00047.safetensors", + "model.layers.33.mlp.experts.37.down_proj.weight_scale": "model-00034-of-00047.safetensors", + "model.layers.33.mlp.experts.37.gate_proj.weight": "model-00034-of-00047.safetensors", + "model.layers.33.mlp.experts.37.gate_proj.weight_scale": "model-00034-of-00047.safetensors", + "model.layers.33.mlp.experts.37.up_proj.weight": "model-00034-of-00047.safetensors", + "model.layers.33.mlp.experts.37.up_proj.weight_scale": "model-00034-of-00047.safetensors", + "model.layers.33.mlp.experts.38.down_proj.weight": "model-00034-of-00047.safetensors", + "model.layers.33.mlp.experts.38.down_proj.weight_scale": "model-00034-of-00047.safetensors", + "model.layers.33.mlp.experts.38.gate_proj.weight": "model-00034-of-00047.safetensors", + "model.layers.33.mlp.experts.38.gate_proj.weight_scale": "model-00034-of-00047.safetensors", + "model.layers.33.mlp.experts.38.up_proj.weight": "model-00034-of-00047.safetensors", + "model.layers.33.mlp.experts.38.up_proj.weight_scale": "model-00034-of-00047.safetensors", + "model.layers.33.mlp.experts.39.down_proj.weight": "model-00034-of-00047.safetensors", + "model.layers.33.mlp.experts.39.down_proj.weight_scale": "model-00034-of-00047.safetensors", + "model.layers.33.mlp.experts.39.gate_proj.weight": "model-00034-of-00047.safetensors", + "model.layers.33.mlp.experts.39.gate_proj.weight_scale": "model-00034-of-00047.safetensors", + "model.layers.33.mlp.experts.39.up_proj.weight": "model-00034-of-00047.safetensors", + "model.layers.33.mlp.experts.39.up_proj.weight_scale": "model-00034-of-00047.safetensors", + "model.layers.33.mlp.experts.4.down_proj.weight": "model-00034-of-00047.safetensors", + "model.layers.33.mlp.experts.4.down_proj.weight_scale": "model-00034-of-00047.safetensors", + "model.layers.33.mlp.experts.4.gate_proj.weight": "model-00034-of-00047.safetensors", + "model.layers.33.mlp.experts.4.gate_proj.weight_scale": "model-00034-of-00047.safetensors", + "model.layers.33.mlp.experts.4.up_proj.weight": "model-00034-of-00047.safetensors", + "model.layers.33.mlp.experts.4.up_proj.weight_scale": "model-00034-of-00047.safetensors", + "model.layers.33.mlp.experts.40.down_proj.weight": "model-00034-of-00047.safetensors", + "model.layers.33.mlp.experts.40.down_proj.weight_scale": "model-00034-of-00047.safetensors", + "model.layers.33.mlp.experts.40.gate_proj.weight": "model-00034-of-00047.safetensors", + "model.layers.33.mlp.experts.40.gate_proj.weight_scale": "model-00034-of-00047.safetensors", + "model.layers.33.mlp.experts.40.up_proj.weight": "model-00034-of-00047.safetensors", + "model.layers.33.mlp.experts.40.up_proj.weight_scale": "model-00034-of-00047.safetensors", + "model.layers.33.mlp.experts.41.down_proj.weight": "model-00034-of-00047.safetensors", + "model.layers.33.mlp.experts.41.down_proj.weight_scale": "model-00034-of-00047.safetensors", + "model.layers.33.mlp.experts.41.gate_proj.weight": "model-00034-of-00047.safetensors", + "model.layers.33.mlp.experts.41.gate_proj.weight_scale": "model-00034-of-00047.safetensors", + "model.layers.33.mlp.experts.41.up_proj.weight": "model-00034-of-00047.safetensors", + "model.layers.33.mlp.experts.41.up_proj.weight_scale": "model-00034-of-00047.safetensors", + "model.layers.33.mlp.experts.42.down_proj.weight": "model-00034-of-00047.safetensors", + "model.layers.33.mlp.experts.42.down_proj.weight_scale": "model-00034-of-00047.safetensors", + "model.layers.33.mlp.experts.42.gate_proj.weight": "model-00034-of-00047.safetensors", + "model.layers.33.mlp.experts.42.gate_proj.weight_scale": "model-00034-of-00047.safetensors", + "model.layers.33.mlp.experts.42.up_proj.weight": "model-00034-of-00047.safetensors", + "model.layers.33.mlp.experts.42.up_proj.weight_scale": "model-00034-of-00047.safetensors", + "model.layers.33.mlp.experts.43.down_proj.weight": "model-00034-of-00047.safetensors", + "model.layers.33.mlp.experts.43.down_proj.weight_scale": "model-00034-of-00047.safetensors", + "model.layers.33.mlp.experts.43.gate_proj.weight": "model-00034-of-00047.safetensors", + "model.layers.33.mlp.experts.43.gate_proj.weight_scale": "model-00034-of-00047.safetensors", + "model.layers.33.mlp.experts.43.up_proj.weight": "model-00034-of-00047.safetensors", + "model.layers.33.mlp.experts.43.up_proj.weight_scale": "model-00034-of-00047.safetensors", + "model.layers.33.mlp.experts.44.down_proj.weight": "model-00034-of-00047.safetensors", + "model.layers.33.mlp.experts.44.down_proj.weight_scale": "model-00034-of-00047.safetensors", + "model.layers.33.mlp.experts.44.gate_proj.weight": "model-00034-of-00047.safetensors", + "model.layers.33.mlp.experts.44.gate_proj.weight_scale": "model-00034-of-00047.safetensors", + "model.layers.33.mlp.experts.44.up_proj.weight": "model-00034-of-00047.safetensors", + "model.layers.33.mlp.experts.44.up_proj.weight_scale": "model-00034-of-00047.safetensors", + "model.layers.33.mlp.experts.45.down_proj.weight": "model-00034-of-00047.safetensors", + "model.layers.33.mlp.experts.45.down_proj.weight_scale": "model-00034-of-00047.safetensors", + "model.layers.33.mlp.experts.45.gate_proj.weight": "model-00034-of-00047.safetensors", + "model.layers.33.mlp.experts.45.gate_proj.weight_scale": "model-00034-of-00047.safetensors", + "model.layers.33.mlp.experts.45.up_proj.weight": "model-00034-of-00047.safetensors", + "model.layers.33.mlp.experts.45.up_proj.weight_scale": "model-00034-of-00047.safetensors", + "model.layers.33.mlp.experts.46.down_proj.weight": "model-00034-of-00047.safetensors", + "model.layers.33.mlp.experts.46.down_proj.weight_scale": "model-00034-of-00047.safetensors", + "model.layers.33.mlp.experts.46.gate_proj.weight": "model-00034-of-00047.safetensors", + "model.layers.33.mlp.experts.46.gate_proj.weight_scale": "model-00034-of-00047.safetensors", + "model.layers.33.mlp.experts.46.up_proj.weight": "model-00034-of-00047.safetensors", + "model.layers.33.mlp.experts.46.up_proj.weight_scale": "model-00034-of-00047.safetensors", + "model.layers.33.mlp.experts.47.down_proj.weight": "model-00034-of-00047.safetensors", + "model.layers.33.mlp.experts.47.down_proj.weight_scale": "model-00034-of-00047.safetensors", + "model.layers.33.mlp.experts.47.gate_proj.weight": "model-00034-of-00047.safetensors", + "model.layers.33.mlp.experts.47.gate_proj.weight_scale": "model-00034-of-00047.safetensors", + "model.layers.33.mlp.experts.47.up_proj.weight": "model-00034-of-00047.safetensors", + "model.layers.33.mlp.experts.47.up_proj.weight_scale": "model-00034-of-00047.safetensors", + "model.layers.33.mlp.experts.48.down_proj.weight": "model-00034-of-00047.safetensors", + "model.layers.33.mlp.experts.48.down_proj.weight_scale": "model-00034-of-00047.safetensors", + "model.layers.33.mlp.experts.48.gate_proj.weight": "model-00034-of-00047.safetensors", + "model.layers.33.mlp.experts.48.gate_proj.weight_scale": "model-00034-of-00047.safetensors", + "model.layers.33.mlp.experts.48.up_proj.weight": "model-00034-of-00047.safetensors", + "model.layers.33.mlp.experts.48.up_proj.weight_scale": "model-00034-of-00047.safetensors", + "model.layers.33.mlp.experts.49.down_proj.weight": "model-00034-of-00047.safetensors", + "model.layers.33.mlp.experts.49.down_proj.weight_scale": "model-00034-of-00047.safetensors", + "model.layers.33.mlp.experts.49.gate_proj.weight": "model-00034-of-00047.safetensors", + "model.layers.33.mlp.experts.49.gate_proj.weight_scale": "model-00034-of-00047.safetensors", + "model.layers.33.mlp.experts.49.up_proj.weight": "model-00034-of-00047.safetensors", + "model.layers.33.mlp.experts.49.up_proj.weight_scale": "model-00034-of-00047.safetensors", + "model.layers.33.mlp.experts.5.down_proj.weight": "model-00034-of-00047.safetensors", + "model.layers.33.mlp.experts.5.down_proj.weight_scale": "model-00034-of-00047.safetensors", + "model.layers.33.mlp.experts.5.gate_proj.weight": "model-00034-of-00047.safetensors", + "model.layers.33.mlp.experts.5.gate_proj.weight_scale": "model-00034-of-00047.safetensors", + "model.layers.33.mlp.experts.5.up_proj.weight": "model-00034-of-00047.safetensors", + "model.layers.33.mlp.experts.5.up_proj.weight_scale": "model-00034-of-00047.safetensors", + "model.layers.33.mlp.experts.50.down_proj.weight": "model-00034-of-00047.safetensors", + "model.layers.33.mlp.experts.50.down_proj.weight_scale": "model-00034-of-00047.safetensors", + "model.layers.33.mlp.experts.50.gate_proj.weight": "model-00034-of-00047.safetensors", + "model.layers.33.mlp.experts.50.gate_proj.weight_scale": "model-00034-of-00047.safetensors", + "model.layers.33.mlp.experts.50.up_proj.weight": "model-00034-of-00047.safetensors", + "model.layers.33.mlp.experts.50.up_proj.weight_scale": "model-00034-of-00047.safetensors", + "model.layers.33.mlp.experts.51.down_proj.weight": "model-00034-of-00047.safetensors", + "model.layers.33.mlp.experts.51.down_proj.weight_scale": "model-00034-of-00047.safetensors", + "model.layers.33.mlp.experts.51.gate_proj.weight": "model-00034-of-00047.safetensors", + "model.layers.33.mlp.experts.51.gate_proj.weight_scale": "model-00034-of-00047.safetensors", + "model.layers.33.mlp.experts.51.up_proj.weight": "model-00034-of-00047.safetensors", + "model.layers.33.mlp.experts.51.up_proj.weight_scale": "model-00034-of-00047.safetensors", + "model.layers.33.mlp.experts.52.down_proj.weight": "model-00034-of-00047.safetensors", + "model.layers.33.mlp.experts.52.down_proj.weight_scale": "model-00034-of-00047.safetensors", + "model.layers.33.mlp.experts.52.gate_proj.weight": "model-00034-of-00047.safetensors", + "model.layers.33.mlp.experts.52.gate_proj.weight_scale": "model-00034-of-00047.safetensors", + "model.layers.33.mlp.experts.52.up_proj.weight": "model-00034-of-00047.safetensors", + "model.layers.33.mlp.experts.52.up_proj.weight_scale": "model-00034-of-00047.safetensors", + "model.layers.33.mlp.experts.53.down_proj.weight": "model-00034-of-00047.safetensors", + "model.layers.33.mlp.experts.53.down_proj.weight_scale": "model-00034-of-00047.safetensors", + "model.layers.33.mlp.experts.53.gate_proj.weight": "model-00034-of-00047.safetensors", + "model.layers.33.mlp.experts.53.gate_proj.weight_scale": "model-00034-of-00047.safetensors", + "model.layers.33.mlp.experts.53.up_proj.weight": "model-00034-of-00047.safetensors", + "model.layers.33.mlp.experts.53.up_proj.weight_scale": "model-00034-of-00047.safetensors", + "model.layers.33.mlp.experts.54.down_proj.weight": "model-00034-of-00047.safetensors", + "model.layers.33.mlp.experts.54.down_proj.weight_scale": "model-00034-of-00047.safetensors", + "model.layers.33.mlp.experts.54.gate_proj.weight": "model-00034-of-00047.safetensors", + "model.layers.33.mlp.experts.54.gate_proj.weight_scale": "model-00034-of-00047.safetensors", + "model.layers.33.mlp.experts.54.up_proj.weight": "model-00034-of-00047.safetensors", + "model.layers.33.mlp.experts.54.up_proj.weight_scale": "model-00034-of-00047.safetensors", + "model.layers.33.mlp.experts.55.down_proj.weight": "model-00034-of-00047.safetensors", + "model.layers.33.mlp.experts.55.down_proj.weight_scale": "model-00034-of-00047.safetensors", + "model.layers.33.mlp.experts.55.gate_proj.weight": "model-00034-of-00047.safetensors", + "model.layers.33.mlp.experts.55.gate_proj.weight_scale": "model-00034-of-00047.safetensors", + "model.layers.33.mlp.experts.55.up_proj.weight": "model-00034-of-00047.safetensors", + "model.layers.33.mlp.experts.55.up_proj.weight_scale": "model-00034-of-00047.safetensors", + "model.layers.33.mlp.experts.56.down_proj.weight": "model-00034-of-00047.safetensors", + "model.layers.33.mlp.experts.56.down_proj.weight_scale": "model-00034-of-00047.safetensors", + "model.layers.33.mlp.experts.56.gate_proj.weight": "model-00034-of-00047.safetensors", + "model.layers.33.mlp.experts.56.gate_proj.weight_scale": "model-00034-of-00047.safetensors", + "model.layers.33.mlp.experts.56.up_proj.weight": "model-00034-of-00047.safetensors", + "model.layers.33.mlp.experts.56.up_proj.weight_scale": "model-00034-of-00047.safetensors", + "model.layers.33.mlp.experts.57.down_proj.weight": "model-00034-of-00047.safetensors", + "model.layers.33.mlp.experts.57.down_proj.weight_scale": "model-00034-of-00047.safetensors", + "model.layers.33.mlp.experts.57.gate_proj.weight": "model-00034-of-00047.safetensors", + "model.layers.33.mlp.experts.57.gate_proj.weight_scale": "model-00034-of-00047.safetensors", + "model.layers.33.mlp.experts.57.up_proj.weight": "model-00034-of-00047.safetensors", + "model.layers.33.mlp.experts.57.up_proj.weight_scale": "model-00034-of-00047.safetensors", + "model.layers.33.mlp.experts.58.down_proj.weight": "model-00034-of-00047.safetensors", + "model.layers.33.mlp.experts.58.down_proj.weight_scale": "model-00034-of-00047.safetensors", + "model.layers.33.mlp.experts.58.gate_proj.weight": "model-00034-of-00047.safetensors", + "model.layers.33.mlp.experts.58.gate_proj.weight_scale": "model-00034-of-00047.safetensors", + "model.layers.33.mlp.experts.58.up_proj.weight": "model-00034-of-00047.safetensors", + "model.layers.33.mlp.experts.58.up_proj.weight_scale": "model-00034-of-00047.safetensors", + "model.layers.33.mlp.experts.59.down_proj.weight": "model-00034-of-00047.safetensors", + "model.layers.33.mlp.experts.59.down_proj.weight_scale": "model-00034-of-00047.safetensors", + "model.layers.33.mlp.experts.59.gate_proj.weight": "model-00034-of-00047.safetensors", + "model.layers.33.mlp.experts.59.gate_proj.weight_scale": "model-00034-of-00047.safetensors", + "model.layers.33.mlp.experts.59.up_proj.weight": "model-00034-of-00047.safetensors", + "model.layers.33.mlp.experts.59.up_proj.weight_scale": "model-00034-of-00047.safetensors", + "model.layers.33.mlp.experts.6.down_proj.weight": "model-00034-of-00047.safetensors", + "model.layers.33.mlp.experts.6.down_proj.weight_scale": "model-00034-of-00047.safetensors", + "model.layers.33.mlp.experts.6.gate_proj.weight": "model-00034-of-00047.safetensors", + "model.layers.33.mlp.experts.6.gate_proj.weight_scale": "model-00034-of-00047.safetensors", + "model.layers.33.mlp.experts.6.up_proj.weight": "model-00034-of-00047.safetensors", + "model.layers.33.mlp.experts.6.up_proj.weight_scale": "model-00034-of-00047.safetensors", + "model.layers.33.mlp.experts.60.down_proj.weight": "model-00034-of-00047.safetensors", + "model.layers.33.mlp.experts.60.down_proj.weight_scale": "model-00034-of-00047.safetensors", + "model.layers.33.mlp.experts.60.gate_proj.weight": "model-00034-of-00047.safetensors", + "model.layers.33.mlp.experts.60.gate_proj.weight_scale": "model-00034-of-00047.safetensors", + "model.layers.33.mlp.experts.60.up_proj.weight": "model-00034-of-00047.safetensors", + "model.layers.33.mlp.experts.60.up_proj.weight_scale": "model-00034-of-00047.safetensors", + "model.layers.33.mlp.experts.61.down_proj.weight": "model-00034-of-00047.safetensors", + "model.layers.33.mlp.experts.61.down_proj.weight_scale": "model-00034-of-00047.safetensors", + "model.layers.33.mlp.experts.61.gate_proj.weight": "model-00034-of-00047.safetensors", + "model.layers.33.mlp.experts.61.gate_proj.weight_scale": "model-00034-of-00047.safetensors", + "model.layers.33.mlp.experts.61.up_proj.weight": "model-00034-of-00047.safetensors", + "model.layers.33.mlp.experts.61.up_proj.weight_scale": "model-00034-of-00047.safetensors", + "model.layers.33.mlp.experts.62.down_proj.weight": "model-00034-of-00047.safetensors", + "model.layers.33.mlp.experts.62.down_proj.weight_scale": "model-00034-of-00047.safetensors", + "model.layers.33.mlp.experts.62.gate_proj.weight": "model-00034-of-00047.safetensors", + "model.layers.33.mlp.experts.62.gate_proj.weight_scale": "model-00034-of-00047.safetensors", + "model.layers.33.mlp.experts.62.up_proj.weight": "model-00034-of-00047.safetensors", + "model.layers.33.mlp.experts.62.up_proj.weight_scale": "model-00034-of-00047.safetensors", + "model.layers.33.mlp.experts.63.down_proj.weight": "model-00034-of-00047.safetensors", + "model.layers.33.mlp.experts.63.down_proj.weight_scale": "model-00034-of-00047.safetensors", + "model.layers.33.mlp.experts.63.gate_proj.weight": "model-00034-of-00047.safetensors", + "model.layers.33.mlp.experts.63.gate_proj.weight_scale": "model-00034-of-00047.safetensors", + "model.layers.33.mlp.experts.63.up_proj.weight": "model-00034-of-00047.safetensors", + "model.layers.33.mlp.experts.63.up_proj.weight_scale": "model-00034-of-00047.safetensors", + "model.layers.33.mlp.experts.64.down_proj.weight": "model-00034-of-00047.safetensors", + "model.layers.33.mlp.experts.64.down_proj.weight_scale": "model-00034-of-00047.safetensors", + "model.layers.33.mlp.experts.64.gate_proj.weight": "model-00034-of-00047.safetensors", + "model.layers.33.mlp.experts.64.gate_proj.weight_scale": "model-00034-of-00047.safetensors", + "model.layers.33.mlp.experts.64.up_proj.weight": "model-00034-of-00047.safetensors", + "model.layers.33.mlp.experts.64.up_proj.weight_scale": "model-00034-of-00047.safetensors", + "model.layers.33.mlp.experts.65.down_proj.weight": "model-00034-of-00047.safetensors", + "model.layers.33.mlp.experts.65.down_proj.weight_scale": "model-00034-of-00047.safetensors", + "model.layers.33.mlp.experts.65.gate_proj.weight": "model-00034-of-00047.safetensors", + "model.layers.33.mlp.experts.65.gate_proj.weight_scale": "model-00034-of-00047.safetensors", + "model.layers.33.mlp.experts.65.up_proj.weight": "model-00034-of-00047.safetensors", + "model.layers.33.mlp.experts.65.up_proj.weight_scale": "model-00034-of-00047.safetensors", + "model.layers.33.mlp.experts.66.down_proj.weight": "model-00034-of-00047.safetensors", + "model.layers.33.mlp.experts.66.down_proj.weight_scale": "model-00034-of-00047.safetensors", + "model.layers.33.mlp.experts.66.gate_proj.weight": "model-00034-of-00047.safetensors", + "model.layers.33.mlp.experts.66.gate_proj.weight_scale": "model-00034-of-00047.safetensors", + "model.layers.33.mlp.experts.66.up_proj.weight": "model-00034-of-00047.safetensors", + "model.layers.33.mlp.experts.66.up_proj.weight_scale": "model-00034-of-00047.safetensors", + "model.layers.33.mlp.experts.67.down_proj.weight": "model-00034-of-00047.safetensors", + "model.layers.33.mlp.experts.67.down_proj.weight_scale": "model-00034-of-00047.safetensors", + "model.layers.33.mlp.experts.67.gate_proj.weight": "model-00034-of-00047.safetensors", + "model.layers.33.mlp.experts.67.gate_proj.weight_scale": "model-00034-of-00047.safetensors", + "model.layers.33.mlp.experts.67.up_proj.weight": "model-00034-of-00047.safetensors", + "model.layers.33.mlp.experts.67.up_proj.weight_scale": "model-00034-of-00047.safetensors", + "model.layers.33.mlp.experts.68.down_proj.weight": "model-00034-of-00047.safetensors", + "model.layers.33.mlp.experts.68.down_proj.weight_scale": "model-00034-of-00047.safetensors", + "model.layers.33.mlp.experts.68.gate_proj.weight": "model-00034-of-00047.safetensors", + "model.layers.33.mlp.experts.68.gate_proj.weight_scale": "model-00034-of-00047.safetensors", + "model.layers.33.mlp.experts.68.up_proj.weight": "model-00034-of-00047.safetensors", + "model.layers.33.mlp.experts.68.up_proj.weight_scale": "model-00034-of-00047.safetensors", + "model.layers.33.mlp.experts.69.down_proj.weight": "model-00034-of-00047.safetensors", + "model.layers.33.mlp.experts.69.down_proj.weight_scale": "model-00034-of-00047.safetensors", + "model.layers.33.mlp.experts.69.gate_proj.weight": "model-00034-of-00047.safetensors", + "model.layers.33.mlp.experts.69.gate_proj.weight_scale": "model-00034-of-00047.safetensors", + "model.layers.33.mlp.experts.69.up_proj.weight": "model-00034-of-00047.safetensors", + "model.layers.33.mlp.experts.69.up_proj.weight_scale": "model-00034-of-00047.safetensors", + "model.layers.33.mlp.experts.7.down_proj.weight": "model-00034-of-00047.safetensors", + "model.layers.33.mlp.experts.7.down_proj.weight_scale": "model-00034-of-00047.safetensors", + "model.layers.33.mlp.experts.7.gate_proj.weight": "model-00034-of-00047.safetensors", + "model.layers.33.mlp.experts.7.gate_proj.weight_scale": "model-00034-of-00047.safetensors", + "model.layers.33.mlp.experts.7.up_proj.weight": "model-00034-of-00047.safetensors", + "model.layers.33.mlp.experts.7.up_proj.weight_scale": "model-00034-of-00047.safetensors", + "model.layers.33.mlp.experts.70.down_proj.weight": "model-00034-of-00047.safetensors", + "model.layers.33.mlp.experts.70.down_proj.weight_scale": "model-00034-of-00047.safetensors", + "model.layers.33.mlp.experts.70.gate_proj.weight": "model-00034-of-00047.safetensors", + "model.layers.33.mlp.experts.70.gate_proj.weight_scale": "model-00034-of-00047.safetensors", + "model.layers.33.mlp.experts.70.up_proj.weight": "model-00034-of-00047.safetensors", + "model.layers.33.mlp.experts.70.up_proj.weight_scale": "model-00034-of-00047.safetensors", + "model.layers.33.mlp.experts.71.down_proj.weight": "model-00034-of-00047.safetensors", + "model.layers.33.mlp.experts.71.down_proj.weight_scale": "model-00034-of-00047.safetensors", + "model.layers.33.mlp.experts.71.gate_proj.weight": "model-00034-of-00047.safetensors", + "model.layers.33.mlp.experts.71.gate_proj.weight_scale": "model-00034-of-00047.safetensors", + "model.layers.33.mlp.experts.71.up_proj.weight": "model-00034-of-00047.safetensors", + "model.layers.33.mlp.experts.71.up_proj.weight_scale": "model-00034-of-00047.safetensors", + "model.layers.33.mlp.experts.72.down_proj.weight": "model-00034-of-00047.safetensors", + "model.layers.33.mlp.experts.72.down_proj.weight_scale": "model-00034-of-00047.safetensors", + "model.layers.33.mlp.experts.72.gate_proj.weight": "model-00034-of-00047.safetensors", + "model.layers.33.mlp.experts.72.gate_proj.weight_scale": "model-00034-of-00047.safetensors", + "model.layers.33.mlp.experts.72.up_proj.weight": "model-00034-of-00047.safetensors", + "model.layers.33.mlp.experts.72.up_proj.weight_scale": "model-00034-of-00047.safetensors", + "model.layers.33.mlp.experts.73.down_proj.weight": "model-00034-of-00047.safetensors", + "model.layers.33.mlp.experts.73.down_proj.weight_scale": "model-00034-of-00047.safetensors", + "model.layers.33.mlp.experts.73.gate_proj.weight": "model-00034-of-00047.safetensors", + "model.layers.33.mlp.experts.73.gate_proj.weight_scale": "model-00034-of-00047.safetensors", + "model.layers.33.mlp.experts.73.up_proj.weight": "model-00034-of-00047.safetensors", + "model.layers.33.mlp.experts.73.up_proj.weight_scale": "model-00034-of-00047.safetensors", + "model.layers.33.mlp.experts.74.down_proj.weight": "model-00034-of-00047.safetensors", + "model.layers.33.mlp.experts.74.down_proj.weight_scale": "model-00034-of-00047.safetensors", + "model.layers.33.mlp.experts.74.gate_proj.weight": "model-00034-of-00047.safetensors", + "model.layers.33.mlp.experts.74.gate_proj.weight_scale": "model-00034-of-00047.safetensors", + "model.layers.33.mlp.experts.74.up_proj.weight": "model-00034-of-00047.safetensors", + "model.layers.33.mlp.experts.74.up_proj.weight_scale": "model-00034-of-00047.safetensors", + "model.layers.33.mlp.experts.75.down_proj.weight": "model-00034-of-00047.safetensors", + "model.layers.33.mlp.experts.75.down_proj.weight_scale": "model-00034-of-00047.safetensors", + "model.layers.33.mlp.experts.75.gate_proj.weight": "model-00034-of-00047.safetensors", + "model.layers.33.mlp.experts.75.gate_proj.weight_scale": "model-00034-of-00047.safetensors", + "model.layers.33.mlp.experts.75.up_proj.weight": "model-00034-of-00047.safetensors", + "model.layers.33.mlp.experts.75.up_proj.weight_scale": "model-00034-of-00047.safetensors", + "model.layers.33.mlp.experts.76.down_proj.weight": "model-00034-of-00047.safetensors", + "model.layers.33.mlp.experts.76.down_proj.weight_scale": "model-00034-of-00047.safetensors", + "model.layers.33.mlp.experts.76.gate_proj.weight": "model-00034-of-00047.safetensors", + "model.layers.33.mlp.experts.76.gate_proj.weight_scale": "model-00034-of-00047.safetensors", + "model.layers.33.mlp.experts.76.up_proj.weight": "model-00034-of-00047.safetensors", + "model.layers.33.mlp.experts.76.up_proj.weight_scale": "model-00034-of-00047.safetensors", + "model.layers.33.mlp.experts.77.down_proj.weight": "model-00034-of-00047.safetensors", + "model.layers.33.mlp.experts.77.down_proj.weight_scale": "model-00034-of-00047.safetensors", + "model.layers.33.mlp.experts.77.gate_proj.weight": "model-00034-of-00047.safetensors", + "model.layers.33.mlp.experts.77.gate_proj.weight_scale": "model-00034-of-00047.safetensors", + "model.layers.33.mlp.experts.77.up_proj.weight": "model-00034-of-00047.safetensors", + "model.layers.33.mlp.experts.77.up_proj.weight_scale": "model-00034-of-00047.safetensors", + "model.layers.33.mlp.experts.78.down_proj.weight": "model-00034-of-00047.safetensors", + "model.layers.33.mlp.experts.78.down_proj.weight_scale": "model-00034-of-00047.safetensors", + "model.layers.33.mlp.experts.78.gate_proj.weight": "model-00034-of-00047.safetensors", + "model.layers.33.mlp.experts.78.gate_proj.weight_scale": "model-00034-of-00047.safetensors", + "model.layers.33.mlp.experts.78.up_proj.weight": "model-00034-of-00047.safetensors", + "model.layers.33.mlp.experts.78.up_proj.weight_scale": "model-00034-of-00047.safetensors", + "model.layers.33.mlp.experts.79.down_proj.weight": "model-00034-of-00047.safetensors", + "model.layers.33.mlp.experts.79.down_proj.weight_scale": "model-00034-of-00047.safetensors", + "model.layers.33.mlp.experts.79.gate_proj.weight": "model-00034-of-00047.safetensors", + "model.layers.33.mlp.experts.79.gate_proj.weight_scale": "model-00034-of-00047.safetensors", + "model.layers.33.mlp.experts.79.up_proj.weight": "model-00034-of-00047.safetensors", + "model.layers.33.mlp.experts.79.up_proj.weight_scale": "model-00034-of-00047.safetensors", + "model.layers.33.mlp.experts.8.down_proj.weight": "model-00034-of-00047.safetensors", + "model.layers.33.mlp.experts.8.down_proj.weight_scale": "model-00034-of-00047.safetensors", + "model.layers.33.mlp.experts.8.gate_proj.weight": "model-00034-of-00047.safetensors", + "model.layers.33.mlp.experts.8.gate_proj.weight_scale": "model-00034-of-00047.safetensors", + "model.layers.33.mlp.experts.8.up_proj.weight": "model-00034-of-00047.safetensors", + "model.layers.33.mlp.experts.8.up_proj.weight_scale": "model-00034-of-00047.safetensors", + "model.layers.33.mlp.experts.80.down_proj.weight": "model-00034-of-00047.safetensors", + "model.layers.33.mlp.experts.80.down_proj.weight_scale": "model-00034-of-00047.safetensors", + "model.layers.33.mlp.experts.80.gate_proj.weight": "model-00034-of-00047.safetensors", + "model.layers.33.mlp.experts.80.gate_proj.weight_scale": "model-00034-of-00047.safetensors", + "model.layers.33.mlp.experts.80.up_proj.weight": "model-00034-of-00047.safetensors", + "model.layers.33.mlp.experts.80.up_proj.weight_scale": "model-00034-of-00047.safetensors", + "model.layers.33.mlp.experts.81.down_proj.weight": "model-00034-of-00047.safetensors", + "model.layers.33.mlp.experts.81.down_proj.weight_scale": "model-00034-of-00047.safetensors", + "model.layers.33.mlp.experts.81.gate_proj.weight": "model-00034-of-00047.safetensors", + "model.layers.33.mlp.experts.81.gate_proj.weight_scale": "model-00034-of-00047.safetensors", + "model.layers.33.mlp.experts.81.up_proj.weight": "model-00034-of-00047.safetensors", + "model.layers.33.mlp.experts.81.up_proj.weight_scale": "model-00034-of-00047.safetensors", + "model.layers.33.mlp.experts.82.down_proj.weight": "model-00034-of-00047.safetensors", + "model.layers.33.mlp.experts.82.down_proj.weight_scale": "model-00034-of-00047.safetensors", + "model.layers.33.mlp.experts.82.gate_proj.weight": "model-00034-of-00047.safetensors", + "model.layers.33.mlp.experts.82.gate_proj.weight_scale": "model-00034-of-00047.safetensors", + "model.layers.33.mlp.experts.82.up_proj.weight": "model-00034-of-00047.safetensors", + "model.layers.33.mlp.experts.82.up_proj.weight_scale": "model-00034-of-00047.safetensors", + "model.layers.33.mlp.experts.83.down_proj.weight": "model-00034-of-00047.safetensors", + "model.layers.33.mlp.experts.83.down_proj.weight_scale": "model-00034-of-00047.safetensors", + "model.layers.33.mlp.experts.83.gate_proj.weight": "model-00034-of-00047.safetensors", + "model.layers.33.mlp.experts.83.gate_proj.weight_scale": "model-00034-of-00047.safetensors", + "model.layers.33.mlp.experts.83.up_proj.weight": "model-00034-of-00047.safetensors", + "model.layers.33.mlp.experts.83.up_proj.weight_scale": "model-00034-of-00047.safetensors", + "model.layers.33.mlp.experts.84.down_proj.weight": "model-00034-of-00047.safetensors", + "model.layers.33.mlp.experts.84.down_proj.weight_scale": "model-00034-of-00047.safetensors", + "model.layers.33.mlp.experts.84.gate_proj.weight": "model-00034-of-00047.safetensors", + "model.layers.33.mlp.experts.84.gate_proj.weight_scale": "model-00034-of-00047.safetensors", + "model.layers.33.mlp.experts.84.up_proj.weight": "model-00034-of-00047.safetensors", + "model.layers.33.mlp.experts.84.up_proj.weight_scale": "model-00034-of-00047.safetensors", + "model.layers.33.mlp.experts.85.down_proj.weight": "model-00034-of-00047.safetensors", + "model.layers.33.mlp.experts.85.down_proj.weight_scale": "model-00034-of-00047.safetensors", + "model.layers.33.mlp.experts.85.gate_proj.weight": "model-00034-of-00047.safetensors", + "model.layers.33.mlp.experts.85.gate_proj.weight_scale": "model-00034-of-00047.safetensors", + "model.layers.33.mlp.experts.85.up_proj.weight": "model-00034-of-00047.safetensors", + "model.layers.33.mlp.experts.85.up_proj.weight_scale": "model-00034-of-00047.safetensors", + "model.layers.33.mlp.experts.86.down_proj.weight": "model-00034-of-00047.safetensors", + "model.layers.33.mlp.experts.86.down_proj.weight_scale": "model-00034-of-00047.safetensors", + "model.layers.33.mlp.experts.86.gate_proj.weight": "model-00034-of-00047.safetensors", + "model.layers.33.mlp.experts.86.gate_proj.weight_scale": "model-00034-of-00047.safetensors", + "model.layers.33.mlp.experts.86.up_proj.weight": "model-00034-of-00047.safetensors", + "model.layers.33.mlp.experts.86.up_proj.weight_scale": "model-00034-of-00047.safetensors", + "model.layers.33.mlp.experts.87.down_proj.weight": "model-00034-of-00047.safetensors", + "model.layers.33.mlp.experts.87.down_proj.weight_scale": "model-00034-of-00047.safetensors", + "model.layers.33.mlp.experts.87.gate_proj.weight": "model-00034-of-00047.safetensors", + "model.layers.33.mlp.experts.87.gate_proj.weight_scale": "model-00034-of-00047.safetensors", + "model.layers.33.mlp.experts.87.up_proj.weight": "model-00034-of-00047.safetensors", + "model.layers.33.mlp.experts.87.up_proj.weight_scale": "model-00034-of-00047.safetensors", + "model.layers.33.mlp.experts.88.down_proj.weight": "model-00034-of-00047.safetensors", + "model.layers.33.mlp.experts.88.down_proj.weight_scale": "model-00034-of-00047.safetensors", + "model.layers.33.mlp.experts.88.gate_proj.weight": "model-00034-of-00047.safetensors", + "model.layers.33.mlp.experts.88.gate_proj.weight_scale": "model-00034-of-00047.safetensors", + "model.layers.33.mlp.experts.88.up_proj.weight": "model-00034-of-00047.safetensors", + "model.layers.33.mlp.experts.88.up_proj.weight_scale": "model-00034-of-00047.safetensors", + "model.layers.33.mlp.experts.89.down_proj.weight": "model-00034-of-00047.safetensors", + "model.layers.33.mlp.experts.89.down_proj.weight_scale": "model-00034-of-00047.safetensors", + "model.layers.33.mlp.experts.89.gate_proj.weight": "model-00034-of-00047.safetensors", + "model.layers.33.mlp.experts.89.gate_proj.weight_scale": "model-00034-of-00047.safetensors", + "model.layers.33.mlp.experts.89.up_proj.weight": "model-00034-of-00047.safetensors", + "model.layers.33.mlp.experts.89.up_proj.weight_scale": "model-00034-of-00047.safetensors", + "model.layers.33.mlp.experts.9.down_proj.weight": "model-00034-of-00047.safetensors", + "model.layers.33.mlp.experts.9.down_proj.weight_scale": "model-00034-of-00047.safetensors", + "model.layers.33.mlp.experts.9.gate_proj.weight": "model-00034-of-00047.safetensors", + "model.layers.33.mlp.experts.9.gate_proj.weight_scale": "model-00034-of-00047.safetensors", + "model.layers.33.mlp.experts.9.up_proj.weight": "model-00034-of-00047.safetensors", + "model.layers.33.mlp.experts.9.up_proj.weight_scale": "model-00034-of-00047.safetensors", + "model.layers.33.mlp.experts.90.down_proj.weight": "model-00034-of-00047.safetensors", + "model.layers.33.mlp.experts.90.down_proj.weight_scale": "model-00034-of-00047.safetensors", + "model.layers.33.mlp.experts.90.gate_proj.weight": "model-00034-of-00047.safetensors", + "model.layers.33.mlp.experts.90.gate_proj.weight_scale": "model-00034-of-00047.safetensors", + "model.layers.33.mlp.experts.90.up_proj.weight": "model-00034-of-00047.safetensors", + "model.layers.33.mlp.experts.90.up_proj.weight_scale": "model-00034-of-00047.safetensors", + "model.layers.33.mlp.experts.91.down_proj.weight": "model-00034-of-00047.safetensors", + "model.layers.33.mlp.experts.91.down_proj.weight_scale": "model-00034-of-00047.safetensors", + "model.layers.33.mlp.experts.91.gate_proj.weight": "model-00034-of-00047.safetensors", + "model.layers.33.mlp.experts.91.gate_proj.weight_scale": "model-00034-of-00047.safetensors", + "model.layers.33.mlp.experts.91.up_proj.weight": "model-00034-of-00047.safetensors", + "model.layers.33.mlp.experts.91.up_proj.weight_scale": "model-00034-of-00047.safetensors", + "model.layers.33.mlp.experts.92.down_proj.weight": "model-00034-of-00047.safetensors", + "model.layers.33.mlp.experts.92.down_proj.weight_scale": "model-00034-of-00047.safetensors", + "model.layers.33.mlp.experts.92.gate_proj.weight": "model-00034-of-00047.safetensors", + "model.layers.33.mlp.experts.92.gate_proj.weight_scale": "model-00034-of-00047.safetensors", + "model.layers.33.mlp.experts.92.up_proj.weight": "model-00034-of-00047.safetensors", + "model.layers.33.mlp.experts.92.up_proj.weight_scale": "model-00034-of-00047.safetensors", + "model.layers.33.mlp.experts.93.down_proj.weight": "model-00034-of-00047.safetensors", + "model.layers.33.mlp.experts.93.down_proj.weight_scale": "model-00034-of-00047.safetensors", + "model.layers.33.mlp.experts.93.gate_proj.weight": "model-00034-of-00047.safetensors", + "model.layers.33.mlp.experts.93.gate_proj.weight_scale": "model-00034-of-00047.safetensors", + "model.layers.33.mlp.experts.93.up_proj.weight": "model-00034-of-00047.safetensors", + "model.layers.33.mlp.experts.93.up_proj.weight_scale": "model-00034-of-00047.safetensors", + "model.layers.33.mlp.experts.94.down_proj.weight": "model-00034-of-00047.safetensors", + "model.layers.33.mlp.experts.94.down_proj.weight_scale": "model-00034-of-00047.safetensors", + "model.layers.33.mlp.experts.94.gate_proj.weight": "model-00034-of-00047.safetensors", + "model.layers.33.mlp.experts.94.gate_proj.weight_scale": "model-00034-of-00047.safetensors", + "model.layers.33.mlp.experts.94.up_proj.weight": "model-00034-of-00047.safetensors", + "model.layers.33.mlp.experts.94.up_proj.weight_scale": "model-00034-of-00047.safetensors", + "model.layers.33.mlp.experts.95.down_proj.weight": "model-00034-of-00047.safetensors", + "model.layers.33.mlp.experts.95.down_proj.weight_scale": "model-00034-of-00047.safetensors", + "model.layers.33.mlp.experts.95.gate_proj.weight": "model-00034-of-00047.safetensors", + "model.layers.33.mlp.experts.95.gate_proj.weight_scale": "model-00034-of-00047.safetensors", + "model.layers.33.mlp.experts.95.up_proj.weight": "model-00034-of-00047.safetensors", + "model.layers.33.mlp.experts.95.up_proj.weight_scale": "model-00034-of-00047.safetensors", + "model.layers.33.mlp.experts.96.down_proj.weight": "model-00034-of-00047.safetensors", + "model.layers.33.mlp.experts.96.down_proj.weight_scale": "model-00034-of-00047.safetensors", + "model.layers.33.mlp.experts.96.gate_proj.weight": "model-00034-of-00047.safetensors", + "model.layers.33.mlp.experts.96.gate_proj.weight_scale": "model-00034-of-00047.safetensors", + "model.layers.33.mlp.experts.96.up_proj.weight": "model-00034-of-00047.safetensors", + "model.layers.33.mlp.experts.96.up_proj.weight_scale": "model-00034-of-00047.safetensors", + "model.layers.33.mlp.experts.97.down_proj.weight": "model-00034-of-00047.safetensors", + "model.layers.33.mlp.experts.97.down_proj.weight_scale": "model-00034-of-00047.safetensors", + "model.layers.33.mlp.experts.97.gate_proj.weight": "model-00034-of-00047.safetensors", + "model.layers.33.mlp.experts.97.gate_proj.weight_scale": "model-00034-of-00047.safetensors", + "model.layers.33.mlp.experts.97.up_proj.weight": "model-00034-of-00047.safetensors", + "model.layers.33.mlp.experts.97.up_proj.weight_scale": "model-00034-of-00047.safetensors", + "model.layers.33.mlp.experts.98.down_proj.weight": "model-00034-of-00047.safetensors", + "model.layers.33.mlp.experts.98.down_proj.weight_scale": "model-00034-of-00047.safetensors", + "model.layers.33.mlp.experts.98.gate_proj.weight": "model-00034-of-00047.safetensors", + "model.layers.33.mlp.experts.98.gate_proj.weight_scale": "model-00034-of-00047.safetensors", + "model.layers.33.mlp.experts.98.up_proj.weight": "model-00034-of-00047.safetensors", + "model.layers.33.mlp.experts.98.up_proj.weight_scale": "model-00034-of-00047.safetensors", + "model.layers.33.mlp.experts.99.down_proj.weight": "model-00034-of-00047.safetensors", + "model.layers.33.mlp.experts.99.down_proj.weight_scale": "model-00034-of-00047.safetensors", + "model.layers.33.mlp.experts.99.gate_proj.weight": "model-00034-of-00047.safetensors", + "model.layers.33.mlp.experts.99.gate_proj.weight_scale": "model-00034-of-00047.safetensors", + "model.layers.33.mlp.experts.99.up_proj.weight": "model-00034-of-00047.safetensors", + "model.layers.33.mlp.experts.99.up_proj.weight_scale": "model-00034-of-00047.safetensors", + "model.layers.33.mlp.gate.e_score_correction_bias": "model-00034-of-00047.safetensors", + "model.layers.33.mlp.gate.weight": "model-00034-of-00047.safetensors", + "model.layers.33.mlp.shared_experts.down_proj.weight": "model-00034-of-00047.safetensors", + "model.layers.33.mlp.shared_experts.down_proj.weight_scale": "model-00034-of-00047.safetensors", + "model.layers.33.mlp.shared_experts.gate_proj.weight": "model-00034-of-00047.safetensors", + "model.layers.33.mlp.shared_experts.gate_proj.weight_scale": "model-00034-of-00047.safetensors", + "model.layers.33.mlp.shared_experts.up_proj.weight": "model-00034-of-00047.safetensors", + "model.layers.33.mlp.shared_experts.up_proj.weight_scale": "model-00034-of-00047.safetensors", + "model.layers.33.post_attention_layernorm.weight": "model-00034-of-00047.safetensors", + "model.layers.33.self_attn.k_proj.bias": "model-00034-of-00047.safetensors", + "model.layers.33.self_attn.k_proj.weight": "model-00034-of-00047.safetensors", + "model.layers.33.self_attn.k_proj.weight_scale": "model-00034-of-00047.safetensors", + "model.layers.33.self_attn.o_proj.weight": "model-00034-of-00047.safetensors", + "model.layers.33.self_attn.o_proj.weight_scale": "model-00034-of-00047.safetensors", + "model.layers.33.self_attn.q_proj.bias": "model-00034-of-00047.safetensors", + "model.layers.33.self_attn.q_proj.weight": "model-00034-of-00047.safetensors", + "model.layers.33.self_attn.q_proj.weight_scale": "model-00034-of-00047.safetensors", + "model.layers.33.self_attn.v_proj.bias": "model-00034-of-00047.safetensors", + "model.layers.33.self_attn.v_proj.weight": "model-00034-of-00047.safetensors", + "model.layers.33.self_attn.v_proj.weight_scale": "model-00034-of-00047.safetensors", + "model.layers.34.input_layernorm.weight": "model-00035-of-00047.safetensors", + "model.layers.34.mlp.experts.0.down_proj.weight": "model-00035-of-00047.safetensors", + "model.layers.34.mlp.experts.0.down_proj.weight_scale": "model-00035-of-00047.safetensors", + "model.layers.34.mlp.experts.0.gate_proj.weight": "model-00035-of-00047.safetensors", + "model.layers.34.mlp.experts.0.gate_proj.weight_scale": "model-00035-of-00047.safetensors", + "model.layers.34.mlp.experts.0.up_proj.weight": "model-00035-of-00047.safetensors", + "model.layers.34.mlp.experts.0.up_proj.weight_scale": "model-00035-of-00047.safetensors", + "model.layers.34.mlp.experts.1.down_proj.weight": "model-00035-of-00047.safetensors", + "model.layers.34.mlp.experts.1.down_proj.weight_scale": "model-00035-of-00047.safetensors", + "model.layers.34.mlp.experts.1.gate_proj.weight": "model-00035-of-00047.safetensors", + "model.layers.34.mlp.experts.1.gate_proj.weight_scale": "model-00035-of-00047.safetensors", + "model.layers.34.mlp.experts.1.up_proj.weight": "model-00035-of-00047.safetensors", + "model.layers.34.mlp.experts.1.up_proj.weight_scale": "model-00035-of-00047.safetensors", + "model.layers.34.mlp.experts.10.down_proj.weight": "model-00035-of-00047.safetensors", + "model.layers.34.mlp.experts.10.down_proj.weight_scale": "model-00035-of-00047.safetensors", + "model.layers.34.mlp.experts.10.gate_proj.weight": "model-00035-of-00047.safetensors", + "model.layers.34.mlp.experts.10.gate_proj.weight_scale": "model-00035-of-00047.safetensors", + "model.layers.34.mlp.experts.10.up_proj.weight": "model-00035-of-00047.safetensors", + "model.layers.34.mlp.experts.10.up_proj.weight_scale": "model-00035-of-00047.safetensors", + "model.layers.34.mlp.experts.100.down_proj.weight": "model-00035-of-00047.safetensors", + "model.layers.34.mlp.experts.100.down_proj.weight_scale": "model-00035-of-00047.safetensors", + "model.layers.34.mlp.experts.100.gate_proj.weight": "model-00035-of-00047.safetensors", + "model.layers.34.mlp.experts.100.gate_proj.weight_scale": "model-00035-of-00047.safetensors", + "model.layers.34.mlp.experts.100.up_proj.weight": "model-00035-of-00047.safetensors", + "model.layers.34.mlp.experts.100.up_proj.weight_scale": "model-00035-of-00047.safetensors", + "model.layers.34.mlp.experts.101.down_proj.weight": "model-00035-of-00047.safetensors", + "model.layers.34.mlp.experts.101.down_proj.weight_scale": "model-00035-of-00047.safetensors", + "model.layers.34.mlp.experts.101.gate_proj.weight": "model-00035-of-00047.safetensors", + "model.layers.34.mlp.experts.101.gate_proj.weight_scale": "model-00035-of-00047.safetensors", + "model.layers.34.mlp.experts.101.up_proj.weight": "model-00035-of-00047.safetensors", + "model.layers.34.mlp.experts.101.up_proj.weight_scale": "model-00035-of-00047.safetensors", + "model.layers.34.mlp.experts.102.down_proj.weight": "model-00035-of-00047.safetensors", + "model.layers.34.mlp.experts.102.down_proj.weight_scale": "model-00035-of-00047.safetensors", + "model.layers.34.mlp.experts.102.gate_proj.weight": "model-00035-of-00047.safetensors", + "model.layers.34.mlp.experts.102.gate_proj.weight_scale": "model-00035-of-00047.safetensors", + "model.layers.34.mlp.experts.102.up_proj.weight": "model-00035-of-00047.safetensors", + "model.layers.34.mlp.experts.102.up_proj.weight_scale": "model-00035-of-00047.safetensors", + "model.layers.34.mlp.experts.103.down_proj.weight": "model-00035-of-00047.safetensors", + "model.layers.34.mlp.experts.103.down_proj.weight_scale": "model-00035-of-00047.safetensors", + "model.layers.34.mlp.experts.103.gate_proj.weight": "model-00035-of-00047.safetensors", + "model.layers.34.mlp.experts.103.gate_proj.weight_scale": "model-00035-of-00047.safetensors", + "model.layers.34.mlp.experts.103.up_proj.weight": "model-00035-of-00047.safetensors", + "model.layers.34.mlp.experts.103.up_proj.weight_scale": "model-00035-of-00047.safetensors", + "model.layers.34.mlp.experts.104.down_proj.weight": "model-00035-of-00047.safetensors", + "model.layers.34.mlp.experts.104.down_proj.weight_scale": "model-00035-of-00047.safetensors", + "model.layers.34.mlp.experts.104.gate_proj.weight": "model-00035-of-00047.safetensors", + "model.layers.34.mlp.experts.104.gate_proj.weight_scale": "model-00035-of-00047.safetensors", + "model.layers.34.mlp.experts.104.up_proj.weight": "model-00035-of-00047.safetensors", + "model.layers.34.mlp.experts.104.up_proj.weight_scale": "model-00035-of-00047.safetensors", + "model.layers.34.mlp.experts.105.down_proj.weight": "model-00035-of-00047.safetensors", + "model.layers.34.mlp.experts.105.down_proj.weight_scale": "model-00035-of-00047.safetensors", + "model.layers.34.mlp.experts.105.gate_proj.weight": "model-00035-of-00047.safetensors", + "model.layers.34.mlp.experts.105.gate_proj.weight_scale": "model-00035-of-00047.safetensors", + "model.layers.34.mlp.experts.105.up_proj.weight": "model-00035-of-00047.safetensors", + "model.layers.34.mlp.experts.105.up_proj.weight_scale": "model-00035-of-00047.safetensors", + "model.layers.34.mlp.experts.106.down_proj.weight": "model-00035-of-00047.safetensors", + "model.layers.34.mlp.experts.106.down_proj.weight_scale": "model-00035-of-00047.safetensors", + "model.layers.34.mlp.experts.106.gate_proj.weight": "model-00035-of-00047.safetensors", + "model.layers.34.mlp.experts.106.gate_proj.weight_scale": "model-00035-of-00047.safetensors", + "model.layers.34.mlp.experts.106.up_proj.weight": "model-00035-of-00047.safetensors", + "model.layers.34.mlp.experts.106.up_proj.weight_scale": "model-00035-of-00047.safetensors", + "model.layers.34.mlp.experts.107.down_proj.weight": "model-00035-of-00047.safetensors", + "model.layers.34.mlp.experts.107.down_proj.weight_scale": "model-00035-of-00047.safetensors", + "model.layers.34.mlp.experts.107.gate_proj.weight": "model-00035-of-00047.safetensors", + "model.layers.34.mlp.experts.107.gate_proj.weight_scale": "model-00035-of-00047.safetensors", + "model.layers.34.mlp.experts.107.up_proj.weight": "model-00035-of-00047.safetensors", + "model.layers.34.mlp.experts.107.up_proj.weight_scale": "model-00035-of-00047.safetensors", + "model.layers.34.mlp.experts.108.down_proj.weight": "model-00035-of-00047.safetensors", + "model.layers.34.mlp.experts.108.down_proj.weight_scale": "model-00035-of-00047.safetensors", + "model.layers.34.mlp.experts.108.gate_proj.weight": "model-00035-of-00047.safetensors", + "model.layers.34.mlp.experts.108.gate_proj.weight_scale": "model-00035-of-00047.safetensors", + "model.layers.34.mlp.experts.108.up_proj.weight": "model-00035-of-00047.safetensors", + "model.layers.34.mlp.experts.108.up_proj.weight_scale": "model-00035-of-00047.safetensors", + "model.layers.34.mlp.experts.109.down_proj.weight": "model-00035-of-00047.safetensors", + "model.layers.34.mlp.experts.109.down_proj.weight_scale": "model-00035-of-00047.safetensors", + "model.layers.34.mlp.experts.109.gate_proj.weight": "model-00035-of-00047.safetensors", + "model.layers.34.mlp.experts.109.gate_proj.weight_scale": "model-00035-of-00047.safetensors", + "model.layers.34.mlp.experts.109.up_proj.weight": "model-00035-of-00047.safetensors", + "model.layers.34.mlp.experts.109.up_proj.weight_scale": "model-00035-of-00047.safetensors", + "model.layers.34.mlp.experts.11.down_proj.weight": "model-00035-of-00047.safetensors", + "model.layers.34.mlp.experts.11.down_proj.weight_scale": "model-00035-of-00047.safetensors", + "model.layers.34.mlp.experts.11.gate_proj.weight": "model-00035-of-00047.safetensors", + "model.layers.34.mlp.experts.11.gate_proj.weight_scale": "model-00035-of-00047.safetensors", + "model.layers.34.mlp.experts.11.up_proj.weight": "model-00035-of-00047.safetensors", + "model.layers.34.mlp.experts.11.up_proj.weight_scale": "model-00035-of-00047.safetensors", + "model.layers.34.mlp.experts.110.down_proj.weight": "model-00035-of-00047.safetensors", + "model.layers.34.mlp.experts.110.down_proj.weight_scale": "model-00035-of-00047.safetensors", + "model.layers.34.mlp.experts.110.gate_proj.weight": "model-00035-of-00047.safetensors", + "model.layers.34.mlp.experts.110.gate_proj.weight_scale": "model-00035-of-00047.safetensors", + "model.layers.34.mlp.experts.110.up_proj.weight": "model-00035-of-00047.safetensors", + "model.layers.34.mlp.experts.110.up_proj.weight_scale": "model-00035-of-00047.safetensors", + "model.layers.34.mlp.experts.111.down_proj.weight": "model-00035-of-00047.safetensors", + "model.layers.34.mlp.experts.111.down_proj.weight_scale": "model-00035-of-00047.safetensors", + "model.layers.34.mlp.experts.111.gate_proj.weight": "model-00035-of-00047.safetensors", + "model.layers.34.mlp.experts.111.gate_proj.weight_scale": "model-00035-of-00047.safetensors", + "model.layers.34.mlp.experts.111.up_proj.weight": "model-00035-of-00047.safetensors", + "model.layers.34.mlp.experts.111.up_proj.weight_scale": "model-00035-of-00047.safetensors", + "model.layers.34.mlp.experts.112.down_proj.weight": "model-00035-of-00047.safetensors", + "model.layers.34.mlp.experts.112.down_proj.weight_scale": "model-00035-of-00047.safetensors", + "model.layers.34.mlp.experts.112.gate_proj.weight": "model-00035-of-00047.safetensors", + "model.layers.34.mlp.experts.112.gate_proj.weight_scale": "model-00035-of-00047.safetensors", + "model.layers.34.mlp.experts.112.up_proj.weight": "model-00035-of-00047.safetensors", + "model.layers.34.mlp.experts.112.up_proj.weight_scale": "model-00035-of-00047.safetensors", + "model.layers.34.mlp.experts.113.down_proj.weight": "model-00035-of-00047.safetensors", + "model.layers.34.mlp.experts.113.down_proj.weight_scale": "model-00035-of-00047.safetensors", + "model.layers.34.mlp.experts.113.gate_proj.weight": "model-00035-of-00047.safetensors", + "model.layers.34.mlp.experts.113.gate_proj.weight_scale": "model-00035-of-00047.safetensors", + "model.layers.34.mlp.experts.113.up_proj.weight": "model-00035-of-00047.safetensors", + "model.layers.34.mlp.experts.113.up_proj.weight_scale": "model-00035-of-00047.safetensors", + "model.layers.34.mlp.experts.114.down_proj.weight": "model-00035-of-00047.safetensors", + "model.layers.34.mlp.experts.114.down_proj.weight_scale": "model-00035-of-00047.safetensors", + "model.layers.34.mlp.experts.114.gate_proj.weight": "model-00035-of-00047.safetensors", + "model.layers.34.mlp.experts.114.gate_proj.weight_scale": "model-00035-of-00047.safetensors", + "model.layers.34.mlp.experts.114.up_proj.weight": "model-00035-of-00047.safetensors", + "model.layers.34.mlp.experts.114.up_proj.weight_scale": "model-00035-of-00047.safetensors", + "model.layers.34.mlp.experts.115.down_proj.weight": "model-00035-of-00047.safetensors", + "model.layers.34.mlp.experts.115.down_proj.weight_scale": "model-00035-of-00047.safetensors", + "model.layers.34.mlp.experts.115.gate_proj.weight": "model-00035-of-00047.safetensors", + "model.layers.34.mlp.experts.115.gate_proj.weight_scale": "model-00035-of-00047.safetensors", + "model.layers.34.mlp.experts.115.up_proj.weight": "model-00035-of-00047.safetensors", + "model.layers.34.mlp.experts.115.up_proj.weight_scale": "model-00035-of-00047.safetensors", + "model.layers.34.mlp.experts.116.down_proj.weight": "model-00035-of-00047.safetensors", + "model.layers.34.mlp.experts.116.down_proj.weight_scale": "model-00035-of-00047.safetensors", + "model.layers.34.mlp.experts.116.gate_proj.weight": "model-00035-of-00047.safetensors", + "model.layers.34.mlp.experts.116.gate_proj.weight_scale": "model-00035-of-00047.safetensors", + "model.layers.34.mlp.experts.116.up_proj.weight": "model-00035-of-00047.safetensors", + "model.layers.34.mlp.experts.116.up_proj.weight_scale": "model-00035-of-00047.safetensors", + "model.layers.34.mlp.experts.117.down_proj.weight": "model-00035-of-00047.safetensors", + "model.layers.34.mlp.experts.117.down_proj.weight_scale": "model-00035-of-00047.safetensors", + "model.layers.34.mlp.experts.117.gate_proj.weight": "model-00035-of-00047.safetensors", + "model.layers.34.mlp.experts.117.gate_proj.weight_scale": "model-00035-of-00047.safetensors", + "model.layers.34.mlp.experts.117.up_proj.weight": "model-00035-of-00047.safetensors", + "model.layers.34.mlp.experts.117.up_proj.weight_scale": "model-00035-of-00047.safetensors", + "model.layers.34.mlp.experts.118.down_proj.weight": "model-00035-of-00047.safetensors", + "model.layers.34.mlp.experts.118.down_proj.weight_scale": "model-00035-of-00047.safetensors", + "model.layers.34.mlp.experts.118.gate_proj.weight": "model-00035-of-00047.safetensors", + "model.layers.34.mlp.experts.118.gate_proj.weight_scale": "model-00035-of-00047.safetensors", + "model.layers.34.mlp.experts.118.up_proj.weight": "model-00035-of-00047.safetensors", + "model.layers.34.mlp.experts.118.up_proj.weight_scale": "model-00035-of-00047.safetensors", + "model.layers.34.mlp.experts.119.down_proj.weight": "model-00035-of-00047.safetensors", + "model.layers.34.mlp.experts.119.down_proj.weight_scale": "model-00035-of-00047.safetensors", + "model.layers.34.mlp.experts.119.gate_proj.weight": "model-00035-of-00047.safetensors", + "model.layers.34.mlp.experts.119.gate_proj.weight_scale": "model-00035-of-00047.safetensors", + "model.layers.34.mlp.experts.119.up_proj.weight": "model-00035-of-00047.safetensors", + "model.layers.34.mlp.experts.119.up_proj.weight_scale": "model-00035-of-00047.safetensors", + "model.layers.34.mlp.experts.12.down_proj.weight": "model-00035-of-00047.safetensors", + "model.layers.34.mlp.experts.12.down_proj.weight_scale": "model-00035-of-00047.safetensors", + "model.layers.34.mlp.experts.12.gate_proj.weight": "model-00035-of-00047.safetensors", + "model.layers.34.mlp.experts.12.gate_proj.weight_scale": "model-00035-of-00047.safetensors", + "model.layers.34.mlp.experts.12.up_proj.weight": "model-00035-of-00047.safetensors", + "model.layers.34.mlp.experts.12.up_proj.weight_scale": "model-00035-of-00047.safetensors", + "model.layers.34.mlp.experts.120.down_proj.weight": "model-00035-of-00047.safetensors", + "model.layers.34.mlp.experts.120.down_proj.weight_scale": "model-00035-of-00047.safetensors", + "model.layers.34.mlp.experts.120.gate_proj.weight": "model-00035-of-00047.safetensors", + "model.layers.34.mlp.experts.120.gate_proj.weight_scale": "model-00035-of-00047.safetensors", + "model.layers.34.mlp.experts.120.up_proj.weight": "model-00035-of-00047.safetensors", + "model.layers.34.mlp.experts.120.up_proj.weight_scale": "model-00035-of-00047.safetensors", + "model.layers.34.mlp.experts.121.down_proj.weight": "model-00035-of-00047.safetensors", + "model.layers.34.mlp.experts.121.down_proj.weight_scale": "model-00035-of-00047.safetensors", + "model.layers.34.mlp.experts.121.gate_proj.weight": "model-00035-of-00047.safetensors", + "model.layers.34.mlp.experts.121.gate_proj.weight_scale": "model-00035-of-00047.safetensors", + "model.layers.34.mlp.experts.121.up_proj.weight": "model-00035-of-00047.safetensors", + "model.layers.34.mlp.experts.121.up_proj.weight_scale": "model-00035-of-00047.safetensors", + "model.layers.34.mlp.experts.122.down_proj.weight": "model-00035-of-00047.safetensors", + "model.layers.34.mlp.experts.122.down_proj.weight_scale": "model-00035-of-00047.safetensors", + "model.layers.34.mlp.experts.122.gate_proj.weight": "model-00035-of-00047.safetensors", + "model.layers.34.mlp.experts.122.gate_proj.weight_scale": "model-00035-of-00047.safetensors", + "model.layers.34.mlp.experts.122.up_proj.weight": "model-00035-of-00047.safetensors", + "model.layers.34.mlp.experts.122.up_proj.weight_scale": "model-00035-of-00047.safetensors", + "model.layers.34.mlp.experts.123.down_proj.weight": "model-00035-of-00047.safetensors", + "model.layers.34.mlp.experts.123.down_proj.weight_scale": "model-00035-of-00047.safetensors", + "model.layers.34.mlp.experts.123.gate_proj.weight": "model-00035-of-00047.safetensors", + "model.layers.34.mlp.experts.123.gate_proj.weight_scale": "model-00035-of-00047.safetensors", + "model.layers.34.mlp.experts.123.up_proj.weight": "model-00035-of-00047.safetensors", + "model.layers.34.mlp.experts.123.up_proj.weight_scale": "model-00035-of-00047.safetensors", + "model.layers.34.mlp.experts.124.down_proj.weight": "model-00035-of-00047.safetensors", + "model.layers.34.mlp.experts.124.down_proj.weight_scale": "model-00035-of-00047.safetensors", + "model.layers.34.mlp.experts.124.gate_proj.weight": "model-00035-of-00047.safetensors", + "model.layers.34.mlp.experts.124.gate_proj.weight_scale": "model-00035-of-00047.safetensors", + "model.layers.34.mlp.experts.124.up_proj.weight": "model-00035-of-00047.safetensors", + "model.layers.34.mlp.experts.124.up_proj.weight_scale": "model-00035-of-00047.safetensors", + "model.layers.34.mlp.experts.125.down_proj.weight": "model-00035-of-00047.safetensors", + "model.layers.34.mlp.experts.125.down_proj.weight_scale": "model-00035-of-00047.safetensors", + "model.layers.34.mlp.experts.125.gate_proj.weight": "model-00035-of-00047.safetensors", + "model.layers.34.mlp.experts.125.gate_proj.weight_scale": "model-00035-of-00047.safetensors", + "model.layers.34.mlp.experts.125.up_proj.weight": "model-00035-of-00047.safetensors", + "model.layers.34.mlp.experts.125.up_proj.weight_scale": "model-00035-of-00047.safetensors", + "model.layers.34.mlp.experts.126.down_proj.weight": "model-00035-of-00047.safetensors", + "model.layers.34.mlp.experts.126.down_proj.weight_scale": "model-00035-of-00047.safetensors", + "model.layers.34.mlp.experts.126.gate_proj.weight": "model-00035-of-00047.safetensors", + "model.layers.34.mlp.experts.126.gate_proj.weight_scale": "model-00035-of-00047.safetensors", + "model.layers.34.mlp.experts.126.up_proj.weight": "model-00035-of-00047.safetensors", + "model.layers.34.mlp.experts.126.up_proj.weight_scale": "model-00035-of-00047.safetensors", + "model.layers.34.mlp.experts.127.down_proj.weight": "model-00035-of-00047.safetensors", + "model.layers.34.mlp.experts.127.down_proj.weight_scale": "model-00035-of-00047.safetensors", + "model.layers.34.mlp.experts.127.gate_proj.weight": "model-00035-of-00047.safetensors", + "model.layers.34.mlp.experts.127.gate_proj.weight_scale": "model-00035-of-00047.safetensors", + "model.layers.34.mlp.experts.127.up_proj.weight": "model-00035-of-00047.safetensors", + "model.layers.34.mlp.experts.127.up_proj.weight_scale": "model-00035-of-00047.safetensors", + "model.layers.34.mlp.experts.13.down_proj.weight": "model-00035-of-00047.safetensors", + "model.layers.34.mlp.experts.13.down_proj.weight_scale": "model-00035-of-00047.safetensors", + "model.layers.34.mlp.experts.13.gate_proj.weight": "model-00035-of-00047.safetensors", + "model.layers.34.mlp.experts.13.gate_proj.weight_scale": "model-00035-of-00047.safetensors", + "model.layers.34.mlp.experts.13.up_proj.weight": "model-00035-of-00047.safetensors", + "model.layers.34.mlp.experts.13.up_proj.weight_scale": "model-00035-of-00047.safetensors", + "model.layers.34.mlp.experts.14.down_proj.weight": "model-00035-of-00047.safetensors", + "model.layers.34.mlp.experts.14.down_proj.weight_scale": "model-00035-of-00047.safetensors", + "model.layers.34.mlp.experts.14.gate_proj.weight": "model-00035-of-00047.safetensors", + "model.layers.34.mlp.experts.14.gate_proj.weight_scale": "model-00035-of-00047.safetensors", + "model.layers.34.mlp.experts.14.up_proj.weight": "model-00035-of-00047.safetensors", + "model.layers.34.mlp.experts.14.up_proj.weight_scale": "model-00035-of-00047.safetensors", + "model.layers.34.mlp.experts.15.down_proj.weight": "model-00035-of-00047.safetensors", + "model.layers.34.mlp.experts.15.down_proj.weight_scale": "model-00035-of-00047.safetensors", + "model.layers.34.mlp.experts.15.gate_proj.weight": "model-00035-of-00047.safetensors", + "model.layers.34.mlp.experts.15.gate_proj.weight_scale": "model-00035-of-00047.safetensors", + "model.layers.34.mlp.experts.15.up_proj.weight": "model-00035-of-00047.safetensors", + "model.layers.34.mlp.experts.15.up_proj.weight_scale": "model-00035-of-00047.safetensors", + "model.layers.34.mlp.experts.16.down_proj.weight": "model-00035-of-00047.safetensors", + "model.layers.34.mlp.experts.16.down_proj.weight_scale": "model-00035-of-00047.safetensors", + "model.layers.34.mlp.experts.16.gate_proj.weight": "model-00035-of-00047.safetensors", + "model.layers.34.mlp.experts.16.gate_proj.weight_scale": "model-00035-of-00047.safetensors", + "model.layers.34.mlp.experts.16.up_proj.weight": "model-00035-of-00047.safetensors", + "model.layers.34.mlp.experts.16.up_proj.weight_scale": "model-00035-of-00047.safetensors", + "model.layers.34.mlp.experts.17.down_proj.weight": "model-00035-of-00047.safetensors", + "model.layers.34.mlp.experts.17.down_proj.weight_scale": "model-00035-of-00047.safetensors", + "model.layers.34.mlp.experts.17.gate_proj.weight": "model-00035-of-00047.safetensors", + "model.layers.34.mlp.experts.17.gate_proj.weight_scale": "model-00035-of-00047.safetensors", + "model.layers.34.mlp.experts.17.up_proj.weight": "model-00035-of-00047.safetensors", + "model.layers.34.mlp.experts.17.up_proj.weight_scale": "model-00035-of-00047.safetensors", + "model.layers.34.mlp.experts.18.down_proj.weight": "model-00035-of-00047.safetensors", + "model.layers.34.mlp.experts.18.down_proj.weight_scale": "model-00035-of-00047.safetensors", + "model.layers.34.mlp.experts.18.gate_proj.weight": "model-00035-of-00047.safetensors", + "model.layers.34.mlp.experts.18.gate_proj.weight_scale": "model-00035-of-00047.safetensors", + "model.layers.34.mlp.experts.18.up_proj.weight": "model-00035-of-00047.safetensors", + "model.layers.34.mlp.experts.18.up_proj.weight_scale": "model-00035-of-00047.safetensors", + "model.layers.34.mlp.experts.19.down_proj.weight": "model-00035-of-00047.safetensors", + "model.layers.34.mlp.experts.19.down_proj.weight_scale": "model-00035-of-00047.safetensors", + "model.layers.34.mlp.experts.19.gate_proj.weight": "model-00035-of-00047.safetensors", + "model.layers.34.mlp.experts.19.gate_proj.weight_scale": "model-00035-of-00047.safetensors", + "model.layers.34.mlp.experts.19.up_proj.weight": "model-00035-of-00047.safetensors", + "model.layers.34.mlp.experts.19.up_proj.weight_scale": "model-00035-of-00047.safetensors", + "model.layers.34.mlp.experts.2.down_proj.weight": "model-00035-of-00047.safetensors", + "model.layers.34.mlp.experts.2.down_proj.weight_scale": "model-00035-of-00047.safetensors", + "model.layers.34.mlp.experts.2.gate_proj.weight": "model-00035-of-00047.safetensors", + "model.layers.34.mlp.experts.2.gate_proj.weight_scale": "model-00035-of-00047.safetensors", + "model.layers.34.mlp.experts.2.up_proj.weight": "model-00035-of-00047.safetensors", + "model.layers.34.mlp.experts.2.up_proj.weight_scale": "model-00035-of-00047.safetensors", + "model.layers.34.mlp.experts.20.down_proj.weight": "model-00035-of-00047.safetensors", + "model.layers.34.mlp.experts.20.down_proj.weight_scale": "model-00035-of-00047.safetensors", + "model.layers.34.mlp.experts.20.gate_proj.weight": "model-00035-of-00047.safetensors", + "model.layers.34.mlp.experts.20.gate_proj.weight_scale": "model-00035-of-00047.safetensors", + "model.layers.34.mlp.experts.20.up_proj.weight": "model-00035-of-00047.safetensors", + "model.layers.34.mlp.experts.20.up_proj.weight_scale": "model-00035-of-00047.safetensors", + "model.layers.34.mlp.experts.21.down_proj.weight": "model-00035-of-00047.safetensors", + "model.layers.34.mlp.experts.21.down_proj.weight_scale": "model-00035-of-00047.safetensors", + "model.layers.34.mlp.experts.21.gate_proj.weight": "model-00035-of-00047.safetensors", + "model.layers.34.mlp.experts.21.gate_proj.weight_scale": "model-00035-of-00047.safetensors", + "model.layers.34.mlp.experts.21.up_proj.weight": "model-00035-of-00047.safetensors", + "model.layers.34.mlp.experts.21.up_proj.weight_scale": "model-00035-of-00047.safetensors", + "model.layers.34.mlp.experts.22.down_proj.weight": "model-00035-of-00047.safetensors", + "model.layers.34.mlp.experts.22.down_proj.weight_scale": "model-00035-of-00047.safetensors", + "model.layers.34.mlp.experts.22.gate_proj.weight": "model-00035-of-00047.safetensors", + "model.layers.34.mlp.experts.22.gate_proj.weight_scale": "model-00035-of-00047.safetensors", + "model.layers.34.mlp.experts.22.up_proj.weight": "model-00035-of-00047.safetensors", + "model.layers.34.mlp.experts.22.up_proj.weight_scale": "model-00035-of-00047.safetensors", + "model.layers.34.mlp.experts.23.down_proj.weight": "model-00035-of-00047.safetensors", + "model.layers.34.mlp.experts.23.down_proj.weight_scale": "model-00035-of-00047.safetensors", + "model.layers.34.mlp.experts.23.gate_proj.weight": "model-00035-of-00047.safetensors", + "model.layers.34.mlp.experts.23.gate_proj.weight_scale": "model-00035-of-00047.safetensors", + "model.layers.34.mlp.experts.23.up_proj.weight": "model-00035-of-00047.safetensors", + "model.layers.34.mlp.experts.23.up_proj.weight_scale": "model-00035-of-00047.safetensors", + "model.layers.34.mlp.experts.24.down_proj.weight": "model-00035-of-00047.safetensors", + "model.layers.34.mlp.experts.24.down_proj.weight_scale": "model-00035-of-00047.safetensors", + "model.layers.34.mlp.experts.24.gate_proj.weight": "model-00035-of-00047.safetensors", + "model.layers.34.mlp.experts.24.gate_proj.weight_scale": "model-00035-of-00047.safetensors", + "model.layers.34.mlp.experts.24.up_proj.weight": "model-00035-of-00047.safetensors", + "model.layers.34.mlp.experts.24.up_proj.weight_scale": "model-00035-of-00047.safetensors", + "model.layers.34.mlp.experts.25.down_proj.weight": "model-00035-of-00047.safetensors", + "model.layers.34.mlp.experts.25.down_proj.weight_scale": "model-00035-of-00047.safetensors", + "model.layers.34.mlp.experts.25.gate_proj.weight": "model-00035-of-00047.safetensors", + "model.layers.34.mlp.experts.25.gate_proj.weight_scale": "model-00035-of-00047.safetensors", + "model.layers.34.mlp.experts.25.up_proj.weight": "model-00035-of-00047.safetensors", + "model.layers.34.mlp.experts.25.up_proj.weight_scale": "model-00035-of-00047.safetensors", + "model.layers.34.mlp.experts.26.down_proj.weight": "model-00035-of-00047.safetensors", + "model.layers.34.mlp.experts.26.down_proj.weight_scale": "model-00035-of-00047.safetensors", + "model.layers.34.mlp.experts.26.gate_proj.weight": "model-00035-of-00047.safetensors", + "model.layers.34.mlp.experts.26.gate_proj.weight_scale": "model-00035-of-00047.safetensors", + "model.layers.34.mlp.experts.26.up_proj.weight": "model-00035-of-00047.safetensors", + "model.layers.34.mlp.experts.26.up_proj.weight_scale": "model-00035-of-00047.safetensors", + "model.layers.34.mlp.experts.27.down_proj.weight": "model-00035-of-00047.safetensors", + "model.layers.34.mlp.experts.27.down_proj.weight_scale": "model-00035-of-00047.safetensors", + "model.layers.34.mlp.experts.27.gate_proj.weight": "model-00035-of-00047.safetensors", + "model.layers.34.mlp.experts.27.gate_proj.weight_scale": "model-00035-of-00047.safetensors", + "model.layers.34.mlp.experts.27.up_proj.weight": "model-00035-of-00047.safetensors", + "model.layers.34.mlp.experts.27.up_proj.weight_scale": "model-00035-of-00047.safetensors", + "model.layers.34.mlp.experts.28.down_proj.weight": "model-00035-of-00047.safetensors", + "model.layers.34.mlp.experts.28.down_proj.weight_scale": "model-00035-of-00047.safetensors", + "model.layers.34.mlp.experts.28.gate_proj.weight": "model-00035-of-00047.safetensors", + "model.layers.34.mlp.experts.28.gate_proj.weight_scale": "model-00035-of-00047.safetensors", + "model.layers.34.mlp.experts.28.up_proj.weight": "model-00035-of-00047.safetensors", + "model.layers.34.mlp.experts.28.up_proj.weight_scale": "model-00035-of-00047.safetensors", + "model.layers.34.mlp.experts.29.down_proj.weight": "model-00035-of-00047.safetensors", + "model.layers.34.mlp.experts.29.down_proj.weight_scale": "model-00035-of-00047.safetensors", + "model.layers.34.mlp.experts.29.gate_proj.weight": "model-00035-of-00047.safetensors", + "model.layers.34.mlp.experts.29.gate_proj.weight_scale": "model-00035-of-00047.safetensors", + "model.layers.34.mlp.experts.29.up_proj.weight": "model-00035-of-00047.safetensors", + "model.layers.34.mlp.experts.29.up_proj.weight_scale": "model-00035-of-00047.safetensors", + "model.layers.34.mlp.experts.3.down_proj.weight": "model-00035-of-00047.safetensors", + "model.layers.34.mlp.experts.3.down_proj.weight_scale": "model-00035-of-00047.safetensors", + "model.layers.34.mlp.experts.3.gate_proj.weight": "model-00035-of-00047.safetensors", + "model.layers.34.mlp.experts.3.gate_proj.weight_scale": "model-00035-of-00047.safetensors", + "model.layers.34.mlp.experts.3.up_proj.weight": "model-00035-of-00047.safetensors", + "model.layers.34.mlp.experts.3.up_proj.weight_scale": "model-00035-of-00047.safetensors", + "model.layers.34.mlp.experts.30.down_proj.weight": "model-00035-of-00047.safetensors", + "model.layers.34.mlp.experts.30.down_proj.weight_scale": "model-00035-of-00047.safetensors", + "model.layers.34.mlp.experts.30.gate_proj.weight": "model-00035-of-00047.safetensors", + "model.layers.34.mlp.experts.30.gate_proj.weight_scale": "model-00035-of-00047.safetensors", + "model.layers.34.mlp.experts.30.up_proj.weight": "model-00035-of-00047.safetensors", + "model.layers.34.mlp.experts.30.up_proj.weight_scale": "model-00035-of-00047.safetensors", + "model.layers.34.mlp.experts.31.down_proj.weight": "model-00035-of-00047.safetensors", + "model.layers.34.mlp.experts.31.down_proj.weight_scale": "model-00035-of-00047.safetensors", + "model.layers.34.mlp.experts.31.gate_proj.weight": "model-00035-of-00047.safetensors", + "model.layers.34.mlp.experts.31.gate_proj.weight_scale": "model-00035-of-00047.safetensors", + "model.layers.34.mlp.experts.31.up_proj.weight": "model-00035-of-00047.safetensors", + "model.layers.34.mlp.experts.31.up_proj.weight_scale": "model-00035-of-00047.safetensors", + "model.layers.34.mlp.experts.32.down_proj.weight": "model-00035-of-00047.safetensors", + "model.layers.34.mlp.experts.32.down_proj.weight_scale": "model-00035-of-00047.safetensors", + "model.layers.34.mlp.experts.32.gate_proj.weight": "model-00035-of-00047.safetensors", + "model.layers.34.mlp.experts.32.gate_proj.weight_scale": "model-00035-of-00047.safetensors", + "model.layers.34.mlp.experts.32.up_proj.weight": "model-00035-of-00047.safetensors", + "model.layers.34.mlp.experts.32.up_proj.weight_scale": "model-00035-of-00047.safetensors", + "model.layers.34.mlp.experts.33.down_proj.weight": "model-00035-of-00047.safetensors", + "model.layers.34.mlp.experts.33.down_proj.weight_scale": "model-00035-of-00047.safetensors", + "model.layers.34.mlp.experts.33.gate_proj.weight": "model-00035-of-00047.safetensors", + "model.layers.34.mlp.experts.33.gate_proj.weight_scale": "model-00035-of-00047.safetensors", + "model.layers.34.mlp.experts.33.up_proj.weight": "model-00035-of-00047.safetensors", + "model.layers.34.mlp.experts.33.up_proj.weight_scale": "model-00035-of-00047.safetensors", + "model.layers.34.mlp.experts.34.down_proj.weight": "model-00035-of-00047.safetensors", + "model.layers.34.mlp.experts.34.down_proj.weight_scale": "model-00035-of-00047.safetensors", + "model.layers.34.mlp.experts.34.gate_proj.weight": "model-00035-of-00047.safetensors", + "model.layers.34.mlp.experts.34.gate_proj.weight_scale": "model-00035-of-00047.safetensors", + "model.layers.34.mlp.experts.34.up_proj.weight": "model-00035-of-00047.safetensors", + "model.layers.34.mlp.experts.34.up_proj.weight_scale": "model-00035-of-00047.safetensors", + "model.layers.34.mlp.experts.35.down_proj.weight": "model-00035-of-00047.safetensors", + "model.layers.34.mlp.experts.35.down_proj.weight_scale": "model-00035-of-00047.safetensors", + "model.layers.34.mlp.experts.35.gate_proj.weight": "model-00035-of-00047.safetensors", + "model.layers.34.mlp.experts.35.gate_proj.weight_scale": "model-00035-of-00047.safetensors", + "model.layers.34.mlp.experts.35.up_proj.weight": "model-00035-of-00047.safetensors", + "model.layers.34.mlp.experts.35.up_proj.weight_scale": "model-00035-of-00047.safetensors", + "model.layers.34.mlp.experts.36.down_proj.weight": "model-00035-of-00047.safetensors", + "model.layers.34.mlp.experts.36.down_proj.weight_scale": "model-00035-of-00047.safetensors", + "model.layers.34.mlp.experts.36.gate_proj.weight": "model-00035-of-00047.safetensors", + "model.layers.34.mlp.experts.36.gate_proj.weight_scale": "model-00035-of-00047.safetensors", + "model.layers.34.mlp.experts.36.up_proj.weight": "model-00035-of-00047.safetensors", + "model.layers.34.mlp.experts.36.up_proj.weight_scale": "model-00035-of-00047.safetensors", + "model.layers.34.mlp.experts.37.down_proj.weight": "model-00035-of-00047.safetensors", + "model.layers.34.mlp.experts.37.down_proj.weight_scale": "model-00035-of-00047.safetensors", + "model.layers.34.mlp.experts.37.gate_proj.weight": "model-00035-of-00047.safetensors", + "model.layers.34.mlp.experts.37.gate_proj.weight_scale": "model-00035-of-00047.safetensors", + "model.layers.34.mlp.experts.37.up_proj.weight": "model-00035-of-00047.safetensors", + "model.layers.34.mlp.experts.37.up_proj.weight_scale": "model-00035-of-00047.safetensors", + "model.layers.34.mlp.experts.38.down_proj.weight": "model-00035-of-00047.safetensors", + "model.layers.34.mlp.experts.38.down_proj.weight_scale": "model-00035-of-00047.safetensors", + "model.layers.34.mlp.experts.38.gate_proj.weight": "model-00035-of-00047.safetensors", + "model.layers.34.mlp.experts.38.gate_proj.weight_scale": "model-00035-of-00047.safetensors", + "model.layers.34.mlp.experts.38.up_proj.weight": "model-00035-of-00047.safetensors", + "model.layers.34.mlp.experts.38.up_proj.weight_scale": "model-00035-of-00047.safetensors", + "model.layers.34.mlp.experts.39.down_proj.weight": "model-00035-of-00047.safetensors", + "model.layers.34.mlp.experts.39.down_proj.weight_scale": "model-00035-of-00047.safetensors", + "model.layers.34.mlp.experts.39.gate_proj.weight": "model-00035-of-00047.safetensors", + "model.layers.34.mlp.experts.39.gate_proj.weight_scale": "model-00035-of-00047.safetensors", + "model.layers.34.mlp.experts.39.up_proj.weight": "model-00035-of-00047.safetensors", + "model.layers.34.mlp.experts.39.up_proj.weight_scale": "model-00035-of-00047.safetensors", + "model.layers.34.mlp.experts.4.down_proj.weight": "model-00035-of-00047.safetensors", + "model.layers.34.mlp.experts.4.down_proj.weight_scale": "model-00035-of-00047.safetensors", + "model.layers.34.mlp.experts.4.gate_proj.weight": "model-00035-of-00047.safetensors", + "model.layers.34.mlp.experts.4.gate_proj.weight_scale": "model-00035-of-00047.safetensors", + "model.layers.34.mlp.experts.4.up_proj.weight": "model-00035-of-00047.safetensors", + "model.layers.34.mlp.experts.4.up_proj.weight_scale": "model-00035-of-00047.safetensors", + "model.layers.34.mlp.experts.40.down_proj.weight": "model-00035-of-00047.safetensors", + "model.layers.34.mlp.experts.40.down_proj.weight_scale": "model-00035-of-00047.safetensors", + "model.layers.34.mlp.experts.40.gate_proj.weight": "model-00035-of-00047.safetensors", + "model.layers.34.mlp.experts.40.gate_proj.weight_scale": "model-00035-of-00047.safetensors", + "model.layers.34.mlp.experts.40.up_proj.weight": "model-00035-of-00047.safetensors", + "model.layers.34.mlp.experts.40.up_proj.weight_scale": "model-00035-of-00047.safetensors", + "model.layers.34.mlp.experts.41.down_proj.weight": "model-00035-of-00047.safetensors", + "model.layers.34.mlp.experts.41.down_proj.weight_scale": "model-00035-of-00047.safetensors", + "model.layers.34.mlp.experts.41.gate_proj.weight": "model-00035-of-00047.safetensors", + "model.layers.34.mlp.experts.41.gate_proj.weight_scale": "model-00035-of-00047.safetensors", + "model.layers.34.mlp.experts.41.up_proj.weight": "model-00035-of-00047.safetensors", + "model.layers.34.mlp.experts.41.up_proj.weight_scale": "model-00035-of-00047.safetensors", + "model.layers.34.mlp.experts.42.down_proj.weight": "model-00035-of-00047.safetensors", + "model.layers.34.mlp.experts.42.down_proj.weight_scale": "model-00035-of-00047.safetensors", + "model.layers.34.mlp.experts.42.gate_proj.weight": "model-00035-of-00047.safetensors", + "model.layers.34.mlp.experts.42.gate_proj.weight_scale": "model-00035-of-00047.safetensors", + "model.layers.34.mlp.experts.42.up_proj.weight": "model-00035-of-00047.safetensors", + "model.layers.34.mlp.experts.42.up_proj.weight_scale": "model-00035-of-00047.safetensors", + "model.layers.34.mlp.experts.43.down_proj.weight": "model-00035-of-00047.safetensors", + "model.layers.34.mlp.experts.43.down_proj.weight_scale": "model-00035-of-00047.safetensors", + "model.layers.34.mlp.experts.43.gate_proj.weight": "model-00035-of-00047.safetensors", + "model.layers.34.mlp.experts.43.gate_proj.weight_scale": "model-00035-of-00047.safetensors", + "model.layers.34.mlp.experts.43.up_proj.weight": "model-00035-of-00047.safetensors", + "model.layers.34.mlp.experts.43.up_proj.weight_scale": "model-00035-of-00047.safetensors", + "model.layers.34.mlp.experts.44.down_proj.weight": "model-00035-of-00047.safetensors", + "model.layers.34.mlp.experts.44.down_proj.weight_scale": "model-00035-of-00047.safetensors", + "model.layers.34.mlp.experts.44.gate_proj.weight": "model-00035-of-00047.safetensors", + "model.layers.34.mlp.experts.44.gate_proj.weight_scale": "model-00035-of-00047.safetensors", + "model.layers.34.mlp.experts.44.up_proj.weight": "model-00035-of-00047.safetensors", + "model.layers.34.mlp.experts.44.up_proj.weight_scale": "model-00035-of-00047.safetensors", + "model.layers.34.mlp.experts.45.down_proj.weight": "model-00035-of-00047.safetensors", + "model.layers.34.mlp.experts.45.down_proj.weight_scale": "model-00035-of-00047.safetensors", + "model.layers.34.mlp.experts.45.gate_proj.weight": "model-00035-of-00047.safetensors", + "model.layers.34.mlp.experts.45.gate_proj.weight_scale": "model-00035-of-00047.safetensors", + "model.layers.34.mlp.experts.45.up_proj.weight": "model-00035-of-00047.safetensors", + "model.layers.34.mlp.experts.45.up_proj.weight_scale": "model-00035-of-00047.safetensors", + "model.layers.34.mlp.experts.46.down_proj.weight": "model-00035-of-00047.safetensors", + "model.layers.34.mlp.experts.46.down_proj.weight_scale": "model-00035-of-00047.safetensors", + "model.layers.34.mlp.experts.46.gate_proj.weight": "model-00035-of-00047.safetensors", + "model.layers.34.mlp.experts.46.gate_proj.weight_scale": "model-00035-of-00047.safetensors", + "model.layers.34.mlp.experts.46.up_proj.weight": "model-00035-of-00047.safetensors", + "model.layers.34.mlp.experts.46.up_proj.weight_scale": "model-00035-of-00047.safetensors", + "model.layers.34.mlp.experts.47.down_proj.weight": "model-00035-of-00047.safetensors", + "model.layers.34.mlp.experts.47.down_proj.weight_scale": "model-00035-of-00047.safetensors", + "model.layers.34.mlp.experts.47.gate_proj.weight": "model-00035-of-00047.safetensors", + "model.layers.34.mlp.experts.47.gate_proj.weight_scale": "model-00035-of-00047.safetensors", + "model.layers.34.mlp.experts.47.up_proj.weight": "model-00035-of-00047.safetensors", + "model.layers.34.mlp.experts.47.up_proj.weight_scale": "model-00035-of-00047.safetensors", + "model.layers.34.mlp.experts.48.down_proj.weight": "model-00035-of-00047.safetensors", + "model.layers.34.mlp.experts.48.down_proj.weight_scale": "model-00035-of-00047.safetensors", + "model.layers.34.mlp.experts.48.gate_proj.weight": "model-00035-of-00047.safetensors", + "model.layers.34.mlp.experts.48.gate_proj.weight_scale": "model-00035-of-00047.safetensors", + "model.layers.34.mlp.experts.48.up_proj.weight": "model-00035-of-00047.safetensors", + "model.layers.34.mlp.experts.48.up_proj.weight_scale": "model-00035-of-00047.safetensors", + "model.layers.34.mlp.experts.49.down_proj.weight": "model-00035-of-00047.safetensors", + "model.layers.34.mlp.experts.49.down_proj.weight_scale": "model-00035-of-00047.safetensors", + "model.layers.34.mlp.experts.49.gate_proj.weight": "model-00035-of-00047.safetensors", + "model.layers.34.mlp.experts.49.gate_proj.weight_scale": "model-00035-of-00047.safetensors", + "model.layers.34.mlp.experts.49.up_proj.weight": "model-00035-of-00047.safetensors", + "model.layers.34.mlp.experts.49.up_proj.weight_scale": "model-00035-of-00047.safetensors", + "model.layers.34.mlp.experts.5.down_proj.weight": "model-00035-of-00047.safetensors", + "model.layers.34.mlp.experts.5.down_proj.weight_scale": "model-00035-of-00047.safetensors", + "model.layers.34.mlp.experts.5.gate_proj.weight": "model-00035-of-00047.safetensors", + "model.layers.34.mlp.experts.5.gate_proj.weight_scale": "model-00035-of-00047.safetensors", + "model.layers.34.mlp.experts.5.up_proj.weight": "model-00035-of-00047.safetensors", + "model.layers.34.mlp.experts.5.up_proj.weight_scale": "model-00035-of-00047.safetensors", + "model.layers.34.mlp.experts.50.down_proj.weight": "model-00035-of-00047.safetensors", + "model.layers.34.mlp.experts.50.down_proj.weight_scale": "model-00035-of-00047.safetensors", + "model.layers.34.mlp.experts.50.gate_proj.weight": "model-00035-of-00047.safetensors", + "model.layers.34.mlp.experts.50.gate_proj.weight_scale": "model-00035-of-00047.safetensors", + "model.layers.34.mlp.experts.50.up_proj.weight": "model-00035-of-00047.safetensors", + "model.layers.34.mlp.experts.50.up_proj.weight_scale": "model-00035-of-00047.safetensors", + "model.layers.34.mlp.experts.51.down_proj.weight": "model-00035-of-00047.safetensors", + "model.layers.34.mlp.experts.51.down_proj.weight_scale": "model-00035-of-00047.safetensors", + "model.layers.34.mlp.experts.51.gate_proj.weight": "model-00035-of-00047.safetensors", + "model.layers.34.mlp.experts.51.gate_proj.weight_scale": "model-00035-of-00047.safetensors", + "model.layers.34.mlp.experts.51.up_proj.weight": "model-00035-of-00047.safetensors", + "model.layers.34.mlp.experts.51.up_proj.weight_scale": "model-00035-of-00047.safetensors", + "model.layers.34.mlp.experts.52.down_proj.weight": "model-00035-of-00047.safetensors", + "model.layers.34.mlp.experts.52.down_proj.weight_scale": "model-00035-of-00047.safetensors", + "model.layers.34.mlp.experts.52.gate_proj.weight": "model-00035-of-00047.safetensors", + "model.layers.34.mlp.experts.52.gate_proj.weight_scale": "model-00035-of-00047.safetensors", + "model.layers.34.mlp.experts.52.up_proj.weight": "model-00035-of-00047.safetensors", + "model.layers.34.mlp.experts.52.up_proj.weight_scale": "model-00035-of-00047.safetensors", + "model.layers.34.mlp.experts.53.down_proj.weight": "model-00035-of-00047.safetensors", + "model.layers.34.mlp.experts.53.down_proj.weight_scale": "model-00035-of-00047.safetensors", + "model.layers.34.mlp.experts.53.gate_proj.weight": "model-00035-of-00047.safetensors", + "model.layers.34.mlp.experts.53.gate_proj.weight_scale": "model-00035-of-00047.safetensors", + "model.layers.34.mlp.experts.53.up_proj.weight": "model-00035-of-00047.safetensors", + "model.layers.34.mlp.experts.53.up_proj.weight_scale": "model-00035-of-00047.safetensors", + "model.layers.34.mlp.experts.54.down_proj.weight": "model-00035-of-00047.safetensors", + "model.layers.34.mlp.experts.54.down_proj.weight_scale": "model-00035-of-00047.safetensors", + "model.layers.34.mlp.experts.54.gate_proj.weight": "model-00035-of-00047.safetensors", + "model.layers.34.mlp.experts.54.gate_proj.weight_scale": "model-00035-of-00047.safetensors", + "model.layers.34.mlp.experts.54.up_proj.weight": "model-00035-of-00047.safetensors", + "model.layers.34.mlp.experts.54.up_proj.weight_scale": "model-00035-of-00047.safetensors", + "model.layers.34.mlp.experts.55.down_proj.weight": "model-00035-of-00047.safetensors", + "model.layers.34.mlp.experts.55.down_proj.weight_scale": "model-00035-of-00047.safetensors", + "model.layers.34.mlp.experts.55.gate_proj.weight": "model-00035-of-00047.safetensors", + "model.layers.34.mlp.experts.55.gate_proj.weight_scale": "model-00035-of-00047.safetensors", + "model.layers.34.mlp.experts.55.up_proj.weight": "model-00035-of-00047.safetensors", + "model.layers.34.mlp.experts.55.up_proj.weight_scale": "model-00035-of-00047.safetensors", + "model.layers.34.mlp.experts.56.down_proj.weight": "model-00035-of-00047.safetensors", + "model.layers.34.mlp.experts.56.down_proj.weight_scale": "model-00035-of-00047.safetensors", + "model.layers.34.mlp.experts.56.gate_proj.weight": "model-00035-of-00047.safetensors", + "model.layers.34.mlp.experts.56.gate_proj.weight_scale": "model-00035-of-00047.safetensors", + "model.layers.34.mlp.experts.56.up_proj.weight": "model-00035-of-00047.safetensors", + "model.layers.34.mlp.experts.56.up_proj.weight_scale": "model-00035-of-00047.safetensors", + "model.layers.34.mlp.experts.57.down_proj.weight": "model-00035-of-00047.safetensors", + "model.layers.34.mlp.experts.57.down_proj.weight_scale": "model-00035-of-00047.safetensors", + "model.layers.34.mlp.experts.57.gate_proj.weight": "model-00035-of-00047.safetensors", + "model.layers.34.mlp.experts.57.gate_proj.weight_scale": "model-00035-of-00047.safetensors", + "model.layers.34.mlp.experts.57.up_proj.weight": "model-00035-of-00047.safetensors", + "model.layers.34.mlp.experts.57.up_proj.weight_scale": "model-00035-of-00047.safetensors", + "model.layers.34.mlp.experts.58.down_proj.weight": "model-00035-of-00047.safetensors", + "model.layers.34.mlp.experts.58.down_proj.weight_scale": "model-00035-of-00047.safetensors", + "model.layers.34.mlp.experts.58.gate_proj.weight": "model-00035-of-00047.safetensors", + "model.layers.34.mlp.experts.58.gate_proj.weight_scale": "model-00035-of-00047.safetensors", + "model.layers.34.mlp.experts.58.up_proj.weight": "model-00035-of-00047.safetensors", + "model.layers.34.mlp.experts.58.up_proj.weight_scale": "model-00035-of-00047.safetensors", + "model.layers.34.mlp.experts.59.down_proj.weight": "model-00035-of-00047.safetensors", + "model.layers.34.mlp.experts.59.down_proj.weight_scale": "model-00035-of-00047.safetensors", + "model.layers.34.mlp.experts.59.gate_proj.weight": "model-00035-of-00047.safetensors", + "model.layers.34.mlp.experts.59.gate_proj.weight_scale": "model-00035-of-00047.safetensors", + "model.layers.34.mlp.experts.59.up_proj.weight": "model-00035-of-00047.safetensors", + "model.layers.34.mlp.experts.59.up_proj.weight_scale": "model-00035-of-00047.safetensors", + "model.layers.34.mlp.experts.6.down_proj.weight": "model-00035-of-00047.safetensors", + "model.layers.34.mlp.experts.6.down_proj.weight_scale": "model-00035-of-00047.safetensors", + "model.layers.34.mlp.experts.6.gate_proj.weight": "model-00035-of-00047.safetensors", + "model.layers.34.mlp.experts.6.gate_proj.weight_scale": "model-00035-of-00047.safetensors", + "model.layers.34.mlp.experts.6.up_proj.weight": "model-00035-of-00047.safetensors", + "model.layers.34.mlp.experts.6.up_proj.weight_scale": "model-00035-of-00047.safetensors", + "model.layers.34.mlp.experts.60.down_proj.weight": "model-00035-of-00047.safetensors", + "model.layers.34.mlp.experts.60.down_proj.weight_scale": "model-00035-of-00047.safetensors", + "model.layers.34.mlp.experts.60.gate_proj.weight": "model-00035-of-00047.safetensors", + "model.layers.34.mlp.experts.60.gate_proj.weight_scale": "model-00035-of-00047.safetensors", + "model.layers.34.mlp.experts.60.up_proj.weight": "model-00035-of-00047.safetensors", + "model.layers.34.mlp.experts.60.up_proj.weight_scale": "model-00035-of-00047.safetensors", + "model.layers.34.mlp.experts.61.down_proj.weight": "model-00035-of-00047.safetensors", + "model.layers.34.mlp.experts.61.down_proj.weight_scale": "model-00035-of-00047.safetensors", + "model.layers.34.mlp.experts.61.gate_proj.weight": "model-00035-of-00047.safetensors", + "model.layers.34.mlp.experts.61.gate_proj.weight_scale": "model-00035-of-00047.safetensors", + "model.layers.34.mlp.experts.61.up_proj.weight": "model-00035-of-00047.safetensors", + "model.layers.34.mlp.experts.61.up_proj.weight_scale": "model-00035-of-00047.safetensors", + "model.layers.34.mlp.experts.62.down_proj.weight": "model-00035-of-00047.safetensors", + "model.layers.34.mlp.experts.62.down_proj.weight_scale": "model-00035-of-00047.safetensors", + "model.layers.34.mlp.experts.62.gate_proj.weight": "model-00035-of-00047.safetensors", + "model.layers.34.mlp.experts.62.gate_proj.weight_scale": "model-00035-of-00047.safetensors", + "model.layers.34.mlp.experts.62.up_proj.weight": "model-00035-of-00047.safetensors", + "model.layers.34.mlp.experts.62.up_proj.weight_scale": "model-00035-of-00047.safetensors", + "model.layers.34.mlp.experts.63.down_proj.weight": "model-00035-of-00047.safetensors", + "model.layers.34.mlp.experts.63.down_proj.weight_scale": "model-00035-of-00047.safetensors", + "model.layers.34.mlp.experts.63.gate_proj.weight": "model-00035-of-00047.safetensors", + "model.layers.34.mlp.experts.63.gate_proj.weight_scale": "model-00035-of-00047.safetensors", + "model.layers.34.mlp.experts.63.up_proj.weight": "model-00035-of-00047.safetensors", + "model.layers.34.mlp.experts.63.up_proj.weight_scale": "model-00035-of-00047.safetensors", + "model.layers.34.mlp.experts.64.down_proj.weight": "model-00035-of-00047.safetensors", + "model.layers.34.mlp.experts.64.down_proj.weight_scale": "model-00035-of-00047.safetensors", + "model.layers.34.mlp.experts.64.gate_proj.weight": "model-00035-of-00047.safetensors", + "model.layers.34.mlp.experts.64.gate_proj.weight_scale": "model-00035-of-00047.safetensors", + "model.layers.34.mlp.experts.64.up_proj.weight": "model-00035-of-00047.safetensors", + "model.layers.34.mlp.experts.64.up_proj.weight_scale": "model-00035-of-00047.safetensors", + "model.layers.34.mlp.experts.65.down_proj.weight": "model-00035-of-00047.safetensors", + "model.layers.34.mlp.experts.65.down_proj.weight_scale": "model-00035-of-00047.safetensors", + "model.layers.34.mlp.experts.65.gate_proj.weight": "model-00035-of-00047.safetensors", + "model.layers.34.mlp.experts.65.gate_proj.weight_scale": "model-00035-of-00047.safetensors", + "model.layers.34.mlp.experts.65.up_proj.weight": "model-00035-of-00047.safetensors", + "model.layers.34.mlp.experts.65.up_proj.weight_scale": "model-00035-of-00047.safetensors", + "model.layers.34.mlp.experts.66.down_proj.weight": "model-00035-of-00047.safetensors", + "model.layers.34.mlp.experts.66.down_proj.weight_scale": "model-00035-of-00047.safetensors", + "model.layers.34.mlp.experts.66.gate_proj.weight": "model-00035-of-00047.safetensors", + "model.layers.34.mlp.experts.66.gate_proj.weight_scale": "model-00035-of-00047.safetensors", + "model.layers.34.mlp.experts.66.up_proj.weight": "model-00035-of-00047.safetensors", + "model.layers.34.mlp.experts.66.up_proj.weight_scale": "model-00035-of-00047.safetensors", + "model.layers.34.mlp.experts.67.down_proj.weight": "model-00035-of-00047.safetensors", + "model.layers.34.mlp.experts.67.down_proj.weight_scale": "model-00035-of-00047.safetensors", + "model.layers.34.mlp.experts.67.gate_proj.weight": "model-00035-of-00047.safetensors", + "model.layers.34.mlp.experts.67.gate_proj.weight_scale": "model-00035-of-00047.safetensors", + "model.layers.34.mlp.experts.67.up_proj.weight": "model-00035-of-00047.safetensors", + "model.layers.34.mlp.experts.67.up_proj.weight_scale": "model-00035-of-00047.safetensors", + "model.layers.34.mlp.experts.68.down_proj.weight": "model-00035-of-00047.safetensors", + "model.layers.34.mlp.experts.68.down_proj.weight_scale": "model-00035-of-00047.safetensors", + "model.layers.34.mlp.experts.68.gate_proj.weight": "model-00035-of-00047.safetensors", + "model.layers.34.mlp.experts.68.gate_proj.weight_scale": "model-00035-of-00047.safetensors", + "model.layers.34.mlp.experts.68.up_proj.weight": "model-00035-of-00047.safetensors", + "model.layers.34.mlp.experts.68.up_proj.weight_scale": "model-00035-of-00047.safetensors", + "model.layers.34.mlp.experts.69.down_proj.weight": "model-00035-of-00047.safetensors", + "model.layers.34.mlp.experts.69.down_proj.weight_scale": "model-00035-of-00047.safetensors", + "model.layers.34.mlp.experts.69.gate_proj.weight": "model-00035-of-00047.safetensors", + "model.layers.34.mlp.experts.69.gate_proj.weight_scale": "model-00035-of-00047.safetensors", + "model.layers.34.mlp.experts.69.up_proj.weight": "model-00035-of-00047.safetensors", + "model.layers.34.mlp.experts.69.up_proj.weight_scale": "model-00035-of-00047.safetensors", + "model.layers.34.mlp.experts.7.down_proj.weight": "model-00035-of-00047.safetensors", + "model.layers.34.mlp.experts.7.down_proj.weight_scale": "model-00035-of-00047.safetensors", + "model.layers.34.mlp.experts.7.gate_proj.weight": "model-00035-of-00047.safetensors", + "model.layers.34.mlp.experts.7.gate_proj.weight_scale": "model-00035-of-00047.safetensors", + "model.layers.34.mlp.experts.7.up_proj.weight": "model-00035-of-00047.safetensors", + "model.layers.34.mlp.experts.7.up_proj.weight_scale": "model-00035-of-00047.safetensors", + "model.layers.34.mlp.experts.70.down_proj.weight": "model-00035-of-00047.safetensors", + "model.layers.34.mlp.experts.70.down_proj.weight_scale": "model-00035-of-00047.safetensors", + "model.layers.34.mlp.experts.70.gate_proj.weight": "model-00035-of-00047.safetensors", + "model.layers.34.mlp.experts.70.gate_proj.weight_scale": "model-00035-of-00047.safetensors", + "model.layers.34.mlp.experts.70.up_proj.weight": "model-00035-of-00047.safetensors", + "model.layers.34.mlp.experts.70.up_proj.weight_scale": "model-00035-of-00047.safetensors", + "model.layers.34.mlp.experts.71.down_proj.weight": "model-00035-of-00047.safetensors", + "model.layers.34.mlp.experts.71.down_proj.weight_scale": "model-00035-of-00047.safetensors", + "model.layers.34.mlp.experts.71.gate_proj.weight": "model-00035-of-00047.safetensors", + "model.layers.34.mlp.experts.71.gate_proj.weight_scale": "model-00035-of-00047.safetensors", + "model.layers.34.mlp.experts.71.up_proj.weight": "model-00035-of-00047.safetensors", + "model.layers.34.mlp.experts.71.up_proj.weight_scale": "model-00035-of-00047.safetensors", + "model.layers.34.mlp.experts.72.down_proj.weight": "model-00035-of-00047.safetensors", + "model.layers.34.mlp.experts.72.down_proj.weight_scale": "model-00035-of-00047.safetensors", + "model.layers.34.mlp.experts.72.gate_proj.weight": "model-00035-of-00047.safetensors", + "model.layers.34.mlp.experts.72.gate_proj.weight_scale": "model-00035-of-00047.safetensors", + "model.layers.34.mlp.experts.72.up_proj.weight": "model-00035-of-00047.safetensors", + "model.layers.34.mlp.experts.72.up_proj.weight_scale": "model-00035-of-00047.safetensors", + "model.layers.34.mlp.experts.73.down_proj.weight": "model-00035-of-00047.safetensors", + "model.layers.34.mlp.experts.73.down_proj.weight_scale": "model-00035-of-00047.safetensors", + "model.layers.34.mlp.experts.73.gate_proj.weight": "model-00035-of-00047.safetensors", + "model.layers.34.mlp.experts.73.gate_proj.weight_scale": "model-00035-of-00047.safetensors", + "model.layers.34.mlp.experts.73.up_proj.weight": "model-00035-of-00047.safetensors", + "model.layers.34.mlp.experts.73.up_proj.weight_scale": "model-00035-of-00047.safetensors", + "model.layers.34.mlp.experts.74.down_proj.weight": "model-00035-of-00047.safetensors", + "model.layers.34.mlp.experts.74.down_proj.weight_scale": "model-00035-of-00047.safetensors", + "model.layers.34.mlp.experts.74.gate_proj.weight": "model-00035-of-00047.safetensors", + "model.layers.34.mlp.experts.74.gate_proj.weight_scale": "model-00035-of-00047.safetensors", + "model.layers.34.mlp.experts.74.up_proj.weight": "model-00035-of-00047.safetensors", + "model.layers.34.mlp.experts.74.up_proj.weight_scale": "model-00035-of-00047.safetensors", + "model.layers.34.mlp.experts.75.down_proj.weight": "model-00035-of-00047.safetensors", + "model.layers.34.mlp.experts.75.down_proj.weight_scale": "model-00035-of-00047.safetensors", + "model.layers.34.mlp.experts.75.gate_proj.weight": "model-00035-of-00047.safetensors", + "model.layers.34.mlp.experts.75.gate_proj.weight_scale": "model-00035-of-00047.safetensors", + "model.layers.34.mlp.experts.75.up_proj.weight": "model-00035-of-00047.safetensors", + "model.layers.34.mlp.experts.75.up_proj.weight_scale": "model-00035-of-00047.safetensors", + "model.layers.34.mlp.experts.76.down_proj.weight": "model-00035-of-00047.safetensors", + "model.layers.34.mlp.experts.76.down_proj.weight_scale": "model-00035-of-00047.safetensors", + "model.layers.34.mlp.experts.76.gate_proj.weight": "model-00035-of-00047.safetensors", + "model.layers.34.mlp.experts.76.gate_proj.weight_scale": "model-00035-of-00047.safetensors", + "model.layers.34.mlp.experts.76.up_proj.weight": "model-00035-of-00047.safetensors", + "model.layers.34.mlp.experts.76.up_proj.weight_scale": "model-00035-of-00047.safetensors", + "model.layers.34.mlp.experts.77.down_proj.weight": "model-00035-of-00047.safetensors", + "model.layers.34.mlp.experts.77.down_proj.weight_scale": "model-00035-of-00047.safetensors", + "model.layers.34.mlp.experts.77.gate_proj.weight": "model-00035-of-00047.safetensors", + "model.layers.34.mlp.experts.77.gate_proj.weight_scale": "model-00035-of-00047.safetensors", + "model.layers.34.mlp.experts.77.up_proj.weight": "model-00035-of-00047.safetensors", + "model.layers.34.mlp.experts.77.up_proj.weight_scale": "model-00035-of-00047.safetensors", + "model.layers.34.mlp.experts.78.down_proj.weight": "model-00035-of-00047.safetensors", + "model.layers.34.mlp.experts.78.down_proj.weight_scale": "model-00035-of-00047.safetensors", + "model.layers.34.mlp.experts.78.gate_proj.weight": "model-00035-of-00047.safetensors", + "model.layers.34.mlp.experts.78.gate_proj.weight_scale": "model-00035-of-00047.safetensors", + "model.layers.34.mlp.experts.78.up_proj.weight": "model-00035-of-00047.safetensors", + "model.layers.34.mlp.experts.78.up_proj.weight_scale": "model-00035-of-00047.safetensors", + "model.layers.34.mlp.experts.79.down_proj.weight": "model-00035-of-00047.safetensors", + "model.layers.34.mlp.experts.79.down_proj.weight_scale": "model-00035-of-00047.safetensors", + "model.layers.34.mlp.experts.79.gate_proj.weight": "model-00035-of-00047.safetensors", + "model.layers.34.mlp.experts.79.gate_proj.weight_scale": "model-00035-of-00047.safetensors", + "model.layers.34.mlp.experts.79.up_proj.weight": "model-00035-of-00047.safetensors", + "model.layers.34.mlp.experts.79.up_proj.weight_scale": "model-00035-of-00047.safetensors", + "model.layers.34.mlp.experts.8.down_proj.weight": "model-00035-of-00047.safetensors", + "model.layers.34.mlp.experts.8.down_proj.weight_scale": "model-00035-of-00047.safetensors", + "model.layers.34.mlp.experts.8.gate_proj.weight": "model-00035-of-00047.safetensors", + "model.layers.34.mlp.experts.8.gate_proj.weight_scale": "model-00035-of-00047.safetensors", + "model.layers.34.mlp.experts.8.up_proj.weight": "model-00035-of-00047.safetensors", + "model.layers.34.mlp.experts.8.up_proj.weight_scale": "model-00035-of-00047.safetensors", + "model.layers.34.mlp.experts.80.down_proj.weight": "model-00035-of-00047.safetensors", + "model.layers.34.mlp.experts.80.down_proj.weight_scale": "model-00035-of-00047.safetensors", + "model.layers.34.mlp.experts.80.gate_proj.weight": "model-00035-of-00047.safetensors", + "model.layers.34.mlp.experts.80.gate_proj.weight_scale": "model-00035-of-00047.safetensors", + "model.layers.34.mlp.experts.80.up_proj.weight": "model-00035-of-00047.safetensors", + "model.layers.34.mlp.experts.80.up_proj.weight_scale": "model-00035-of-00047.safetensors", + "model.layers.34.mlp.experts.81.down_proj.weight": "model-00035-of-00047.safetensors", + "model.layers.34.mlp.experts.81.down_proj.weight_scale": "model-00035-of-00047.safetensors", + "model.layers.34.mlp.experts.81.gate_proj.weight": "model-00035-of-00047.safetensors", + "model.layers.34.mlp.experts.81.gate_proj.weight_scale": "model-00035-of-00047.safetensors", + "model.layers.34.mlp.experts.81.up_proj.weight": "model-00035-of-00047.safetensors", + "model.layers.34.mlp.experts.81.up_proj.weight_scale": "model-00035-of-00047.safetensors", + "model.layers.34.mlp.experts.82.down_proj.weight": "model-00035-of-00047.safetensors", + "model.layers.34.mlp.experts.82.down_proj.weight_scale": "model-00035-of-00047.safetensors", + "model.layers.34.mlp.experts.82.gate_proj.weight": "model-00035-of-00047.safetensors", + "model.layers.34.mlp.experts.82.gate_proj.weight_scale": "model-00035-of-00047.safetensors", + "model.layers.34.mlp.experts.82.up_proj.weight": "model-00035-of-00047.safetensors", + "model.layers.34.mlp.experts.82.up_proj.weight_scale": "model-00035-of-00047.safetensors", + "model.layers.34.mlp.experts.83.down_proj.weight": "model-00035-of-00047.safetensors", + "model.layers.34.mlp.experts.83.down_proj.weight_scale": "model-00035-of-00047.safetensors", + "model.layers.34.mlp.experts.83.gate_proj.weight": "model-00035-of-00047.safetensors", + "model.layers.34.mlp.experts.83.gate_proj.weight_scale": "model-00035-of-00047.safetensors", + "model.layers.34.mlp.experts.83.up_proj.weight": "model-00035-of-00047.safetensors", + "model.layers.34.mlp.experts.83.up_proj.weight_scale": "model-00035-of-00047.safetensors", + "model.layers.34.mlp.experts.84.down_proj.weight": "model-00035-of-00047.safetensors", + "model.layers.34.mlp.experts.84.down_proj.weight_scale": "model-00035-of-00047.safetensors", + "model.layers.34.mlp.experts.84.gate_proj.weight": "model-00035-of-00047.safetensors", + "model.layers.34.mlp.experts.84.gate_proj.weight_scale": "model-00035-of-00047.safetensors", + "model.layers.34.mlp.experts.84.up_proj.weight": "model-00035-of-00047.safetensors", + "model.layers.34.mlp.experts.84.up_proj.weight_scale": "model-00035-of-00047.safetensors", + "model.layers.34.mlp.experts.85.down_proj.weight": "model-00035-of-00047.safetensors", + "model.layers.34.mlp.experts.85.down_proj.weight_scale": "model-00035-of-00047.safetensors", + "model.layers.34.mlp.experts.85.gate_proj.weight": "model-00035-of-00047.safetensors", + "model.layers.34.mlp.experts.85.gate_proj.weight_scale": "model-00035-of-00047.safetensors", + "model.layers.34.mlp.experts.85.up_proj.weight": "model-00035-of-00047.safetensors", + "model.layers.34.mlp.experts.85.up_proj.weight_scale": "model-00035-of-00047.safetensors", + "model.layers.34.mlp.experts.86.down_proj.weight": "model-00035-of-00047.safetensors", + "model.layers.34.mlp.experts.86.down_proj.weight_scale": "model-00035-of-00047.safetensors", + "model.layers.34.mlp.experts.86.gate_proj.weight": "model-00035-of-00047.safetensors", + "model.layers.34.mlp.experts.86.gate_proj.weight_scale": "model-00035-of-00047.safetensors", + "model.layers.34.mlp.experts.86.up_proj.weight": "model-00035-of-00047.safetensors", + "model.layers.34.mlp.experts.86.up_proj.weight_scale": "model-00035-of-00047.safetensors", + "model.layers.34.mlp.experts.87.down_proj.weight": "model-00035-of-00047.safetensors", + "model.layers.34.mlp.experts.87.down_proj.weight_scale": "model-00035-of-00047.safetensors", + "model.layers.34.mlp.experts.87.gate_proj.weight": "model-00035-of-00047.safetensors", + "model.layers.34.mlp.experts.87.gate_proj.weight_scale": "model-00035-of-00047.safetensors", + "model.layers.34.mlp.experts.87.up_proj.weight": "model-00035-of-00047.safetensors", + "model.layers.34.mlp.experts.87.up_proj.weight_scale": "model-00035-of-00047.safetensors", + "model.layers.34.mlp.experts.88.down_proj.weight": "model-00035-of-00047.safetensors", + "model.layers.34.mlp.experts.88.down_proj.weight_scale": "model-00035-of-00047.safetensors", + "model.layers.34.mlp.experts.88.gate_proj.weight": "model-00035-of-00047.safetensors", + "model.layers.34.mlp.experts.88.gate_proj.weight_scale": "model-00035-of-00047.safetensors", + "model.layers.34.mlp.experts.88.up_proj.weight": "model-00035-of-00047.safetensors", + "model.layers.34.mlp.experts.88.up_proj.weight_scale": "model-00035-of-00047.safetensors", + "model.layers.34.mlp.experts.89.down_proj.weight": "model-00035-of-00047.safetensors", + "model.layers.34.mlp.experts.89.down_proj.weight_scale": "model-00035-of-00047.safetensors", + "model.layers.34.mlp.experts.89.gate_proj.weight": "model-00035-of-00047.safetensors", + "model.layers.34.mlp.experts.89.gate_proj.weight_scale": "model-00035-of-00047.safetensors", + "model.layers.34.mlp.experts.89.up_proj.weight": "model-00035-of-00047.safetensors", + "model.layers.34.mlp.experts.89.up_proj.weight_scale": "model-00035-of-00047.safetensors", + "model.layers.34.mlp.experts.9.down_proj.weight": "model-00035-of-00047.safetensors", + "model.layers.34.mlp.experts.9.down_proj.weight_scale": "model-00035-of-00047.safetensors", + "model.layers.34.mlp.experts.9.gate_proj.weight": "model-00035-of-00047.safetensors", + "model.layers.34.mlp.experts.9.gate_proj.weight_scale": "model-00035-of-00047.safetensors", + "model.layers.34.mlp.experts.9.up_proj.weight": "model-00035-of-00047.safetensors", + "model.layers.34.mlp.experts.9.up_proj.weight_scale": "model-00035-of-00047.safetensors", + "model.layers.34.mlp.experts.90.down_proj.weight": "model-00035-of-00047.safetensors", + "model.layers.34.mlp.experts.90.down_proj.weight_scale": "model-00035-of-00047.safetensors", + "model.layers.34.mlp.experts.90.gate_proj.weight": "model-00035-of-00047.safetensors", + "model.layers.34.mlp.experts.90.gate_proj.weight_scale": "model-00035-of-00047.safetensors", + "model.layers.34.mlp.experts.90.up_proj.weight": "model-00035-of-00047.safetensors", + "model.layers.34.mlp.experts.90.up_proj.weight_scale": "model-00035-of-00047.safetensors", + "model.layers.34.mlp.experts.91.down_proj.weight": "model-00035-of-00047.safetensors", + "model.layers.34.mlp.experts.91.down_proj.weight_scale": "model-00035-of-00047.safetensors", + "model.layers.34.mlp.experts.91.gate_proj.weight": "model-00035-of-00047.safetensors", + "model.layers.34.mlp.experts.91.gate_proj.weight_scale": "model-00035-of-00047.safetensors", + "model.layers.34.mlp.experts.91.up_proj.weight": "model-00035-of-00047.safetensors", + "model.layers.34.mlp.experts.91.up_proj.weight_scale": "model-00035-of-00047.safetensors", + "model.layers.34.mlp.experts.92.down_proj.weight": "model-00035-of-00047.safetensors", + "model.layers.34.mlp.experts.92.down_proj.weight_scale": "model-00035-of-00047.safetensors", + "model.layers.34.mlp.experts.92.gate_proj.weight": "model-00035-of-00047.safetensors", + "model.layers.34.mlp.experts.92.gate_proj.weight_scale": "model-00035-of-00047.safetensors", + "model.layers.34.mlp.experts.92.up_proj.weight": "model-00035-of-00047.safetensors", + "model.layers.34.mlp.experts.92.up_proj.weight_scale": "model-00035-of-00047.safetensors", + "model.layers.34.mlp.experts.93.down_proj.weight": "model-00035-of-00047.safetensors", + "model.layers.34.mlp.experts.93.down_proj.weight_scale": "model-00035-of-00047.safetensors", + "model.layers.34.mlp.experts.93.gate_proj.weight": "model-00035-of-00047.safetensors", + "model.layers.34.mlp.experts.93.gate_proj.weight_scale": "model-00035-of-00047.safetensors", + "model.layers.34.mlp.experts.93.up_proj.weight": "model-00035-of-00047.safetensors", + "model.layers.34.mlp.experts.93.up_proj.weight_scale": "model-00035-of-00047.safetensors", + "model.layers.34.mlp.experts.94.down_proj.weight": "model-00035-of-00047.safetensors", + "model.layers.34.mlp.experts.94.down_proj.weight_scale": "model-00035-of-00047.safetensors", + "model.layers.34.mlp.experts.94.gate_proj.weight": "model-00035-of-00047.safetensors", + "model.layers.34.mlp.experts.94.gate_proj.weight_scale": "model-00035-of-00047.safetensors", + "model.layers.34.mlp.experts.94.up_proj.weight": "model-00035-of-00047.safetensors", + "model.layers.34.mlp.experts.94.up_proj.weight_scale": "model-00035-of-00047.safetensors", + "model.layers.34.mlp.experts.95.down_proj.weight": "model-00035-of-00047.safetensors", + "model.layers.34.mlp.experts.95.down_proj.weight_scale": "model-00035-of-00047.safetensors", + "model.layers.34.mlp.experts.95.gate_proj.weight": "model-00035-of-00047.safetensors", + "model.layers.34.mlp.experts.95.gate_proj.weight_scale": "model-00035-of-00047.safetensors", + "model.layers.34.mlp.experts.95.up_proj.weight": "model-00035-of-00047.safetensors", + "model.layers.34.mlp.experts.95.up_proj.weight_scale": "model-00035-of-00047.safetensors", + "model.layers.34.mlp.experts.96.down_proj.weight": "model-00035-of-00047.safetensors", + "model.layers.34.mlp.experts.96.down_proj.weight_scale": "model-00035-of-00047.safetensors", + "model.layers.34.mlp.experts.96.gate_proj.weight": "model-00035-of-00047.safetensors", + "model.layers.34.mlp.experts.96.gate_proj.weight_scale": "model-00035-of-00047.safetensors", + "model.layers.34.mlp.experts.96.up_proj.weight": "model-00035-of-00047.safetensors", + "model.layers.34.mlp.experts.96.up_proj.weight_scale": "model-00035-of-00047.safetensors", + "model.layers.34.mlp.experts.97.down_proj.weight": "model-00035-of-00047.safetensors", + "model.layers.34.mlp.experts.97.down_proj.weight_scale": "model-00035-of-00047.safetensors", + "model.layers.34.mlp.experts.97.gate_proj.weight": "model-00035-of-00047.safetensors", + "model.layers.34.mlp.experts.97.gate_proj.weight_scale": "model-00035-of-00047.safetensors", + "model.layers.34.mlp.experts.97.up_proj.weight": "model-00035-of-00047.safetensors", + "model.layers.34.mlp.experts.97.up_proj.weight_scale": "model-00035-of-00047.safetensors", + "model.layers.34.mlp.experts.98.down_proj.weight": "model-00035-of-00047.safetensors", + "model.layers.34.mlp.experts.98.down_proj.weight_scale": "model-00035-of-00047.safetensors", + "model.layers.34.mlp.experts.98.gate_proj.weight": "model-00035-of-00047.safetensors", + "model.layers.34.mlp.experts.98.gate_proj.weight_scale": "model-00035-of-00047.safetensors", + "model.layers.34.mlp.experts.98.up_proj.weight": "model-00035-of-00047.safetensors", + "model.layers.34.mlp.experts.98.up_proj.weight_scale": "model-00035-of-00047.safetensors", + "model.layers.34.mlp.experts.99.down_proj.weight": "model-00035-of-00047.safetensors", + "model.layers.34.mlp.experts.99.down_proj.weight_scale": "model-00035-of-00047.safetensors", + "model.layers.34.mlp.experts.99.gate_proj.weight": "model-00035-of-00047.safetensors", + "model.layers.34.mlp.experts.99.gate_proj.weight_scale": "model-00035-of-00047.safetensors", + "model.layers.34.mlp.experts.99.up_proj.weight": "model-00035-of-00047.safetensors", + "model.layers.34.mlp.experts.99.up_proj.weight_scale": "model-00035-of-00047.safetensors", + "model.layers.34.mlp.gate.e_score_correction_bias": "model-00035-of-00047.safetensors", + "model.layers.34.mlp.gate.weight": "model-00035-of-00047.safetensors", + "model.layers.34.mlp.shared_experts.down_proj.weight": "model-00035-of-00047.safetensors", + "model.layers.34.mlp.shared_experts.down_proj.weight_scale": "model-00035-of-00047.safetensors", + "model.layers.34.mlp.shared_experts.gate_proj.weight": "model-00035-of-00047.safetensors", + "model.layers.34.mlp.shared_experts.gate_proj.weight_scale": "model-00035-of-00047.safetensors", + "model.layers.34.mlp.shared_experts.up_proj.weight": "model-00035-of-00047.safetensors", + "model.layers.34.mlp.shared_experts.up_proj.weight_scale": "model-00035-of-00047.safetensors", + "model.layers.34.post_attention_layernorm.weight": "model-00035-of-00047.safetensors", + "model.layers.34.self_attn.k_proj.bias": "model-00035-of-00047.safetensors", + "model.layers.34.self_attn.k_proj.weight": "model-00035-of-00047.safetensors", + "model.layers.34.self_attn.k_proj.weight_scale": "model-00035-of-00047.safetensors", + "model.layers.34.self_attn.o_proj.weight": "model-00035-of-00047.safetensors", + "model.layers.34.self_attn.o_proj.weight_scale": "model-00035-of-00047.safetensors", + "model.layers.34.self_attn.q_proj.bias": "model-00035-of-00047.safetensors", + "model.layers.34.self_attn.q_proj.weight": "model-00035-of-00047.safetensors", + "model.layers.34.self_attn.q_proj.weight_scale": "model-00035-of-00047.safetensors", + "model.layers.34.self_attn.v_proj.bias": "model-00035-of-00047.safetensors", + "model.layers.34.self_attn.v_proj.weight": "model-00035-of-00047.safetensors", + "model.layers.34.self_attn.v_proj.weight_scale": "model-00035-of-00047.safetensors", + "model.layers.35.input_layernorm.weight": "model-00036-of-00047.safetensors", + "model.layers.35.mlp.experts.0.down_proj.weight": "model-00036-of-00047.safetensors", + "model.layers.35.mlp.experts.0.down_proj.weight_scale": "model-00036-of-00047.safetensors", + "model.layers.35.mlp.experts.0.gate_proj.weight": "model-00036-of-00047.safetensors", + "model.layers.35.mlp.experts.0.gate_proj.weight_scale": "model-00036-of-00047.safetensors", + "model.layers.35.mlp.experts.0.up_proj.weight": "model-00036-of-00047.safetensors", + "model.layers.35.mlp.experts.0.up_proj.weight_scale": "model-00036-of-00047.safetensors", + "model.layers.35.mlp.experts.1.down_proj.weight": "model-00036-of-00047.safetensors", + "model.layers.35.mlp.experts.1.down_proj.weight_scale": "model-00036-of-00047.safetensors", + "model.layers.35.mlp.experts.1.gate_proj.weight": "model-00036-of-00047.safetensors", + "model.layers.35.mlp.experts.1.gate_proj.weight_scale": "model-00036-of-00047.safetensors", + "model.layers.35.mlp.experts.1.up_proj.weight": "model-00036-of-00047.safetensors", + "model.layers.35.mlp.experts.1.up_proj.weight_scale": "model-00036-of-00047.safetensors", + "model.layers.35.mlp.experts.10.down_proj.weight": "model-00036-of-00047.safetensors", + "model.layers.35.mlp.experts.10.down_proj.weight_scale": "model-00036-of-00047.safetensors", + "model.layers.35.mlp.experts.10.gate_proj.weight": "model-00036-of-00047.safetensors", + "model.layers.35.mlp.experts.10.gate_proj.weight_scale": "model-00036-of-00047.safetensors", + "model.layers.35.mlp.experts.10.up_proj.weight": "model-00036-of-00047.safetensors", + "model.layers.35.mlp.experts.10.up_proj.weight_scale": "model-00036-of-00047.safetensors", + "model.layers.35.mlp.experts.100.down_proj.weight": "model-00036-of-00047.safetensors", + "model.layers.35.mlp.experts.100.down_proj.weight_scale": "model-00036-of-00047.safetensors", + "model.layers.35.mlp.experts.100.gate_proj.weight": "model-00036-of-00047.safetensors", + "model.layers.35.mlp.experts.100.gate_proj.weight_scale": "model-00036-of-00047.safetensors", + "model.layers.35.mlp.experts.100.up_proj.weight": "model-00036-of-00047.safetensors", + "model.layers.35.mlp.experts.100.up_proj.weight_scale": "model-00036-of-00047.safetensors", + "model.layers.35.mlp.experts.101.down_proj.weight": "model-00036-of-00047.safetensors", + "model.layers.35.mlp.experts.101.down_proj.weight_scale": "model-00036-of-00047.safetensors", + "model.layers.35.mlp.experts.101.gate_proj.weight": "model-00036-of-00047.safetensors", + "model.layers.35.mlp.experts.101.gate_proj.weight_scale": "model-00036-of-00047.safetensors", + "model.layers.35.mlp.experts.101.up_proj.weight": "model-00036-of-00047.safetensors", + "model.layers.35.mlp.experts.101.up_proj.weight_scale": "model-00036-of-00047.safetensors", + "model.layers.35.mlp.experts.102.down_proj.weight": "model-00036-of-00047.safetensors", + "model.layers.35.mlp.experts.102.down_proj.weight_scale": "model-00036-of-00047.safetensors", + "model.layers.35.mlp.experts.102.gate_proj.weight": "model-00036-of-00047.safetensors", + "model.layers.35.mlp.experts.102.gate_proj.weight_scale": "model-00036-of-00047.safetensors", + "model.layers.35.mlp.experts.102.up_proj.weight": "model-00036-of-00047.safetensors", + "model.layers.35.mlp.experts.102.up_proj.weight_scale": "model-00036-of-00047.safetensors", + "model.layers.35.mlp.experts.103.down_proj.weight": "model-00036-of-00047.safetensors", + "model.layers.35.mlp.experts.103.down_proj.weight_scale": "model-00036-of-00047.safetensors", + "model.layers.35.mlp.experts.103.gate_proj.weight": "model-00036-of-00047.safetensors", + "model.layers.35.mlp.experts.103.gate_proj.weight_scale": "model-00036-of-00047.safetensors", + "model.layers.35.mlp.experts.103.up_proj.weight": "model-00036-of-00047.safetensors", + "model.layers.35.mlp.experts.103.up_proj.weight_scale": "model-00036-of-00047.safetensors", + "model.layers.35.mlp.experts.104.down_proj.weight": "model-00036-of-00047.safetensors", + "model.layers.35.mlp.experts.104.down_proj.weight_scale": "model-00036-of-00047.safetensors", + "model.layers.35.mlp.experts.104.gate_proj.weight": "model-00036-of-00047.safetensors", + "model.layers.35.mlp.experts.104.gate_proj.weight_scale": "model-00036-of-00047.safetensors", + "model.layers.35.mlp.experts.104.up_proj.weight": "model-00036-of-00047.safetensors", + "model.layers.35.mlp.experts.104.up_proj.weight_scale": "model-00036-of-00047.safetensors", + "model.layers.35.mlp.experts.105.down_proj.weight": "model-00036-of-00047.safetensors", + "model.layers.35.mlp.experts.105.down_proj.weight_scale": "model-00036-of-00047.safetensors", + "model.layers.35.mlp.experts.105.gate_proj.weight": "model-00036-of-00047.safetensors", + "model.layers.35.mlp.experts.105.gate_proj.weight_scale": "model-00036-of-00047.safetensors", + "model.layers.35.mlp.experts.105.up_proj.weight": "model-00036-of-00047.safetensors", + "model.layers.35.mlp.experts.105.up_proj.weight_scale": "model-00036-of-00047.safetensors", + "model.layers.35.mlp.experts.106.down_proj.weight": "model-00036-of-00047.safetensors", + "model.layers.35.mlp.experts.106.down_proj.weight_scale": "model-00036-of-00047.safetensors", + "model.layers.35.mlp.experts.106.gate_proj.weight": "model-00036-of-00047.safetensors", + "model.layers.35.mlp.experts.106.gate_proj.weight_scale": "model-00036-of-00047.safetensors", + "model.layers.35.mlp.experts.106.up_proj.weight": "model-00036-of-00047.safetensors", + "model.layers.35.mlp.experts.106.up_proj.weight_scale": "model-00036-of-00047.safetensors", + "model.layers.35.mlp.experts.107.down_proj.weight": "model-00036-of-00047.safetensors", + "model.layers.35.mlp.experts.107.down_proj.weight_scale": "model-00036-of-00047.safetensors", + "model.layers.35.mlp.experts.107.gate_proj.weight": "model-00036-of-00047.safetensors", + "model.layers.35.mlp.experts.107.gate_proj.weight_scale": "model-00036-of-00047.safetensors", + "model.layers.35.mlp.experts.107.up_proj.weight": "model-00036-of-00047.safetensors", + "model.layers.35.mlp.experts.107.up_proj.weight_scale": "model-00036-of-00047.safetensors", + "model.layers.35.mlp.experts.108.down_proj.weight": "model-00036-of-00047.safetensors", + "model.layers.35.mlp.experts.108.down_proj.weight_scale": "model-00036-of-00047.safetensors", + "model.layers.35.mlp.experts.108.gate_proj.weight": "model-00036-of-00047.safetensors", + "model.layers.35.mlp.experts.108.gate_proj.weight_scale": "model-00036-of-00047.safetensors", + "model.layers.35.mlp.experts.108.up_proj.weight": "model-00036-of-00047.safetensors", + "model.layers.35.mlp.experts.108.up_proj.weight_scale": "model-00036-of-00047.safetensors", + "model.layers.35.mlp.experts.109.down_proj.weight": "model-00036-of-00047.safetensors", + "model.layers.35.mlp.experts.109.down_proj.weight_scale": "model-00036-of-00047.safetensors", + "model.layers.35.mlp.experts.109.gate_proj.weight": "model-00036-of-00047.safetensors", + "model.layers.35.mlp.experts.109.gate_proj.weight_scale": "model-00036-of-00047.safetensors", + "model.layers.35.mlp.experts.109.up_proj.weight": "model-00036-of-00047.safetensors", + "model.layers.35.mlp.experts.109.up_proj.weight_scale": "model-00036-of-00047.safetensors", + "model.layers.35.mlp.experts.11.down_proj.weight": "model-00036-of-00047.safetensors", + "model.layers.35.mlp.experts.11.down_proj.weight_scale": "model-00036-of-00047.safetensors", + "model.layers.35.mlp.experts.11.gate_proj.weight": "model-00036-of-00047.safetensors", + "model.layers.35.mlp.experts.11.gate_proj.weight_scale": "model-00036-of-00047.safetensors", + "model.layers.35.mlp.experts.11.up_proj.weight": "model-00036-of-00047.safetensors", + "model.layers.35.mlp.experts.11.up_proj.weight_scale": "model-00036-of-00047.safetensors", + "model.layers.35.mlp.experts.110.down_proj.weight": "model-00036-of-00047.safetensors", + "model.layers.35.mlp.experts.110.down_proj.weight_scale": "model-00036-of-00047.safetensors", + "model.layers.35.mlp.experts.110.gate_proj.weight": "model-00036-of-00047.safetensors", + "model.layers.35.mlp.experts.110.gate_proj.weight_scale": "model-00036-of-00047.safetensors", + "model.layers.35.mlp.experts.110.up_proj.weight": "model-00036-of-00047.safetensors", + "model.layers.35.mlp.experts.110.up_proj.weight_scale": "model-00036-of-00047.safetensors", + "model.layers.35.mlp.experts.111.down_proj.weight": "model-00036-of-00047.safetensors", + "model.layers.35.mlp.experts.111.down_proj.weight_scale": "model-00036-of-00047.safetensors", + "model.layers.35.mlp.experts.111.gate_proj.weight": "model-00036-of-00047.safetensors", + "model.layers.35.mlp.experts.111.gate_proj.weight_scale": "model-00036-of-00047.safetensors", + "model.layers.35.mlp.experts.111.up_proj.weight": "model-00036-of-00047.safetensors", + "model.layers.35.mlp.experts.111.up_proj.weight_scale": "model-00036-of-00047.safetensors", + "model.layers.35.mlp.experts.112.down_proj.weight": "model-00036-of-00047.safetensors", + "model.layers.35.mlp.experts.112.down_proj.weight_scale": "model-00036-of-00047.safetensors", + "model.layers.35.mlp.experts.112.gate_proj.weight": "model-00036-of-00047.safetensors", + "model.layers.35.mlp.experts.112.gate_proj.weight_scale": "model-00036-of-00047.safetensors", + "model.layers.35.mlp.experts.112.up_proj.weight": "model-00036-of-00047.safetensors", + "model.layers.35.mlp.experts.112.up_proj.weight_scale": "model-00036-of-00047.safetensors", + "model.layers.35.mlp.experts.113.down_proj.weight": "model-00036-of-00047.safetensors", + "model.layers.35.mlp.experts.113.down_proj.weight_scale": "model-00036-of-00047.safetensors", + "model.layers.35.mlp.experts.113.gate_proj.weight": "model-00036-of-00047.safetensors", + "model.layers.35.mlp.experts.113.gate_proj.weight_scale": "model-00036-of-00047.safetensors", + "model.layers.35.mlp.experts.113.up_proj.weight": "model-00036-of-00047.safetensors", + "model.layers.35.mlp.experts.113.up_proj.weight_scale": "model-00036-of-00047.safetensors", + "model.layers.35.mlp.experts.114.down_proj.weight": "model-00036-of-00047.safetensors", + "model.layers.35.mlp.experts.114.down_proj.weight_scale": "model-00036-of-00047.safetensors", + "model.layers.35.mlp.experts.114.gate_proj.weight": "model-00036-of-00047.safetensors", + "model.layers.35.mlp.experts.114.gate_proj.weight_scale": "model-00036-of-00047.safetensors", + "model.layers.35.mlp.experts.114.up_proj.weight": "model-00036-of-00047.safetensors", + "model.layers.35.mlp.experts.114.up_proj.weight_scale": "model-00036-of-00047.safetensors", + "model.layers.35.mlp.experts.115.down_proj.weight": "model-00036-of-00047.safetensors", + "model.layers.35.mlp.experts.115.down_proj.weight_scale": "model-00036-of-00047.safetensors", + "model.layers.35.mlp.experts.115.gate_proj.weight": "model-00036-of-00047.safetensors", + "model.layers.35.mlp.experts.115.gate_proj.weight_scale": "model-00036-of-00047.safetensors", + "model.layers.35.mlp.experts.115.up_proj.weight": "model-00036-of-00047.safetensors", + "model.layers.35.mlp.experts.115.up_proj.weight_scale": "model-00036-of-00047.safetensors", + "model.layers.35.mlp.experts.116.down_proj.weight": "model-00036-of-00047.safetensors", + "model.layers.35.mlp.experts.116.down_proj.weight_scale": "model-00036-of-00047.safetensors", + "model.layers.35.mlp.experts.116.gate_proj.weight": "model-00036-of-00047.safetensors", + "model.layers.35.mlp.experts.116.gate_proj.weight_scale": "model-00036-of-00047.safetensors", + "model.layers.35.mlp.experts.116.up_proj.weight": "model-00036-of-00047.safetensors", + "model.layers.35.mlp.experts.116.up_proj.weight_scale": "model-00036-of-00047.safetensors", + "model.layers.35.mlp.experts.117.down_proj.weight": "model-00036-of-00047.safetensors", + "model.layers.35.mlp.experts.117.down_proj.weight_scale": "model-00036-of-00047.safetensors", + "model.layers.35.mlp.experts.117.gate_proj.weight": "model-00036-of-00047.safetensors", + "model.layers.35.mlp.experts.117.gate_proj.weight_scale": "model-00036-of-00047.safetensors", + "model.layers.35.mlp.experts.117.up_proj.weight": "model-00036-of-00047.safetensors", + "model.layers.35.mlp.experts.117.up_proj.weight_scale": "model-00036-of-00047.safetensors", + "model.layers.35.mlp.experts.118.down_proj.weight": "model-00036-of-00047.safetensors", + "model.layers.35.mlp.experts.118.down_proj.weight_scale": "model-00036-of-00047.safetensors", + "model.layers.35.mlp.experts.118.gate_proj.weight": "model-00036-of-00047.safetensors", + "model.layers.35.mlp.experts.118.gate_proj.weight_scale": "model-00036-of-00047.safetensors", + "model.layers.35.mlp.experts.118.up_proj.weight": "model-00036-of-00047.safetensors", + "model.layers.35.mlp.experts.118.up_proj.weight_scale": "model-00036-of-00047.safetensors", + "model.layers.35.mlp.experts.119.down_proj.weight": "model-00036-of-00047.safetensors", + "model.layers.35.mlp.experts.119.down_proj.weight_scale": "model-00036-of-00047.safetensors", + "model.layers.35.mlp.experts.119.gate_proj.weight": "model-00036-of-00047.safetensors", + "model.layers.35.mlp.experts.119.gate_proj.weight_scale": "model-00036-of-00047.safetensors", + "model.layers.35.mlp.experts.119.up_proj.weight": "model-00036-of-00047.safetensors", + "model.layers.35.mlp.experts.119.up_proj.weight_scale": "model-00036-of-00047.safetensors", + "model.layers.35.mlp.experts.12.down_proj.weight": "model-00036-of-00047.safetensors", + "model.layers.35.mlp.experts.12.down_proj.weight_scale": "model-00036-of-00047.safetensors", + "model.layers.35.mlp.experts.12.gate_proj.weight": "model-00036-of-00047.safetensors", + "model.layers.35.mlp.experts.12.gate_proj.weight_scale": "model-00036-of-00047.safetensors", + "model.layers.35.mlp.experts.12.up_proj.weight": "model-00036-of-00047.safetensors", + "model.layers.35.mlp.experts.12.up_proj.weight_scale": "model-00036-of-00047.safetensors", + "model.layers.35.mlp.experts.120.down_proj.weight": "model-00036-of-00047.safetensors", + "model.layers.35.mlp.experts.120.down_proj.weight_scale": "model-00036-of-00047.safetensors", + "model.layers.35.mlp.experts.120.gate_proj.weight": "model-00036-of-00047.safetensors", + "model.layers.35.mlp.experts.120.gate_proj.weight_scale": "model-00036-of-00047.safetensors", + "model.layers.35.mlp.experts.120.up_proj.weight": "model-00036-of-00047.safetensors", + "model.layers.35.mlp.experts.120.up_proj.weight_scale": "model-00036-of-00047.safetensors", + "model.layers.35.mlp.experts.121.down_proj.weight": "model-00036-of-00047.safetensors", + "model.layers.35.mlp.experts.121.down_proj.weight_scale": "model-00036-of-00047.safetensors", + "model.layers.35.mlp.experts.121.gate_proj.weight": "model-00036-of-00047.safetensors", + "model.layers.35.mlp.experts.121.gate_proj.weight_scale": "model-00036-of-00047.safetensors", + "model.layers.35.mlp.experts.121.up_proj.weight": "model-00036-of-00047.safetensors", + "model.layers.35.mlp.experts.121.up_proj.weight_scale": "model-00036-of-00047.safetensors", + "model.layers.35.mlp.experts.122.down_proj.weight": "model-00036-of-00047.safetensors", + "model.layers.35.mlp.experts.122.down_proj.weight_scale": "model-00036-of-00047.safetensors", + "model.layers.35.mlp.experts.122.gate_proj.weight": "model-00036-of-00047.safetensors", + "model.layers.35.mlp.experts.122.gate_proj.weight_scale": "model-00036-of-00047.safetensors", + "model.layers.35.mlp.experts.122.up_proj.weight": "model-00036-of-00047.safetensors", + "model.layers.35.mlp.experts.122.up_proj.weight_scale": "model-00036-of-00047.safetensors", + "model.layers.35.mlp.experts.123.down_proj.weight": "model-00036-of-00047.safetensors", + "model.layers.35.mlp.experts.123.down_proj.weight_scale": "model-00036-of-00047.safetensors", + "model.layers.35.mlp.experts.123.gate_proj.weight": "model-00036-of-00047.safetensors", + "model.layers.35.mlp.experts.123.gate_proj.weight_scale": "model-00036-of-00047.safetensors", + "model.layers.35.mlp.experts.123.up_proj.weight": "model-00036-of-00047.safetensors", + "model.layers.35.mlp.experts.123.up_proj.weight_scale": "model-00036-of-00047.safetensors", + "model.layers.35.mlp.experts.124.down_proj.weight": "model-00036-of-00047.safetensors", + "model.layers.35.mlp.experts.124.down_proj.weight_scale": "model-00036-of-00047.safetensors", + "model.layers.35.mlp.experts.124.gate_proj.weight": "model-00036-of-00047.safetensors", + "model.layers.35.mlp.experts.124.gate_proj.weight_scale": "model-00036-of-00047.safetensors", + "model.layers.35.mlp.experts.124.up_proj.weight": "model-00036-of-00047.safetensors", + "model.layers.35.mlp.experts.124.up_proj.weight_scale": "model-00036-of-00047.safetensors", + "model.layers.35.mlp.experts.125.down_proj.weight": "model-00036-of-00047.safetensors", + "model.layers.35.mlp.experts.125.down_proj.weight_scale": "model-00036-of-00047.safetensors", + "model.layers.35.mlp.experts.125.gate_proj.weight": "model-00036-of-00047.safetensors", + "model.layers.35.mlp.experts.125.gate_proj.weight_scale": "model-00036-of-00047.safetensors", + "model.layers.35.mlp.experts.125.up_proj.weight": "model-00036-of-00047.safetensors", + "model.layers.35.mlp.experts.125.up_proj.weight_scale": "model-00036-of-00047.safetensors", + "model.layers.35.mlp.experts.126.down_proj.weight": "model-00036-of-00047.safetensors", + "model.layers.35.mlp.experts.126.down_proj.weight_scale": "model-00036-of-00047.safetensors", + "model.layers.35.mlp.experts.126.gate_proj.weight": "model-00036-of-00047.safetensors", + "model.layers.35.mlp.experts.126.gate_proj.weight_scale": "model-00036-of-00047.safetensors", + "model.layers.35.mlp.experts.126.up_proj.weight": "model-00036-of-00047.safetensors", + "model.layers.35.mlp.experts.126.up_proj.weight_scale": "model-00036-of-00047.safetensors", + "model.layers.35.mlp.experts.127.down_proj.weight": "model-00036-of-00047.safetensors", + "model.layers.35.mlp.experts.127.down_proj.weight_scale": "model-00036-of-00047.safetensors", + "model.layers.35.mlp.experts.127.gate_proj.weight": "model-00036-of-00047.safetensors", + "model.layers.35.mlp.experts.127.gate_proj.weight_scale": "model-00036-of-00047.safetensors", + "model.layers.35.mlp.experts.127.up_proj.weight": "model-00036-of-00047.safetensors", + "model.layers.35.mlp.experts.127.up_proj.weight_scale": "model-00036-of-00047.safetensors", + "model.layers.35.mlp.experts.13.down_proj.weight": "model-00036-of-00047.safetensors", + "model.layers.35.mlp.experts.13.down_proj.weight_scale": "model-00036-of-00047.safetensors", + "model.layers.35.mlp.experts.13.gate_proj.weight": "model-00036-of-00047.safetensors", + "model.layers.35.mlp.experts.13.gate_proj.weight_scale": "model-00036-of-00047.safetensors", + "model.layers.35.mlp.experts.13.up_proj.weight": "model-00036-of-00047.safetensors", + "model.layers.35.mlp.experts.13.up_proj.weight_scale": "model-00036-of-00047.safetensors", + "model.layers.35.mlp.experts.14.down_proj.weight": "model-00036-of-00047.safetensors", + "model.layers.35.mlp.experts.14.down_proj.weight_scale": "model-00036-of-00047.safetensors", + "model.layers.35.mlp.experts.14.gate_proj.weight": "model-00036-of-00047.safetensors", + "model.layers.35.mlp.experts.14.gate_proj.weight_scale": "model-00036-of-00047.safetensors", + "model.layers.35.mlp.experts.14.up_proj.weight": "model-00036-of-00047.safetensors", + "model.layers.35.mlp.experts.14.up_proj.weight_scale": "model-00036-of-00047.safetensors", + "model.layers.35.mlp.experts.15.down_proj.weight": "model-00036-of-00047.safetensors", + "model.layers.35.mlp.experts.15.down_proj.weight_scale": "model-00036-of-00047.safetensors", + "model.layers.35.mlp.experts.15.gate_proj.weight": "model-00036-of-00047.safetensors", + "model.layers.35.mlp.experts.15.gate_proj.weight_scale": "model-00036-of-00047.safetensors", + "model.layers.35.mlp.experts.15.up_proj.weight": "model-00036-of-00047.safetensors", + "model.layers.35.mlp.experts.15.up_proj.weight_scale": "model-00036-of-00047.safetensors", + "model.layers.35.mlp.experts.16.down_proj.weight": "model-00036-of-00047.safetensors", + "model.layers.35.mlp.experts.16.down_proj.weight_scale": "model-00036-of-00047.safetensors", + "model.layers.35.mlp.experts.16.gate_proj.weight": "model-00036-of-00047.safetensors", + "model.layers.35.mlp.experts.16.gate_proj.weight_scale": "model-00036-of-00047.safetensors", + "model.layers.35.mlp.experts.16.up_proj.weight": "model-00036-of-00047.safetensors", + "model.layers.35.mlp.experts.16.up_proj.weight_scale": "model-00036-of-00047.safetensors", + "model.layers.35.mlp.experts.17.down_proj.weight": "model-00036-of-00047.safetensors", + "model.layers.35.mlp.experts.17.down_proj.weight_scale": "model-00036-of-00047.safetensors", + "model.layers.35.mlp.experts.17.gate_proj.weight": "model-00036-of-00047.safetensors", + "model.layers.35.mlp.experts.17.gate_proj.weight_scale": "model-00036-of-00047.safetensors", + "model.layers.35.mlp.experts.17.up_proj.weight": "model-00036-of-00047.safetensors", + "model.layers.35.mlp.experts.17.up_proj.weight_scale": "model-00036-of-00047.safetensors", + "model.layers.35.mlp.experts.18.down_proj.weight": "model-00036-of-00047.safetensors", + "model.layers.35.mlp.experts.18.down_proj.weight_scale": "model-00036-of-00047.safetensors", + "model.layers.35.mlp.experts.18.gate_proj.weight": "model-00036-of-00047.safetensors", + "model.layers.35.mlp.experts.18.gate_proj.weight_scale": "model-00036-of-00047.safetensors", + "model.layers.35.mlp.experts.18.up_proj.weight": "model-00036-of-00047.safetensors", + "model.layers.35.mlp.experts.18.up_proj.weight_scale": "model-00036-of-00047.safetensors", + "model.layers.35.mlp.experts.19.down_proj.weight": "model-00036-of-00047.safetensors", + "model.layers.35.mlp.experts.19.down_proj.weight_scale": "model-00036-of-00047.safetensors", + "model.layers.35.mlp.experts.19.gate_proj.weight": "model-00036-of-00047.safetensors", + "model.layers.35.mlp.experts.19.gate_proj.weight_scale": "model-00036-of-00047.safetensors", + "model.layers.35.mlp.experts.19.up_proj.weight": "model-00036-of-00047.safetensors", + "model.layers.35.mlp.experts.19.up_proj.weight_scale": "model-00036-of-00047.safetensors", + "model.layers.35.mlp.experts.2.down_proj.weight": "model-00036-of-00047.safetensors", + "model.layers.35.mlp.experts.2.down_proj.weight_scale": "model-00036-of-00047.safetensors", + "model.layers.35.mlp.experts.2.gate_proj.weight": "model-00036-of-00047.safetensors", + "model.layers.35.mlp.experts.2.gate_proj.weight_scale": "model-00036-of-00047.safetensors", + "model.layers.35.mlp.experts.2.up_proj.weight": "model-00036-of-00047.safetensors", + "model.layers.35.mlp.experts.2.up_proj.weight_scale": "model-00036-of-00047.safetensors", + "model.layers.35.mlp.experts.20.down_proj.weight": "model-00036-of-00047.safetensors", + "model.layers.35.mlp.experts.20.down_proj.weight_scale": "model-00036-of-00047.safetensors", + "model.layers.35.mlp.experts.20.gate_proj.weight": "model-00036-of-00047.safetensors", + "model.layers.35.mlp.experts.20.gate_proj.weight_scale": "model-00036-of-00047.safetensors", + "model.layers.35.mlp.experts.20.up_proj.weight": "model-00036-of-00047.safetensors", + "model.layers.35.mlp.experts.20.up_proj.weight_scale": "model-00036-of-00047.safetensors", + "model.layers.35.mlp.experts.21.down_proj.weight": "model-00036-of-00047.safetensors", + "model.layers.35.mlp.experts.21.down_proj.weight_scale": "model-00036-of-00047.safetensors", + "model.layers.35.mlp.experts.21.gate_proj.weight": "model-00036-of-00047.safetensors", + "model.layers.35.mlp.experts.21.gate_proj.weight_scale": "model-00036-of-00047.safetensors", + "model.layers.35.mlp.experts.21.up_proj.weight": "model-00036-of-00047.safetensors", + "model.layers.35.mlp.experts.21.up_proj.weight_scale": "model-00036-of-00047.safetensors", + "model.layers.35.mlp.experts.22.down_proj.weight": "model-00036-of-00047.safetensors", + "model.layers.35.mlp.experts.22.down_proj.weight_scale": "model-00036-of-00047.safetensors", + "model.layers.35.mlp.experts.22.gate_proj.weight": "model-00036-of-00047.safetensors", + "model.layers.35.mlp.experts.22.gate_proj.weight_scale": "model-00036-of-00047.safetensors", + "model.layers.35.mlp.experts.22.up_proj.weight": "model-00036-of-00047.safetensors", + "model.layers.35.mlp.experts.22.up_proj.weight_scale": "model-00036-of-00047.safetensors", + "model.layers.35.mlp.experts.23.down_proj.weight": "model-00036-of-00047.safetensors", + "model.layers.35.mlp.experts.23.down_proj.weight_scale": "model-00036-of-00047.safetensors", + "model.layers.35.mlp.experts.23.gate_proj.weight": "model-00036-of-00047.safetensors", + "model.layers.35.mlp.experts.23.gate_proj.weight_scale": "model-00036-of-00047.safetensors", + "model.layers.35.mlp.experts.23.up_proj.weight": "model-00036-of-00047.safetensors", + "model.layers.35.mlp.experts.23.up_proj.weight_scale": "model-00036-of-00047.safetensors", + "model.layers.35.mlp.experts.24.down_proj.weight": "model-00036-of-00047.safetensors", + "model.layers.35.mlp.experts.24.down_proj.weight_scale": "model-00036-of-00047.safetensors", + "model.layers.35.mlp.experts.24.gate_proj.weight": "model-00036-of-00047.safetensors", + "model.layers.35.mlp.experts.24.gate_proj.weight_scale": "model-00036-of-00047.safetensors", + "model.layers.35.mlp.experts.24.up_proj.weight": "model-00036-of-00047.safetensors", + "model.layers.35.mlp.experts.24.up_proj.weight_scale": "model-00036-of-00047.safetensors", + "model.layers.35.mlp.experts.25.down_proj.weight": "model-00036-of-00047.safetensors", + "model.layers.35.mlp.experts.25.down_proj.weight_scale": "model-00036-of-00047.safetensors", + "model.layers.35.mlp.experts.25.gate_proj.weight": "model-00036-of-00047.safetensors", + "model.layers.35.mlp.experts.25.gate_proj.weight_scale": "model-00036-of-00047.safetensors", + "model.layers.35.mlp.experts.25.up_proj.weight": "model-00036-of-00047.safetensors", + "model.layers.35.mlp.experts.25.up_proj.weight_scale": "model-00036-of-00047.safetensors", + "model.layers.35.mlp.experts.26.down_proj.weight": "model-00036-of-00047.safetensors", + "model.layers.35.mlp.experts.26.down_proj.weight_scale": "model-00036-of-00047.safetensors", + "model.layers.35.mlp.experts.26.gate_proj.weight": "model-00036-of-00047.safetensors", + "model.layers.35.mlp.experts.26.gate_proj.weight_scale": "model-00036-of-00047.safetensors", + "model.layers.35.mlp.experts.26.up_proj.weight": "model-00036-of-00047.safetensors", + "model.layers.35.mlp.experts.26.up_proj.weight_scale": "model-00036-of-00047.safetensors", + "model.layers.35.mlp.experts.27.down_proj.weight": "model-00036-of-00047.safetensors", + "model.layers.35.mlp.experts.27.down_proj.weight_scale": "model-00036-of-00047.safetensors", + "model.layers.35.mlp.experts.27.gate_proj.weight": "model-00036-of-00047.safetensors", + "model.layers.35.mlp.experts.27.gate_proj.weight_scale": "model-00036-of-00047.safetensors", + "model.layers.35.mlp.experts.27.up_proj.weight": "model-00036-of-00047.safetensors", + "model.layers.35.mlp.experts.27.up_proj.weight_scale": "model-00036-of-00047.safetensors", + "model.layers.35.mlp.experts.28.down_proj.weight": "model-00036-of-00047.safetensors", + "model.layers.35.mlp.experts.28.down_proj.weight_scale": "model-00036-of-00047.safetensors", + "model.layers.35.mlp.experts.28.gate_proj.weight": "model-00036-of-00047.safetensors", + "model.layers.35.mlp.experts.28.gate_proj.weight_scale": "model-00036-of-00047.safetensors", + "model.layers.35.mlp.experts.28.up_proj.weight": "model-00036-of-00047.safetensors", + "model.layers.35.mlp.experts.28.up_proj.weight_scale": "model-00036-of-00047.safetensors", + "model.layers.35.mlp.experts.29.down_proj.weight": "model-00036-of-00047.safetensors", + "model.layers.35.mlp.experts.29.down_proj.weight_scale": "model-00036-of-00047.safetensors", + "model.layers.35.mlp.experts.29.gate_proj.weight": "model-00036-of-00047.safetensors", + "model.layers.35.mlp.experts.29.gate_proj.weight_scale": "model-00036-of-00047.safetensors", + "model.layers.35.mlp.experts.29.up_proj.weight": "model-00036-of-00047.safetensors", + "model.layers.35.mlp.experts.29.up_proj.weight_scale": "model-00036-of-00047.safetensors", + "model.layers.35.mlp.experts.3.down_proj.weight": "model-00036-of-00047.safetensors", + "model.layers.35.mlp.experts.3.down_proj.weight_scale": "model-00036-of-00047.safetensors", + "model.layers.35.mlp.experts.3.gate_proj.weight": "model-00036-of-00047.safetensors", + "model.layers.35.mlp.experts.3.gate_proj.weight_scale": "model-00036-of-00047.safetensors", + "model.layers.35.mlp.experts.3.up_proj.weight": "model-00036-of-00047.safetensors", + "model.layers.35.mlp.experts.3.up_proj.weight_scale": "model-00036-of-00047.safetensors", + "model.layers.35.mlp.experts.30.down_proj.weight": "model-00036-of-00047.safetensors", + "model.layers.35.mlp.experts.30.down_proj.weight_scale": "model-00036-of-00047.safetensors", + "model.layers.35.mlp.experts.30.gate_proj.weight": "model-00036-of-00047.safetensors", + "model.layers.35.mlp.experts.30.gate_proj.weight_scale": "model-00036-of-00047.safetensors", + "model.layers.35.mlp.experts.30.up_proj.weight": "model-00036-of-00047.safetensors", + "model.layers.35.mlp.experts.30.up_proj.weight_scale": "model-00036-of-00047.safetensors", + "model.layers.35.mlp.experts.31.down_proj.weight": "model-00036-of-00047.safetensors", + "model.layers.35.mlp.experts.31.down_proj.weight_scale": "model-00036-of-00047.safetensors", + "model.layers.35.mlp.experts.31.gate_proj.weight": "model-00036-of-00047.safetensors", + "model.layers.35.mlp.experts.31.gate_proj.weight_scale": "model-00036-of-00047.safetensors", + "model.layers.35.mlp.experts.31.up_proj.weight": "model-00036-of-00047.safetensors", + "model.layers.35.mlp.experts.31.up_proj.weight_scale": "model-00036-of-00047.safetensors", + "model.layers.35.mlp.experts.32.down_proj.weight": "model-00036-of-00047.safetensors", + "model.layers.35.mlp.experts.32.down_proj.weight_scale": "model-00036-of-00047.safetensors", + "model.layers.35.mlp.experts.32.gate_proj.weight": "model-00036-of-00047.safetensors", + "model.layers.35.mlp.experts.32.gate_proj.weight_scale": "model-00036-of-00047.safetensors", + "model.layers.35.mlp.experts.32.up_proj.weight": "model-00036-of-00047.safetensors", + "model.layers.35.mlp.experts.32.up_proj.weight_scale": "model-00036-of-00047.safetensors", + "model.layers.35.mlp.experts.33.down_proj.weight": "model-00036-of-00047.safetensors", + "model.layers.35.mlp.experts.33.down_proj.weight_scale": "model-00036-of-00047.safetensors", + "model.layers.35.mlp.experts.33.gate_proj.weight": "model-00036-of-00047.safetensors", + "model.layers.35.mlp.experts.33.gate_proj.weight_scale": "model-00036-of-00047.safetensors", + "model.layers.35.mlp.experts.33.up_proj.weight": "model-00036-of-00047.safetensors", + "model.layers.35.mlp.experts.33.up_proj.weight_scale": "model-00036-of-00047.safetensors", + "model.layers.35.mlp.experts.34.down_proj.weight": "model-00036-of-00047.safetensors", + "model.layers.35.mlp.experts.34.down_proj.weight_scale": "model-00036-of-00047.safetensors", + "model.layers.35.mlp.experts.34.gate_proj.weight": "model-00036-of-00047.safetensors", + "model.layers.35.mlp.experts.34.gate_proj.weight_scale": "model-00036-of-00047.safetensors", + "model.layers.35.mlp.experts.34.up_proj.weight": "model-00036-of-00047.safetensors", + "model.layers.35.mlp.experts.34.up_proj.weight_scale": "model-00036-of-00047.safetensors", + "model.layers.35.mlp.experts.35.down_proj.weight": "model-00036-of-00047.safetensors", + "model.layers.35.mlp.experts.35.down_proj.weight_scale": "model-00036-of-00047.safetensors", + "model.layers.35.mlp.experts.35.gate_proj.weight": "model-00036-of-00047.safetensors", + "model.layers.35.mlp.experts.35.gate_proj.weight_scale": "model-00036-of-00047.safetensors", + "model.layers.35.mlp.experts.35.up_proj.weight": "model-00036-of-00047.safetensors", + "model.layers.35.mlp.experts.35.up_proj.weight_scale": "model-00036-of-00047.safetensors", + "model.layers.35.mlp.experts.36.down_proj.weight": "model-00036-of-00047.safetensors", + "model.layers.35.mlp.experts.36.down_proj.weight_scale": "model-00036-of-00047.safetensors", + "model.layers.35.mlp.experts.36.gate_proj.weight": "model-00036-of-00047.safetensors", + "model.layers.35.mlp.experts.36.gate_proj.weight_scale": "model-00036-of-00047.safetensors", + "model.layers.35.mlp.experts.36.up_proj.weight": "model-00036-of-00047.safetensors", + "model.layers.35.mlp.experts.36.up_proj.weight_scale": "model-00036-of-00047.safetensors", + "model.layers.35.mlp.experts.37.down_proj.weight": "model-00036-of-00047.safetensors", + "model.layers.35.mlp.experts.37.down_proj.weight_scale": "model-00036-of-00047.safetensors", + "model.layers.35.mlp.experts.37.gate_proj.weight": "model-00036-of-00047.safetensors", + "model.layers.35.mlp.experts.37.gate_proj.weight_scale": "model-00036-of-00047.safetensors", + "model.layers.35.mlp.experts.37.up_proj.weight": "model-00036-of-00047.safetensors", + "model.layers.35.mlp.experts.37.up_proj.weight_scale": "model-00036-of-00047.safetensors", + "model.layers.35.mlp.experts.38.down_proj.weight": "model-00036-of-00047.safetensors", + "model.layers.35.mlp.experts.38.down_proj.weight_scale": "model-00036-of-00047.safetensors", + "model.layers.35.mlp.experts.38.gate_proj.weight": "model-00036-of-00047.safetensors", + "model.layers.35.mlp.experts.38.gate_proj.weight_scale": "model-00036-of-00047.safetensors", + "model.layers.35.mlp.experts.38.up_proj.weight": "model-00036-of-00047.safetensors", + "model.layers.35.mlp.experts.38.up_proj.weight_scale": "model-00036-of-00047.safetensors", + "model.layers.35.mlp.experts.39.down_proj.weight": "model-00036-of-00047.safetensors", + "model.layers.35.mlp.experts.39.down_proj.weight_scale": "model-00036-of-00047.safetensors", + "model.layers.35.mlp.experts.39.gate_proj.weight": "model-00036-of-00047.safetensors", + "model.layers.35.mlp.experts.39.gate_proj.weight_scale": "model-00036-of-00047.safetensors", + "model.layers.35.mlp.experts.39.up_proj.weight": "model-00036-of-00047.safetensors", + "model.layers.35.mlp.experts.39.up_proj.weight_scale": "model-00036-of-00047.safetensors", + "model.layers.35.mlp.experts.4.down_proj.weight": "model-00036-of-00047.safetensors", + "model.layers.35.mlp.experts.4.down_proj.weight_scale": "model-00036-of-00047.safetensors", + "model.layers.35.mlp.experts.4.gate_proj.weight": "model-00036-of-00047.safetensors", + "model.layers.35.mlp.experts.4.gate_proj.weight_scale": "model-00036-of-00047.safetensors", + "model.layers.35.mlp.experts.4.up_proj.weight": "model-00036-of-00047.safetensors", + "model.layers.35.mlp.experts.4.up_proj.weight_scale": "model-00036-of-00047.safetensors", + "model.layers.35.mlp.experts.40.down_proj.weight": "model-00036-of-00047.safetensors", + "model.layers.35.mlp.experts.40.down_proj.weight_scale": "model-00036-of-00047.safetensors", + "model.layers.35.mlp.experts.40.gate_proj.weight": "model-00036-of-00047.safetensors", + "model.layers.35.mlp.experts.40.gate_proj.weight_scale": "model-00036-of-00047.safetensors", + "model.layers.35.mlp.experts.40.up_proj.weight": "model-00036-of-00047.safetensors", + "model.layers.35.mlp.experts.40.up_proj.weight_scale": "model-00036-of-00047.safetensors", + "model.layers.35.mlp.experts.41.down_proj.weight": "model-00036-of-00047.safetensors", + "model.layers.35.mlp.experts.41.down_proj.weight_scale": "model-00036-of-00047.safetensors", + "model.layers.35.mlp.experts.41.gate_proj.weight": "model-00036-of-00047.safetensors", + "model.layers.35.mlp.experts.41.gate_proj.weight_scale": "model-00036-of-00047.safetensors", + "model.layers.35.mlp.experts.41.up_proj.weight": "model-00036-of-00047.safetensors", + "model.layers.35.mlp.experts.41.up_proj.weight_scale": "model-00036-of-00047.safetensors", + "model.layers.35.mlp.experts.42.down_proj.weight": "model-00036-of-00047.safetensors", + "model.layers.35.mlp.experts.42.down_proj.weight_scale": "model-00036-of-00047.safetensors", + "model.layers.35.mlp.experts.42.gate_proj.weight": "model-00036-of-00047.safetensors", + "model.layers.35.mlp.experts.42.gate_proj.weight_scale": "model-00036-of-00047.safetensors", + "model.layers.35.mlp.experts.42.up_proj.weight": "model-00036-of-00047.safetensors", + "model.layers.35.mlp.experts.42.up_proj.weight_scale": "model-00036-of-00047.safetensors", + "model.layers.35.mlp.experts.43.down_proj.weight": "model-00036-of-00047.safetensors", + "model.layers.35.mlp.experts.43.down_proj.weight_scale": "model-00036-of-00047.safetensors", + "model.layers.35.mlp.experts.43.gate_proj.weight": "model-00036-of-00047.safetensors", + "model.layers.35.mlp.experts.43.gate_proj.weight_scale": "model-00036-of-00047.safetensors", + "model.layers.35.mlp.experts.43.up_proj.weight": "model-00036-of-00047.safetensors", + "model.layers.35.mlp.experts.43.up_proj.weight_scale": "model-00036-of-00047.safetensors", + "model.layers.35.mlp.experts.44.down_proj.weight": "model-00036-of-00047.safetensors", + "model.layers.35.mlp.experts.44.down_proj.weight_scale": "model-00036-of-00047.safetensors", + "model.layers.35.mlp.experts.44.gate_proj.weight": "model-00036-of-00047.safetensors", + "model.layers.35.mlp.experts.44.gate_proj.weight_scale": "model-00036-of-00047.safetensors", + "model.layers.35.mlp.experts.44.up_proj.weight": "model-00036-of-00047.safetensors", + "model.layers.35.mlp.experts.44.up_proj.weight_scale": "model-00036-of-00047.safetensors", + "model.layers.35.mlp.experts.45.down_proj.weight": "model-00036-of-00047.safetensors", + "model.layers.35.mlp.experts.45.down_proj.weight_scale": "model-00036-of-00047.safetensors", + "model.layers.35.mlp.experts.45.gate_proj.weight": "model-00036-of-00047.safetensors", + "model.layers.35.mlp.experts.45.gate_proj.weight_scale": "model-00036-of-00047.safetensors", + "model.layers.35.mlp.experts.45.up_proj.weight": "model-00036-of-00047.safetensors", + "model.layers.35.mlp.experts.45.up_proj.weight_scale": "model-00036-of-00047.safetensors", + "model.layers.35.mlp.experts.46.down_proj.weight": "model-00036-of-00047.safetensors", + "model.layers.35.mlp.experts.46.down_proj.weight_scale": "model-00036-of-00047.safetensors", + "model.layers.35.mlp.experts.46.gate_proj.weight": "model-00036-of-00047.safetensors", + "model.layers.35.mlp.experts.46.gate_proj.weight_scale": "model-00036-of-00047.safetensors", + "model.layers.35.mlp.experts.46.up_proj.weight": "model-00036-of-00047.safetensors", + "model.layers.35.mlp.experts.46.up_proj.weight_scale": "model-00036-of-00047.safetensors", + "model.layers.35.mlp.experts.47.down_proj.weight": "model-00036-of-00047.safetensors", + "model.layers.35.mlp.experts.47.down_proj.weight_scale": "model-00036-of-00047.safetensors", + "model.layers.35.mlp.experts.47.gate_proj.weight": "model-00036-of-00047.safetensors", + "model.layers.35.mlp.experts.47.gate_proj.weight_scale": "model-00036-of-00047.safetensors", + "model.layers.35.mlp.experts.47.up_proj.weight": "model-00036-of-00047.safetensors", + "model.layers.35.mlp.experts.47.up_proj.weight_scale": "model-00036-of-00047.safetensors", + "model.layers.35.mlp.experts.48.down_proj.weight": "model-00036-of-00047.safetensors", + "model.layers.35.mlp.experts.48.down_proj.weight_scale": "model-00036-of-00047.safetensors", + "model.layers.35.mlp.experts.48.gate_proj.weight": "model-00036-of-00047.safetensors", + "model.layers.35.mlp.experts.48.gate_proj.weight_scale": "model-00036-of-00047.safetensors", + "model.layers.35.mlp.experts.48.up_proj.weight": "model-00036-of-00047.safetensors", + "model.layers.35.mlp.experts.48.up_proj.weight_scale": "model-00036-of-00047.safetensors", + "model.layers.35.mlp.experts.49.down_proj.weight": "model-00036-of-00047.safetensors", + "model.layers.35.mlp.experts.49.down_proj.weight_scale": "model-00036-of-00047.safetensors", + "model.layers.35.mlp.experts.49.gate_proj.weight": "model-00036-of-00047.safetensors", + "model.layers.35.mlp.experts.49.gate_proj.weight_scale": "model-00036-of-00047.safetensors", + "model.layers.35.mlp.experts.49.up_proj.weight": "model-00036-of-00047.safetensors", + "model.layers.35.mlp.experts.49.up_proj.weight_scale": "model-00036-of-00047.safetensors", + "model.layers.35.mlp.experts.5.down_proj.weight": "model-00036-of-00047.safetensors", + "model.layers.35.mlp.experts.5.down_proj.weight_scale": "model-00036-of-00047.safetensors", + "model.layers.35.mlp.experts.5.gate_proj.weight": "model-00036-of-00047.safetensors", + "model.layers.35.mlp.experts.5.gate_proj.weight_scale": "model-00036-of-00047.safetensors", + "model.layers.35.mlp.experts.5.up_proj.weight": "model-00036-of-00047.safetensors", + "model.layers.35.mlp.experts.5.up_proj.weight_scale": "model-00036-of-00047.safetensors", + "model.layers.35.mlp.experts.50.down_proj.weight": "model-00036-of-00047.safetensors", + "model.layers.35.mlp.experts.50.down_proj.weight_scale": "model-00036-of-00047.safetensors", + "model.layers.35.mlp.experts.50.gate_proj.weight": "model-00036-of-00047.safetensors", + "model.layers.35.mlp.experts.50.gate_proj.weight_scale": "model-00036-of-00047.safetensors", + "model.layers.35.mlp.experts.50.up_proj.weight": "model-00036-of-00047.safetensors", + "model.layers.35.mlp.experts.50.up_proj.weight_scale": "model-00036-of-00047.safetensors", + "model.layers.35.mlp.experts.51.down_proj.weight": "model-00036-of-00047.safetensors", + "model.layers.35.mlp.experts.51.down_proj.weight_scale": "model-00036-of-00047.safetensors", + "model.layers.35.mlp.experts.51.gate_proj.weight": "model-00036-of-00047.safetensors", + "model.layers.35.mlp.experts.51.gate_proj.weight_scale": "model-00036-of-00047.safetensors", + "model.layers.35.mlp.experts.51.up_proj.weight": "model-00036-of-00047.safetensors", + "model.layers.35.mlp.experts.51.up_proj.weight_scale": "model-00036-of-00047.safetensors", + "model.layers.35.mlp.experts.52.down_proj.weight": "model-00036-of-00047.safetensors", + "model.layers.35.mlp.experts.52.down_proj.weight_scale": "model-00036-of-00047.safetensors", + "model.layers.35.mlp.experts.52.gate_proj.weight": "model-00036-of-00047.safetensors", + "model.layers.35.mlp.experts.52.gate_proj.weight_scale": "model-00036-of-00047.safetensors", + "model.layers.35.mlp.experts.52.up_proj.weight": "model-00036-of-00047.safetensors", + "model.layers.35.mlp.experts.52.up_proj.weight_scale": "model-00036-of-00047.safetensors", + "model.layers.35.mlp.experts.53.down_proj.weight": "model-00036-of-00047.safetensors", + "model.layers.35.mlp.experts.53.down_proj.weight_scale": "model-00036-of-00047.safetensors", + "model.layers.35.mlp.experts.53.gate_proj.weight": "model-00036-of-00047.safetensors", + "model.layers.35.mlp.experts.53.gate_proj.weight_scale": "model-00036-of-00047.safetensors", + "model.layers.35.mlp.experts.53.up_proj.weight": "model-00036-of-00047.safetensors", + "model.layers.35.mlp.experts.53.up_proj.weight_scale": "model-00036-of-00047.safetensors", + "model.layers.35.mlp.experts.54.down_proj.weight": "model-00036-of-00047.safetensors", + "model.layers.35.mlp.experts.54.down_proj.weight_scale": "model-00036-of-00047.safetensors", + "model.layers.35.mlp.experts.54.gate_proj.weight": "model-00036-of-00047.safetensors", + "model.layers.35.mlp.experts.54.gate_proj.weight_scale": "model-00036-of-00047.safetensors", + "model.layers.35.mlp.experts.54.up_proj.weight": "model-00036-of-00047.safetensors", + "model.layers.35.mlp.experts.54.up_proj.weight_scale": "model-00036-of-00047.safetensors", + "model.layers.35.mlp.experts.55.down_proj.weight": "model-00036-of-00047.safetensors", + "model.layers.35.mlp.experts.55.down_proj.weight_scale": "model-00036-of-00047.safetensors", + "model.layers.35.mlp.experts.55.gate_proj.weight": "model-00036-of-00047.safetensors", + "model.layers.35.mlp.experts.55.gate_proj.weight_scale": "model-00036-of-00047.safetensors", + "model.layers.35.mlp.experts.55.up_proj.weight": "model-00036-of-00047.safetensors", + "model.layers.35.mlp.experts.55.up_proj.weight_scale": "model-00036-of-00047.safetensors", + "model.layers.35.mlp.experts.56.down_proj.weight": "model-00036-of-00047.safetensors", + "model.layers.35.mlp.experts.56.down_proj.weight_scale": "model-00036-of-00047.safetensors", + "model.layers.35.mlp.experts.56.gate_proj.weight": "model-00036-of-00047.safetensors", + "model.layers.35.mlp.experts.56.gate_proj.weight_scale": "model-00036-of-00047.safetensors", + "model.layers.35.mlp.experts.56.up_proj.weight": "model-00036-of-00047.safetensors", + "model.layers.35.mlp.experts.56.up_proj.weight_scale": "model-00036-of-00047.safetensors", + "model.layers.35.mlp.experts.57.down_proj.weight": "model-00036-of-00047.safetensors", + "model.layers.35.mlp.experts.57.down_proj.weight_scale": "model-00036-of-00047.safetensors", + "model.layers.35.mlp.experts.57.gate_proj.weight": "model-00036-of-00047.safetensors", + "model.layers.35.mlp.experts.57.gate_proj.weight_scale": "model-00036-of-00047.safetensors", + "model.layers.35.mlp.experts.57.up_proj.weight": "model-00036-of-00047.safetensors", + "model.layers.35.mlp.experts.57.up_proj.weight_scale": "model-00036-of-00047.safetensors", + "model.layers.35.mlp.experts.58.down_proj.weight": "model-00036-of-00047.safetensors", + "model.layers.35.mlp.experts.58.down_proj.weight_scale": "model-00036-of-00047.safetensors", + "model.layers.35.mlp.experts.58.gate_proj.weight": "model-00036-of-00047.safetensors", + "model.layers.35.mlp.experts.58.gate_proj.weight_scale": "model-00036-of-00047.safetensors", + "model.layers.35.mlp.experts.58.up_proj.weight": "model-00036-of-00047.safetensors", + "model.layers.35.mlp.experts.58.up_proj.weight_scale": "model-00036-of-00047.safetensors", + "model.layers.35.mlp.experts.59.down_proj.weight": "model-00036-of-00047.safetensors", + "model.layers.35.mlp.experts.59.down_proj.weight_scale": "model-00036-of-00047.safetensors", + "model.layers.35.mlp.experts.59.gate_proj.weight": "model-00036-of-00047.safetensors", + "model.layers.35.mlp.experts.59.gate_proj.weight_scale": "model-00036-of-00047.safetensors", + "model.layers.35.mlp.experts.59.up_proj.weight": "model-00036-of-00047.safetensors", + "model.layers.35.mlp.experts.59.up_proj.weight_scale": "model-00036-of-00047.safetensors", + "model.layers.35.mlp.experts.6.down_proj.weight": "model-00036-of-00047.safetensors", + "model.layers.35.mlp.experts.6.down_proj.weight_scale": "model-00036-of-00047.safetensors", + "model.layers.35.mlp.experts.6.gate_proj.weight": "model-00036-of-00047.safetensors", + "model.layers.35.mlp.experts.6.gate_proj.weight_scale": "model-00036-of-00047.safetensors", + "model.layers.35.mlp.experts.6.up_proj.weight": "model-00036-of-00047.safetensors", + "model.layers.35.mlp.experts.6.up_proj.weight_scale": "model-00036-of-00047.safetensors", + "model.layers.35.mlp.experts.60.down_proj.weight": "model-00036-of-00047.safetensors", + "model.layers.35.mlp.experts.60.down_proj.weight_scale": "model-00036-of-00047.safetensors", + "model.layers.35.mlp.experts.60.gate_proj.weight": "model-00036-of-00047.safetensors", + "model.layers.35.mlp.experts.60.gate_proj.weight_scale": "model-00036-of-00047.safetensors", + "model.layers.35.mlp.experts.60.up_proj.weight": "model-00036-of-00047.safetensors", + "model.layers.35.mlp.experts.60.up_proj.weight_scale": "model-00036-of-00047.safetensors", + "model.layers.35.mlp.experts.61.down_proj.weight": "model-00036-of-00047.safetensors", + "model.layers.35.mlp.experts.61.down_proj.weight_scale": "model-00036-of-00047.safetensors", + "model.layers.35.mlp.experts.61.gate_proj.weight": "model-00036-of-00047.safetensors", + "model.layers.35.mlp.experts.61.gate_proj.weight_scale": "model-00036-of-00047.safetensors", + "model.layers.35.mlp.experts.61.up_proj.weight": "model-00036-of-00047.safetensors", + "model.layers.35.mlp.experts.61.up_proj.weight_scale": "model-00036-of-00047.safetensors", + "model.layers.35.mlp.experts.62.down_proj.weight": "model-00036-of-00047.safetensors", + "model.layers.35.mlp.experts.62.down_proj.weight_scale": "model-00036-of-00047.safetensors", + "model.layers.35.mlp.experts.62.gate_proj.weight": "model-00036-of-00047.safetensors", + "model.layers.35.mlp.experts.62.gate_proj.weight_scale": "model-00036-of-00047.safetensors", + "model.layers.35.mlp.experts.62.up_proj.weight": "model-00036-of-00047.safetensors", + "model.layers.35.mlp.experts.62.up_proj.weight_scale": "model-00036-of-00047.safetensors", + "model.layers.35.mlp.experts.63.down_proj.weight": "model-00036-of-00047.safetensors", + "model.layers.35.mlp.experts.63.down_proj.weight_scale": "model-00036-of-00047.safetensors", + "model.layers.35.mlp.experts.63.gate_proj.weight": "model-00036-of-00047.safetensors", + "model.layers.35.mlp.experts.63.gate_proj.weight_scale": "model-00036-of-00047.safetensors", + "model.layers.35.mlp.experts.63.up_proj.weight": "model-00036-of-00047.safetensors", + "model.layers.35.mlp.experts.63.up_proj.weight_scale": "model-00036-of-00047.safetensors", + "model.layers.35.mlp.experts.64.down_proj.weight": "model-00036-of-00047.safetensors", + "model.layers.35.mlp.experts.64.down_proj.weight_scale": "model-00036-of-00047.safetensors", + "model.layers.35.mlp.experts.64.gate_proj.weight": "model-00036-of-00047.safetensors", + "model.layers.35.mlp.experts.64.gate_proj.weight_scale": "model-00036-of-00047.safetensors", + "model.layers.35.mlp.experts.64.up_proj.weight": "model-00036-of-00047.safetensors", + "model.layers.35.mlp.experts.64.up_proj.weight_scale": "model-00036-of-00047.safetensors", + "model.layers.35.mlp.experts.65.down_proj.weight": "model-00036-of-00047.safetensors", + "model.layers.35.mlp.experts.65.down_proj.weight_scale": "model-00036-of-00047.safetensors", + "model.layers.35.mlp.experts.65.gate_proj.weight": "model-00036-of-00047.safetensors", + "model.layers.35.mlp.experts.65.gate_proj.weight_scale": "model-00036-of-00047.safetensors", + "model.layers.35.mlp.experts.65.up_proj.weight": "model-00036-of-00047.safetensors", + "model.layers.35.mlp.experts.65.up_proj.weight_scale": "model-00036-of-00047.safetensors", + "model.layers.35.mlp.experts.66.down_proj.weight": "model-00036-of-00047.safetensors", + "model.layers.35.mlp.experts.66.down_proj.weight_scale": "model-00036-of-00047.safetensors", + "model.layers.35.mlp.experts.66.gate_proj.weight": "model-00036-of-00047.safetensors", + "model.layers.35.mlp.experts.66.gate_proj.weight_scale": "model-00036-of-00047.safetensors", + "model.layers.35.mlp.experts.66.up_proj.weight": "model-00036-of-00047.safetensors", + "model.layers.35.mlp.experts.66.up_proj.weight_scale": "model-00036-of-00047.safetensors", + "model.layers.35.mlp.experts.67.down_proj.weight": "model-00036-of-00047.safetensors", + "model.layers.35.mlp.experts.67.down_proj.weight_scale": "model-00036-of-00047.safetensors", + "model.layers.35.mlp.experts.67.gate_proj.weight": "model-00036-of-00047.safetensors", + "model.layers.35.mlp.experts.67.gate_proj.weight_scale": "model-00036-of-00047.safetensors", + "model.layers.35.mlp.experts.67.up_proj.weight": "model-00036-of-00047.safetensors", + "model.layers.35.mlp.experts.67.up_proj.weight_scale": "model-00036-of-00047.safetensors", + "model.layers.35.mlp.experts.68.down_proj.weight": "model-00036-of-00047.safetensors", + "model.layers.35.mlp.experts.68.down_proj.weight_scale": "model-00036-of-00047.safetensors", + "model.layers.35.mlp.experts.68.gate_proj.weight": "model-00036-of-00047.safetensors", + "model.layers.35.mlp.experts.68.gate_proj.weight_scale": "model-00036-of-00047.safetensors", + "model.layers.35.mlp.experts.68.up_proj.weight": "model-00036-of-00047.safetensors", + "model.layers.35.mlp.experts.68.up_proj.weight_scale": "model-00036-of-00047.safetensors", + "model.layers.35.mlp.experts.69.down_proj.weight": "model-00036-of-00047.safetensors", + "model.layers.35.mlp.experts.69.down_proj.weight_scale": "model-00036-of-00047.safetensors", + "model.layers.35.mlp.experts.69.gate_proj.weight": "model-00036-of-00047.safetensors", + "model.layers.35.mlp.experts.69.gate_proj.weight_scale": "model-00036-of-00047.safetensors", + "model.layers.35.mlp.experts.69.up_proj.weight": "model-00036-of-00047.safetensors", + "model.layers.35.mlp.experts.69.up_proj.weight_scale": "model-00036-of-00047.safetensors", + "model.layers.35.mlp.experts.7.down_proj.weight": "model-00036-of-00047.safetensors", + "model.layers.35.mlp.experts.7.down_proj.weight_scale": "model-00036-of-00047.safetensors", + "model.layers.35.mlp.experts.7.gate_proj.weight": "model-00036-of-00047.safetensors", + "model.layers.35.mlp.experts.7.gate_proj.weight_scale": "model-00036-of-00047.safetensors", + "model.layers.35.mlp.experts.7.up_proj.weight": "model-00036-of-00047.safetensors", + "model.layers.35.mlp.experts.7.up_proj.weight_scale": "model-00036-of-00047.safetensors", + "model.layers.35.mlp.experts.70.down_proj.weight": "model-00036-of-00047.safetensors", + "model.layers.35.mlp.experts.70.down_proj.weight_scale": "model-00036-of-00047.safetensors", + "model.layers.35.mlp.experts.70.gate_proj.weight": "model-00036-of-00047.safetensors", + "model.layers.35.mlp.experts.70.gate_proj.weight_scale": "model-00036-of-00047.safetensors", + "model.layers.35.mlp.experts.70.up_proj.weight": "model-00036-of-00047.safetensors", + "model.layers.35.mlp.experts.70.up_proj.weight_scale": "model-00036-of-00047.safetensors", + "model.layers.35.mlp.experts.71.down_proj.weight": "model-00036-of-00047.safetensors", + "model.layers.35.mlp.experts.71.down_proj.weight_scale": "model-00036-of-00047.safetensors", + "model.layers.35.mlp.experts.71.gate_proj.weight": "model-00036-of-00047.safetensors", + "model.layers.35.mlp.experts.71.gate_proj.weight_scale": "model-00036-of-00047.safetensors", + "model.layers.35.mlp.experts.71.up_proj.weight": "model-00036-of-00047.safetensors", + "model.layers.35.mlp.experts.71.up_proj.weight_scale": "model-00036-of-00047.safetensors", + "model.layers.35.mlp.experts.72.down_proj.weight": "model-00036-of-00047.safetensors", + "model.layers.35.mlp.experts.72.down_proj.weight_scale": "model-00036-of-00047.safetensors", + "model.layers.35.mlp.experts.72.gate_proj.weight": "model-00036-of-00047.safetensors", + "model.layers.35.mlp.experts.72.gate_proj.weight_scale": "model-00036-of-00047.safetensors", + "model.layers.35.mlp.experts.72.up_proj.weight": "model-00036-of-00047.safetensors", + "model.layers.35.mlp.experts.72.up_proj.weight_scale": "model-00036-of-00047.safetensors", + "model.layers.35.mlp.experts.73.down_proj.weight": "model-00036-of-00047.safetensors", + "model.layers.35.mlp.experts.73.down_proj.weight_scale": "model-00036-of-00047.safetensors", + "model.layers.35.mlp.experts.73.gate_proj.weight": "model-00036-of-00047.safetensors", + "model.layers.35.mlp.experts.73.gate_proj.weight_scale": "model-00036-of-00047.safetensors", + "model.layers.35.mlp.experts.73.up_proj.weight": "model-00036-of-00047.safetensors", + "model.layers.35.mlp.experts.73.up_proj.weight_scale": "model-00036-of-00047.safetensors", + "model.layers.35.mlp.experts.74.down_proj.weight": "model-00036-of-00047.safetensors", + "model.layers.35.mlp.experts.74.down_proj.weight_scale": "model-00036-of-00047.safetensors", + "model.layers.35.mlp.experts.74.gate_proj.weight": "model-00036-of-00047.safetensors", + "model.layers.35.mlp.experts.74.gate_proj.weight_scale": "model-00036-of-00047.safetensors", + "model.layers.35.mlp.experts.74.up_proj.weight": "model-00036-of-00047.safetensors", + "model.layers.35.mlp.experts.74.up_proj.weight_scale": "model-00036-of-00047.safetensors", + "model.layers.35.mlp.experts.75.down_proj.weight": "model-00036-of-00047.safetensors", + "model.layers.35.mlp.experts.75.down_proj.weight_scale": "model-00036-of-00047.safetensors", + "model.layers.35.mlp.experts.75.gate_proj.weight": "model-00036-of-00047.safetensors", + "model.layers.35.mlp.experts.75.gate_proj.weight_scale": "model-00036-of-00047.safetensors", + "model.layers.35.mlp.experts.75.up_proj.weight": "model-00036-of-00047.safetensors", + "model.layers.35.mlp.experts.75.up_proj.weight_scale": "model-00036-of-00047.safetensors", + "model.layers.35.mlp.experts.76.down_proj.weight": "model-00036-of-00047.safetensors", + "model.layers.35.mlp.experts.76.down_proj.weight_scale": "model-00036-of-00047.safetensors", + "model.layers.35.mlp.experts.76.gate_proj.weight": "model-00036-of-00047.safetensors", + "model.layers.35.mlp.experts.76.gate_proj.weight_scale": "model-00036-of-00047.safetensors", + "model.layers.35.mlp.experts.76.up_proj.weight": "model-00036-of-00047.safetensors", + "model.layers.35.mlp.experts.76.up_proj.weight_scale": "model-00036-of-00047.safetensors", + "model.layers.35.mlp.experts.77.down_proj.weight": "model-00036-of-00047.safetensors", + "model.layers.35.mlp.experts.77.down_proj.weight_scale": "model-00036-of-00047.safetensors", + "model.layers.35.mlp.experts.77.gate_proj.weight": "model-00036-of-00047.safetensors", + "model.layers.35.mlp.experts.77.gate_proj.weight_scale": "model-00036-of-00047.safetensors", + "model.layers.35.mlp.experts.77.up_proj.weight": "model-00036-of-00047.safetensors", + "model.layers.35.mlp.experts.77.up_proj.weight_scale": "model-00036-of-00047.safetensors", + "model.layers.35.mlp.experts.78.down_proj.weight": "model-00036-of-00047.safetensors", + "model.layers.35.mlp.experts.78.down_proj.weight_scale": "model-00036-of-00047.safetensors", + "model.layers.35.mlp.experts.78.gate_proj.weight": "model-00036-of-00047.safetensors", + "model.layers.35.mlp.experts.78.gate_proj.weight_scale": "model-00036-of-00047.safetensors", + "model.layers.35.mlp.experts.78.up_proj.weight": "model-00036-of-00047.safetensors", + "model.layers.35.mlp.experts.78.up_proj.weight_scale": "model-00036-of-00047.safetensors", + "model.layers.35.mlp.experts.79.down_proj.weight": "model-00036-of-00047.safetensors", + "model.layers.35.mlp.experts.79.down_proj.weight_scale": "model-00036-of-00047.safetensors", + "model.layers.35.mlp.experts.79.gate_proj.weight": "model-00036-of-00047.safetensors", + "model.layers.35.mlp.experts.79.gate_proj.weight_scale": "model-00036-of-00047.safetensors", + "model.layers.35.mlp.experts.79.up_proj.weight": "model-00036-of-00047.safetensors", + "model.layers.35.mlp.experts.79.up_proj.weight_scale": "model-00036-of-00047.safetensors", + "model.layers.35.mlp.experts.8.down_proj.weight": "model-00036-of-00047.safetensors", + "model.layers.35.mlp.experts.8.down_proj.weight_scale": "model-00036-of-00047.safetensors", + "model.layers.35.mlp.experts.8.gate_proj.weight": "model-00036-of-00047.safetensors", + "model.layers.35.mlp.experts.8.gate_proj.weight_scale": "model-00036-of-00047.safetensors", + "model.layers.35.mlp.experts.8.up_proj.weight": "model-00036-of-00047.safetensors", + "model.layers.35.mlp.experts.8.up_proj.weight_scale": "model-00036-of-00047.safetensors", + "model.layers.35.mlp.experts.80.down_proj.weight": "model-00036-of-00047.safetensors", + "model.layers.35.mlp.experts.80.down_proj.weight_scale": "model-00036-of-00047.safetensors", + "model.layers.35.mlp.experts.80.gate_proj.weight": "model-00036-of-00047.safetensors", + "model.layers.35.mlp.experts.80.gate_proj.weight_scale": "model-00036-of-00047.safetensors", + "model.layers.35.mlp.experts.80.up_proj.weight": "model-00036-of-00047.safetensors", + "model.layers.35.mlp.experts.80.up_proj.weight_scale": "model-00036-of-00047.safetensors", + "model.layers.35.mlp.experts.81.down_proj.weight": "model-00036-of-00047.safetensors", + "model.layers.35.mlp.experts.81.down_proj.weight_scale": "model-00036-of-00047.safetensors", + "model.layers.35.mlp.experts.81.gate_proj.weight": "model-00036-of-00047.safetensors", + "model.layers.35.mlp.experts.81.gate_proj.weight_scale": "model-00036-of-00047.safetensors", + "model.layers.35.mlp.experts.81.up_proj.weight": "model-00036-of-00047.safetensors", + "model.layers.35.mlp.experts.81.up_proj.weight_scale": "model-00036-of-00047.safetensors", + "model.layers.35.mlp.experts.82.down_proj.weight": "model-00036-of-00047.safetensors", + "model.layers.35.mlp.experts.82.down_proj.weight_scale": "model-00036-of-00047.safetensors", + "model.layers.35.mlp.experts.82.gate_proj.weight": "model-00036-of-00047.safetensors", + "model.layers.35.mlp.experts.82.gate_proj.weight_scale": "model-00036-of-00047.safetensors", + "model.layers.35.mlp.experts.82.up_proj.weight": "model-00036-of-00047.safetensors", + "model.layers.35.mlp.experts.82.up_proj.weight_scale": "model-00036-of-00047.safetensors", + "model.layers.35.mlp.experts.83.down_proj.weight": "model-00036-of-00047.safetensors", + "model.layers.35.mlp.experts.83.down_proj.weight_scale": "model-00036-of-00047.safetensors", + "model.layers.35.mlp.experts.83.gate_proj.weight": "model-00036-of-00047.safetensors", + "model.layers.35.mlp.experts.83.gate_proj.weight_scale": "model-00036-of-00047.safetensors", + "model.layers.35.mlp.experts.83.up_proj.weight": "model-00036-of-00047.safetensors", + "model.layers.35.mlp.experts.83.up_proj.weight_scale": "model-00036-of-00047.safetensors", + "model.layers.35.mlp.experts.84.down_proj.weight": "model-00036-of-00047.safetensors", + "model.layers.35.mlp.experts.84.down_proj.weight_scale": "model-00036-of-00047.safetensors", + "model.layers.35.mlp.experts.84.gate_proj.weight": "model-00036-of-00047.safetensors", + "model.layers.35.mlp.experts.84.gate_proj.weight_scale": "model-00036-of-00047.safetensors", + "model.layers.35.mlp.experts.84.up_proj.weight": "model-00036-of-00047.safetensors", + "model.layers.35.mlp.experts.84.up_proj.weight_scale": "model-00036-of-00047.safetensors", + "model.layers.35.mlp.experts.85.down_proj.weight": "model-00036-of-00047.safetensors", + "model.layers.35.mlp.experts.85.down_proj.weight_scale": "model-00036-of-00047.safetensors", + "model.layers.35.mlp.experts.85.gate_proj.weight": "model-00036-of-00047.safetensors", + "model.layers.35.mlp.experts.85.gate_proj.weight_scale": "model-00036-of-00047.safetensors", + "model.layers.35.mlp.experts.85.up_proj.weight": "model-00036-of-00047.safetensors", + "model.layers.35.mlp.experts.85.up_proj.weight_scale": "model-00036-of-00047.safetensors", + "model.layers.35.mlp.experts.86.down_proj.weight": "model-00036-of-00047.safetensors", + "model.layers.35.mlp.experts.86.down_proj.weight_scale": "model-00036-of-00047.safetensors", + "model.layers.35.mlp.experts.86.gate_proj.weight": "model-00036-of-00047.safetensors", + "model.layers.35.mlp.experts.86.gate_proj.weight_scale": "model-00036-of-00047.safetensors", + "model.layers.35.mlp.experts.86.up_proj.weight": "model-00036-of-00047.safetensors", + "model.layers.35.mlp.experts.86.up_proj.weight_scale": "model-00036-of-00047.safetensors", + "model.layers.35.mlp.experts.87.down_proj.weight": "model-00036-of-00047.safetensors", + "model.layers.35.mlp.experts.87.down_proj.weight_scale": "model-00036-of-00047.safetensors", + "model.layers.35.mlp.experts.87.gate_proj.weight": "model-00036-of-00047.safetensors", + "model.layers.35.mlp.experts.87.gate_proj.weight_scale": "model-00036-of-00047.safetensors", + "model.layers.35.mlp.experts.87.up_proj.weight": "model-00036-of-00047.safetensors", + "model.layers.35.mlp.experts.87.up_proj.weight_scale": "model-00036-of-00047.safetensors", + "model.layers.35.mlp.experts.88.down_proj.weight": "model-00036-of-00047.safetensors", + "model.layers.35.mlp.experts.88.down_proj.weight_scale": "model-00036-of-00047.safetensors", + "model.layers.35.mlp.experts.88.gate_proj.weight": "model-00036-of-00047.safetensors", + "model.layers.35.mlp.experts.88.gate_proj.weight_scale": "model-00036-of-00047.safetensors", + "model.layers.35.mlp.experts.88.up_proj.weight": "model-00036-of-00047.safetensors", + "model.layers.35.mlp.experts.88.up_proj.weight_scale": "model-00036-of-00047.safetensors", + "model.layers.35.mlp.experts.89.down_proj.weight": "model-00036-of-00047.safetensors", + "model.layers.35.mlp.experts.89.down_proj.weight_scale": "model-00036-of-00047.safetensors", + "model.layers.35.mlp.experts.89.gate_proj.weight": "model-00036-of-00047.safetensors", + "model.layers.35.mlp.experts.89.gate_proj.weight_scale": "model-00036-of-00047.safetensors", + "model.layers.35.mlp.experts.89.up_proj.weight": "model-00036-of-00047.safetensors", + "model.layers.35.mlp.experts.89.up_proj.weight_scale": "model-00036-of-00047.safetensors", + "model.layers.35.mlp.experts.9.down_proj.weight": "model-00036-of-00047.safetensors", + "model.layers.35.mlp.experts.9.down_proj.weight_scale": "model-00036-of-00047.safetensors", + "model.layers.35.mlp.experts.9.gate_proj.weight": "model-00036-of-00047.safetensors", + "model.layers.35.mlp.experts.9.gate_proj.weight_scale": "model-00036-of-00047.safetensors", + "model.layers.35.mlp.experts.9.up_proj.weight": "model-00036-of-00047.safetensors", + "model.layers.35.mlp.experts.9.up_proj.weight_scale": "model-00036-of-00047.safetensors", + "model.layers.35.mlp.experts.90.down_proj.weight": "model-00036-of-00047.safetensors", + "model.layers.35.mlp.experts.90.down_proj.weight_scale": "model-00036-of-00047.safetensors", + "model.layers.35.mlp.experts.90.gate_proj.weight": "model-00036-of-00047.safetensors", + "model.layers.35.mlp.experts.90.gate_proj.weight_scale": "model-00036-of-00047.safetensors", + "model.layers.35.mlp.experts.90.up_proj.weight": "model-00036-of-00047.safetensors", + "model.layers.35.mlp.experts.90.up_proj.weight_scale": "model-00036-of-00047.safetensors", + "model.layers.35.mlp.experts.91.down_proj.weight": "model-00036-of-00047.safetensors", + "model.layers.35.mlp.experts.91.down_proj.weight_scale": "model-00036-of-00047.safetensors", + "model.layers.35.mlp.experts.91.gate_proj.weight": "model-00036-of-00047.safetensors", + "model.layers.35.mlp.experts.91.gate_proj.weight_scale": "model-00036-of-00047.safetensors", + "model.layers.35.mlp.experts.91.up_proj.weight": "model-00036-of-00047.safetensors", + "model.layers.35.mlp.experts.91.up_proj.weight_scale": "model-00036-of-00047.safetensors", + "model.layers.35.mlp.experts.92.down_proj.weight": "model-00036-of-00047.safetensors", + "model.layers.35.mlp.experts.92.down_proj.weight_scale": "model-00036-of-00047.safetensors", + "model.layers.35.mlp.experts.92.gate_proj.weight": "model-00036-of-00047.safetensors", + "model.layers.35.mlp.experts.92.gate_proj.weight_scale": "model-00036-of-00047.safetensors", + "model.layers.35.mlp.experts.92.up_proj.weight": "model-00036-of-00047.safetensors", + "model.layers.35.mlp.experts.92.up_proj.weight_scale": "model-00036-of-00047.safetensors", + "model.layers.35.mlp.experts.93.down_proj.weight": "model-00036-of-00047.safetensors", + "model.layers.35.mlp.experts.93.down_proj.weight_scale": "model-00036-of-00047.safetensors", + "model.layers.35.mlp.experts.93.gate_proj.weight": "model-00036-of-00047.safetensors", + "model.layers.35.mlp.experts.93.gate_proj.weight_scale": "model-00036-of-00047.safetensors", + "model.layers.35.mlp.experts.93.up_proj.weight": "model-00036-of-00047.safetensors", + "model.layers.35.mlp.experts.93.up_proj.weight_scale": "model-00036-of-00047.safetensors", + "model.layers.35.mlp.experts.94.down_proj.weight": "model-00036-of-00047.safetensors", + "model.layers.35.mlp.experts.94.down_proj.weight_scale": "model-00036-of-00047.safetensors", + "model.layers.35.mlp.experts.94.gate_proj.weight": "model-00036-of-00047.safetensors", + "model.layers.35.mlp.experts.94.gate_proj.weight_scale": "model-00036-of-00047.safetensors", + "model.layers.35.mlp.experts.94.up_proj.weight": "model-00036-of-00047.safetensors", + "model.layers.35.mlp.experts.94.up_proj.weight_scale": "model-00036-of-00047.safetensors", + "model.layers.35.mlp.experts.95.down_proj.weight": "model-00036-of-00047.safetensors", + "model.layers.35.mlp.experts.95.down_proj.weight_scale": "model-00036-of-00047.safetensors", + "model.layers.35.mlp.experts.95.gate_proj.weight": "model-00036-of-00047.safetensors", + "model.layers.35.mlp.experts.95.gate_proj.weight_scale": "model-00036-of-00047.safetensors", + "model.layers.35.mlp.experts.95.up_proj.weight": "model-00036-of-00047.safetensors", + "model.layers.35.mlp.experts.95.up_proj.weight_scale": "model-00036-of-00047.safetensors", + "model.layers.35.mlp.experts.96.down_proj.weight": "model-00036-of-00047.safetensors", + "model.layers.35.mlp.experts.96.down_proj.weight_scale": "model-00036-of-00047.safetensors", + "model.layers.35.mlp.experts.96.gate_proj.weight": "model-00036-of-00047.safetensors", + "model.layers.35.mlp.experts.96.gate_proj.weight_scale": "model-00036-of-00047.safetensors", + "model.layers.35.mlp.experts.96.up_proj.weight": "model-00036-of-00047.safetensors", + "model.layers.35.mlp.experts.96.up_proj.weight_scale": "model-00036-of-00047.safetensors", + "model.layers.35.mlp.experts.97.down_proj.weight": "model-00036-of-00047.safetensors", + "model.layers.35.mlp.experts.97.down_proj.weight_scale": "model-00036-of-00047.safetensors", + "model.layers.35.mlp.experts.97.gate_proj.weight": "model-00036-of-00047.safetensors", + "model.layers.35.mlp.experts.97.gate_proj.weight_scale": "model-00036-of-00047.safetensors", + "model.layers.35.mlp.experts.97.up_proj.weight": "model-00036-of-00047.safetensors", + "model.layers.35.mlp.experts.97.up_proj.weight_scale": "model-00036-of-00047.safetensors", + "model.layers.35.mlp.experts.98.down_proj.weight": "model-00036-of-00047.safetensors", + "model.layers.35.mlp.experts.98.down_proj.weight_scale": "model-00036-of-00047.safetensors", + "model.layers.35.mlp.experts.98.gate_proj.weight": "model-00036-of-00047.safetensors", + "model.layers.35.mlp.experts.98.gate_proj.weight_scale": "model-00036-of-00047.safetensors", + "model.layers.35.mlp.experts.98.up_proj.weight": "model-00036-of-00047.safetensors", + "model.layers.35.mlp.experts.98.up_proj.weight_scale": "model-00036-of-00047.safetensors", + "model.layers.35.mlp.experts.99.down_proj.weight": "model-00036-of-00047.safetensors", + "model.layers.35.mlp.experts.99.down_proj.weight_scale": "model-00036-of-00047.safetensors", + "model.layers.35.mlp.experts.99.gate_proj.weight": "model-00036-of-00047.safetensors", + "model.layers.35.mlp.experts.99.gate_proj.weight_scale": "model-00036-of-00047.safetensors", + "model.layers.35.mlp.experts.99.up_proj.weight": "model-00036-of-00047.safetensors", + "model.layers.35.mlp.experts.99.up_proj.weight_scale": "model-00036-of-00047.safetensors", + "model.layers.35.mlp.gate.e_score_correction_bias": "model-00036-of-00047.safetensors", + "model.layers.35.mlp.gate.weight": "model-00036-of-00047.safetensors", + "model.layers.35.mlp.shared_experts.down_proj.weight": "model-00036-of-00047.safetensors", + "model.layers.35.mlp.shared_experts.down_proj.weight_scale": "model-00036-of-00047.safetensors", + "model.layers.35.mlp.shared_experts.gate_proj.weight": "model-00036-of-00047.safetensors", + "model.layers.35.mlp.shared_experts.gate_proj.weight_scale": "model-00036-of-00047.safetensors", + "model.layers.35.mlp.shared_experts.up_proj.weight": "model-00036-of-00047.safetensors", + "model.layers.35.mlp.shared_experts.up_proj.weight_scale": "model-00036-of-00047.safetensors", + "model.layers.35.post_attention_layernorm.weight": "model-00036-of-00047.safetensors", + "model.layers.35.self_attn.k_proj.bias": "model-00036-of-00047.safetensors", + "model.layers.35.self_attn.k_proj.weight": "model-00036-of-00047.safetensors", + "model.layers.35.self_attn.k_proj.weight_scale": "model-00036-of-00047.safetensors", + "model.layers.35.self_attn.o_proj.weight": "model-00036-of-00047.safetensors", + "model.layers.35.self_attn.o_proj.weight_scale": "model-00036-of-00047.safetensors", + "model.layers.35.self_attn.q_proj.bias": "model-00036-of-00047.safetensors", + "model.layers.35.self_attn.q_proj.weight": "model-00036-of-00047.safetensors", + "model.layers.35.self_attn.q_proj.weight_scale": "model-00036-of-00047.safetensors", + "model.layers.35.self_attn.v_proj.bias": "model-00036-of-00047.safetensors", + "model.layers.35.self_attn.v_proj.weight": "model-00036-of-00047.safetensors", + "model.layers.35.self_attn.v_proj.weight_scale": "model-00036-of-00047.safetensors", + "model.layers.36.input_layernorm.weight": "model-00037-of-00047.safetensors", + "model.layers.36.mlp.experts.0.down_proj.weight": "model-00037-of-00047.safetensors", + "model.layers.36.mlp.experts.0.down_proj.weight_scale": "model-00037-of-00047.safetensors", + "model.layers.36.mlp.experts.0.gate_proj.weight": "model-00037-of-00047.safetensors", + "model.layers.36.mlp.experts.0.gate_proj.weight_scale": "model-00037-of-00047.safetensors", + "model.layers.36.mlp.experts.0.up_proj.weight": "model-00037-of-00047.safetensors", + "model.layers.36.mlp.experts.0.up_proj.weight_scale": "model-00037-of-00047.safetensors", + "model.layers.36.mlp.experts.1.down_proj.weight": "model-00037-of-00047.safetensors", + "model.layers.36.mlp.experts.1.down_proj.weight_scale": "model-00037-of-00047.safetensors", + "model.layers.36.mlp.experts.1.gate_proj.weight": "model-00037-of-00047.safetensors", + "model.layers.36.mlp.experts.1.gate_proj.weight_scale": "model-00037-of-00047.safetensors", + "model.layers.36.mlp.experts.1.up_proj.weight": "model-00037-of-00047.safetensors", + "model.layers.36.mlp.experts.1.up_proj.weight_scale": "model-00037-of-00047.safetensors", + "model.layers.36.mlp.experts.10.down_proj.weight": "model-00037-of-00047.safetensors", + "model.layers.36.mlp.experts.10.down_proj.weight_scale": "model-00037-of-00047.safetensors", + "model.layers.36.mlp.experts.10.gate_proj.weight": "model-00037-of-00047.safetensors", + "model.layers.36.mlp.experts.10.gate_proj.weight_scale": "model-00037-of-00047.safetensors", + "model.layers.36.mlp.experts.10.up_proj.weight": "model-00037-of-00047.safetensors", + "model.layers.36.mlp.experts.10.up_proj.weight_scale": "model-00037-of-00047.safetensors", + "model.layers.36.mlp.experts.100.down_proj.weight": "model-00037-of-00047.safetensors", + "model.layers.36.mlp.experts.100.down_proj.weight_scale": "model-00037-of-00047.safetensors", + "model.layers.36.mlp.experts.100.gate_proj.weight": "model-00037-of-00047.safetensors", + "model.layers.36.mlp.experts.100.gate_proj.weight_scale": "model-00037-of-00047.safetensors", + "model.layers.36.mlp.experts.100.up_proj.weight": "model-00037-of-00047.safetensors", + "model.layers.36.mlp.experts.100.up_proj.weight_scale": "model-00037-of-00047.safetensors", + "model.layers.36.mlp.experts.101.down_proj.weight": "model-00037-of-00047.safetensors", + "model.layers.36.mlp.experts.101.down_proj.weight_scale": "model-00037-of-00047.safetensors", + "model.layers.36.mlp.experts.101.gate_proj.weight": "model-00037-of-00047.safetensors", + "model.layers.36.mlp.experts.101.gate_proj.weight_scale": "model-00037-of-00047.safetensors", + "model.layers.36.mlp.experts.101.up_proj.weight": "model-00037-of-00047.safetensors", + "model.layers.36.mlp.experts.101.up_proj.weight_scale": "model-00037-of-00047.safetensors", + "model.layers.36.mlp.experts.102.down_proj.weight": "model-00037-of-00047.safetensors", + "model.layers.36.mlp.experts.102.down_proj.weight_scale": "model-00037-of-00047.safetensors", + "model.layers.36.mlp.experts.102.gate_proj.weight": "model-00037-of-00047.safetensors", + "model.layers.36.mlp.experts.102.gate_proj.weight_scale": "model-00037-of-00047.safetensors", + "model.layers.36.mlp.experts.102.up_proj.weight": "model-00037-of-00047.safetensors", + "model.layers.36.mlp.experts.102.up_proj.weight_scale": "model-00037-of-00047.safetensors", + "model.layers.36.mlp.experts.103.down_proj.weight": "model-00037-of-00047.safetensors", + "model.layers.36.mlp.experts.103.down_proj.weight_scale": "model-00037-of-00047.safetensors", + "model.layers.36.mlp.experts.103.gate_proj.weight": "model-00037-of-00047.safetensors", + "model.layers.36.mlp.experts.103.gate_proj.weight_scale": "model-00037-of-00047.safetensors", + "model.layers.36.mlp.experts.103.up_proj.weight": "model-00037-of-00047.safetensors", + "model.layers.36.mlp.experts.103.up_proj.weight_scale": "model-00037-of-00047.safetensors", + "model.layers.36.mlp.experts.104.down_proj.weight": "model-00037-of-00047.safetensors", + "model.layers.36.mlp.experts.104.down_proj.weight_scale": "model-00037-of-00047.safetensors", + "model.layers.36.mlp.experts.104.gate_proj.weight": "model-00037-of-00047.safetensors", + "model.layers.36.mlp.experts.104.gate_proj.weight_scale": "model-00037-of-00047.safetensors", + "model.layers.36.mlp.experts.104.up_proj.weight": "model-00037-of-00047.safetensors", + "model.layers.36.mlp.experts.104.up_proj.weight_scale": "model-00037-of-00047.safetensors", + "model.layers.36.mlp.experts.105.down_proj.weight": "model-00037-of-00047.safetensors", + "model.layers.36.mlp.experts.105.down_proj.weight_scale": "model-00037-of-00047.safetensors", + "model.layers.36.mlp.experts.105.gate_proj.weight": "model-00037-of-00047.safetensors", + "model.layers.36.mlp.experts.105.gate_proj.weight_scale": "model-00037-of-00047.safetensors", + "model.layers.36.mlp.experts.105.up_proj.weight": "model-00037-of-00047.safetensors", + "model.layers.36.mlp.experts.105.up_proj.weight_scale": "model-00037-of-00047.safetensors", + "model.layers.36.mlp.experts.106.down_proj.weight": "model-00037-of-00047.safetensors", + "model.layers.36.mlp.experts.106.down_proj.weight_scale": "model-00037-of-00047.safetensors", + "model.layers.36.mlp.experts.106.gate_proj.weight": "model-00037-of-00047.safetensors", + "model.layers.36.mlp.experts.106.gate_proj.weight_scale": "model-00037-of-00047.safetensors", + "model.layers.36.mlp.experts.106.up_proj.weight": "model-00037-of-00047.safetensors", + "model.layers.36.mlp.experts.106.up_proj.weight_scale": "model-00037-of-00047.safetensors", + "model.layers.36.mlp.experts.107.down_proj.weight": "model-00037-of-00047.safetensors", + "model.layers.36.mlp.experts.107.down_proj.weight_scale": "model-00037-of-00047.safetensors", + "model.layers.36.mlp.experts.107.gate_proj.weight": "model-00037-of-00047.safetensors", + "model.layers.36.mlp.experts.107.gate_proj.weight_scale": "model-00037-of-00047.safetensors", + "model.layers.36.mlp.experts.107.up_proj.weight": "model-00037-of-00047.safetensors", + "model.layers.36.mlp.experts.107.up_proj.weight_scale": "model-00037-of-00047.safetensors", + "model.layers.36.mlp.experts.108.down_proj.weight": "model-00037-of-00047.safetensors", + "model.layers.36.mlp.experts.108.down_proj.weight_scale": "model-00037-of-00047.safetensors", + "model.layers.36.mlp.experts.108.gate_proj.weight": "model-00037-of-00047.safetensors", + "model.layers.36.mlp.experts.108.gate_proj.weight_scale": "model-00037-of-00047.safetensors", + "model.layers.36.mlp.experts.108.up_proj.weight": "model-00037-of-00047.safetensors", + "model.layers.36.mlp.experts.108.up_proj.weight_scale": "model-00037-of-00047.safetensors", + "model.layers.36.mlp.experts.109.down_proj.weight": "model-00037-of-00047.safetensors", + "model.layers.36.mlp.experts.109.down_proj.weight_scale": "model-00037-of-00047.safetensors", + "model.layers.36.mlp.experts.109.gate_proj.weight": "model-00037-of-00047.safetensors", + "model.layers.36.mlp.experts.109.gate_proj.weight_scale": "model-00037-of-00047.safetensors", + "model.layers.36.mlp.experts.109.up_proj.weight": "model-00037-of-00047.safetensors", + "model.layers.36.mlp.experts.109.up_proj.weight_scale": "model-00037-of-00047.safetensors", + "model.layers.36.mlp.experts.11.down_proj.weight": "model-00037-of-00047.safetensors", + "model.layers.36.mlp.experts.11.down_proj.weight_scale": "model-00037-of-00047.safetensors", + "model.layers.36.mlp.experts.11.gate_proj.weight": "model-00037-of-00047.safetensors", + "model.layers.36.mlp.experts.11.gate_proj.weight_scale": "model-00037-of-00047.safetensors", + "model.layers.36.mlp.experts.11.up_proj.weight": "model-00037-of-00047.safetensors", + "model.layers.36.mlp.experts.11.up_proj.weight_scale": "model-00037-of-00047.safetensors", + "model.layers.36.mlp.experts.110.down_proj.weight": "model-00037-of-00047.safetensors", + "model.layers.36.mlp.experts.110.down_proj.weight_scale": "model-00037-of-00047.safetensors", + "model.layers.36.mlp.experts.110.gate_proj.weight": "model-00037-of-00047.safetensors", + "model.layers.36.mlp.experts.110.gate_proj.weight_scale": "model-00037-of-00047.safetensors", + "model.layers.36.mlp.experts.110.up_proj.weight": "model-00037-of-00047.safetensors", + "model.layers.36.mlp.experts.110.up_proj.weight_scale": "model-00037-of-00047.safetensors", + "model.layers.36.mlp.experts.111.down_proj.weight": "model-00037-of-00047.safetensors", + "model.layers.36.mlp.experts.111.down_proj.weight_scale": "model-00037-of-00047.safetensors", + "model.layers.36.mlp.experts.111.gate_proj.weight": "model-00037-of-00047.safetensors", + "model.layers.36.mlp.experts.111.gate_proj.weight_scale": "model-00037-of-00047.safetensors", + "model.layers.36.mlp.experts.111.up_proj.weight": "model-00037-of-00047.safetensors", + "model.layers.36.mlp.experts.111.up_proj.weight_scale": "model-00037-of-00047.safetensors", + "model.layers.36.mlp.experts.112.down_proj.weight": "model-00037-of-00047.safetensors", + "model.layers.36.mlp.experts.112.down_proj.weight_scale": "model-00037-of-00047.safetensors", + "model.layers.36.mlp.experts.112.gate_proj.weight": "model-00037-of-00047.safetensors", + "model.layers.36.mlp.experts.112.gate_proj.weight_scale": "model-00037-of-00047.safetensors", + "model.layers.36.mlp.experts.112.up_proj.weight": "model-00037-of-00047.safetensors", + "model.layers.36.mlp.experts.112.up_proj.weight_scale": "model-00037-of-00047.safetensors", + "model.layers.36.mlp.experts.113.down_proj.weight": "model-00037-of-00047.safetensors", + "model.layers.36.mlp.experts.113.down_proj.weight_scale": "model-00037-of-00047.safetensors", + "model.layers.36.mlp.experts.113.gate_proj.weight": "model-00037-of-00047.safetensors", + "model.layers.36.mlp.experts.113.gate_proj.weight_scale": "model-00037-of-00047.safetensors", + "model.layers.36.mlp.experts.113.up_proj.weight": "model-00037-of-00047.safetensors", + "model.layers.36.mlp.experts.113.up_proj.weight_scale": "model-00037-of-00047.safetensors", + "model.layers.36.mlp.experts.114.down_proj.weight": "model-00037-of-00047.safetensors", + "model.layers.36.mlp.experts.114.down_proj.weight_scale": "model-00037-of-00047.safetensors", + "model.layers.36.mlp.experts.114.gate_proj.weight": "model-00037-of-00047.safetensors", + "model.layers.36.mlp.experts.114.gate_proj.weight_scale": "model-00037-of-00047.safetensors", + "model.layers.36.mlp.experts.114.up_proj.weight": "model-00037-of-00047.safetensors", + "model.layers.36.mlp.experts.114.up_proj.weight_scale": "model-00037-of-00047.safetensors", + "model.layers.36.mlp.experts.115.down_proj.weight": "model-00037-of-00047.safetensors", + "model.layers.36.mlp.experts.115.down_proj.weight_scale": "model-00037-of-00047.safetensors", + "model.layers.36.mlp.experts.115.gate_proj.weight": "model-00037-of-00047.safetensors", + "model.layers.36.mlp.experts.115.gate_proj.weight_scale": "model-00037-of-00047.safetensors", + "model.layers.36.mlp.experts.115.up_proj.weight": "model-00037-of-00047.safetensors", + "model.layers.36.mlp.experts.115.up_proj.weight_scale": "model-00037-of-00047.safetensors", + "model.layers.36.mlp.experts.116.down_proj.weight": "model-00037-of-00047.safetensors", + "model.layers.36.mlp.experts.116.down_proj.weight_scale": "model-00037-of-00047.safetensors", + "model.layers.36.mlp.experts.116.gate_proj.weight": "model-00037-of-00047.safetensors", + "model.layers.36.mlp.experts.116.gate_proj.weight_scale": "model-00037-of-00047.safetensors", + "model.layers.36.mlp.experts.116.up_proj.weight": "model-00037-of-00047.safetensors", + "model.layers.36.mlp.experts.116.up_proj.weight_scale": "model-00037-of-00047.safetensors", + "model.layers.36.mlp.experts.117.down_proj.weight": "model-00037-of-00047.safetensors", + "model.layers.36.mlp.experts.117.down_proj.weight_scale": "model-00037-of-00047.safetensors", + "model.layers.36.mlp.experts.117.gate_proj.weight": "model-00037-of-00047.safetensors", + "model.layers.36.mlp.experts.117.gate_proj.weight_scale": "model-00037-of-00047.safetensors", + "model.layers.36.mlp.experts.117.up_proj.weight": "model-00037-of-00047.safetensors", + "model.layers.36.mlp.experts.117.up_proj.weight_scale": "model-00037-of-00047.safetensors", + "model.layers.36.mlp.experts.118.down_proj.weight": "model-00037-of-00047.safetensors", + "model.layers.36.mlp.experts.118.down_proj.weight_scale": "model-00037-of-00047.safetensors", + "model.layers.36.mlp.experts.118.gate_proj.weight": "model-00037-of-00047.safetensors", + "model.layers.36.mlp.experts.118.gate_proj.weight_scale": "model-00037-of-00047.safetensors", + "model.layers.36.mlp.experts.118.up_proj.weight": "model-00037-of-00047.safetensors", + "model.layers.36.mlp.experts.118.up_proj.weight_scale": "model-00037-of-00047.safetensors", + "model.layers.36.mlp.experts.119.down_proj.weight": "model-00037-of-00047.safetensors", + "model.layers.36.mlp.experts.119.down_proj.weight_scale": "model-00037-of-00047.safetensors", + "model.layers.36.mlp.experts.119.gate_proj.weight": "model-00037-of-00047.safetensors", + "model.layers.36.mlp.experts.119.gate_proj.weight_scale": "model-00037-of-00047.safetensors", + "model.layers.36.mlp.experts.119.up_proj.weight": "model-00037-of-00047.safetensors", + "model.layers.36.mlp.experts.119.up_proj.weight_scale": "model-00037-of-00047.safetensors", + "model.layers.36.mlp.experts.12.down_proj.weight": "model-00037-of-00047.safetensors", + "model.layers.36.mlp.experts.12.down_proj.weight_scale": "model-00037-of-00047.safetensors", + "model.layers.36.mlp.experts.12.gate_proj.weight": "model-00037-of-00047.safetensors", + "model.layers.36.mlp.experts.12.gate_proj.weight_scale": "model-00037-of-00047.safetensors", + "model.layers.36.mlp.experts.12.up_proj.weight": "model-00037-of-00047.safetensors", + "model.layers.36.mlp.experts.12.up_proj.weight_scale": "model-00037-of-00047.safetensors", + "model.layers.36.mlp.experts.120.down_proj.weight": "model-00037-of-00047.safetensors", + "model.layers.36.mlp.experts.120.down_proj.weight_scale": "model-00037-of-00047.safetensors", + "model.layers.36.mlp.experts.120.gate_proj.weight": "model-00037-of-00047.safetensors", + "model.layers.36.mlp.experts.120.gate_proj.weight_scale": "model-00037-of-00047.safetensors", + "model.layers.36.mlp.experts.120.up_proj.weight": "model-00037-of-00047.safetensors", + "model.layers.36.mlp.experts.120.up_proj.weight_scale": "model-00037-of-00047.safetensors", + "model.layers.36.mlp.experts.121.down_proj.weight": "model-00037-of-00047.safetensors", + "model.layers.36.mlp.experts.121.down_proj.weight_scale": "model-00037-of-00047.safetensors", + "model.layers.36.mlp.experts.121.gate_proj.weight": "model-00037-of-00047.safetensors", + "model.layers.36.mlp.experts.121.gate_proj.weight_scale": "model-00037-of-00047.safetensors", + "model.layers.36.mlp.experts.121.up_proj.weight": "model-00037-of-00047.safetensors", + "model.layers.36.mlp.experts.121.up_proj.weight_scale": "model-00037-of-00047.safetensors", + "model.layers.36.mlp.experts.122.down_proj.weight": "model-00037-of-00047.safetensors", + "model.layers.36.mlp.experts.122.down_proj.weight_scale": "model-00037-of-00047.safetensors", + "model.layers.36.mlp.experts.122.gate_proj.weight": "model-00037-of-00047.safetensors", + "model.layers.36.mlp.experts.122.gate_proj.weight_scale": "model-00037-of-00047.safetensors", + "model.layers.36.mlp.experts.122.up_proj.weight": "model-00037-of-00047.safetensors", + "model.layers.36.mlp.experts.122.up_proj.weight_scale": "model-00037-of-00047.safetensors", + "model.layers.36.mlp.experts.123.down_proj.weight": "model-00037-of-00047.safetensors", + "model.layers.36.mlp.experts.123.down_proj.weight_scale": "model-00037-of-00047.safetensors", + "model.layers.36.mlp.experts.123.gate_proj.weight": "model-00037-of-00047.safetensors", + "model.layers.36.mlp.experts.123.gate_proj.weight_scale": "model-00037-of-00047.safetensors", + "model.layers.36.mlp.experts.123.up_proj.weight": "model-00037-of-00047.safetensors", + "model.layers.36.mlp.experts.123.up_proj.weight_scale": "model-00037-of-00047.safetensors", + "model.layers.36.mlp.experts.124.down_proj.weight": "model-00037-of-00047.safetensors", + "model.layers.36.mlp.experts.124.down_proj.weight_scale": "model-00037-of-00047.safetensors", + "model.layers.36.mlp.experts.124.gate_proj.weight": "model-00037-of-00047.safetensors", + "model.layers.36.mlp.experts.124.gate_proj.weight_scale": "model-00037-of-00047.safetensors", + "model.layers.36.mlp.experts.124.up_proj.weight": "model-00037-of-00047.safetensors", + "model.layers.36.mlp.experts.124.up_proj.weight_scale": "model-00037-of-00047.safetensors", + "model.layers.36.mlp.experts.125.down_proj.weight": "model-00037-of-00047.safetensors", + "model.layers.36.mlp.experts.125.down_proj.weight_scale": "model-00037-of-00047.safetensors", + "model.layers.36.mlp.experts.125.gate_proj.weight": "model-00037-of-00047.safetensors", + "model.layers.36.mlp.experts.125.gate_proj.weight_scale": "model-00037-of-00047.safetensors", + "model.layers.36.mlp.experts.125.up_proj.weight": "model-00037-of-00047.safetensors", + "model.layers.36.mlp.experts.125.up_proj.weight_scale": "model-00037-of-00047.safetensors", + "model.layers.36.mlp.experts.126.down_proj.weight": "model-00037-of-00047.safetensors", + "model.layers.36.mlp.experts.126.down_proj.weight_scale": "model-00037-of-00047.safetensors", + "model.layers.36.mlp.experts.126.gate_proj.weight": "model-00037-of-00047.safetensors", + "model.layers.36.mlp.experts.126.gate_proj.weight_scale": "model-00037-of-00047.safetensors", + "model.layers.36.mlp.experts.126.up_proj.weight": "model-00037-of-00047.safetensors", + "model.layers.36.mlp.experts.126.up_proj.weight_scale": "model-00037-of-00047.safetensors", + "model.layers.36.mlp.experts.127.down_proj.weight": "model-00037-of-00047.safetensors", + "model.layers.36.mlp.experts.127.down_proj.weight_scale": "model-00037-of-00047.safetensors", + "model.layers.36.mlp.experts.127.gate_proj.weight": "model-00037-of-00047.safetensors", + "model.layers.36.mlp.experts.127.gate_proj.weight_scale": "model-00037-of-00047.safetensors", + "model.layers.36.mlp.experts.127.up_proj.weight": "model-00037-of-00047.safetensors", + "model.layers.36.mlp.experts.127.up_proj.weight_scale": "model-00037-of-00047.safetensors", + "model.layers.36.mlp.experts.13.down_proj.weight": "model-00037-of-00047.safetensors", + "model.layers.36.mlp.experts.13.down_proj.weight_scale": "model-00037-of-00047.safetensors", + "model.layers.36.mlp.experts.13.gate_proj.weight": "model-00037-of-00047.safetensors", + "model.layers.36.mlp.experts.13.gate_proj.weight_scale": "model-00037-of-00047.safetensors", + "model.layers.36.mlp.experts.13.up_proj.weight": "model-00037-of-00047.safetensors", + "model.layers.36.mlp.experts.13.up_proj.weight_scale": "model-00037-of-00047.safetensors", + "model.layers.36.mlp.experts.14.down_proj.weight": "model-00037-of-00047.safetensors", + "model.layers.36.mlp.experts.14.down_proj.weight_scale": "model-00037-of-00047.safetensors", + "model.layers.36.mlp.experts.14.gate_proj.weight": "model-00037-of-00047.safetensors", + "model.layers.36.mlp.experts.14.gate_proj.weight_scale": "model-00037-of-00047.safetensors", + "model.layers.36.mlp.experts.14.up_proj.weight": "model-00037-of-00047.safetensors", + "model.layers.36.mlp.experts.14.up_proj.weight_scale": "model-00037-of-00047.safetensors", + "model.layers.36.mlp.experts.15.down_proj.weight": "model-00037-of-00047.safetensors", + "model.layers.36.mlp.experts.15.down_proj.weight_scale": "model-00037-of-00047.safetensors", + "model.layers.36.mlp.experts.15.gate_proj.weight": "model-00037-of-00047.safetensors", + "model.layers.36.mlp.experts.15.gate_proj.weight_scale": "model-00037-of-00047.safetensors", + "model.layers.36.mlp.experts.15.up_proj.weight": "model-00037-of-00047.safetensors", + "model.layers.36.mlp.experts.15.up_proj.weight_scale": "model-00037-of-00047.safetensors", + "model.layers.36.mlp.experts.16.down_proj.weight": "model-00037-of-00047.safetensors", + "model.layers.36.mlp.experts.16.down_proj.weight_scale": "model-00037-of-00047.safetensors", + "model.layers.36.mlp.experts.16.gate_proj.weight": "model-00037-of-00047.safetensors", + "model.layers.36.mlp.experts.16.gate_proj.weight_scale": "model-00037-of-00047.safetensors", + "model.layers.36.mlp.experts.16.up_proj.weight": "model-00037-of-00047.safetensors", + "model.layers.36.mlp.experts.16.up_proj.weight_scale": "model-00037-of-00047.safetensors", + "model.layers.36.mlp.experts.17.down_proj.weight": "model-00037-of-00047.safetensors", + "model.layers.36.mlp.experts.17.down_proj.weight_scale": "model-00037-of-00047.safetensors", + "model.layers.36.mlp.experts.17.gate_proj.weight": "model-00037-of-00047.safetensors", + "model.layers.36.mlp.experts.17.gate_proj.weight_scale": "model-00037-of-00047.safetensors", + "model.layers.36.mlp.experts.17.up_proj.weight": "model-00037-of-00047.safetensors", + "model.layers.36.mlp.experts.17.up_proj.weight_scale": "model-00037-of-00047.safetensors", + "model.layers.36.mlp.experts.18.down_proj.weight": "model-00037-of-00047.safetensors", + "model.layers.36.mlp.experts.18.down_proj.weight_scale": "model-00037-of-00047.safetensors", + "model.layers.36.mlp.experts.18.gate_proj.weight": "model-00037-of-00047.safetensors", + "model.layers.36.mlp.experts.18.gate_proj.weight_scale": "model-00037-of-00047.safetensors", + "model.layers.36.mlp.experts.18.up_proj.weight": "model-00037-of-00047.safetensors", + "model.layers.36.mlp.experts.18.up_proj.weight_scale": "model-00037-of-00047.safetensors", + "model.layers.36.mlp.experts.19.down_proj.weight": "model-00037-of-00047.safetensors", + "model.layers.36.mlp.experts.19.down_proj.weight_scale": "model-00037-of-00047.safetensors", + "model.layers.36.mlp.experts.19.gate_proj.weight": "model-00037-of-00047.safetensors", + "model.layers.36.mlp.experts.19.gate_proj.weight_scale": "model-00037-of-00047.safetensors", + "model.layers.36.mlp.experts.19.up_proj.weight": "model-00037-of-00047.safetensors", + "model.layers.36.mlp.experts.19.up_proj.weight_scale": "model-00037-of-00047.safetensors", + "model.layers.36.mlp.experts.2.down_proj.weight": "model-00037-of-00047.safetensors", + "model.layers.36.mlp.experts.2.down_proj.weight_scale": "model-00037-of-00047.safetensors", + "model.layers.36.mlp.experts.2.gate_proj.weight": "model-00037-of-00047.safetensors", + "model.layers.36.mlp.experts.2.gate_proj.weight_scale": "model-00037-of-00047.safetensors", + "model.layers.36.mlp.experts.2.up_proj.weight": "model-00037-of-00047.safetensors", + "model.layers.36.mlp.experts.2.up_proj.weight_scale": "model-00037-of-00047.safetensors", + "model.layers.36.mlp.experts.20.down_proj.weight": "model-00037-of-00047.safetensors", + "model.layers.36.mlp.experts.20.down_proj.weight_scale": "model-00037-of-00047.safetensors", + "model.layers.36.mlp.experts.20.gate_proj.weight": "model-00037-of-00047.safetensors", + "model.layers.36.mlp.experts.20.gate_proj.weight_scale": "model-00037-of-00047.safetensors", + "model.layers.36.mlp.experts.20.up_proj.weight": "model-00037-of-00047.safetensors", + "model.layers.36.mlp.experts.20.up_proj.weight_scale": "model-00037-of-00047.safetensors", + "model.layers.36.mlp.experts.21.down_proj.weight": "model-00037-of-00047.safetensors", + "model.layers.36.mlp.experts.21.down_proj.weight_scale": "model-00037-of-00047.safetensors", + "model.layers.36.mlp.experts.21.gate_proj.weight": "model-00037-of-00047.safetensors", + "model.layers.36.mlp.experts.21.gate_proj.weight_scale": "model-00037-of-00047.safetensors", + "model.layers.36.mlp.experts.21.up_proj.weight": "model-00037-of-00047.safetensors", + "model.layers.36.mlp.experts.21.up_proj.weight_scale": "model-00037-of-00047.safetensors", + "model.layers.36.mlp.experts.22.down_proj.weight": "model-00037-of-00047.safetensors", + "model.layers.36.mlp.experts.22.down_proj.weight_scale": "model-00037-of-00047.safetensors", + "model.layers.36.mlp.experts.22.gate_proj.weight": "model-00037-of-00047.safetensors", + "model.layers.36.mlp.experts.22.gate_proj.weight_scale": "model-00037-of-00047.safetensors", + "model.layers.36.mlp.experts.22.up_proj.weight": "model-00037-of-00047.safetensors", + "model.layers.36.mlp.experts.22.up_proj.weight_scale": "model-00037-of-00047.safetensors", + "model.layers.36.mlp.experts.23.down_proj.weight": "model-00037-of-00047.safetensors", + "model.layers.36.mlp.experts.23.down_proj.weight_scale": "model-00037-of-00047.safetensors", + "model.layers.36.mlp.experts.23.gate_proj.weight": "model-00037-of-00047.safetensors", + "model.layers.36.mlp.experts.23.gate_proj.weight_scale": "model-00037-of-00047.safetensors", + "model.layers.36.mlp.experts.23.up_proj.weight": "model-00037-of-00047.safetensors", + "model.layers.36.mlp.experts.23.up_proj.weight_scale": "model-00037-of-00047.safetensors", + "model.layers.36.mlp.experts.24.down_proj.weight": "model-00037-of-00047.safetensors", + "model.layers.36.mlp.experts.24.down_proj.weight_scale": "model-00037-of-00047.safetensors", + "model.layers.36.mlp.experts.24.gate_proj.weight": "model-00037-of-00047.safetensors", + "model.layers.36.mlp.experts.24.gate_proj.weight_scale": "model-00037-of-00047.safetensors", + "model.layers.36.mlp.experts.24.up_proj.weight": "model-00037-of-00047.safetensors", + "model.layers.36.mlp.experts.24.up_proj.weight_scale": "model-00037-of-00047.safetensors", + "model.layers.36.mlp.experts.25.down_proj.weight": "model-00037-of-00047.safetensors", + "model.layers.36.mlp.experts.25.down_proj.weight_scale": "model-00037-of-00047.safetensors", + "model.layers.36.mlp.experts.25.gate_proj.weight": "model-00037-of-00047.safetensors", + "model.layers.36.mlp.experts.25.gate_proj.weight_scale": "model-00037-of-00047.safetensors", + "model.layers.36.mlp.experts.25.up_proj.weight": "model-00037-of-00047.safetensors", + "model.layers.36.mlp.experts.25.up_proj.weight_scale": "model-00037-of-00047.safetensors", + "model.layers.36.mlp.experts.26.down_proj.weight": "model-00037-of-00047.safetensors", + "model.layers.36.mlp.experts.26.down_proj.weight_scale": "model-00037-of-00047.safetensors", + "model.layers.36.mlp.experts.26.gate_proj.weight": "model-00037-of-00047.safetensors", + "model.layers.36.mlp.experts.26.gate_proj.weight_scale": "model-00037-of-00047.safetensors", + "model.layers.36.mlp.experts.26.up_proj.weight": "model-00037-of-00047.safetensors", + "model.layers.36.mlp.experts.26.up_proj.weight_scale": "model-00037-of-00047.safetensors", + "model.layers.36.mlp.experts.27.down_proj.weight": "model-00037-of-00047.safetensors", + "model.layers.36.mlp.experts.27.down_proj.weight_scale": "model-00037-of-00047.safetensors", + "model.layers.36.mlp.experts.27.gate_proj.weight": "model-00037-of-00047.safetensors", + "model.layers.36.mlp.experts.27.gate_proj.weight_scale": "model-00037-of-00047.safetensors", + "model.layers.36.mlp.experts.27.up_proj.weight": "model-00037-of-00047.safetensors", + "model.layers.36.mlp.experts.27.up_proj.weight_scale": "model-00037-of-00047.safetensors", + "model.layers.36.mlp.experts.28.down_proj.weight": "model-00037-of-00047.safetensors", + "model.layers.36.mlp.experts.28.down_proj.weight_scale": "model-00037-of-00047.safetensors", + "model.layers.36.mlp.experts.28.gate_proj.weight": "model-00037-of-00047.safetensors", + "model.layers.36.mlp.experts.28.gate_proj.weight_scale": "model-00037-of-00047.safetensors", + "model.layers.36.mlp.experts.28.up_proj.weight": "model-00037-of-00047.safetensors", + "model.layers.36.mlp.experts.28.up_proj.weight_scale": "model-00037-of-00047.safetensors", + "model.layers.36.mlp.experts.29.down_proj.weight": "model-00037-of-00047.safetensors", + "model.layers.36.mlp.experts.29.down_proj.weight_scale": "model-00037-of-00047.safetensors", + "model.layers.36.mlp.experts.29.gate_proj.weight": "model-00037-of-00047.safetensors", + "model.layers.36.mlp.experts.29.gate_proj.weight_scale": "model-00037-of-00047.safetensors", + "model.layers.36.mlp.experts.29.up_proj.weight": "model-00037-of-00047.safetensors", + "model.layers.36.mlp.experts.29.up_proj.weight_scale": "model-00037-of-00047.safetensors", + "model.layers.36.mlp.experts.3.down_proj.weight": "model-00037-of-00047.safetensors", + "model.layers.36.mlp.experts.3.down_proj.weight_scale": "model-00037-of-00047.safetensors", + "model.layers.36.mlp.experts.3.gate_proj.weight": "model-00037-of-00047.safetensors", + "model.layers.36.mlp.experts.3.gate_proj.weight_scale": "model-00037-of-00047.safetensors", + "model.layers.36.mlp.experts.3.up_proj.weight": "model-00037-of-00047.safetensors", + "model.layers.36.mlp.experts.3.up_proj.weight_scale": "model-00037-of-00047.safetensors", + "model.layers.36.mlp.experts.30.down_proj.weight": "model-00037-of-00047.safetensors", + "model.layers.36.mlp.experts.30.down_proj.weight_scale": "model-00037-of-00047.safetensors", + "model.layers.36.mlp.experts.30.gate_proj.weight": "model-00037-of-00047.safetensors", + "model.layers.36.mlp.experts.30.gate_proj.weight_scale": "model-00037-of-00047.safetensors", + "model.layers.36.mlp.experts.30.up_proj.weight": "model-00037-of-00047.safetensors", + "model.layers.36.mlp.experts.30.up_proj.weight_scale": "model-00037-of-00047.safetensors", + "model.layers.36.mlp.experts.31.down_proj.weight": "model-00037-of-00047.safetensors", + "model.layers.36.mlp.experts.31.down_proj.weight_scale": "model-00037-of-00047.safetensors", + "model.layers.36.mlp.experts.31.gate_proj.weight": "model-00037-of-00047.safetensors", + "model.layers.36.mlp.experts.31.gate_proj.weight_scale": "model-00037-of-00047.safetensors", + "model.layers.36.mlp.experts.31.up_proj.weight": "model-00037-of-00047.safetensors", + "model.layers.36.mlp.experts.31.up_proj.weight_scale": "model-00037-of-00047.safetensors", + "model.layers.36.mlp.experts.32.down_proj.weight": "model-00037-of-00047.safetensors", + "model.layers.36.mlp.experts.32.down_proj.weight_scale": "model-00037-of-00047.safetensors", + "model.layers.36.mlp.experts.32.gate_proj.weight": "model-00037-of-00047.safetensors", + "model.layers.36.mlp.experts.32.gate_proj.weight_scale": "model-00037-of-00047.safetensors", + "model.layers.36.mlp.experts.32.up_proj.weight": "model-00037-of-00047.safetensors", + "model.layers.36.mlp.experts.32.up_proj.weight_scale": "model-00037-of-00047.safetensors", + "model.layers.36.mlp.experts.33.down_proj.weight": "model-00037-of-00047.safetensors", + "model.layers.36.mlp.experts.33.down_proj.weight_scale": "model-00037-of-00047.safetensors", + "model.layers.36.mlp.experts.33.gate_proj.weight": "model-00037-of-00047.safetensors", + "model.layers.36.mlp.experts.33.gate_proj.weight_scale": "model-00037-of-00047.safetensors", + "model.layers.36.mlp.experts.33.up_proj.weight": "model-00037-of-00047.safetensors", + "model.layers.36.mlp.experts.33.up_proj.weight_scale": "model-00037-of-00047.safetensors", + "model.layers.36.mlp.experts.34.down_proj.weight": "model-00037-of-00047.safetensors", + "model.layers.36.mlp.experts.34.down_proj.weight_scale": "model-00037-of-00047.safetensors", + "model.layers.36.mlp.experts.34.gate_proj.weight": "model-00037-of-00047.safetensors", + "model.layers.36.mlp.experts.34.gate_proj.weight_scale": "model-00037-of-00047.safetensors", + "model.layers.36.mlp.experts.34.up_proj.weight": "model-00037-of-00047.safetensors", + "model.layers.36.mlp.experts.34.up_proj.weight_scale": "model-00037-of-00047.safetensors", + "model.layers.36.mlp.experts.35.down_proj.weight": "model-00037-of-00047.safetensors", + "model.layers.36.mlp.experts.35.down_proj.weight_scale": "model-00037-of-00047.safetensors", + "model.layers.36.mlp.experts.35.gate_proj.weight": "model-00037-of-00047.safetensors", + "model.layers.36.mlp.experts.35.gate_proj.weight_scale": "model-00037-of-00047.safetensors", + "model.layers.36.mlp.experts.35.up_proj.weight": "model-00037-of-00047.safetensors", + "model.layers.36.mlp.experts.35.up_proj.weight_scale": "model-00037-of-00047.safetensors", + "model.layers.36.mlp.experts.36.down_proj.weight": "model-00037-of-00047.safetensors", + "model.layers.36.mlp.experts.36.down_proj.weight_scale": "model-00037-of-00047.safetensors", + "model.layers.36.mlp.experts.36.gate_proj.weight": "model-00037-of-00047.safetensors", + "model.layers.36.mlp.experts.36.gate_proj.weight_scale": "model-00037-of-00047.safetensors", + "model.layers.36.mlp.experts.36.up_proj.weight": "model-00037-of-00047.safetensors", + "model.layers.36.mlp.experts.36.up_proj.weight_scale": "model-00037-of-00047.safetensors", + "model.layers.36.mlp.experts.37.down_proj.weight": "model-00037-of-00047.safetensors", + "model.layers.36.mlp.experts.37.down_proj.weight_scale": "model-00037-of-00047.safetensors", + "model.layers.36.mlp.experts.37.gate_proj.weight": "model-00037-of-00047.safetensors", + "model.layers.36.mlp.experts.37.gate_proj.weight_scale": "model-00037-of-00047.safetensors", + "model.layers.36.mlp.experts.37.up_proj.weight": "model-00037-of-00047.safetensors", + "model.layers.36.mlp.experts.37.up_proj.weight_scale": "model-00037-of-00047.safetensors", + "model.layers.36.mlp.experts.38.down_proj.weight": "model-00037-of-00047.safetensors", + "model.layers.36.mlp.experts.38.down_proj.weight_scale": "model-00037-of-00047.safetensors", + "model.layers.36.mlp.experts.38.gate_proj.weight": "model-00037-of-00047.safetensors", + "model.layers.36.mlp.experts.38.gate_proj.weight_scale": "model-00037-of-00047.safetensors", + "model.layers.36.mlp.experts.38.up_proj.weight": "model-00037-of-00047.safetensors", + "model.layers.36.mlp.experts.38.up_proj.weight_scale": "model-00037-of-00047.safetensors", + "model.layers.36.mlp.experts.39.down_proj.weight": "model-00037-of-00047.safetensors", + "model.layers.36.mlp.experts.39.down_proj.weight_scale": "model-00037-of-00047.safetensors", + "model.layers.36.mlp.experts.39.gate_proj.weight": "model-00037-of-00047.safetensors", + "model.layers.36.mlp.experts.39.gate_proj.weight_scale": "model-00037-of-00047.safetensors", + "model.layers.36.mlp.experts.39.up_proj.weight": "model-00037-of-00047.safetensors", + "model.layers.36.mlp.experts.39.up_proj.weight_scale": "model-00037-of-00047.safetensors", + "model.layers.36.mlp.experts.4.down_proj.weight": "model-00037-of-00047.safetensors", + "model.layers.36.mlp.experts.4.down_proj.weight_scale": "model-00037-of-00047.safetensors", + "model.layers.36.mlp.experts.4.gate_proj.weight": "model-00037-of-00047.safetensors", + "model.layers.36.mlp.experts.4.gate_proj.weight_scale": "model-00037-of-00047.safetensors", + "model.layers.36.mlp.experts.4.up_proj.weight": "model-00037-of-00047.safetensors", + "model.layers.36.mlp.experts.4.up_proj.weight_scale": "model-00037-of-00047.safetensors", + "model.layers.36.mlp.experts.40.down_proj.weight": "model-00037-of-00047.safetensors", + "model.layers.36.mlp.experts.40.down_proj.weight_scale": "model-00037-of-00047.safetensors", + "model.layers.36.mlp.experts.40.gate_proj.weight": "model-00037-of-00047.safetensors", + "model.layers.36.mlp.experts.40.gate_proj.weight_scale": "model-00037-of-00047.safetensors", + "model.layers.36.mlp.experts.40.up_proj.weight": "model-00037-of-00047.safetensors", + "model.layers.36.mlp.experts.40.up_proj.weight_scale": "model-00037-of-00047.safetensors", + "model.layers.36.mlp.experts.41.down_proj.weight": "model-00037-of-00047.safetensors", + "model.layers.36.mlp.experts.41.down_proj.weight_scale": "model-00037-of-00047.safetensors", + "model.layers.36.mlp.experts.41.gate_proj.weight": "model-00037-of-00047.safetensors", + "model.layers.36.mlp.experts.41.gate_proj.weight_scale": "model-00037-of-00047.safetensors", + "model.layers.36.mlp.experts.41.up_proj.weight": "model-00037-of-00047.safetensors", + "model.layers.36.mlp.experts.41.up_proj.weight_scale": "model-00037-of-00047.safetensors", + "model.layers.36.mlp.experts.42.down_proj.weight": "model-00037-of-00047.safetensors", + "model.layers.36.mlp.experts.42.down_proj.weight_scale": "model-00037-of-00047.safetensors", + "model.layers.36.mlp.experts.42.gate_proj.weight": "model-00037-of-00047.safetensors", + "model.layers.36.mlp.experts.42.gate_proj.weight_scale": "model-00037-of-00047.safetensors", + "model.layers.36.mlp.experts.42.up_proj.weight": "model-00037-of-00047.safetensors", + "model.layers.36.mlp.experts.42.up_proj.weight_scale": "model-00037-of-00047.safetensors", + "model.layers.36.mlp.experts.43.down_proj.weight": "model-00037-of-00047.safetensors", + "model.layers.36.mlp.experts.43.down_proj.weight_scale": "model-00037-of-00047.safetensors", + "model.layers.36.mlp.experts.43.gate_proj.weight": "model-00037-of-00047.safetensors", + "model.layers.36.mlp.experts.43.gate_proj.weight_scale": "model-00037-of-00047.safetensors", + "model.layers.36.mlp.experts.43.up_proj.weight": "model-00037-of-00047.safetensors", + "model.layers.36.mlp.experts.43.up_proj.weight_scale": "model-00037-of-00047.safetensors", + "model.layers.36.mlp.experts.44.down_proj.weight": "model-00037-of-00047.safetensors", + "model.layers.36.mlp.experts.44.down_proj.weight_scale": "model-00037-of-00047.safetensors", + "model.layers.36.mlp.experts.44.gate_proj.weight": "model-00037-of-00047.safetensors", + "model.layers.36.mlp.experts.44.gate_proj.weight_scale": "model-00037-of-00047.safetensors", + "model.layers.36.mlp.experts.44.up_proj.weight": "model-00037-of-00047.safetensors", + "model.layers.36.mlp.experts.44.up_proj.weight_scale": "model-00037-of-00047.safetensors", + "model.layers.36.mlp.experts.45.down_proj.weight": "model-00037-of-00047.safetensors", + "model.layers.36.mlp.experts.45.down_proj.weight_scale": "model-00037-of-00047.safetensors", + "model.layers.36.mlp.experts.45.gate_proj.weight": "model-00037-of-00047.safetensors", + "model.layers.36.mlp.experts.45.gate_proj.weight_scale": "model-00037-of-00047.safetensors", + "model.layers.36.mlp.experts.45.up_proj.weight": "model-00037-of-00047.safetensors", + "model.layers.36.mlp.experts.45.up_proj.weight_scale": "model-00037-of-00047.safetensors", + "model.layers.36.mlp.experts.46.down_proj.weight": "model-00037-of-00047.safetensors", + "model.layers.36.mlp.experts.46.down_proj.weight_scale": "model-00037-of-00047.safetensors", + "model.layers.36.mlp.experts.46.gate_proj.weight": "model-00037-of-00047.safetensors", + "model.layers.36.mlp.experts.46.gate_proj.weight_scale": "model-00037-of-00047.safetensors", + "model.layers.36.mlp.experts.46.up_proj.weight": "model-00037-of-00047.safetensors", + "model.layers.36.mlp.experts.46.up_proj.weight_scale": "model-00037-of-00047.safetensors", + "model.layers.36.mlp.experts.47.down_proj.weight": "model-00037-of-00047.safetensors", + "model.layers.36.mlp.experts.47.down_proj.weight_scale": "model-00037-of-00047.safetensors", + "model.layers.36.mlp.experts.47.gate_proj.weight": "model-00037-of-00047.safetensors", + "model.layers.36.mlp.experts.47.gate_proj.weight_scale": "model-00037-of-00047.safetensors", + "model.layers.36.mlp.experts.47.up_proj.weight": "model-00037-of-00047.safetensors", + "model.layers.36.mlp.experts.47.up_proj.weight_scale": "model-00037-of-00047.safetensors", + "model.layers.36.mlp.experts.48.down_proj.weight": "model-00037-of-00047.safetensors", + "model.layers.36.mlp.experts.48.down_proj.weight_scale": "model-00037-of-00047.safetensors", + "model.layers.36.mlp.experts.48.gate_proj.weight": "model-00037-of-00047.safetensors", + "model.layers.36.mlp.experts.48.gate_proj.weight_scale": "model-00037-of-00047.safetensors", + "model.layers.36.mlp.experts.48.up_proj.weight": "model-00037-of-00047.safetensors", + "model.layers.36.mlp.experts.48.up_proj.weight_scale": "model-00037-of-00047.safetensors", + "model.layers.36.mlp.experts.49.down_proj.weight": "model-00037-of-00047.safetensors", + "model.layers.36.mlp.experts.49.down_proj.weight_scale": "model-00037-of-00047.safetensors", + "model.layers.36.mlp.experts.49.gate_proj.weight": "model-00037-of-00047.safetensors", + "model.layers.36.mlp.experts.49.gate_proj.weight_scale": "model-00037-of-00047.safetensors", + "model.layers.36.mlp.experts.49.up_proj.weight": "model-00037-of-00047.safetensors", + "model.layers.36.mlp.experts.49.up_proj.weight_scale": "model-00037-of-00047.safetensors", + "model.layers.36.mlp.experts.5.down_proj.weight": "model-00037-of-00047.safetensors", + "model.layers.36.mlp.experts.5.down_proj.weight_scale": "model-00037-of-00047.safetensors", + "model.layers.36.mlp.experts.5.gate_proj.weight": "model-00037-of-00047.safetensors", + "model.layers.36.mlp.experts.5.gate_proj.weight_scale": "model-00037-of-00047.safetensors", + "model.layers.36.mlp.experts.5.up_proj.weight": "model-00037-of-00047.safetensors", + "model.layers.36.mlp.experts.5.up_proj.weight_scale": "model-00037-of-00047.safetensors", + "model.layers.36.mlp.experts.50.down_proj.weight": "model-00037-of-00047.safetensors", + "model.layers.36.mlp.experts.50.down_proj.weight_scale": "model-00037-of-00047.safetensors", + "model.layers.36.mlp.experts.50.gate_proj.weight": "model-00037-of-00047.safetensors", + "model.layers.36.mlp.experts.50.gate_proj.weight_scale": "model-00037-of-00047.safetensors", + "model.layers.36.mlp.experts.50.up_proj.weight": "model-00037-of-00047.safetensors", + "model.layers.36.mlp.experts.50.up_proj.weight_scale": "model-00037-of-00047.safetensors", + "model.layers.36.mlp.experts.51.down_proj.weight": "model-00037-of-00047.safetensors", + "model.layers.36.mlp.experts.51.down_proj.weight_scale": "model-00037-of-00047.safetensors", + "model.layers.36.mlp.experts.51.gate_proj.weight": "model-00037-of-00047.safetensors", + "model.layers.36.mlp.experts.51.gate_proj.weight_scale": "model-00037-of-00047.safetensors", + "model.layers.36.mlp.experts.51.up_proj.weight": "model-00037-of-00047.safetensors", + "model.layers.36.mlp.experts.51.up_proj.weight_scale": "model-00037-of-00047.safetensors", + "model.layers.36.mlp.experts.52.down_proj.weight": "model-00037-of-00047.safetensors", + "model.layers.36.mlp.experts.52.down_proj.weight_scale": "model-00037-of-00047.safetensors", + "model.layers.36.mlp.experts.52.gate_proj.weight": "model-00037-of-00047.safetensors", + "model.layers.36.mlp.experts.52.gate_proj.weight_scale": "model-00037-of-00047.safetensors", + "model.layers.36.mlp.experts.52.up_proj.weight": "model-00037-of-00047.safetensors", + "model.layers.36.mlp.experts.52.up_proj.weight_scale": "model-00037-of-00047.safetensors", + "model.layers.36.mlp.experts.53.down_proj.weight": "model-00037-of-00047.safetensors", + "model.layers.36.mlp.experts.53.down_proj.weight_scale": "model-00037-of-00047.safetensors", + "model.layers.36.mlp.experts.53.gate_proj.weight": "model-00037-of-00047.safetensors", + "model.layers.36.mlp.experts.53.gate_proj.weight_scale": "model-00037-of-00047.safetensors", + "model.layers.36.mlp.experts.53.up_proj.weight": "model-00037-of-00047.safetensors", + "model.layers.36.mlp.experts.53.up_proj.weight_scale": "model-00037-of-00047.safetensors", + "model.layers.36.mlp.experts.54.down_proj.weight": "model-00037-of-00047.safetensors", + "model.layers.36.mlp.experts.54.down_proj.weight_scale": "model-00037-of-00047.safetensors", + "model.layers.36.mlp.experts.54.gate_proj.weight": "model-00037-of-00047.safetensors", + "model.layers.36.mlp.experts.54.gate_proj.weight_scale": "model-00037-of-00047.safetensors", + "model.layers.36.mlp.experts.54.up_proj.weight": "model-00037-of-00047.safetensors", + "model.layers.36.mlp.experts.54.up_proj.weight_scale": "model-00037-of-00047.safetensors", + "model.layers.36.mlp.experts.55.down_proj.weight": "model-00037-of-00047.safetensors", + "model.layers.36.mlp.experts.55.down_proj.weight_scale": "model-00037-of-00047.safetensors", + "model.layers.36.mlp.experts.55.gate_proj.weight": "model-00037-of-00047.safetensors", + "model.layers.36.mlp.experts.55.gate_proj.weight_scale": "model-00037-of-00047.safetensors", + "model.layers.36.mlp.experts.55.up_proj.weight": "model-00037-of-00047.safetensors", + "model.layers.36.mlp.experts.55.up_proj.weight_scale": "model-00037-of-00047.safetensors", + "model.layers.36.mlp.experts.56.down_proj.weight": "model-00037-of-00047.safetensors", + "model.layers.36.mlp.experts.56.down_proj.weight_scale": "model-00037-of-00047.safetensors", + "model.layers.36.mlp.experts.56.gate_proj.weight": "model-00037-of-00047.safetensors", + "model.layers.36.mlp.experts.56.gate_proj.weight_scale": "model-00037-of-00047.safetensors", + "model.layers.36.mlp.experts.56.up_proj.weight": "model-00037-of-00047.safetensors", + "model.layers.36.mlp.experts.56.up_proj.weight_scale": "model-00037-of-00047.safetensors", + "model.layers.36.mlp.experts.57.down_proj.weight": "model-00037-of-00047.safetensors", + "model.layers.36.mlp.experts.57.down_proj.weight_scale": "model-00037-of-00047.safetensors", + "model.layers.36.mlp.experts.57.gate_proj.weight": "model-00037-of-00047.safetensors", + "model.layers.36.mlp.experts.57.gate_proj.weight_scale": "model-00037-of-00047.safetensors", + "model.layers.36.mlp.experts.57.up_proj.weight": "model-00037-of-00047.safetensors", + "model.layers.36.mlp.experts.57.up_proj.weight_scale": "model-00037-of-00047.safetensors", + "model.layers.36.mlp.experts.58.down_proj.weight": "model-00037-of-00047.safetensors", + "model.layers.36.mlp.experts.58.down_proj.weight_scale": "model-00037-of-00047.safetensors", + "model.layers.36.mlp.experts.58.gate_proj.weight": "model-00037-of-00047.safetensors", + "model.layers.36.mlp.experts.58.gate_proj.weight_scale": "model-00037-of-00047.safetensors", + "model.layers.36.mlp.experts.58.up_proj.weight": "model-00037-of-00047.safetensors", + "model.layers.36.mlp.experts.58.up_proj.weight_scale": "model-00037-of-00047.safetensors", + "model.layers.36.mlp.experts.59.down_proj.weight": "model-00037-of-00047.safetensors", + "model.layers.36.mlp.experts.59.down_proj.weight_scale": "model-00037-of-00047.safetensors", + "model.layers.36.mlp.experts.59.gate_proj.weight": "model-00037-of-00047.safetensors", + "model.layers.36.mlp.experts.59.gate_proj.weight_scale": "model-00037-of-00047.safetensors", + "model.layers.36.mlp.experts.59.up_proj.weight": "model-00037-of-00047.safetensors", + "model.layers.36.mlp.experts.59.up_proj.weight_scale": "model-00037-of-00047.safetensors", + "model.layers.36.mlp.experts.6.down_proj.weight": "model-00037-of-00047.safetensors", + "model.layers.36.mlp.experts.6.down_proj.weight_scale": "model-00037-of-00047.safetensors", + "model.layers.36.mlp.experts.6.gate_proj.weight": "model-00037-of-00047.safetensors", + "model.layers.36.mlp.experts.6.gate_proj.weight_scale": "model-00037-of-00047.safetensors", + "model.layers.36.mlp.experts.6.up_proj.weight": "model-00037-of-00047.safetensors", + "model.layers.36.mlp.experts.6.up_proj.weight_scale": "model-00037-of-00047.safetensors", + "model.layers.36.mlp.experts.60.down_proj.weight": "model-00037-of-00047.safetensors", + "model.layers.36.mlp.experts.60.down_proj.weight_scale": "model-00037-of-00047.safetensors", + "model.layers.36.mlp.experts.60.gate_proj.weight": "model-00037-of-00047.safetensors", + "model.layers.36.mlp.experts.60.gate_proj.weight_scale": "model-00037-of-00047.safetensors", + "model.layers.36.mlp.experts.60.up_proj.weight": "model-00037-of-00047.safetensors", + "model.layers.36.mlp.experts.60.up_proj.weight_scale": "model-00037-of-00047.safetensors", + "model.layers.36.mlp.experts.61.down_proj.weight": "model-00037-of-00047.safetensors", + "model.layers.36.mlp.experts.61.down_proj.weight_scale": "model-00037-of-00047.safetensors", + "model.layers.36.mlp.experts.61.gate_proj.weight": "model-00037-of-00047.safetensors", + "model.layers.36.mlp.experts.61.gate_proj.weight_scale": "model-00037-of-00047.safetensors", + "model.layers.36.mlp.experts.61.up_proj.weight": "model-00037-of-00047.safetensors", + "model.layers.36.mlp.experts.61.up_proj.weight_scale": "model-00037-of-00047.safetensors", + "model.layers.36.mlp.experts.62.down_proj.weight": "model-00037-of-00047.safetensors", + "model.layers.36.mlp.experts.62.down_proj.weight_scale": "model-00037-of-00047.safetensors", + "model.layers.36.mlp.experts.62.gate_proj.weight": "model-00037-of-00047.safetensors", + "model.layers.36.mlp.experts.62.gate_proj.weight_scale": "model-00037-of-00047.safetensors", + "model.layers.36.mlp.experts.62.up_proj.weight": "model-00037-of-00047.safetensors", + "model.layers.36.mlp.experts.62.up_proj.weight_scale": "model-00037-of-00047.safetensors", + "model.layers.36.mlp.experts.63.down_proj.weight": "model-00037-of-00047.safetensors", + "model.layers.36.mlp.experts.63.down_proj.weight_scale": "model-00037-of-00047.safetensors", + "model.layers.36.mlp.experts.63.gate_proj.weight": "model-00037-of-00047.safetensors", + "model.layers.36.mlp.experts.63.gate_proj.weight_scale": "model-00037-of-00047.safetensors", + "model.layers.36.mlp.experts.63.up_proj.weight": "model-00037-of-00047.safetensors", + "model.layers.36.mlp.experts.63.up_proj.weight_scale": "model-00037-of-00047.safetensors", + "model.layers.36.mlp.experts.64.down_proj.weight": "model-00037-of-00047.safetensors", + "model.layers.36.mlp.experts.64.down_proj.weight_scale": "model-00037-of-00047.safetensors", + "model.layers.36.mlp.experts.64.gate_proj.weight": "model-00037-of-00047.safetensors", + "model.layers.36.mlp.experts.64.gate_proj.weight_scale": "model-00037-of-00047.safetensors", + "model.layers.36.mlp.experts.64.up_proj.weight": "model-00037-of-00047.safetensors", + "model.layers.36.mlp.experts.64.up_proj.weight_scale": "model-00037-of-00047.safetensors", + "model.layers.36.mlp.experts.65.down_proj.weight": "model-00037-of-00047.safetensors", + "model.layers.36.mlp.experts.65.down_proj.weight_scale": "model-00037-of-00047.safetensors", + "model.layers.36.mlp.experts.65.gate_proj.weight": "model-00037-of-00047.safetensors", + "model.layers.36.mlp.experts.65.gate_proj.weight_scale": "model-00037-of-00047.safetensors", + "model.layers.36.mlp.experts.65.up_proj.weight": "model-00037-of-00047.safetensors", + "model.layers.36.mlp.experts.65.up_proj.weight_scale": "model-00037-of-00047.safetensors", + "model.layers.36.mlp.experts.66.down_proj.weight": "model-00037-of-00047.safetensors", + "model.layers.36.mlp.experts.66.down_proj.weight_scale": "model-00037-of-00047.safetensors", + "model.layers.36.mlp.experts.66.gate_proj.weight": "model-00037-of-00047.safetensors", + "model.layers.36.mlp.experts.66.gate_proj.weight_scale": "model-00037-of-00047.safetensors", + "model.layers.36.mlp.experts.66.up_proj.weight": "model-00037-of-00047.safetensors", + "model.layers.36.mlp.experts.66.up_proj.weight_scale": "model-00037-of-00047.safetensors", + "model.layers.36.mlp.experts.67.down_proj.weight": "model-00037-of-00047.safetensors", + "model.layers.36.mlp.experts.67.down_proj.weight_scale": "model-00037-of-00047.safetensors", + "model.layers.36.mlp.experts.67.gate_proj.weight": "model-00037-of-00047.safetensors", + "model.layers.36.mlp.experts.67.gate_proj.weight_scale": "model-00037-of-00047.safetensors", + "model.layers.36.mlp.experts.67.up_proj.weight": "model-00037-of-00047.safetensors", + "model.layers.36.mlp.experts.67.up_proj.weight_scale": "model-00037-of-00047.safetensors", + "model.layers.36.mlp.experts.68.down_proj.weight": "model-00037-of-00047.safetensors", + "model.layers.36.mlp.experts.68.down_proj.weight_scale": "model-00037-of-00047.safetensors", + "model.layers.36.mlp.experts.68.gate_proj.weight": "model-00037-of-00047.safetensors", + "model.layers.36.mlp.experts.68.gate_proj.weight_scale": "model-00037-of-00047.safetensors", + "model.layers.36.mlp.experts.68.up_proj.weight": "model-00037-of-00047.safetensors", + "model.layers.36.mlp.experts.68.up_proj.weight_scale": "model-00037-of-00047.safetensors", + "model.layers.36.mlp.experts.69.down_proj.weight": "model-00037-of-00047.safetensors", + "model.layers.36.mlp.experts.69.down_proj.weight_scale": "model-00037-of-00047.safetensors", + "model.layers.36.mlp.experts.69.gate_proj.weight": "model-00037-of-00047.safetensors", + "model.layers.36.mlp.experts.69.gate_proj.weight_scale": "model-00037-of-00047.safetensors", + "model.layers.36.mlp.experts.69.up_proj.weight": "model-00037-of-00047.safetensors", + "model.layers.36.mlp.experts.69.up_proj.weight_scale": "model-00037-of-00047.safetensors", + "model.layers.36.mlp.experts.7.down_proj.weight": "model-00037-of-00047.safetensors", + "model.layers.36.mlp.experts.7.down_proj.weight_scale": "model-00037-of-00047.safetensors", + "model.layers.36.mlp.experts.7.gate_proj.weight": "model-00037-of-00047.safetensors", + "model.layers.36.mlp.experts.7.gate_proj.weight_scale": "model-00037-of-00047.safetensors", + "model.layers.36.mlp.experts.7.up_proj.weight": "model-00037-of-00047.safetensors", + "model.layers.36.mlp.experts.7.up_proj.weight_scale": "model-00037-of-00047.safetensors", + "model.layers.36.mlp.experts.70.down_proj.weight": "model-00037-of-00047.safetensors", + "model.layers.36.mlp.experts.70.down_proj.weight_scale": "model-00037-of-00047.safetensors", + "model.layers.36.mlp.experts.70.gate_proj.weight": "model-00037-of-00047.safetensors", + "model.layers.36.mlp.experts.70.gate_proj.weight_scale": "model-00037-of-00047.safetensors", + "model.layers.36.mlp.experts.70.up_proj.weight": "model-00037-of-00047.safetensors", + "model.layers.36.mlp.experts.70.up_proj.weight_scale": "model-00037-of-00047.safetensors", + "model.layers.36.mlp.experts.71.down_proj.weight": "model-00037-of-00047.safetensors", + "model.layers.36.mlp.experts.71.down_proj.weight_scale": "model-00037-of-00047.safetensors", + "model.layers.36.mlp.experts.71.gate_proj.weight": "model-00037-of-00047.safetensors", + "model.layers.36.mlp.experts.71.gate_proj.weight_scale": "model-00037-of-00047.safetensors", + "model.layers.36.mlp.experts.71.up_proj.weight": "model-00037-of-00047.safetensors", + "model.layers.36.mlp.experts.71.up_proj.weight_scale": "model-00037-of-00047.safetensors", + "model.layers.36.mlp.experts.72.down_proj.weight": "model-00037-of-00047.safetensors", + "model.layers.36.mlp.experts.72.down_proj.weight_scale": "model-00037-of-00047.safetensors", + "model.layers.36.mlp.experts.72.gate_proj.weight": "model-00037-of-00047.safetensors", + "model.layers.36.mlp.experts.72.gate_proj.weight_scale": "model-00037-of-00047.safetensors", + "model.layers.36.mlp.experts.72.up_proj.weight": "model-00037-of-00047.safetensors", + "model.layers.36.mlp.experts.72.up_proj.weight_scale": "model-00037-of-00047.safetensors", + "model.layers.36.mlp.experts.73.down_proj.weight": "model-00037-of-00047.safetensors", + "model.layers.36.mlp.experts.73.down_proj.weight_scale": "model-00037-of-00047.safetensors", + "model.layers.36.mlp.experts.73.gate_proj.weight": "model-00037-of-00047.safetensors", + "model.layers.36.mlp.experts.73.gate_proj.weight_scale": "model-00037-of-00047.safetensors", + "model.layers.36.mlp.experts.73.up_proj.weight": "model-00037-of-00047.safetensors", + "model.layers.36.mlp.experts.73.up_proj.weight_scale": "model-00037-of-00047.safetensors", + "model.layers.36.mlp.experts.74.down_proj.weight": "model-00037-of-00047.safetensors", + "model.layers.36.mlp.experts.74.down_proj.weight_scale": "model-00037-of-00047.safetensors", + "model.layers.36.mlp.experts.74.gate_proj.weight": "model-00037-of-00047.safetensors", + "model.layers.36.mlp.experts.74.gate_proj.weight_scale": "model-00037-of-00047.safetensors", + "model.layers.36.mlp.experts.74.up_proj.weight": "model-00037-of-00047.safetensors", + "model.layers.36.mlp.experts.74.up_proj.weight_scale": "model-00037-of-00047.safetensors", + "model.layers.36.mlp.experts.75.down_proj.weight": "model-00037-of-00047.safetensors", + "model.layers.36.mlp.experts.75.down_proj.weight_scale": "model-00037-of-00047.safetensors", + "model.layers.36.mlp.experts.75.gate_proj.weight": "model-00037-of-00047.safetensors", + "model.layers.36.mlp.experts.75.gate_proj.weight_scale": "model-00037-of-00047.safetensors", + "model.layers.36.mlp.experts.75.up_proj.weight": "model-00037-of-00047.safetensors", + "model.layers.36.mlp.experts.75.up_proj.weight_scale": "model-00037-of-00047.safetensors", + "model.layers.36.mlp.experts.76.down_proj.weight": "model-00037-of-00047.safetensors", + "model.layers.36.mlp.experts.76.down_proj.weight_scale": "model-00037-of-00047.safetensors", + "model.layers.36.mlp.experts.76.gate_proj.weight": "model-00037-of-00047.safetensors", + "model.layers.36.mlp.experts.76.gate_proj.weight_scale": "model-00037-of-00047.safetensors", + "model.layers.36.mlp.experts.76.up_proj.weight": "model-00037-of-00047.safetensors", + "model.layers.36.mlp.experts.76.up_proj.weight_scale": "model-00037-of-00047.safetensors", + "model.layers.36.mlp.experts.77.down_proj.weight": "model-00037-of-00047.safetensors", + "model.layers.36.mlp.experts.77.down_proj.weight_scale": "model-00037-of-00047.safetensors", + "model.layers.36.mlp.experts.77.gate_proj.weight": "model-00037-of-00047.safetensors", + "model.layers.36.mlp.experts.77.gate_proj.weight_scale": "model-00037-of-00047.safetensors", + "model.layers.36.mlp.experts.77.up_proj.weight": "model-00037-of-00047.safetensors", + "model.layers.36.mlp.experts.77.up_proj.weight_scale": "model-00037-of-00047.safetensors", + "model.layers.36.mlp.experts.78.down_proj.weight": "model-00037-of-00047.safetensors", + "model.layers.36.mlp.experts.78.down_proj.weight_scale": "model-00037-of-00047.safetensors", + "model.layers.36.mlp.experts.78.gate_proj.weight": "model-00037-of-00047.safetensors", + "model.layers.36.mlp.experts.78.gate_proj.weight_scale": "model-00037-of-00047.safetensors", + "model.layers.36.mlp.experts.78.up_proj.weight": "model-00037-of-00047.safetensors", + "model.layers.36.mlp.experts.78.up_proj.weight_scale": "model-00037-of-00047.safetensors", + "model.layers.36.mlp.experts.79.down_proj.weight": "model-00037-of-00047.safetensors", + "model.layers.36.mlp.experts.79.down_proj.weight_scale": "model-00037-of-00047.safetensors", + "model.layers.36.mlp.experts.79.gate_proj.weight": "model-00037-of-00047.safetensors", + "model.layers.36.mlp.experts.79.gate_proj.weight_scale": "model-00037-of-00047.safetensors", + "model.layers.36.mlp.experts.79.up_proj.weight": "model-00037-of-00047.safetensors", + "model.layers.36.mlp.experts.79.up_proj.weight_scale": "model-00037-of-00047.safetensors", + "model.layers.36.mlp.experts.8.down_proj.weight": "model-00037-of-00047.safetensors", + "model.layers.36.mlp.experts.8.down_proj.weight_scale": "model-00037-of-00047.safetensors", + "model.layers.36.mlp.experts.8.gate_proj.weight": "model-00037-of-00047.safetensors", + "model.layers.36.mlp.experts.8.gate_proj.weight_scale": "model-00037-of-00047.safetensors", + "model.layers.36.mlp.experts.8.up_proj.weight": "model-00037-of-00047.safetensors", + "model.layers.36.mlp.experts.8.up_proj.weight_scale": "model-00037-of-00047.safetensors", + "model.layers.36.mlp.experts.80.down_proj.weight": "model-00037-of-00047.safetensors", + "model.layers.36.mlp.experts.80.down_proj.weight_scale": "model-00037-of-00047.safetensors", + "model.layers.36.mlp.experts.80.gate_proj.weight": "model-00037-of-00047.safetensors", + "model.layers.36.mlp.experts.80.gate_proj.weight_scale": "model-00037-of-00047.safetensors", + "model.layers.36.mlp.experts.80.up_proj.weight": "model-00037-of-00047.safetensors", + "model.layers.36.mlp.experts.80.up_proj.weight_scale": "model-00037-of-00047.safetensors", + "model.layers.36.mlp.experts.81.down_proj.weight": "model-00037-of-00047.safetensors", + "model.layers.36.mlp.experts.81.down_proj.weight_scale": "model-00037-of-00047.safetensors", + "model.layers.36.mlp.experts.81.gate_proj.weight": "model-00037-of-00047.safetensors", + "model.layers.36.mlp.experts.81.gate_proj.weight_scale": "model-00037-of-00047.safetensors", + "model.layers.36.mlp.experts.81.up_proj.weight": "model-00037-of-00047.safetensors", + "model.layers.36.mlp.experts.81.up_proj.weight_scale": "model-00037-of-00047.safetensors", + "model.layers.36.mlp.experts.82.down_proj.weight": "model-00037-of-00047.safetensors", + "model.layers.36.mlp.experts.82.down_proj.weight_scale": "model-00037-of-00047.safetensors", + "model.layers.36.mlp.experts.82.gate_proj.weight": "model-00037-of-00047.safetensors", + "model.layers.36.mlp.experts.82.gate_proj.weight_scale": "model-00037-of-00047.safetensors", + "model.layers.36.mlp.experts.82.up_proj.weight": "model-00037-of-00047.safetensors", + "model.layers.36.mlp.experts.82.up_proj.weight_scale": "model-00037-of-00047.safetensors", + "model.layers.36.mlp.experts.83.down_proj.weight": "model-00037-of-00047.safetensors", + "model.layers.36.mlp.experts.83.down_proj.weight_scale": "model-00037-of-00047.safetensors", + "model.layers.36.mlp.experts.83.gate_proj.weight": "model-00037-of-00047.safetensors", + "model.layers.36.mlp.experts.83.gate_proj.weight_scale": "model-00037-of-00047.safetensors", + "model.layers.36.mlp.experts.83.up_proj.weight": "model-00037-of-00047.safetensors", + "model.layers.36.mlp.experts.83.up_proj.weight_scale": "model-00037-of-00047.safetensors", + "model.layers.36.mlp.experts.84.down_proj.weight": "model-00037-of-00047.safetensors", + "model.layers.36.mlp.experts.84.down_proj.weight_scale": "model-00037-of-00047.safetensors", + "model.layers.36.mlp.experts.84.gate_proj.weight": "model-00037-of-00047.safetensors", + "model.layers.36.mlp.experts.84.gate_proj.weight_scale": "model-00037-of-00047.safetensors", + "model.layers.36.mlp.experts.84.up_proj.weight": "model-00037-of-00047.safetensors", + "model.layers.36.mlp.experts.84.up_proj.weight_scale": "model-00037-of-00047.safetensors", + "model.layers.36.mlp.experts.85.down_proj.weight": "model-00037-of-00047.safetensors", + "model.layers.36.mlp.experts.85.down_proj.weight_scale": "model-00037-of-00047.safetensors", + "model.layers.36.mlp.experts.85.gate_proj.weight": "model-00037-of-00047.safetensors", + "model.layers.36.mlp.experts.85.gate_proj.weight_scale": "model-00037-of-00047.safetensors", + "model.layers.36.mlp.experts.85.up_proj.weight": "model-00037-of-00047.safetensors", + "model.layers.36.mlp.experts.85.up_proj.weight_scale": "model-00037-of-00047.safetensors", + "model.layers.36.mlp.experts.86.down_proj.weight": "model-00037-of-00047.safetensors", + "model.layers.36.mlp.experts.86.down_proj.weight_scale": "model-00037-of-00047.safetensors", + "model.layers.36.mlp.experts.86.gate_proj.weight": "model-00037-of-00047.safetensors", + "model.layers.36.mlp.experts.86.gate_proj.weight_scale": "model-00037-of-00047.safetensors", + "model.layers.36.mlp.experts.86.up_proj.weight": "model-00037-of-00047.safetensors", + "model.layers.36.mlp.experts.86.up_proj.weight_scale": "model-00037-of-00047.safetensors", + "model.layers.36.mlp.experts.87.down_proj.weight": "model-00037-of-00047.safetensors", + "model.layers.36.mlp.experts.87.down_proj.weight_scale": "model-00037-of-00047.safetensors", + "model.layers.36.mlp.experts.87.gate_proj.weight": "model-00037-of-00047.safetensors", + "model.layers.36.mlp.experts.87.gate_proj.weight_scale": "model-00037-of-00047.safetensors", + "model.layers.36.mlp.experts.87.up_proj.weight": "model-00037-of-00047.safetensors", + "model.layers.36.mlp.experts.87.up_proj.weight_scale": "model-00037-of-00047.safetensors", + "model.layers.36.mlp.experts.88.down_proj.weight": "model-00037-of-00047.safetensors", + "model.layers.36.mlp.experts.88.down_proj.weight_scale": "model-00037-of-00047.safetensors", + "model.layers.36.mlp.experts.88.gate_proj.weight": "model-00037-of-00047.safetensors", + "model.layers.36.mlp.experts.88.gate_proj.weight_scale": "model-00037-of-00047.safetensors", + "model.layers.36.mlp.experts.88.up_proj.weight": "model-00037-of-00047.safetensors", + "model.layers.36.mlp.experts.88.up_proj.weight_scale": "model-00037-of-00047.safetensors", + "model.layers.36.mlp.experts.89.down_proj.weight": "model-00037-of-00047.safetensors", + "model.layers.36.mlp.experts.89.down_proj.weight_scale": "model-00037-of-00047.safetensors", + "model.layers.36.mlp.experts.89.gate_proj.weight": "model-00037-of-00047.safetensors", + "model.layers.36.mlp.experts.89.gate_proj.weight_scale": "model-00037-of-00047.safetensors", + "model.layers.36.mlp.experts.89.up_proj.weight": "model-00037-of-00047.safetensors", + "model.layers.36.mlp.experts.89.up_proj.weight_scale": "model-00037-of-00047.safetensors", + "model.layers.36.mlp.experts.9.down_proj.weight": "model-00037-of-00047.safetensors", + "model.layers.36.mlp.experts.9.down_proj.weight_scale": "model-00037-of-00047.safetensors", + "model.layers.36.mlp.experts.9.gate_proj.weight": "model-00037-of-00047.safetensors", + "model.layers.36.mlp.experts.9.gate_proj.weight_scale": "model-00037-of-00047.safetensors", + "model.layers.36.mlp.experts.9.up_proj.weight": "model-00037-of-00047.safetensors", + "model.layers.36.mlp.experts.9.up_proj.weight_scale": "model-00037-of-00047.safetensors", + "model.layers.36.mlp.experts.90.down_proj.weight": "model-00037-of-00047.safetensors", + "model.layers.36.mlp.experts.90.down_proj.weight_scale": "model-00037-of-00047.safetensors", + "model.layers.36.mlp.experts.90.gate_proj.weight": "model-00037-of-00047.safetensors", + "model.layers.36.mlp.experts.90.gate_proj.weight_scale": "model-00037-of-00047.safetensors", + "model.layers.36.mlp.experts.90.up_proj.weight": "model-00037-of-00047.safetensors", + "model.layers.36.mlp.experts.90.up_proj.weight_scale": "model-00037-of-00047.safetensors", + "model.layers.36.mlp.experts.91.down_proj.weight": "model-00037-of-00047.safetensors", + "model.layers.36.mlp.experts.91.down_proj.weight_scale": "model-00037-of-00047.safetensors", + "model.layers.36.mlp.experts.91.gate_proj.weight": "model-00037-of-00047.safetensors", + "model.layers.36.mlp.experts.91.gate_proj.weight_scale": "model-00037-of-00047.safetensors", + "model.layers.36.mlp.experts.91.up_proj.weight": "model-00037-of-00047.safetensors", + "model.layers.36.mlp.experts.91.up_proj.weight_scale": "model-00037-of-00047.safetensors", + "model.layers.36.mlp.experts.92.down_proj.weight": "model-00037-of-00047.safetensors", + "model.layers.36.mlp.experts.92.down_proj.weight_scale": "model-00037-of-00047.safetensors", + "model.layers.36.mlp.experts.92.gate_proj.weight": "model-00037-of-00047.safetensors", + "model.layers.36.mlp.experts.92.gate_proj.weight_scale": "model-00037-of-00047.safetensors", + "model.layers.36.mlp.experts.92.up_proj.weight": "model-00037-of-00047.safetensors", + "model.layers.36.mlp.experts.92.up_proj.weight_scale": "model-00037-of-00047.safetensors", + "model.layers.36.mlp.experts.93.down_proj.weight": "model-00037-of-00047.safetensors", + "model.layers.36.mlp.experts.93.down_proj.weight_scale": "model-00037-of-00047.safetensors", + "model.layers.36.mlp.experts.93.gate_proj.weight": "model-00037-of-00047.safetensors", + "model.layers.36.mlp.experts.93.gate_proj.weight_scale": "model-00037-of-00047.safetensors", + "model.layers.36.mlp.experts.93.up_proj.weight": "model-00037-of-00047.safetensors", + "model.layers.36.mlp.experts.93.up_proj.weight_scale": "model-00037-of-00047.safetensors", + "model.layers.36.mlp.experts.94.down_proj.weight": "model-00037-of-00047.safetensors", + "model.layers.36.mlp.experts.94.down_proj.weight_scale": "model-00037-of-00047.safetensors", + "model.layers.36.mlp.experts.94.gate_proj.weight": "model-00037-of-00047.safetensors", + "model.layers.36.mlp.experts.94.gate_proj.weight_scale": "model-00037-of-00047.safetensors", + "model.layers.36.mlp.experts.94.up_proj.weight": "model-00037-of-00047.safetensors", + "model.layers.36.mlp.experts.94.up_proj.weight_scale": "model-00037-of-00047.safetensors", + "model.layers.36.mlp.experts.95.down_proj.weight": "model-00037-of-00047.safetensors", + "model.layers.36.mlp.experts.95.down_proj.weight_scale": "model-00037-of-00047.safetensors", + "model.layers.36.mlp.experts.95.gate_proj.weight": "model-00037-of-00047.safetensors", + "model.layers.36.mlp.experts.95.gate_proj.weight_scale": "model-00037-of-00047.safetensors", + "model.layers.36.mlp.experts.95.up_proj.weight": "model-00037-of-00047.safetensors", + "model.layers.36.mlp.experts.95.up_proj.weight_scale": "model-00037-of-00047.safetensors", + "model.layers.36.mlp.experts.96.down_proj.weight": "model-00037-of-00047.safetensors", + "model.layers.36.mlp.experts.96.down_proj.weight_scale": "model-00037-of-00047.safetensors", + "model.layers.36.mlp.experts.96.gate_proj.weight": "model-00037-of-00047.safetensors", + "model.layers.36.mlp.experts.96.gate_proj.weight_scale": "model-00037-of-00047.safetensors", + "model.layers.36.mlp.experts.96.up_proj.weight": "model-00037-of-00047.safetensors", + "model.layers.36.mlp.experts.96.up_proj.weight_scale": "model-00037-of-00047.safetensors", + "model.layers.36.mlp.experts.97.down_proj.weight": "model-00037-of-00047.safetensors", + "model.layers.36.mlp.experts.97.down_proj.weight_scale": "model-00037-of-00047.safetensors", + "model.layers.36.mlp.experts.97.gate_proj.weight": "model-00037-of-00047.safetensors", + "model.layers.36.mlp.experts.97.gate_proj.weight_scale": "model-00037-of-00047.safetensors", + "model.layers.36.mlp.experts.97.up_proj.weight": "model-00037-of-00047.safetensors", + "model.layers.36.mlp.experts.97.up_proj.weight_scale": "model-00037-of-00047.safetensors", + "model.layers.36.mlp.experts.98.down_proj.weight": "model-00037-of-00047.safetensors", + "model.layers.36.mlp.experts.98.down_proj.weight_scale": "model-00037-of-00047.safetensors", + "model.layers.36.mlp.experts.98.gate_proj.weight": "model-00037-of-00047.safetensors", + "model.layers.36.mlp.experts.98.gate_proj.weight_scale": "model-00037-of-00047.safetensors", + "model.layers.36.mlp.experts.98.up_proj.weight": "model-00037-of-00047.safetensors", + "model.layers.36.mlp.experts.98.up_proj.weight_scale": "model-00037-of-00047.safetensors", + "model.layers.36.mlp.experts.99.down_proj.weight": "model-00037-of-00047.safetensors", + "model.layers.36.mlp.experts.99.down_proj.weight_scale": "model-00037-of-00047.safetensors", + "model.layers.36.mlp.experts.99.gate_proj.weight": "model-00037-of-00047.safetensors", + "model.layers.36.mlp.experts.99.gate_proj.weight_scale": "model-00037-of-00047.safetensors", + "model.layers.36.mlp.experts.99.up_proj.weight": "model-00037-of-00047.safetensors", + "model.layers.36.mlp.experts.99.up_proj.weight_scale": "model-00037-of-00047.safetensors", + "model.layers.36.mlp.gate.e_score_correction_bias": "model-00037-of-00047.safetensors", + "model.layers.36.mlp.gate.weight": "model-00037-of-00047.safetensors", + "model.layers.36.mlp.shared_experts.down_proj.weight": "model-00037-of-00047.safetensors", + "model.layers.36.mlp.shared_experts.down_proj.weight_scale": "model-00037-of-00047.safetensors", + "model.layers.36.mlp.shared_experts.gate_proj.weight": "model-00037-of-00047.safetensors", + "model.layers.36.mlp.shared_experts.gate_proj.weight_scale": "model-00037-of-00047.safetensors", + "model.layers.36.mlp.shared_experts.up_proj.weight": "model-00037-of-00047.safetensors", + "model.layers.36.mlp.shared_experts.up_proj.weight_scale": "model-00037-of-00047.safetensors", + "model.layers.36.post_attention_layernorm.weight": "model-00037-of-00047.safetensors", + "model.layers.36.self_attn.k_proj.bias": "model-00037-of-00047.safetensors", + "model.layers.36.self_attn.k_proj.weight": "model-00037-of-00047.safetensors", + "model.layers.36.self_attn.k_proj.weight_scale": "model-00037-of-00047.safetensors", + "model.layers.36.self_attn.o_proj.weight": "model-00037-of-00047.safetensors", + "model.layers.36.self_attn.o_proj.weight_scale": "model-00037-of-00047.safetensors", + "model.layers.36.self_attn.q_proj.bias": "model-00037-of-00047.safetensors", + "model.layers.36.self_attn.q_proj.weight": "model-00037-of-00047.safetensors", + "model.layers.36.self_attn.q_proj.weight_scale": "model-00037-of-00047.safetensors", + "model.layers.36.self_attn.v_proj.bias": "model-00037-of-00047.safetensors", + "model.layers.36.self_attn.v_proj.weight": "model-00037-of-00047.safetensors", + "model.layers.36.self_attn.v_proj.weight_scale": "model-00037-of-00047.safetensors", + "model.layers.37.input_layernorm.weight": "model-00038-of-00047.safetensors", + "model.layers.37.mlp.experts.0.down_proj.weight": "model-00038-of-00047.safetensors", + "model.layers.37.mlp.experts.0.down_proj.weight_scale": "model-00038-of-00047.safetensors", + "model.layers.37.mlp.experts.0.gate_proj.weight": "model-00038-of-00047.safetensors", + "model.layers.37.mlp.experts.0.gate_proj.weight_scale": "model-00038-of-00047.safetensors", + "model.layers.37.mlp.experts.0.up_proj.weight": "model-00038-of-00047.safetensors", + "model.layers.37.mlp.experts.0.up_proj.weight_scale": "model-00038-of-00047.safetensors", + "model.layers.37.mlp.experts.1.down_proj.weight": "model-00038-of-00047.safetensors", + "model.layers.37.mlp.experts.1.down_proj.weight_scale": "model-00038-of-00047.safetensors", + "model.layers.37.mlp.experts.1.gate_proj.weight": "model-00038-of-00047.safetensors", + "model.layers.37.mlp.experts.1.gate_proj.weight_scale": "model-00038-of-00047.safetensors", + "model.layers.37.mlp.experts.1.up_proj.weight": "model-00038-of-00047.safetensors", + "model.layers.37.mlp.experts.1.up_proj.weight_scale": "model-00038-of-00047.safetensors", + "model.layers.37.mlp.experts.10.down_proj.weight": "model-00038-of-00047.safetensors", + "model.layers.37.mlp.experts.10.down_proj.weight_scale": "model-00038-of-00047.safetensors", + "model.layers.37.mlp.experts.10.gate_proj.weight": "model-00038-of-00047.safetensors", + "model.layers.37.mlp.experts.10.gate_proj.weight_scale": "model-00038-of-00047.safetensors", + "model.layers.37.mlp.experts.10.up_proj.weight": "model-00038-of-00047.safetensors", + "model.layers.37.mlp.experts.10.up_proj.weight_scale": "model-00038-of-00047.safetensors", + "model.layers.37.mlp.experts.100.down_proj.weight": "model-00038-of-00047.safetensors", + "model.layers.37.mlp.experts.100.down_proj.weight_scale": "model-00038-of-00047.safetensors", + "model.layers.37.mlp.experts.100.gate_proj.weight": "model-00038-of-00047.safetensors", + "model.layers.37.mlp.experts.100.gate_proj.weight_scale": "model-00038-of-00047.safetensors", + "model.layers.37.mlp.experts.100.up_proj.weight": "model-00038-of-00047.safetensors", + "model.layers.37.mlp.experts.100.up_proj.weight_scale": "model-00038-of-00047.safetensors", + "model.layers.37.mlp.experts.101.down_proj.weight": "model-00038-of-00047.safetensors", + "model.layers.37.mlp.experts.101.down_proj.weight_scale": "model-00038-of-00047.safetensors", + "model.layers.37.mlp.experts.101.gate_proj.weight": "model-00038-of-00047.safetensors", + "model.layers.37.mlp.experts.101.gate_proj.weight_scale": "model-00038-of-00047.safetensors", + "model.layers.37.mlp.experts.101.up_proj.weight": "model-00038-of-00047.safetensors", + "model.layers.37.mlp.experts.101.up_proj.weight_scale": "model-00038-of-00047.safetensors", + "model.layers.37.mlp.experts.102.down_proj.weight": "model-00038-of-00047.safetensors", + "model.layers.37.mlp.experts.102.down_proj.weight_scale": "model-00038-of-00047.safetensors", + "model.layers.37.mlp.experts.102.gate_proj.weight": "model-00038-of-00047.safetensors", + "model.layers.37.mlp.experts.102.gate_proj.weight_scale": "model-00038-of-00047.safetensors", + "model.layers.37.mlp.experts.102.up_proj.weight": "model-00038-of-00047.safetensors", + "model.layers.37.mlp.experts.102.up_proj.weight_scale": "model-00038-of-00047.safetensors", + "model.layers.37.mlp.experts.103.down_proj.weight": "model-00038-of-00047.safetensors", + "model.layers.37.mlp.experts.103.down_proj.weight_scale": "model-00038-of-00047.safetensors", + "model.layers.37.mlp.experts.103.gate_proj.weight": "model-00038-of-00047.safetensors", + "model.layers.37.mlp.experts.103.gate_proj.weight_scale": "model-00038-of-00047.safetensors", + "model.layers.37.mlp.experts.103.up_proj.weight": "model-00038-of-00047.safetensors", + "model.layers.37.mlp.experts.103.up_proj.weight_scale": "model-00038-of-00047.safetensors", + "model.layers.37.mlp.experts.104.down_proj.weight": "model-00038-of-00047.safetensors", + "model.layers.37.mlp.experts.104.down_proj.weight_scale": "model-00038-of-00047.safetensors", + "model.layers.37.mlp.experts.104.gate_proj.weight": "model-00038-of-00047.safetensors", + "model.layers.37.mlp.experts.104.gate_proj.weight_scale": "model-00038-of-00047.safetensors", + "model.layers.37.mlp.experts.104.up_proj.weight": "model-00038-of-00047.safetensors", + "model.layers.37.mlp.experts.104.up_proj.weight_scale": "model-00038-of-00047.safetensors", + "model.layers.37.mlp.experts.105.down_proj.weight": "model-00038-of-00047.safetensors", + "model.layers.37.mlp.experts.105.down_proj.weight_scale": "model-00038-of-00047.safetensors", + "model.layers.37.mlp.experts.105.gate_proj.weight": "model-00038-of-00047.safetensors", + "model.layers.37.mlp.experts.105.gate_proj.weight_scale": "model-00038-of-00047.safetensors", + "model.layers.37.mlp.experts.105.up_proj.weight": "model-00038-of-00047.safetensors", + "model.layers.37.mlp.experts.105.up_proj.weight_scale": "model-00038-of-00047.safetensors", + "model.layers.37.mlp.experts.106.down_proj.weight": "model-00038-of-00047.safetensors", + "model.layers.37.mlp.experts.106.down_proj.weight_scale": "model-00038-of-00047.safetensors", + "model.layers.37.mlp.experts.106.gate_proj.weight": "model-00038-of-00047.safetensors", + "model.layers.37.mlp.experts.106.gate_proj.weight_scale": "model-00038-of-00047.safetensors", + "model.layers.37.mlp.experts.106.up_proj.weight": "model-00038-of-00047.safetensors", + "model.layers.37.mlp.experts.106.up_proj.weight_scale": "model-00038-of-00047.safetensors", + "model.layers.37.mlp.experts.107.down_proj.weight": "model-00038-of-00047.safetensors", + "model.layers.37.mlp.experts.107.down_proj.weight_scale": "model-00038-of-00047.safetensors", + "model.layers.37.mlp.experts.107.gate_proj.weight": "model-00038-of-00047.safetensors", + "model.layers.37.mlp.experts.107.gate_proj.weight_scale": "model-00038-of-00047.safetensors", + "model.layers.37.mlp.experts.107.up_proj.weight": "model-00038-of-00047.safetensors", + "model.layers.37.mlp.experts.107.up_proj.weight_scale": "model-00038-of-00047.safetensors", + "model.layers.37.mlp.experts.108.down_proj.weight": "model-00038-of-00047.safetensors", + "model.layers.37.mlp.experts.108.down_proj.weight_scale": "model-00038-of-00047.safetensors", + "model.layers.37.mlp.experts.108.gate_proj.weight": "model-00038-of-00047.safetensors", + "model.layers.37.mlp.experts.108.gate_proj.weight_scale": "model-00038-of-00047.safetensors", + "model.layers.37.mlp.experts.108.up_proj.weight": "model-00038-of-00047.safetensors", + "model.layers.37.mlp.experts.108.up_proj.weight_scale": "model-00038-of-00047.safetensors", + "model.layers.37.mlp.experts.109.down_proj.weight": "model-00038-of-00047.safetensors", + "model.layers.37.mlp.experts.109.down_proj.weight_scale": "model-00038-of-00047.safetensors", + "model.layers.37.mlp.experts.109.gate_proj.weight": "model-00038-of-00047.safetensors", + "model.layers.37.mlp.experts.109.gate_proj.weight_scale": "model-00038-of-00047.safetensors", + "model.layers.37.mlp.experts.109.up_proj.weight": "model-00038-of-00047.safetensors", + "model.layers.37.mlp.experts.109.up_proj.weight_scale": "model-00038-of-00047.safetensors", + "model.layers.37.mlp.experts.11.down_proj.weight": "model-00038-of-00047.safetensors", + "model.layers.37.mlp.experts.11.down_proj.weight_scale": "model-00038-of-00047.safetensors", + "model.layers.37.mlp.experts.11.gate_proj.weight": "model-00038-of-00047.safetensors", + "model.layers.37.mlp.experts.11.gate_proj.weight_scale": "model-00038-of-00047.safetensors", + "model.layers.37.mlp.experts.11.up_proj.weight": "model-00038-of-00047.safetensors", + "model.layers.37.mlp.experts.11.up_proj.weight_scale": "model-00038-of-00047.safetensors", + "model.layers.37.mlp.experts.110.down_proj.weight": "model-00038-of-00047.safetensors", + "model.layers.37.mlp.experts.110.down_proj.weight_scale": "model-00038-of-00047.safetensors", + "model.layers.37.mlp.experts.110.gate_proj.weight": "model-00038-of-00047.safetensors", + "model.layers.37.mlp.experts.110.gate_proj.weight_scale": "model-00038-of-00047.safetensors", + "model.layers.37.mlp.experts.110.up_proj.weight": "model-00038-of-00047.safetensors", + "model.layers.37.mlp.experts.110.up_proj.weight_scale": "model-00038-of-00047.safetensors", + "model.layers.37.mlp.experts.111.down_proj.weight": "model-00038-of-00047.safetensors", + "model.layers.37.mlp.experts.111.down_proj.weight_scale": "model-00038-of-00047.safetensors", + "model.layers.37.mlp.experts.111.gate_proj.weight": "model-00038-of-00047.safetensors", + "model.layers.37.mlp.experts.111.gate_proj.weight_scale": "model-00038-of-00047.safetensors", + "model.layers.37.mlp.experts.111.up_proj.weight": "model-00038-of-00047.safetensors", + "model.layers.37.mlp.experts.111.up_proj.weight_scale": "model-00038-of-00047.safetensors", + "model.layers.37.mlp.experts.112.down_proj.weight": "model-00038-of-00047.safetensors", + "model.layers.37.mlp.experts.112.down_proj.weight_scale": "model-00038-of-00047.safetensors", + "model.layers.37.mlp.experts.112.gate_proj.weight": "model-00038-of-00047.safetensors", + "model.layers.37.mlp.experts.112.gate_proj.weight_scale": "model-00038-of-00047.safetensors", + "model.layers.37.mlp.experts.112.up_proj.weight": "model-00038-of-00047.safetensors", + "model.layers.37.mlp.experts.112.up_proj.weight_scale": "model-00038-of-00047.safetensors", + "model.layers.37.mlp.experts.113.down_proj.weight": "model-00038-of-00047.safetensors", + "model.layers.37.mlp.experts.113.down_proj.weight_scale": "model-00038-of-00047.safetensors", + "model.layers.37.mlp.experts.113.gate_proj.weight": "model-00038-of-00047.safetensors", + "model.layers.37.mlp.experts.113.gate_proj.weight_scale": "model-00038-of-00047.safetensors", + "model.layers.37.mlp.experts.113.up_proj.weight": "model-00038-of-00047.safetensors", + "model.layers.37.mlp.experts.113.up_proj.weight_scale": "model-00038-of-00047.safetensors", + "model.layers.37.mlp.experts.114.down_proj.weight": "model-00038-of-00047.safetensors", + "model.layers.37.mlp.experts.114.down_proj.weight_scale": "model-00038-of-00047.safetensors", + "model.layers.37.mlp.experts.114.gate_proj.weight": "model-00038-of-00047.safetensors", + "model.layers.37.mlp.experts.114.gate_proj.weight_scale": "model-00038-of-00047.safetensors", + "model.layers.37.mlp.experts.114.up_proj.weight": "model-00038-of-00047.safetensors", + "model.layers.37.mlp.experts.114.up_proj.weight_scale": "model-00038-of-00047.safetensors", + "model.layers.37.mlp.experts.115.down_proj.weight": "model-00038-of-00047.safetensors", + "model.layers.37.mlp.experts.115.down_proj.weight_scale": "model-00038-of-00047.safetensors", + "model.layers.37.mlp.experts.115.gate_proj.weight": "model-00038-of-00047.safetensors", + "model.layers.37.mlp.experts.115.gate_proj.weight_scale": "model-00038-of-00047.safetensors", + "model.layers.37.mlp.experts.115.up_proj.weight": "model-00038-of-00047.safetensors", + "model.layers.37.mlp.experts.115.up_proj.weight_scale": "model-00038-of-00047.safetensors", + "model.layers.37.mlp.experts.116.down_proj.weight": "model-00038-of-00047.safetensors", + "model.layers.37.mlp.experts.116.down_proj.weight_scale": "model-00038-of-00047.safetensors", + "model.layers.37.mlp.experts.116.gate_proj.weight": "model-00038-of-00047.safetensors", + "model.layers.37.mlp.experts.116.gate_proj.weight_scale": "model-00038-of-00047.safetensors", + "model.layers.37.mlp.experts.116.up_proj.weight": "model-00038-of-00047.safetensors", + "model.layers.37.mlp.experts.116.up_proj.weight_scale": "model-00038-of-00047.safetensors", + "model.layers.37.mlp.experts.117.down_proj.weight": "model-00038-of-00047.safetensors", + "model.layers.37.mlp.experts.117.down_proj.weight_scale": "model-00038-of-00047.safetensors", + "model.layers.37.mlp.experts.117.gate_proj.weight": "model-00038-of-00047.safetensors", + "model.layers.37.mlp.experts.117.gate_proj.weight_scale": "model-00038-of-00047.safetensors", + "model.layers.37.mlp.experts.117.up_proj.weight": "model-00038-of-00047.safetensors", + "model.layers.37.mlp.experts.117.up_proj.weight_scale": "model-00038-of-00047.safetensors", + "model.layers.37.mlp.experts.118.down_proj.weight": "model-00038-of-00047.safetensors", + "model.layers.37.mlp.experts.118.down_proj.weight_scale": "model-00038-of-00047.safetensors", + "model.layers.37.mlp.experts.118.gate_proj.weight": "model-00038-of-00047.safetensors", + "model.layers.37.mlp.experts.118.gate_proj.weight_scale": "model-00038-of-00047.safetensors", + "model.layers.37.mlp.experts.118.up_proj.weight": "model-00038-of-00047.safetensors", + "model.layers.37.mlp.experts.118.up_proj.weight_scale": "model-00038-of-00047.safetensors", + "model.layers.37.mlp.experts.119.down_proj.weight": "model-00038-of-00047.safetensors", + "model.layers.37.mlp.experts.119.down_proj.weight_scale": "model-00038-of-00047.safetensors", + "model.layers.37.mlp.experts.119.gate_proj.weight": "model-00038-of-00047.safetensors", + "model.layers.37.mlp.experts.119.gate_proj.weight_scale": "model-00038-of-00047.safetensors", + "model.layers.37.mlp.experts.119.up_proj.weight": "model-00038-of-00047.safetensors", + "model.layers.37.mlp.experts.119.up_proj.weight_scale": "model-00038-of-00047.safetensors", + "model.layers.37.mlp.experts.12.down_proj.weight": "model-00038-of-00047.safetensors", + "model.layers.37.mlp.experts.12.down_proj.weight_scale": "model-00038-of-00047.safetensors", + "model.layers.37.mlp.experts.12.gate_proj.weight": "model-00038-of-00047.safetensors", + "model.layers.37.mlp.experts.12.gate_proj.weight_scale": "model-00038-of-00047.safetensors", + "model.layers.37.mlp.experts.12.up_proj.weight": "model-00038-of-00047.safetensors", + "model.layers.37.mlp.experts.12.up_proj.weight_scale": "model-00038-of-00047.safetensors", + "model.layers.37.mlp.experts.120.down_proj.weight": "model-00038-of-00047.safetensors", + "model.layers.37.mlp.experts.120.down_proj.weight_scale": "model-00038-of-00047.safetensors", + "model.layers.37.mlp.experts.120.gate_proj.weight": "model-00038-of-00047.safetensors", + "model.layers.37.mlp.experts.120.gate_proj.weight_scale": "model-00038-of-00047.safetensors", + "model.layers.37.mlp.experts.120.up_proj.weight": "model-00038-of-00047.safetensors", + "model.layers.37.mlp.experts.120.up_proj.weight_scale": "model-00038-of-00047.safetensors", + "model.layers.37.mlp.experts.121.down_proj.weight": "model-00038-of-00047.safetensors", + "model.layers.37.mlp.experts.121.down_proj.weight_scale": "model-00038-of-00047.safetensors", + "model.layers.37.mlp.experts.121.gate_proj.weight": "model-00038-of-00047.safetensors", + "model.layers.37.mlp.experts.121.gate_proj.weight_scale": "model-00038-of-00047.safetensors", + "model.layers.37.mlp.experts.121.up_proj.weight": "model-00038-of-00047.safetensors", + "model.layers.37.mlp.experts.121.up_proj.weight_scale": "model-00038-of-00047.safetensors", + "model.layers.37.mlp.experts.122.down_proj.weight": "model-00038-of-00047.safetensors", + "model.layers.37.mlp.experts.122.down_proj.weight_scale": "model-00038-of-00047.safetensors", + "model.layers.37.mlp.experts.122.gate_proj.weight": "model-00038-of-00047.safetensors", + "model.layers.37.mlp.experts.122.gate_proj.weight_scale": "model-00038-of-00047.safetensors", + "model.layers.37.mlp.experts.122.up_proj.weight": "model-00038-of-00047.safetensors", + "model.layers.37.mlp.experts.122.up_proj.weight_scale": "model-00038-of-00047.safetensors", + "model.layers.37.mlp.experts.123.down_proj.weight": "model-00038-of-00047.safetensors", + "model.layers.37.mlp.experts.123.down_proj.weight_scale": "model-00038-of-00047.safetensors", + "model.layers.37.mlp.experts.123.gate_proj.weight": "model-00038-of-00047.safetensors", + "model.layers.37.mlp.experts.123.gate_proj.weight_scale": "model-00038-of-00047.safetensors", + "model.layers.37.mlp.experts.123.up_proj.weight": "model-00038-of-00047.safetensors", + "model.layers.37.mlp.experts.123.up_proj.weight_scale": "model-00038-of-00047.safetensors", + "model.layers.37.mlp.experts.124.down_proj.weight": "model-00038-of-00047.safetensors", + "model.layers.37.mlp.experts.124.down_proj.weight_scale": "model-00038-of-00047.safetensors", + "model.layers.37.mlp.experts.124.gate_proj.weight": "model-00038-of-00047.safetensors", + "model.layers.37.mlp.experts.124.gate_proj.weight_scale": "model-00038-of-00047.safetensors", + "model.layers.37.mlp.experts.124.up_proj.weight": "model-00038-of-00047.safetensors", + "model.layers.37.mlp.experts.124.up_proj.weight_scale": "model-00038-of-00047.safetensors", + "model.layers.37.mlp.experts.125.down_proj.weight": "model-00038-of-00047.safetensors", + "model.layers.37.mlp.experts.125.down_proj.weight_scale": "model-00038-of-00047.safetensors", + "model.layers.37.mlp.experts.125.gate_proj.weight": "model-00038-of-00047.safetensors", + "model.layers.37.mlp.experts.125.gate_proj.weight_scale": "model-00038-of-00047.safetensors", + "model.layers.37.mlp.experts.125.up_proj.weight": "model-00038-of-00047.safetensors", + "model.layers.37.mlp.experts.125.up_proj.weight_scale": "model-00038-of-00047.safetensors", + "model.layers.37.mlp.experts.126.down_proj.weight": "model-00038-of-00047.safetensors", + "model.layers.37.mlp.experts.126.down_proj.weight_scale": "model-00038-of-00047.safetensors", + "model.layers.37.mlp.experts.126.gate_proj.weight": "model-00038-of-00047.safetensors", + "model.layers.37.mlp.experts.126.gate_proj.weight_scale": "model-00038-of-00047.safetensors", + "model.layers.37.mlp.experts.126.up_proj.weight": "model-00038-of-00047.safetensors", + "model.layers.37.mlp.experts.126.up_proj.weight_scale": "model-00038-of-00047.safetensors", + "model.layers.37.mlp.experts.127.down_proj.weight": "model-00038-of-00047.safetensors", + "model.layers.37.mlp.experts.127.down_proj.weight_scale": "model-00038-of-00047.safetensors", + "model.layers.37.mlp.experts.127.gate_proj.weight": "model-00038-of-00047.safetensors", + "model.layers.37.mlp.experts.127.gate_proj.weight_scale": "model-00038-of-00047.safetensors", + "model.layers.37.mlp.experts.127.up_proj.weight": "model-00038-of-00047.safetensors", + "model.layers.37.mlp.experts.127.up_proj.weight_scale": "model-00038-of-00047.safetensors", + "model.layers.37.mlp.experts.13.down_proj.weight": "model-00038-of-00047.safetensors", + "model.layers.37.mlp.experts.13.down_proj.weight_scale": "model-00038-of-00047.safetensors", + "model.layers.37.mlp.experts.13.gate_proj.weight": "model-00038-of-00047.safetensors", + "model.layers.37.mlp.experts.13.gate_proj.weight_scale": "model-00038-of-00047.safetensors", + "model.layers.37.mlp.experts.13.up_proj.weight": "model-00038-of-00047.safetensors", + "model.layers.37.mlp.experts.13.up_proj.weight_scale": "model-00038-of-00047.safetensors", + "model.layers.37.mlp.experts.14.down_proj.weight": "model-00038-of-00047.safetensors", + "model.layers.37.mlp.experts.14.down_proj.weight_scale": "model-00038-of-00047.safetensors", + "model.layers.37.mlp.experts.14.gate_proj.weight": "model-00038-of-00047.safetensors", + "model.layers.37.mlp.experts.14.gate_proj.weight_scale": "model-00038-of-00047.safetensors", + "model.layers.37.mlp.experts.14.up_proj.weight": "model-00038-of-00047.safetensors", + "model.layers.37.mlp.experts.14.up_proj.weight_scale": "model-00038-of-00047.safetensors", + "model.layers.37.mlp.experts.15.down_proj.weight": "model-00038-of-00047.safetensors", + "model.layers.37.mlp.experts.15.down_proj.weight_scale": "model-00038-of-00047.safetensors", + "model.layers.37.mlp.experts.15.gate_proj.weight": "model-00038-of-00047.safetensors", + "model.layers.37.mlp.experts.15.gate_proj.weight_scale": "model-00038-of-00047.safetensors", + "model.layers.37.mlp.experts.15.up_proj.weight": "model-00038-of-00047.safetensors", + "model.layers.37.mlp.experts.15.up_proj.weight_scale": "model-00038-of-00047.safetensors", + "model.layers.37.mlp.experts.16.down_proj.weight": "model-00038-of-00047.safetensors", + "model.layers.37.mlp.experts.16.down_proj.weight_scale": "model-00038-of-00047.safetensors", + "model.layers.37.mlp.experts.16.gate_proj.weight": "model-00038-of-00047.safetensors", + "model.layers.37.mlp.experts.16.gate_proj.weight_scale": "model-00038-of-00047.safetensors", + "model.layers.37.mlp.experts.16.up_proj.weight": "model-00038-of-00047.safetensors", + "model.layers.37.mlp.experts.16.up_proj.weight_scale": "model-00038-of-00047.safetensors", + "model.layers.37.mlp.experts.17.down_proj.weight": "model-00038-of-00047.safetensors", + "model.layers.37.mlp.experts.17.down_proj.weight_scale": "model-00038-of-00047.safetensors", + "model.layers.37.mlp.experts.17.gate_proj.weight": "model-00038-of-00047.safetensors", + "model.layers.37.mlp.experts.17.gate_proj.weight_scale": "model-00038-of-00047.safetensors", + "model.layers.37.mlp.experts.17.up_proj.weight": "model-00038-of-00047.safetensors", + "model.layers.37.mlp.experts.17.up_proj.weight_scale": "model-00038-of-00047.safetensors", + "model.layers.37.mlp.experts.18.down_proj.weight": "model-00038-of-00047.safetensors", + "model.layers.37.mlp.experts.18.down_proj.weight_scale": "model-00038-of-00047.safetensors", + "model.layers.37.mlp.experts.18.gate_proj.weight": "model-00038-of-00047.safetensors", + "model.layers.37.mlp.experts.18.gate_proj.weight_scale": "model-00038-of-00047.safetensors", + "model.layers.37.mlp.experts.18.up_proj.weight": "model-00038-of-00047.safetensors", + "model.layers.37.mlp.experts.18.up_proj.weight_scale": "model-00038-of-00047.safetensors", + "model.layers.37.mlp.experts.19.down_proj.weight": "model-00038-of-00047.safetensors", + "model.layers.37.mlp.experts.19.down_proj.weight_scale": "model-00038-of-00047.safetensors", + "model.layers.37.mlp.experts.19.gate_proj.weight": "model-00038-of-00047.safetensors", + "model.layers.37.mlp.experts.19.gate_proj.weight_scale": "model-00038-of-00047.safetensors", + "model.layers.37.mlp.experts.19.up_proj.weight": "model-00038-of-00047.safetensors", + "model.layers.37.mlp.experts.19.up_proj.weight_scale": "model-00038-of-00047.safetensors", + "model.layers.37.mlp.experts.2.down_proj.weight": "model-00038-of-00047.safetensors", + "model.layers.37.mlp.experts.2.down_proj.weight_scale": "model-00038-of-00047.safetensors", + "model.layers.37.mlp.experts.2.gate_proj.weight": "model-00038-of-00047.safetensors", + "model.layers.37.mlp.experts.2.gate_proj.weight_scale": "model-00038-of-00047.safetensors", + "model.layers.37.mlp.experts.2.up_proj.weight": "model-00038-of-00047.safetensors", + "model.layers.37.mlp.experts.2.up_proj.weight_scale": "model-00038-of-00047.safetensors", + "model.layers.37.mlp.experts.20.down_proj.weight": "model-00038-of-00047.safetensors", + "model.layers.37.mlp.experts.20.down_proj.weight_scale": "model-00038-of-00047.safetensors", + "model.layers.37.mlp.experts.20.gate_proj.weight": "model-00038-of-00047.safetensors", + "model.layers.37.mlp.experts.20.gate_proj.weight_scale": "model-00038-of-00047.safetensors", + "model.layers.37.mlp.experts.20.up_proj.weight": "model-00038-of-00047.safetensors", + "model.layers.37.mlp.experts.20.up_proj.weight_scale": "model-00038-of-00047.safetensors", + "model.layers.37.mlp.experts.21.down_proj.weight": "model-00038-of-00047.safetensors", + "model.layers.37.mlp.experts.21.down_proj.weight_scale": "model-00038-of-00047.safetensors", + "model.layers.37.mlp.experts.21.gate_proj.weight": "model-00038-of-00047.safetensors", + "model.layers.37.mlp.experts.21.gate_proj.weight_scale": "model-00038-of-00047.safetensors", + "model.layers.37.mlp.experts.21.up_proj.weight": "model-00038-of-00047.safetensors", + "model.layers.37.mlp.experts.21.up_proj.weight_scale": "model-00038-of-00047.safetensors", + "model.layers.37.mlp.experts.22.down_proj.weight": "model-00038-of-00047.safetensors", + "model.layers.37.mlp.experts.22.down_proj.weight_scale": "model-00038-of-00047.safetensors", + "model.layers.37.mlp.experts.22.gate_proj.weight": "model-00038-of-00047.safetensors", + "model.layers.37.mlp.experts.22.gate_proj.weight_scale": "model-00038-of-00047.safetensors", + "model.layers.37.mlp.experts.22.up_proj.weight": "model-00038-of-00047.safetensors", + "model.layers.37.mlp.experts.22.up_proj.weight_scale": "model-00038-of-00047.safetensors", + "model.layers.37.mlp.experts.23.down_proj.weight": "model-00038-of-00047.safetensors", + "model.layers.37.mlp.experts.23.down_proj.weight_scale": "model-00038-of-00047.safetensors", + "model.layers.37.mlp.experts.23.gate_proj.weight": "model-00038-of-00047.safetensors", + "model.layers.37.mlp.experts.23.gate_proj.weight_scale": "model-00038-of-00047.safetensors", + "model.layers.37.mlp.experts.23.up_proj.weight": "model-00038-of-00047.safetensors", + "model.layers.37.mlp.experts.23.up_proj.weight_scale": "model-00038-of-00047.safetensors", + "model.layers.37.mlp.experts.24.down_proj.weight": "model-00038-of-00047.safetensors", + "model.layers.37.mlp.experts.24.down_proj.weight_scale": "model-00038-of-00047.safetensors", + "model.layers.37.mlp.experts.24.gate_proj.weight": "model-00038-of-00047.safetensors", + "model.layers.37.mlp.experts.24.gate_proj.weight_scale": "model-00038-of-00047.safetensors", + "model.layers.37.mlp.experts.24.up_proj.weight": "model-00038-of-00047.safetensors", + "model.layers.37.mlp.experts.24.up_proj.weight_scale": "model-00038-of-00047.safetensors", + "model.layers.37.mlp.experts.25.down_proj.weight": "model-00038-of-00047.safetensors", + "model.layers.37.mlp.experts.25.down_proj.weight_scale": "model-00038-of-00047.safetensors", + "model.layers.37.mlp.experts.25.gate_proj.weight": "model-00038-of-00047.safetensors", + "model.layers.37.mlp.experts.25.gate_proj.weight_scale": "model-00038-of-00047.safetensors", + "model.layers.37.mlp.experts.25.up_proj.weight": "model-00038-of-00047.safetensors", + "model.layers.37.mlp.experts.25.up_proj.weight_scale": "model-00038-of-00047.safetensors", + "model.layers.37.mlp.experts.26.down_proj.weight": "model-00038-of-00047.safetensors", + "model.layers.37.mlp.experts.26.down_proj.weight_scale": "model-00038-of-00047.safetensors", + "model.layers.37.mlp.experts.26.gate_proj.weight": "model-00038-of-00047.safetensors", + "model.layers.37.mlp.experts.26.gate_proj.weight_scale": "model-00038-of-00047.safetensors", + "model.layers.37.mlp.experts.26.up_proj.weight": "model-00038-of-00047.safetensors", + "model.layers.37.mlp.experts.26.up_proj.weight_scale": "model-00038-of-00047.safetensors", + "model.layers.37.mlp.experts.27.down_proj.weight": "model-00038-of-00047.safetensors", + "model.layers.37.mlp.experts.27.down_proj.weight_scale": "model-00038-of-00047.safetensors", + "model.layers.37.mlp.experts.27.gate_proj.weight": "model-00038-of-00047.safetensors", + "model.layers.37.mlp.experts.27.gate_proj.weight_scale": "model-00038-of-00047.safetensors", + "model.layers.37.mlp.experts.27.up_proj.weight": "model-00038-of-00047.safetensors", + "model.layers.37.mlp.experts.27.up_proj.weight_scale": "model-00038-of-00047.safetensors", + "model.layers.37.mlp.experts.28.down_proj.weight": "model-00038-of-00047.safetensors", + "model.layers.37.mlp.experts.28.down_proj.weight_scale": "model-00038-of-00047.safetensors", + "model.layers.37.mlp.experts.28.gate_proj.weight": "model-00038-of-00047.safetensors", + "model.layers.37.mlp.experts.28.gate_proj.weight_scale": "model-00038-of-00047.safetensors", + "model.layers.37.mlp.experts.28.up_proj.weight": "model-00038-of-00047.safetensors", + "model.layers.37.mlp.experts.28.up_proj.weight_scale": "model-00038-of-00047.safetensors", + "model.layers.37.mlp.experts.29.down_proj.weight": "model-00038-of-00047.safetensors", + "model.layers.37.mlp.experts.29.down_proj.weight_scale": "model-00038-of-00047.safetensors", + "model.layers.37.mlp.experts.29.gate_proj.weight": "model-00038-of-00047.safetensors", + "model.layers.37.mlp.experts.29.gate_proj.weight_scale": "model-00038-of-00047.safetensors", + "model.layers.37.mlp.experts.29.up_proj.weight": "model-00038-of-00047.safetensors", + "model.layers.37.mlp.experts.29.up_proj.weight_scale": "model-00038-of-00047.safetensors", + "model.layers.37.mlp.experts.3.down_proj.weight": "model-00038-of-00047.safetensors", + "model.layers.37.mlp.experts.3.down_proj.weight_scale": "model-00038-of-00047.safetensors", + "model.layers.37.mlp.experts.3.gate_proj.weight": "model-00038-of-00047.safetensors", + "model.layers.37.mlp.experts.3.gate_proj.weight_scale": "model-00038-of-00047.safetensors", + "model.layers.37.mlp.experts.3.up_proj.weight": "model-00038-of-00047.safetensors", + "model.layers.37.mlp.experts.3.up_proj.weight_scale": "model-00038-of-00047.safetensors", + "model.layers.37.mlp.experts.30.down_proj.weight": "model-00038-of-00047.safetensors", + "model.layers.37.mlp.experts.30.down_proj.weight_scale": "model-00038-of-00047.safetensors", + "model.layers.37.mlp.experts.30.gate_proj.weight": "model-00038-of-00047.safetensors", + "model.layers.37.mlp.experts.30.gate_proj.weight_scale": "model-00038-of-00047.safetensors", + "model.layers.37.mlp.experts.30.up_proj.weight": "model-00038-of-00047.safetensors", + "model.layers.37.mlp.experts.30.up_proj.weight_scale": "model-00038-of-00047.safetensors", + "model.layers.37.mlp.experts.31.down_proj.weight": "model-00038-of-00047.safetensors", + "model.layers.37.mlp.experts.31.down_proj.weight_scale": "model-00038-of-00047.safetensors", + "model.layers.37.mlp.experts.31.gate_proj.weight": "model-00038-of-00047.safetensors", + "model.layers.37.mlp.experts.31.gate_proj.weight_scale": "model-00038-of-00047.safetensors", + "model.layers.37.mlp.experts.31.up_proj.weight": "model-00038-of-00047.safetensors", + "model.layers.37.mlp.experts.31.up_proj.weight_scale": "model-00038-of-00047.safetensors", + "model.layers.37.mlp.experts.32.down_proj.weight": "model-00038-of-00047.safetensors", + "model.layers.37.mlp.experts.32.down_proj.weight_scale": "model-00038-of-00047.safetensors", + "model.layers.37.mlp.experts.32.gate_proj.weight": "model-00038-of-00047.safetensors", + "model.layers.37.mlp.experts.32.gate_proj.weight_scale": "model-00038-of-00047.safetensors", + "model.layers.37.mlp.experts.32.up_proj.weight": "model-00038-of-00047.safetensors", + "model.layers.37.mlp.experts.32.up_proj.weight_scale": "model-00038-of-00047.safetensors", + "model.layers.37.mlp.experts.33.down_proj.weight": "model-00038-of-00047.safetensors", + "model.layers.37.mlp.experts.33.down_proj.weight_scale": "model-00038-of-00047.safetensors", + "model.layers.37.mlp.experts.33.gate_proj.weight": "model-00038-of-00047.safetensors", + "model.layers.37.mlp.experts.33.gate_proj.weight_scale": "model-00038-of-00047.safetensors", + "model.layers.37.mlp.experts.33.up_proj.weight": "model-00038-of-00047.safetensors", + "model.layers.37.mlp.experts.33.up_proj.weight_scale": "model-00038-of-00047.safetensors", + "model.layers.37.mlp.experts.34.down_proj.weight": "model-00038-of-00047.safetensors", + "model.layers.37.mlp.experts.34.down_proj.weight_scale": "model-00038-of-00047.safetensors", + "model.layers.37.mlp.experts.34.gate_proj.weight": "model-00038-of-00047.safetensors", + "model.layers.37.mlp.experts.34.gate_proj.weight_scale": "model-00038-of-00047.safetensors", + "model.layers.37.mlp.experts.34.up_proj.weight": "model-00038-of-00047.safetensors", + "model.layers.37.mlp.experts.34.up_proj.weight_scale": "model-00038-of-00047.safetensors", + "model.layers.37.mlp.experts.35.down_proj.weight": "model-00038-of-00047.safetensors", + "model.layers.37.mlp.experts.35.down_proj.weight_scale": "model-00038-of-00047.safetensors", + "model.layers.37.mlp.experts.35.gate_proj.weight": "model-00038-of-00047.safetensors", + "model.layers.37.mlp.experts.35.gate_proj.weight_scale": "model-00038-of-00047.safetensors", + "model.layers.37.mlp.experts.35.up_proj.weight": "model-00038-of-00047.safetensors", + "model.layers.37.mlp.experts.35.up_proj.weight_scale": "model-00038-of-00047.safetensors", + "model.layers.37.mlp.experts.36.down_proj.weight": "model-00038-of-00047.safetensors", + "model.layers.37.mlp.experts.36.down_proj.weight_scale": "model-00038-of-00047.safetensors", + "model.layers.37.mlp.experts.36.gate_proj.weight": "model-00038-of-00047.safetensors", + "model.layers.37.mlp.experts.36.gate_proj.weight_scale": "model-00038-of-00047.safetensors", + "model.layers.37.mlp.experts.36.up_proj.weight": "model-00038-of-00047.safetensors", + "model.layers.37.mlp.experts.36.up_proj.weight_scale": "model-00038-of-00047.safetensors", + "model.layers.37.mlp.experts.37.down_proj.weight": "model-00038-of-00047.safetensors", + "model.layers.37.mlp.experts.37.down_proj.weight_scale": "model-00038-of-00047.safetensors", + "model.layers.37.mlp.experts.37.gate_proj.weight": "model-00038-of-00047.safetensors", + "model.layers.37.mlp.experts.37.gate_proj.weight_scale": "model-00038-of-00047.safetensors", + "model.layers.37.mlp.experts.37.up_proj.weight": "model-00038-of-00047.safetensors", + "model.layers.37.mlp.experts.37.up_proj.weight_scale": "model-00038-of-00047.safetensors", + "model.layers.37.mlp.experts.38.down_proj.weight": "model-00038-of-00047.safetensors", + "model.layers.37.mlp.experts.38.down_proj.weight_scale": "model-00038-of-00047.safetensors", + "model.layers.37.mlp.experts.38.gate_proj.weight": "model-00038-of-00047.safetensors", + "model.layers.37.mlp.experts.38.gate_proj.weight_scale": "model-00038-of-00047.safetensors", + "model.layers.37.mlp.experts.38.up_proj.weight": "model-00038-of-00047.safetensors", + "model.layers.37.mlp.experts.38.up_proj.weight_scale": "model-00038-of-00047.safetensors", + "model.layers.37.mlp.experts.39.down_proj.weight": "model-00038-of-00047.safetensors", + "model.layers.37.mlp.experts.39.down_proj.weight_scale": "model-00038-of-00047.safetensors", + "model.layers.37.mlp.experts.39.gate_proj.weight": "model-00038-of-00047.safetensors", + "model.layers.37.mlp.experts.39.gate_proj.weight_scale": "model-00038-of-00047.safetensors", + "model.layers.37.mlp.experts.39.up_proj.weight": "model-00038-of-00047.safetensors", + "model.layers.37.mlp.experts.39.up_proj.weight_scale": "model-00038-of-00047.safetensors", + "model.layers.37.mlp.experts.4.down_proj.weight": "model-00038-of-00047.safetensors", + "model.layers.37.mlp.experts.4.down_proj.weight_scale": "model-00038-of-00047.safetensors", + "model.layers.37.mlp.experts.4.gate_proj.weight": "model-00038-of-00047.safetensors", + "model.layers.37.mlp.experts.4.gate_proj.weight_scale": "model-00038-of-00047.safetensors", + "model.layers.37.mlp.experts.4.up_proj.weight": "model-00038-of-00047.safetensors", + "model.layers.37.mlp.experts.4.up_proj.weight_scale": "model-00038-of-00047.safetensors", + "model.layers.37.mlp.experts.40.down_proj.weight": "model-00038-of-00047.safetensors", + "model.layers.37.mlp.experts.40.down_proj.weight_scale": "model-00038-of-00047.safetensors", + "model.layers.37.mlp.experts.40.gate_proj.weight": "model-00038-of-00047.safetensors", + "model.layers.37.mlp.experts.40.gate_proj.weight_scale": "model-00038-of-00047.safetensors", + "model.layers.37.mlp.experts.40.up_proj.weight": "model-00038-of-00047.safetensors", + "model.layers.37.mlp.experts.40.up_proj.weight_scale": "model-00038-of-00047.safetensors", + "model.layers.37.mlp.experts.41.down_proj.weight": "model-00038-of-00047.safetensors", + "model.layers.37.mlp.experts.41.down_proj.weight_scale": "model-00038-of-00047.safetensors", + "model.layers.37.mlp.experts.41.gate_proj.weight": "model-00038-of-00047.safetensors", + "model.layers.37.mlp.experts.41.gate_proj.weight_scale": "model-00038-of-00047.safetensors", + "model.layers.37.mlp.experts.41.up_proj.weight": "model-00038-of-00047.safetensors", + "model.layers.37.mlp.experts.41.up_proj.weight_scale": "model-00038-of-00047.safetensors", + "model.layers.37.mlp.experts.42.down_proj.weight": "model-00038-of-00047.safetensors", + "model.layers.37.mlp.experts.42.down_proj.weight_scale": "model-00038-of-00047.safetensors", + "model.layers.37.mlp.experts.42.gate_proj.weight": "model-00038-of-00047.safetensors", + "model.layers.37.mlp.experts.42.gate_proj.weight_scale": "model-00038-of-00047.safetensors", + "model.layers.37.mlp.experts.42.up_proj.weight": "model-00038-of-00047.safetensors", + "model.layers.37.mlp.experts.42.up_proj.weight_scale": "model-00038-of-00047.safetensors", + "model.layers.37.mlp.experts.43.down_proj.weight": "model-00038-of-00047.safetensors", + "model.layers.37.mlp.experts.43.down_proj.weight_scale": "model-00038-of-00047.safetensors", + "model.layers.37.mlp.experts.43.gate_proj.weight": "model-00038-of-00047.safetensors", + "model.layers.37.mlp.experts.43.gate_proj.weight_scale": "model-00038-of-00047.safetensors", + "model.layers.37.mlp.experts.43.up_proj.weight": "model-00038-of-00047.safetensors", + "model.layers.37.mlp.experts.43.up_proj.weight_scale": "model-00038-of-00047.safetensors", + "model.layers.37.mlp.experts.44.down_proj.weight": "model-00038-of-00047.safetensors", + "model.layers.37.mlp.experts.44.down_proj.weight_scale": "model-00038-of-00047.safetensors", + "model.layers.37.mlp.experts.44.gate_proj.weight": "model-00038-of-00047.safetensors", + "model.layers.37.mlp.experts.44.gate_proj.weight_scale": "model-00038-of-00047.safetensors", + "model.layers.37.mlp.experts.44.up_proj.weight": "model-00038-of-00047.safetensors", + "model.layers.37.mlp.experts.44.up_proj.weight_scale": "model-00038-of-00047.safetensors", + "model.layers.37.mlp.experts.45.down_proj.weight": "model-00038-of-00047.safetensors", + "model.layers.37.mlp.experts.45.down_proj.weight_scale": "model-00038-of-00047.safetensors", + "model.layers.37.mlp.experts.45.gate_proj.weight": "model-00038-of-00047.safetensors", + "model.layers.37.mlp.experts.45.gate_proj.weight_scale": "model-00038-of-00047.safetensors", + "model.layers.37.mlp.experts.45.up_proj.weight": "model-00038-of-00047.safetensors", + "model.layers.37.mlp.experts.45.up_proj.weight_scale": "model-00038-of-00047.safetensors", + "model.layers.37.mlp.experts.46.down_proj.weight": "model-00038-of-00047.safetensors", + "model.layers.37.mlp.experts.46.down_proj.weight_scale": "model-00038-of-00047.safetensors", + "model.layers.37.mlp.experts.46.gate_proj.weight": "model-00038-of-00047.safetensors", + "model.layers.37.mlp.experts.46.gate_proj.weight_scale": "model-00038-of-00047.safetensors", + "model.layers.37.mlp.experts.46.up_proj.weight": "model-00038-of-00047.safetensors", + "model.layers.37.mlp.experts.46.up_proj.weight_scale": "model-00038-of-00047.safetensors", + "model.layers.37.mlp.experts.47.down_proj.weight": "model-00038-of-00047.safetensors", + "model.layers.37.mlp.experts.47.down_proj.weight_scale": "model-00038-of-00047.safetensors", + "model.layers.37.mlp.experts.47.gate_proj.weight": "model-00038-of-00047.safetensors", + "model.layers.37.mlp.experts.47.gate_proj.weight_scale": "model-00038-of-00047.safetensors", + "model.layers.37.mlp.experts.47.up_proj.weight": "model-00038-of-00047.safetensors", + "model.layers.37.mlp.experts.47.up_proj.weight_scale": "model-00038-of-00047.safetensors", + "model.layers.37.mlp.experts.48.down_proj.weight": "model-00038-of-00047.safetensors", + "model.layers.37.mlp.experts.48.down_proj.weight_scale": "model-00038-of-00047.safetensors", + "model.layers.37.mlp.experts.48.gate_proj.weight": "model-00038-of-00047.safetensors", + "model.layers.37.mlp.experts.48.gate_proj.weight_scale": "model-00038-of-00047.safetensors", + "model.layers.37.mlp.experts.48.up_proj.weight": "model-00038-of-00047.safetensors", + "model.layers.37.mlp.experts.48.up_proj.weight_scale": "model-00038-of-00047.safetensors", + "model.layers.37.mlp.experts.49.down_proj.weight": "model-00038-of-00047.safetensors", + "model.layers.37.mlp.experts.49.down_proj.weight_scale": "model-00038-of-00047.safetensors", + "model.layers.37.mlp.experts.49.gate_proj.weight": "model-00038-of-00047.safetensors", + "model.layers.37.mlp.experts.49.gate_proj.weight_scale": "model-00038-of-00047.safetensors", + "model.layers.37.mlp.experts.49.up_proj.weight": "model-00038-of-00047.safetensors", + "model.layers.37.mlp.experts.49.up_proj.weight_scale": "model-00038-of-00047.safetensors", + "model.layers.37.mlp.experts.5.down_proj.weight": "model-00038-of-00047.safetensors", + "model.layers.37.mlp.experts.5.down_proj.weight_scale": "model-00038-of-00047.safetensors", + "model.layers.37.mlp.experts.5.gate_proj.weight": "model-00038-of-00047.safetensors", + "model.layers.37.mlp.experts.5.gate_proj.weight_scale": "model-00038-of-00047.safetensors", + "model.layers.37.mlp.experts.5.up_proj.weight": "model-00038-of-00047.safetensors", + "model.layers.37.mlp.experts.5.up_proj.weight_scale": "model-00038-of-00047.safetensors", + "model.layers.37.mlp.experts.50.down_proj.weight": "model-00038-of-00047.safetensors", + "model.layers.37.mlp.experts.50.down_proj.weight_scale": "model-00038-of-00047.safetensors", + "model.layers.37.mlp.experts.50.gate_proj.weight": "model-00038-of-00047.safetensors", + "model.layers.37.mlp.experts.50.gate_proj.weight_scale": "model-00038-of-00047.safetensors", + "model.layers.37.mlp.experts.50.up_proj.weight": "model-00038-of-00047.safetensors", + "model.layers.37.mlp.experts.50.up_proj.weight_scale": "model-00038-of-00047.safetensors", + "model.layers.37.mlp.experts.51.down_proj.weight": "model-00038-of-00047.safetensors", + "model.layers.37.mlp.experts.51.down_proj.weight_scale": "model-00038-of-00047.safetensors", + "model.layers.37.mlp.experts.51.gate_proj.weight": "model-00038-of-00047.safetensors", + "model.layers.37.mlp.experts.51.gate_proj.weight_scale": "model-00038-of-00047.safetensors", + "model.layers.37.mlp.experts.51.up_proj.weight": "model-00038-of-00047.safetensors", + "model.layers.37.mlp.experts.51.up_proj.weight_scale": "model-00038-of-00047.safetensors", + "model.layers.37.mlp.experts.52.down_proj.weight": "model-00038-of-00047.safetensors", + "model.layers.37.mlp.experts.52.down_proj.weight_scale": "model-00038-of-00047.safetensors", + "model.layers.37.mlp.experts.52.gate_proj.weight": "model-00038-of-00047.safetensors", + "model.layers.37.mlp.experts.52.gate_proj.weight_scale": "model-00038-of-00047.safetensors", + "model.layers.37.mlp.experts.52.up_proj.weight": "model-00038-of-00047.safetensors", + "model.layers.37.mlp.experts.52.up_proj.weight_scale": "model-00038-of-00047.safetensors", + "model.layers.37.mlp.experts.53.down_proj.weight": "model-00038-of-00047.safetensors", + "model.layers.37.mlp.experts.53.down_proj.weight_scale": "model-00038-of-00047.safetensors", + "model.layers.37.mlp.experts.53.gate_proj.weight": "model-00038-of-00047.safetensors", + "model.layers.37.mlp.experts.53.gate_proj.weight_scale": "model-00038-of-00047.safetensors", + "model.layers.37.mlp.experts.53.up_proj.weight": "model-00038-of-00047.safetensors", + "model.layers.37.mlp.experts.53.up_proj.weight_scale": "model-00038-of-00047.safetensors", + "model.layers.37.mlp.experts.54.down_proj.weight": "model-00038-of-00047.safetensors", + "model.layers.37.mlp.experts.54.down_proj.weight_scale": "model-00038-of-00047.safetensors", + "model.layers.37.mlp.experts.54.gate_proj.weight": "model-00038-of-00047.safetensors", + "model.layers.37.mlp.experts.54.gate_proj.weight_scale": "model-00038-of-00047.safetensors", + "model.layers.37.mlp.experts.54.up_proj.weight": "model-00038-of-00047.safetensors", + "model.layers.37.mlp.experts.54.up_proj.weight_scale": "model-00038-of-00047.safetensors", + "model.layers.37.mlp.experts.55.down_proj.weight": "model-00038-of-00047.safetensors", + "model.layers.37.mlp.experts.55.down_proj.weight_scale": "model-00038-of-00047.safetensors", + "model.layers.37.mlp.experts.55.gate_proj.weight": "model-00038-of-00047.safetensors", + "model.layers.37.mlp.experts.55.gate_proj.weight_scale": "model-00038-of-00047.safetensors", + "model.layers.37.mlp.experts.55.up_proj.weight": "model-00038-of-00047.safetensors", + "model.layers.37.mlp.experts.55.up_proj.weight_scale": "model-00038-of-00047.safetensors", + "model.layers.37.mlp.experts.56.down_proj.weight": "model-00038-of-00047.safetensors", + "model.layers.37.mlp.experts.56.down_proj.weight_scale": "model-00038-of-00047.safetensors", + "model.layers.37.mlp.experts.56.gate_proj.weight": "model-00038-of-00047.safetensors", + "model.layers.37.mlp.experts.56.gate_proj.weight_scale": "model-00038-of-00047.safetensors", + "model.layers.37.mlp.experts.56.up_proj.weight": "model-00038-of-00047.safetensors", + "model.layers.37.mlp.experts.56.up_proj.weight_scale": "model-00038-of-00047.safetensors", + "model.layers.37.mlp.experts.57.down_proj.weight": "model-00038-of-00047.safetensors", + "model.layers.37.mlp.experts.57.down_proj.weight_scale": "model-00038-of-00047.safetensors", + "model.layers.37.mlp.experts.57.gate_proj.weight": "model-00038-of-00047.safetensors", + "model.layers.37.mlp.experts.57.gate_proj.weight_scale": "model-00038-of-00047.safetensors", + "model.layers.37.mlp.experts.57.up_proj.weight": "model-00038-of-00047.safetensors", + "model.layers.37.mlp.experts.57.up_proj.weight_scale": "model-00038-of-00047.safetensors", + "model.layers.37.mlp.experts.58.down_proj.weight": "model-00038-of-00047.safetensors", + "model.layers.37.mlp.experts.58.down_proj.weight_scale": "model-00038-of-00047.safetensors", + "model.layers.37.mlp.experts.58.gate_proj.weight": "model-00038-of-00047.safetensors", + "model.layers.37.mlp.experts.58.gate_proj.weight_scale": "model-00038-of-00047.safetensors", + "model.layers.37.mlp.experts.58.up_proj.weight": "model-00038-of-00047.safetensors", + "model.layers.37.mlp.experts.58.up_proj.weight_scale": "model-00038-of-00047.safetensors", + "model.layers.37.mlp.experts.59.down_proj.weight": "model-00038-of-00047.safetensors", + "model.layers.37.mlp.experts.59.down_proj.weight_scale": "model-00038-of-00047.safetensors", + "model.layers.37.mlp.experts.59.gate_proj.weight": "model-00038-of-00047.safetensors", + "model.layers.37.mlp.experts.59.gate_proj.weight_scale": "model-00038-of-00047.safetensors", + "model.layers.37.mlp.experts.59.up_proj.weight": "model-00038-of-00047.safetensors", + "model.layers.37.mlp.experts.59.up_proj.weight_scale": "model-00038-of-00047.safetensors", + "model.layers.37.mlp.experts.6.down_proj.weight": "model-00038-of-00047.safetensors", + "model.layers.37.mlp.experts.6.down_proj.weight_scale": "model-00038-of-00047.safetensors", + "model.layers.37.mlp.experts.6.gate_proj.weight": "model-00038-of-00047.safetensors", + "model.layers.37.mlp.experts.6.gate_proj.weight_scale": "model-00038-of-00047.safetensors", + "model.layers.37.mlp.experts.6.up_proj.weight": "model-00038-of-00047.safetensors", + "model.layers.37.mlp.experts.6.up_proj.weight_scale": "model-00038-of-00047.safetensors", + "model.layers.37.mlp.experts.60.down_proj.weight": "model-00038-of-00047.safetensors", + "model.layers.37.mlp.experts.60.down_proj.weight_scale": "model-00038-of-00047.safetensors", + "model.layers.37.mlp.experts.60.gate_proj.weight": "model-00038-of-00047.safetensors", + "model.layers.37.mlp.experts.60.gate_proj.weight_scale": "model-00038-of-00047.safetensors", + "model.layers.37.mlp.experts.60.up_proj.weight": "model-00038-of-00047.safetensors", + "model.layers.37.mlp.experts.60.up_proj.weight_scale": "model-00038-of-00047.safetensors", + "model.layers.37.mlp.experts.61.down_proj.weight": "model-00038-of-00047.safetensors", + "model.layers.37.mlp.experts.61.down_proj.weight_scale": "model-00038-of-00047.safetensors", + "model.layers.37.mlp.experts.61.gate_proj.weight": "model-00038-of-00047.safetensors", + "model.layers.37.mlp.experts.61.gate_proj.weight_scale": "model-00038-of-00047.safetensors", + "model.layers.37.mlp.experts.61.up_proj.weight": "model-00038-of-00047.safetensors", + "model.layers.37.mlp.experts.61.up_proj.weight_scale": "model-00038-of-00047.safetensors", + "model.layers.37.mlp.experts.62.down_proj.weight": "model-00038-of-00047.safetensors", + "model.layers.37.mlp.experts.62.down_proj.weight_scale": "model-00038-of-00047.safetensors", + "model.layers.37.mlp.experts.62.gate_proj.weight": "model-00038-of-00047.safetensors", + "model.layers.37.mlp.experts.62.gate_proj.weight_scale": "model-00038-of-00047.safetensors", + "model.layers.37.mlp.experts.62.up_proj.weight": "model-00038-of-00047.safetensors", + "model.layers.37.mlp.experts.62.up_proj.weight_scale": "model-00038-of-00047.safetensors", + "model.layers.37.mlp.experts.63.down_proj.weight": "model-00038-of-00047.safetensors", + "model.layers.37.mlp.experts.63.down_proj.weight_scale": "model-00038-of-00047.safetensors", + "model.layers.37.mlp.experts.63.gate_proj.weight": "model-00038-of-00047.safetensors", + "model.layers.37.mlp.experts.63.gate_proj.weight_scale": "model-00038-of-00047.safetensors", + "model.layers.37.mlp.experts.63.up_proj.weight": "model-00038-of-00047.safetensors", + "model.layers.37.mlp.experts.63.up_proj.weight_scale": "model-00038-of-00047.safetensors", + "model.layers.37.mlp.experts.64.down_proj.weight": "model-00038-of-00047.safetensors", + "model.layers.37.mlp.experts.64.down_proj.weight_scale": "model-00038-of-00047.safetensors", + "model.layers.37.mlp.experts.64.gate_proj.weight": "model-00038-of-00047.safetensors", + "model.layers.37.mlp.experts.64.gate_proj.weight_scale": "model-00038-of-00047.safetensors", + "model.layers.37.mlp.experts.64.up_proj.weight": "model-00038-of-00047.safetensors", + "model.layers.37.mlp.experts.64.up_proj.weight_scale": "model-00038-of-00047.safetensors", + "model.layers.37.mlp.experts.65.down_proj.weight": "model-00038-of-00047.safetensors", + "model.layers.37.mlp.experts.65.down_proj.weight_scale": "model-00038-of-00047.safetensors", + "model.layers.37.mlp.experts.65.gate_proj.weight": "model-00038-of-00047.safetensors", + "model.layers.37.mlp.experts.65.gate_proj.weight_scale": "model-00038-of-00047.safetensors", + "model.layers.37.mlp.experts.65.up_proj.weight": "model-00038-of-00047.safetensors", + "model.layers.37.mlp.experts.65.up_proj.weight_scale": "model-00038-of-00047.safetensors", + "model.layers.37.mlp.experts.66.down_proj.weight": "model-00038-of-00047.safetensors", + "model.layers.37.mlp.experts.66.down_proj.weight_scale": "model-00038-of-00047.safetensors", + "model.layers.37.mlp.experts.66.gate_proj.weight": "model-00038-of-00047.safetensors", + "model.layers.37.mlp.experts.66.gate_proj.weight_scale": "model-00038-of-00047.safetensors", + "model.layers.37.mlp.experts.66.up_proj.weight": "model-00038-of-00047.safetensors", + "model.layers.37.mlp.experts.66.up_proj.weight_scale": "model-00038-of-00047.safetensors", + "model.layers.37.mlp.experts.67.down_proj.weight": "model-00038-of-00047.safetensors", + "model.layers.37.mlp.experts.67.down_proj.weight_scale": "model-00038-of-00047.safetensors", + "model.layers.37.mlp.experts.67.gate_proj.weight": "model-00038-of-00047.safetensors", + "model.layers.37.mlp.experts.67.gate_proj.weight_scale": "model-00038-of-00047.safetensors", + "model.layers.37.mlp.experts.67.up_proj.weight": "model-00038-of-00047.safetensors", + "model.layers.37.mlp.experts.67.up_proj.weight_scale": "model-00038-of-00047.safetensors", + "model.layers.37.mlp.experts.68.down_proj.weight": "model-00038-of-00047.safetensors", + "model.layers.37.mlp.experts.68.down_proj.weight_scale": "model-00038-of-00047.safetensors", + "model.layers.37.mlp.experts.68.gate_proj.weight": "model-00038-of-00047.safetensors", + "model.layers.37.mlp.experts.68.gate_proj.weight_scale": "model-00038-of-00047.safetensors", + "model.layers.37.mlp.experts.68.up_proj.weight": "model-00038-of-00047.safetensors", + "model.layers.37.mlp.experts.68.up_proj.weight_scale": "model-00038-of-00047.safetensors", + "model.layers.37.mlp.experts.69.down_proj.weight": "model-00038-of-00047.safetensors", + "model.layers.37.mlp.experts.69.down_proj.weight_scale": "model-00038-of-00047.safetensors", + "model.layers.37.mlp.experts.69.gate_proj.weight": "model-00038-of-00047.safetensors", + "model.layers.37.mlp.experts.69.gate_proj.weight_scale": "model-00038-of-00047.safetensors", + "model.layers.37.mlp.experts.69.up_proj.weight": "model-00038-of-00047.safetensors", + "model.layers.37.mlp.experts.69.up_proj.weight_scale": "model-00038-of-00047.safetensors", + "model.layers.37.mlp.experts.7.down_proj.weight": "model-00038-of-00047.safetensors", + "model.layers.37.mlp.experts.7.down_proj.weight_scale": "model-00038-of-00047.safetensors", + "model.layers.37.mlp.experts.7.gate_proj.weight": "model-00038-of-00047.safetensors", + "model.layers.37.mlp.experts.7.gate_proj.weight_scale": "model-00038-of-00047.safetensors", + "model.layers.37.mlp.experts.7.up_proj.weight": "model-00038-of-00047.safetensors", + "model.layers.37.mlp.experts.7.up_proj.weight_scale": "model-00038-of-00047.safetensors", + "model.layers.37.mlp.experts.70.down_proj.weight": "model-00038-of-00047.safetensors", + "model.layers.37.mlp.experts.70.down_proj.weight_scale": "model-00038-of-00047.safetensors", + "model.layers.37.mlp.experts.70.gate_proj.weight": "model-00038-of-00047.safetensors", + "model.layers.37.mlp.experts.70.gate_proj.weight_scale": "model-00038-of-00047.safetensors", + "model.layers.37.mlp.experts.70.up_proj.weight": "model-00038-of-00047.safetensors", + "model.layers.37.mlp.experts.70.up_proj.weight_scale": "model-00038-of-00047.safetensors", + "model.layers.37.mlp.experts.71.down_proj.weight": "model-00038-of-00047.safetensors", + "model.layers.37.mlp.experts.71.down_proj.weight_scale": "model-00038-of-00047.safetensors", + "model.layers.37.mlp.experts.71.gate_proj.weight": "model-00038-of-00047.safetensors", + "model.layers.37.mlp.experts.71.gate_proj.weight_scale": "model-00038-of-00047.safetensors", + "model.layers.37.mlp.experts.71.up_proj.weight": "model-00038-of-00047.safetensors", + "model.layers.37.mlp.experts.71.up_proj.weight_scale": "model-00038-of-00047.safetensors", + "model.layers.37.mlp.experts.72.down_proj.weight": "model-00038-of-00047.safetensors", + "model.layers.37.mlp.experts.72.down_proj.weight_scale": "model-00038-of-00047.safetensors", + "model.layers.37.mlp.experts.72.gate_proj.weight": "model-00038-of-00047.safetensors", + "model.layers.37.mlp.experts.72.gate_proj.weight_scale": "model-00038-of-00047.safetensors", + "model.layers.37.mlp.experts.72.up_proj.weight": "model-00038-of-00047.safetensors", + "model.layers.37.mlp.experts.72.up_proj.weight_scale": "model-00038-of-00047.safetensors", + "model.layers.37.mlp.experts.73.down_proj.weight": "model-00038-of-00047.safetensors", + "model.layers.37.mlp.experts.73.down_proj.weight_scale": "model-00038-of-00047.safetensors", + "model.layers.37.mlp.experts.73.gate_proj.weight": "model-00038-of-00047.safetensors", + "model.layers.37.mlp.experts.73.gate_proj.weight_scale": "model-00038-of-00047.safetensors", + "model.layers.37.mlp.experts.73.up_proj.weight": "model-00038-of-00047.safetensors", + "model.layers.37.mlp.experts.73.up_proj.weight_scale": "model-00038-of-00047.safetensors", + "model.layers.37.mlp.experts.74.down_proj.weight": "model-00038-of-00047.safetensors", + "model.layers.37.mlp.experts.74.down_proj.weight_scale": "model-00038-of-00047.safetensors", + "model.layers.37.mlp.experts.74.gate_proj.weight": "model-00038-of-00047.safetensors", + "model.layers.37.mlp.experts.74.gate_proj.weight_scale": "model-00038-of-00047.safetensors", + "model.layers.37.mlp.experts.74.up_proj.weight": "model-00038-of-00047.safetensors", + "model.layers.37.mlp.experts.74.up_proj.weight_scale": "model-00038-of-00047.safetensors", + "model.layers.37.mlp.experts.75.down_proj.weight": "model-00038-of-00047.safetensors", + "model.layers.37.mlp.experts.75.down_proj.weight_scale": "model-00038-of-00047.safetensors", + "model.layers.37.mlp.experts.75.gate_proj.weight": "model-00038-of-00047.safetensors", + "model.layers.37.mlp.experts.75.gate_proj.weight_scale": "model-00038-of-00047.safetensors", + "model.layers.37.mlp.experts.75.up_proj.weight": "model-00038-of-00047.safetensors", + "model.layers.37.mlp.experts.75.up_proj.weight_scale": "model-00038-of-00047.safetensors", + "model.layers.37.mlp.experts.76.down_proj.weight": "model-00038-of-00047.safetensors", + "model.layers.37.mlp.experts.76.down_proj.weight_scale": "model-00038-of-00047.safetensors", + "model.layers.37.mlp.experts.76.gate_proj.weight": "model-00038-of-00047.safetensors", + "model.layers.37.mlp.experts.76.gate_proj.weight_scale": "model-00038-of-00047.safetensors", + "model.layers.37.mlp.experts.76.up_proj.weight": "model-00038-of-00047.safetensors", + "model.layers.37.mlp.experts.76.up_proj.weight_scale": "model-00038-of-00047.safetensors", + "model.layers.37.mlp.experts.77.down_proj.weight": "model-00038-of-00047.safetensors", + "model.layers.37.mlp.experts.77.down_proj.weight_scale": "model-00038-of-00047.safetensors", + "model.layers.37.mlp.experts.77.gate_proj.weight": "model-00038-of-00047.safetensors", + "model.layers.37.mlp.experts.77.gate_proj.weight_scale": "model-00038-of-00047.safetensors", + "model.layers.37.mlp.experts.77.up_proj.weight": "model-00038-of-00047.safetensors", + "model.layers.37.mlp.experts.77.up_proj.weight_scale": "model-00038-of-00047.safetensors", + "model.layers.37.mlp.experts.78.down_proj.weight": "model-00038-of-00047.safetensors", + "model.layers.37.mlp.experts.78.down_proj.weight_scale": "model-00038-of-00047.safetensors", + "model.layers.37.mlp.experts.78.gate_proj.weight": "model-00038-of-00047.safetensors", + "model.layers.37.mlp.experts.78.gate_proj.weight_scale": "model-00038-of-00047.safetensors", + "model.layers.37.mlp.experts.78.up_proj.weight": "model-00038-of-00047.safetensors", + "model.layers.37.mlp.experts.78.up_proj.weight_scale": "model-00038-of-00047.safetensors", + "model.layers.37.mlp.experts.79.down_proj.weight": "model-00038-of-00047.safetensors", + "model.layers.37.mlp.experts.79.down_proj.weight_scale": "model-00038-of-00047.safetensors", + "model.layers.37.mlp.experts.79.gate_proj.weight": "model-00038-of-00047.safetensors", + "model.layers.37.mlp.experts.79.gate_proj.weight_scale": "model-00038-of-00047.safetensors", + "model.layers.37.mlp.experts.79.up_proj.weight": "model-00038-of-00047.safetensors", + "model.layers.37.mlp.experts.79.up_proj.weight_scale": "model-00038-of-00047.safetensors", + "model.layers.37.mlp.experts.8.down_proj.weight": "model-00038-of-00047.safetensors", + "model.layers.37.mlp.experts.8.down_proj.weight_scale": "model-00038-of-00047.safetensors", + "model.layers.37.mlp.experts.8.gate_proj.weight": "model-00038-of-00047.safetensors", + "model.layers.37.mlp.experts.8.gate_proj.weight_scale": "model-00038-of-00047.safetensors", + "model.layers.37.mlp.experts.8.up_proj.weight": "model-00038-of-00047.safetensors", + "model.layers.37.mlp.experts.8.up_proj.weight_scale": "model-00038-of-00047.safetensors", + "model.layers.37.mlp.experts.80.down_proj.weight": "model-00038-of-00047.safetensors", + "model.layers.37.mlp.experts.80.down_proj.weight_scale": "model-00038-of-00047.safetensors", + "model.layers.37.mlp.experts.80.gate_proj.weight": "model-00038-of-00047.safetensors", + "model.layers.37.mlp.experts.80.gate_proj.weight_scale": "model-00038-of-00047.safetensors", + "model.layers.37.mlp.experts.80.up_proj.weight": "model-00038-of-00047.safetensors", + "model.layers.37.mlp.experts.80.up_proj.weight_scale": "model-00038-of-00047.safetensors", + "model.layers.37.mlp.experts.81.down_proj.weight": "model-00038-of-00047.safetensors", + "model.layers.37.mlp.experts.81.down_proj.weight_scale": "model-00038-of-00047.safetensors", + "model.layers.37.mlp.experts.81.gate_proj.weight": "model-00038-of-00047.safetensors", + "model.layers.37.mlp.experts.81.gate_proj.weight_scale": "model-00038-of-00047.safetensors", + "model.layers.37.mlp.experts.81.up_proj.weight": "model-00038-of-00047.safetensors", + "model.layers.37.mlp.experts.81.up_proj.weight_scale": "model-00038-of-00047.safetensors", + "model.layers.37.mlp.experts.82.down_proj.weight": "model-00038-of-00047.safetensors", + "model.layers.37.mlp.experts.82.down_proj.weight_scale": "model-00038-of-00047.safetensors", + "model.layers.37.mlp.experts.82.gate_proj.weight": "model-00038-of-00047.safetensors", + "model.layers.37.mlp.experts.82.gate_proj.weight_scale": "model-00038-of-00047.safetensors", + "model.layers.37.mlp.experts.82.up_proj.weight": "model-00038-of-00047.safetensors", + "model.layers.37.mlp.experts.82.up_proj.weight_scale": "model-00038-of-00047.safetensors", + "model.layers.37.mlp.experts.83.down_proj.weight": "model-00038-of-00047.safetensors", + "model.layers.37.mlp.experts.83.down_proj.weight_scale": "model-00038-of-00047.safetensors", + "model.layers.37.mlp.experts.83.gate_proj.weight": "model-00038-of-00047.safetensors", + "model.layers.37.mlp.experts.83.gate_proj.weight_scale": "model-00038-of-00047.safetensors", + "model.layers.37.mlp.experts.83.up_proj.weight": "model-00038-of-00047.safetensors", + "model.layers.37.mlp.experts.83.up_proj.weight_scale": "model-00038-of-00047.safetensors", + "model.layers.37.mlp.experts.84.down_proj.weight": "model-00038-of-00047.safetensors", + "model.layers.37.mlp.experts.84.down_proj.weight_scale": "model-00038-of-00047.safetensors", + "model.layers.37.mlp.experts.84.gate_proj.weight": "model-00038-of-00047.safetensors", + "model.layers.37.mlp.experts.84.gate_proj.weight_scale": "model-00038-of-00047.safetensors", + "model.layers.37.mlp.experts.84.up_proj.weight": "model-00038-of-00047.safetensors", + "model.layers.37.mlp.experts.84.up_proj.weight_scale": "model-00038-of-00047.safetensors", + "model.layers.37.mlp.experts.85.down_proj.weight": "model-00038-of-00047.safetensors", + "model.layers.37.mlp.experts.85.down_proj.weight_scale": "model-00038-of-00047.safetensors", + "model.layers.37.mlp.experts.85.gate_proj.weight": "model-00038-of-00047.safetensors", + "model.layers.37.mlp.experts.85.gate_proj.weight_scale": "model-00038-of-00047.safetensors", + "model.layers.37.mlp.experts.85.up_proj.weight": "model-00038-of-00047.safetensors", + "model.layers.37.mlp.experts.85.up_proj.weight_scale": "model-00038-of-00047.safetensors", + "model.layers.37.mlp.experts.86.down_proj.weight": "model-00038-of-00047.safetensors", + "model.layers.37.mlp.experts.86.down_proj.weight_scale": "model-00038-of-00047.safetensors", + "model.layers.37.mlp.experts.86.gate_proj.weight": "model-00038-of-00047.safetensors", + "model.layers.37.mlp.experts.86.gate_proj.weight_scale": "model-00038-of-00047.safetensors", + "model.layers.37.mlp.experts.86.up_proj.weight": "model-00038-of-00047.safetensors", + "model.layers.37.mlp.experts.86.up_proj.weight_scale": "model-00038-of-00047.safetensors", + "model.layers.37.mlp.experts.87.down_proj.weight": "model-00038-of-00047.safetensors", + "model.layers.37.mlp.experts.87.down_proj.weight_scale": "model-00038-of-00047.safetensors", + "model.layers.37.mlp.experts.87.gate_proj.weight": "model-00038-of-00047.safetensors", + "model.layers.37.mlp.experts.87.gate_proj.weight_scale": "model-00038-of-00047.safetensors", + "model.layers.37.mlp.experts.87.up_proj.weight": "model-00038-of-00047.safetensors", + "model.layers.37.mlp.experts.87.up_proj.weight_scale": "model-00038-of-00047.safetensors", + "model.layers.37.mlp.experts.88.down_proj.weight": "model-00038-of-00047.safetensors", + "model.layers.37.mlp.experts.88.down_proj.weight_scale": "model-00038-of-00047.safetensors", + "model.layers.37.mlp.experts.88.gate_proj.weight": "model-00038-of-00047.safetensors", + "model.layers.37.mlp.experts.88.gate_proj.weight_scale": "model-00038-of-00047.safetensors", + "model.layers.37.mlp.experts.88.up_proj.weight": "model-00038-of-00047.safetensors", + "model.layers.37.mlp.experts.88.up_proj.weight_scale": "model-00038-of-00047.safetensors", + "model.layers.37.mlp.experts.89.down_proj.weight": "model-00038-of-00047.safetensors", + "model.layers.37.mlp.experts.89.down_proj.weight_scale": "model-00038-of-00047.safetensors", + "model.layers.37.mlp.experts.89.gate_proj.weight": "model-00038-of-00047.safetensors", + "model.layers.37.mlp.experts.89.gate_proj.weight_scale": "model-00038-of-00047.safetensors", + "model.layers.37.mlp.experts.89.up_proj.weight": "model-00038-of-00047.safetensors", + "model.layers.37.mlp.experts.89.up_proj.weight_scale": "model-00038-of-00047.safetensors", + "model.layers.37.mlp.experts.9.down_proj.weight": "model-00038-of-00047.safetensors", + "model.layers.37.mlp.experts.9.down_proj.weight_scale": "model-00038-of-00047.safetensors", + "model.layers.37.mlp.experts.9.gate_proj.weight": "model-00038-of-00047.safetensors", + "model.layers.37.mlp.experts.9.gate_proj.weight_scale": "model-00038-of-00047.safetensors", + "model.layers.37.mlp.experts.9.up_proj.weight": "model-00038-of-00047.safetensors", + "model.layers.37.mlp.experts.9.up_proj.weight_scale": "model-00038-of-00047.safetensors", + "model.layers.37.mlp.experts.90.down_proj.weight": "model-00038-of-00047.safetensors", + "model.layers.37.mlp.experts.90.down_proj.weight_scale": "model-00038-of-00047.safetensors", + "model.layers.37.mlp.experts.90.gate_proj.weight": "model-00038-of-00047.safetensors", + "model.layers.37.mlp.experts.90.gate_proj.weight_scale": "model-00038-of-00047.safetensors", + "model.layers.37.mlp.experts.90.up_proj.weight": "model-00038-of-00047.safetensors", + "model.layers.37.mlp.experts.90.up_proj.weight_scale": "model-00038-of-00047.safetensors", + "model.layers.37.mlp.experts.91.down_proj.weight": "model-00038-of-00047.safetensors", + "model.layers.37.mlp.experts.91.down_proj.weight_scale": "model-00038-of-00047.safetensors", + "model.layers.37.mlp.experts.91.gate_proj.weight": "model-00038-of-00047.safetensors", + "model.layers.37.mlp.experts.91.gate_proj.weight_scale": "model-00038-of-00047.safetensors", + "model.layers.37.mlp.experts.91.up_proj.weight": "model-00038-of-00047.safetensors", + "model.layers.37.mlp.experts.91.up_proj.weight_scale": "model-00038-of-00047.safetensors", + "model.layers.37.mlp.experts.92.down_proj.weight": "model-00038-of-00047.safetensors", + "model.layers.37.mlp.experts.92.down_proj.weight_scale": "model-00038-of-00047.safetensors", + "model.layers.37.mlp.experts.92.gate_proj.weight": "model-00038-of-00047.safetensors", + "model.layers.37.mlp.experts.92.gate_proj.weight_scale": "model-00038-of-00047.safetensors", + "model.layers.37.mlp.experts.92.up_proj.weight": "model-00038-of-00047.safetensors", + "model.layers.37.mlp.experts.92.up_proj.weight_scale": "model-00038-of-00047.safetensors", + "model.layers.37.mlp.experts.93.down_proj.weight": "model-00038-of-00047.safetensors", + "model.layers.37.mlp.experts.93.down_proj.weight_scale": "model-00038-of-00047.safetensors", + "model.layers.37.mlp.experts.93.gate_proj.weight": "model-00038-of-00047.safetensors", + "model.layers.37.mlp.experts.93.gate_proj.weight_scale": "model-00038-of-00047.safetensors", + "model.layers.37.mlp.experts.93.up_proj.weight": "model-00038-of-00047.safetensors", + "model.layers.37.mlp.experts.93.up_proj.weight_scale": "model-00038-of-00047.safetensors", + "model.layers.37.mlp.experts.94.down_proj.weight": "model-00038-of-00047.safetensors", + "model.layers.37.mlp.experts.94.down_proj.weight_scale": "model-00038-of-00047.safetensors", + "model.layers.37.mlp.experts.94.gate_proj.weight": "model-00038-of-00047.safetensors", + "model.layers.37.mlp.experts.94.gate_proj.weight_scale": "model-00038-of-00047.safetensors", + "model.layers.37.mlp.experts.94.up_proj.weight": "model-00038-of-00047.safetensors", + "model.layers.37.mlp.experts.94.up_proj.weight_scale": "model-00038-of-00047.safetensors", + "model.layers.37.mlp.experts.95.down_proj.weight": "model-00038-of-00047.safetensors", + "model.layers.37.mlp.experts.95.down_proj.weight_scale": "model-00038-of-00047.safetensors", + "model.layers.37.mlp.experts.95.gate_proj.weight": "model-00038-of-00047.safetensors", + "model.layers.37.mlp.experts.95.gate_proj.weight_scale": "model-00038-of-00047.safetensors", + "model.layers.37.mlp.experts.95.up_proj.weight": "model-00038-of-00047.safetensors", + "model.layers.37.mlp.experts.95.up_proj.weight_scale": "model-00038-of-00047.safetensors", + "model.layers.37.mlp.experts.96.down_proj.weight": "model-00038-of-00047.safetensors", + "model.layers.37.mlp.experts.96.down_proj.weight_scale": "model-00038-of-00047.safetensors", + "model.layers.37.mlp.experts.96.gate_proj.weight": "model-00038-of-00047.safetensors", + "model.layers.37.mlp.experts.96.gate_proj.weight_scale": "model-00038-of-00047.safetensors", + "model.layers.37.mlp.experts.96.up_proj.weight": "model-00038-of-00047.safetensors", + "model.layers.37.mlp.experts.96.up_proj.weight_scale": "model-00038-of-00047.safetensors", + "model.layers.37.mlp.experts.97.down_proj.weight": "model-00038-of-00047.safetensors", + "model.layers.37.mlp.experts.97.down_proj.weight_scale": "model-00038-of-00047.safetensors", + "model.layers.37.mlp.experts.97.gate_proj.weight": "model-00038-of-00047.safetensors", + "model.layers.37.mlp.experts.97.gate_proj.weight_scale": "model-00038-of-00047.safetensors", + "model.layers.37.mlp.experts.97.up_proj.weight": "model-00038-of-00047.safetensors", + "model.layers.37.mlp.experts.97.up_proj.weight_scale": "model-00038-of-00047.safetensors", + "model.layers.37.mlp.experts.98.down_proj.weight": "model-00038-of-00047.safetensors", + "model.layers.37.mlp.experts.98.down_proj.weight_scale": "model-00038-of-00047.safetensors", + "model.layers.37.mlp.experts.98.gate_proj.weight": "model-00038-of-00047.safetensors", + "model.layers.37.mlp.experts.98.gate_proj.weight_scale": "model-00038-of-00047.safetensors", + "model.layers.37.mlp.experts.98.up_proj.weight": "model-00038-of-00047.safetensors", + "model.layers.37.mlp.experts.98.up_proj.weight_scale": "model-00038-of-00047.safetensors", + "model.layers.37.mlp.experts.99.down_proj.weight": "model-00038-of-00047.safetensors", + "model.layers.37.mlp.experts.99.down_proj.weight_scale": "model-00038-of-00047.safetensors", + "model.layers.37.mlp.experts.99.gate_proj.weight": "model-00038-of-00047.safetensors", + "model.layers.37.mlp.experts.99.gate_proj.weight_scale": "model-00038-of-00047.safetensors", + "model.layers.37.mlp.experts.99.up_proj.weight": "model-00038-of-00047.safetensors", + "model.layers.37.mlp.experts.99.up_proj.weight_scale": "model-00038-of-00047.safetensors", + "model.layers.37.mlp.gate.e_score_correction_bias": "model-00038-of-00047.safetensors", + "model.layers.37.mlp.gate.weight": "model-00038-of-00047.safetensors", + "model.layers.37.mlp.shared_experts.down_proj.weight": "model-00038-of-00047.safetensors", + "model.layers.37.mlp.shared_experts.down_proj.weight_scale": "model-00038-of-00047.safetensors", + "model.layers.37.mlp.shared_experts.gate_proj.weight": "model-00038-of-00047.safetensors", + "model.layers.37.mlp.shared_experts.gate_proj.weight_scale": "model-00038-of-00047.safetensors", + "model.layers.37.mlp.shared_experts.up_proj.weight": "model-00038-of-00047.safetensors", + "model.layers.37.mlp.shared_experts.up_proj.weight_scale": "model-00038-of-00047.safetensors", + "model.layers.37.post_attention_layernorm.weight": "model-00038-of-00047.safetensors", + "model.layers.37.self_attn.k_proj.bias": "model-00038-of-00047.safetensors", + "model.layers.37.self_attn.k_proj.weight": "model-00038-of-00047.safetensors", + "model.layers.37.self_attn.k_proj.weight_scale": "model-00038-of-00047.safetensors", + "model.layers.37.self_attn.o_proj.weight": "model-00038-of-00047.safetensors", + "model.layers.37.self_attn.o_proj.weight_scale": "model-00038-of-00047.safetensors", + "model.layers.37.self_attn.q_proj.bias": "model-00038-of-00047.safetensors", + "model.layers.37.self_attn.q_proj.weight": "model-00038-of-00047.safetensors", + "model.layers.37.self_attn.q_proj.weight_scale": "model-00038-of-00047.safetensors", + "model.layers.37.self_attn.v_proj.bias": "model-00038-of-00047.safetensors", + "model.layers.37.self_attn.v_proj.weight": "model-00038-of-00047.safetensors", + "model.layers.37.self_attn.v_proj.weight_scale": "model-00038-of-00047.safetensors", + "model.layers.38.input_layernorm.weight": "model-00039-of-00047.safetensors", + "model.layers.38.mlp.experts.0.down_proj.weight": "model-00039-of-00047.safetensors", + "model.layers.38.mlp.experts.0.down_proj.weight_scale": "model-00039-of-00047.safetensors", + "model.layers.38.mlp.experts.0.gate_proj.weight": "model-00039-of-00047.safetensors", + "model.layers.38.mlp.experts.0.gate_proj.weight_scale": "model-00039-of-00047.safetensors", + "model.layers.38.mlp.experts.0.up_proj.weight": "model-00039-of-00047.safetensors", + "model.layers.38.mlp.experts.0.up_proj.weight_scale": "model-00039-of-00047.safetensors", + "model.layers.38.mlp.experts.1.down_proj.weight": "model-00039-of-00047.safetensors", + "model.layers.38.mlp.experts.1.down_proj.weight_scale": "model-00039-of-00047.safetensors", + "model.layers.38.mlp.experts.1.gate_proj.weight": "model-00039-of-00047.safetensors", + "model.layers.38.mlp.experts.1.gate_proj.weight_scale": "model-00039-of-00047.safetensors", + "model.layers.38.mlp.experts.1.up_proj.weight": "model-00039-of-00047.safetensors", + "model.layers.38.mlp.experts.1.up_proj.weight_scale": "model-00039-of-00047.safetensors", + "model.layers.38.mlp.experts.10.down_proj.weight": "model-00039-of-00047.safetensors", + "model.layers.38.mlp.experts.10.down_proj.weight_scale": "model-00039-of-00047.safetensors", + "model.layers.38.mlp.experts.10.gate_proj.weight": "model-00039-of-00047.safetensors", + "model.layers.38.mlp.experts.10.gate_proj.weight_scale": "model-00039-of-00047.safetensors", + "model.layers.38.mlp.experts.10.up_proj.weight": "model-00039-of-00047.safetensors", + "model.layers.38.mlp.experts.10.up_proj.weight_scale": "model-00039-of-00047.safetensors", + "model.layers.38.mlp.experts.100.down_proj.weight": "model-00039-of-00047.safetensors", + "model.layers.38.mlp.experts.100.down_proj.weight_scale": "model-00039-of-00047.safetensors", + "model.layers.38.mlp.experts.100.gate_proj.weight": "model-00039-of-00047.safetensors", + "model.layers.38.mlp.experts.100.gate_proj.weight_scale": "model-00039-of-00047.safetensors", + "model.layers.38.mlp.experts.100.up_proj.weight": "model-00039-of-00047.safetensors", + "model.layers.38.mlp.experts.100.up_proj.weight_scale": "model-00039-of-00047.safetensors", + "model.layers.38.mlp.experts.101.down_proj.weight": "model-00039-of-00047.safetensors", + "model.layers.38.mlp.experts.101.down_proj.weight_scale": "model-00039-of-00047.safetensors", + "model.layers.38.mlp.experts.101.gate_proj.weight": "model-00039-of-00047.safetensors", + "model.layers.38.mlp.experts.101.gate_proj.weight_scale": "model-00039-of-00047.safetensors", + "model.layers.38.mlp.experts.101.up_proj.weight": "model-00039-of-00047.safetensors", + "model.layers.38.mlp.experts.101.up_proj.weight_scale": "model-00039-of-00047.safetensors", + "model.layers.38.mlp.experts.102.down_proj.weight": "model-00039-of-00047.safetensors", + "model.layers.38.mlp.experts.102.down_proj.weight_scale": "model-00039-of-00047.safetensors", + "model.layers.38.mlp.experts.102.gate_proj.weight": "model-00039-of-00047.safetensors", + "model.layers.38.mlp.experts.102.gate_proj.weight_scale": "model-00039-of-00047.safetensors", + "model.layers.38.mlp.experts.102.up_proj.weight": "model-00039-of-00047.safetensors", + "model.layers.38.mlp.experts.102.up_proj.weight_scale": "model-00039-of-00047.safetensors", + "model.layers.38.mlp.experts.103.down_proj.weight": "model-00039-of-00047.safetensors", + "model.layers.38.mlp.experts.103.down_proj.weight_scale": "model-00039-of-00047.safetensors", + "model.layers.38.mlp.experts.103.gate_proj.weight": "model-00039-of-00047.safetensors", + "model.layers.38.mlp.experts.103.gate_proj.weight_scale": "model-00039-of-00047.safetensors", + "model.layers.38.mlp.experts.103.up_proj.weight": "model-00039-of-00047.safetensors", + "model.layers.38.mlp.experts.103.up_proj.weight_scale": "model-00039-of-00047.safetensors", + "model.layers.38.mlp.experts.104.down_proj.weight": "model-00039-of-00047.safetensors", + "model.layers.38.mlp.experts.104.down_proj.weight_scale": "model-00039-of-00047.safetensors", + "model.layers.38.mlp.experts.104.gate_proj.weight": "model-00039-of-00047.safetensors", + "model.layers.38.mlp.experts.104.gate_proj.weight_scale": "model-00039-of-00047.safetensors", + "model.layers.38.mlp.experts.104.up_proj.weight": "model-00039-of-00047.safetensors", + "model.layers.38.mlp.experts.104.up_proj.weight_scale": "model-00039-of-00047.safetensors", + "model.layers.38.mlp.experts.105.down_proj.weight": "model-00039-of-00047.safetensors", + "model.layers.38.mlp.experts.105.down_proj.weight_scale": "model-00039-of-00047.safetensors", + "model.layers.38.mlp.experts.105.gate_proj.weight": "model-00039-of-00047.safetensors", + "model.layers.38.mlp.experts.105.gate_proj.weight_scale": "model-00039-of-00047.safetensors", + "model.layers.38.mlp.experts.105.up_proj.weight": "model-00039-of-00047.safetensors", + "model.layers.38.mlp.experts.105.up_proj.weight_scale": "model-00039-of-00047.safetensors", + "model.layers.38.mlp.experts.106.down_proj.weight": "model-00039-of-00047.safetensors", + "model.layers.38.mlp.experts.106.down_proj.weight_scale": "model-00039-of-00047.safetensors", + "model.layers.38.mlp.experts.106.gate_proj.weight": "model-00039-of-00047.safetensors", + "model.layers.38.mlp.experts.106.gate_proj.weight_scale": "model-00039-of-00047.safetensors", + "model.layers.38.mlp.experts.106.up_proj.weight": "model-00039-of-00047.safetensors", + "model.layers.38.mlp.experts.106.up_proj.weight_scale": "model-00039-of-00047.safetensors", + "model.layers.38.mlp.experts.107.down_proj.weight": "model-00039-of-00047.safetensors", + "model.layers.38.mlp.experts.107.down_proj.weight_scale": "model-00039-of-00047.safetensors", + "model.layers.38.mlp.experts.107.gate_proj.weight": "model-00039-of-00047.safetensors", + "model.layers.38.mlp.experts.107.gate_proj.weight_scale": "model-00039-of-00047.safetensors", + "model.layers.38.mlp.experts.107.up_proj.weight": "model-00039-of-00047.safetensors", + "model.layers.38.mlp.experts.107.up_proj.weight_scale": "model-00039-of-00047.safetensors", + "model.layers.38.mlp.experts.108.down_proj.weight": "model-00039-of-00047.safetensors", + "model.layers.38.mlp.experts.108.down_proj.weight_scale": "model-00039-of-00047.safetensors", + "model.layers.38.mlp.experts.108.gate_proj.weight": "model-00039-of-00047.safetensors", + "model.layers.38.mlp.experts.108.gate_proj.weight_scale": "model-00039-of-00047.safetensors", + "model.layers.38.mlp.experts.108.up_proj.weight": "model-00039-of-00047.safetensors", + "model.layers.38.mlp.experts.108.up_proj.weight_scale": "model-00039-of-00047.safetensors", + "model.layers.38.mlp.experts.109.down_proj.weight": "model-00039-of-00047.safetensors", + "model.layers.38.mlp.experts.109.down_proj.weight_scale": "model-00039-of-00047.safetensors", + "model.layers.38.mlp.experts.109.gate_proj.weight": "model-00039-of-00047.safetensors", + "model.layers.38.mlp.experts.109.gate_proj.weight_scale": "model-00039-of-00047.safetensors", + "model.layers.38.mlp.experts.109.up_proj.weight": "model-00039-of-00047.safetensors", + "model.layers.38.mlp.experts.109.up_proj.weight_scale": "model-00039-of-00047.safetensors", + "model.layers.38.mlp.experts.11.down_proj.weight": "model-00039-of-00047.safetensors", + "model.layers.38.mlp.experts.11.down_proj.weight_scale": "model-00039-of-00047.safetensors", + "model.layers.38.mlp.experts.11.gate_proj.weight": "model-00039-of-00047.safetensors", + "model.layers.38.mlp.experts.11.gate_proj.weight_scale": "model-00039-of-00047.safetensors", + "model.layers.38.mlp.experts.11.up_proj.weight": "model-00039-of-00047.safetensors", + "model.layers.38.mlp.experts.11.up_proj.weight_scale": "model-00039-of-00047.safetensors", + "model.layers.38.mlp.experts.110.down_proj.weight": "model-00039-of-00047.safetensors", + "model.layers.38.mlp.experts.110.down_proj.weight_scale": "model-00039-of-00047.safetensors", + "model.layers.38.mlp.experts.110.gate_proj.weight": "model-00039-of-00047.safetensors", + "model.layers.38.mlp.experts.110.gate_proj.weight_scale": "model-00039-of-00047.safetensors", + "model.layers.38.mlp.experts.110.up_proj.weight": "model-00039-of-00047.safetensors", + "model.layers.38.mlp.experts.110.up_proj.weight_scale": "model-00039-of-00047.safetensors", + "model.layers.38.mlp.experts.111.down_proj.weight": "model-00039-of-00047.safetensors", + "model.layers.38.mlp.experts.111.down_proj.weight_scale": "model-00039-of-00047.safetensors", + "model.layers.38.mlp.experts.111.gate_proj.weight": "model-00039-of-00047.safetensors", + "model.layers.38.mlp.experts.111.gate_proj.weight_scale": "model-00039-of-00047.safetensors", + "model.layers.38.mlp.experts.111.up_proj.weight": "model-00039-of-00047.safetensors", + "model.layers.38.mlp.experts.111.up_proj.weight_scale": "model-00039-of-00047.safetensors", + "model.layers.38.mlp.experts.112.down_proj.weight": "model-00039-of-00047.safetensors", + "model.layers.38.mlp.experts.112.down_proj.weight_scale": "model-00039-of-00047.safetensors", + "model.layers.38.mlp.experts.112.gate_proj.weight": "model-00039-of-00047.safetensors", + "model.layers.38.mlp.experts.112.gate_proj.weight_scale": "model-00039-of-00047.safetensors", + "model.layers.38.mlp.experts.112.up_proj.weight": "model-00039-of-00047.safetensors", + "model.layers.38.mlp.experts.112.up_proj.weight_scale": "model-00039-of-00047.safetensors", + "model.layers.38.mlp.experts.113.down_proj.weight": "model-00039-of-00047.safetensors", + "model.layers.38.mlp.experts.113.down_proj.weight_scale": "model-00039-of-00047.safetensors", + "model.layers.38.mlp.experts.113.gate_proj.weight": "model-00039-of-00047.safetensors", + "model.layers.38.mlp.experts.113.gate_proj.weight_scale": "model-00039-of-00047.safetensors", + "model.layers.38.mlp.experts.113.up_proj.weight": "model-00039-of-00047.safetensors", + "model.layers.38.mlp.experts.113.up_proj.weight_scale": "model-00039-of-00047.safetensors", + "model.layers.38.mlp.experts.114.down_proj.weight": "model-00039-of-00047.safetensors", + "model.layers.38.mlp.experts.114.down_proj.weight_scale": "model-00039-of-00047.safetensors", + "model.layers.38.mlp.experts.114.gate_proj.weight": "model-00039-of-00047.safetensors", + "model.layers.38.mlp.experts.114.gate_proj.weight_scale": "model-00039-of-00047.safetensors", + "model.layers.38.mlp.experts.114.up_proj.weight": "model-00039-of-00047.safetensors", + "model.layers.38.mlp.experts.114.up_proj.weight_scale": "model-00039-of-00047.safetensors", + "model.layers.38.mlp.experts.115.down_proj.weight": "model-00039-of-00047.safetensors", + "model.layers.38.mlp.experts.115.down_proj.weight_scale": "model-00039-of-00047.safetensors", + "model.layers.38.mlp.experts.115.gate_proj.weight": "model-00039-of-00047.safetensors", + "model.layers.38.mlp.experts.115.gate_proj.weight_scale": "model-00039-of-00047.safetensors", + "model.layers.38.mlp.experts.115.up_proj.weight": "model-00039-of-00047.safetensors", + "model.layers.38.mlp.experts.115.up_proj.weight_scale": "model-00039-of-00047.safetensors", + "model.layers.38.mlp.experts.116.down_proj.weight": "model-00039-of-00047.safetensors", + "model.layers.38.mlp.experts.116.down_proj.weight_scale": "model-00039-of-00047.safetensors", + "model.layers.38.mlp.experts.116.gate_proj.weight": "model-00039-of-00047.safetensors", + "model.layers.38.mlp.experts.116.gate_proj.weight_scale": "model-00039-of-00047.safetensors", + "model.layers.38.mlp.experts.116.up_proj.weight": "model-00039-of-00047.safetensors", + "model.layers.38.mlp.experts.116.up_proj.weight_scale": "model-00039-of-00047.safetensors", + "model.layers.38.mlp.experts.117.down_proj.weight": "model-00039-of-00047.safetensors", + "model.layers.38.mlp.experts.117.down_proj.weight_scale": "model-00039-of-00047.safetensors", + "model.layers.38.mlp.experts.117.gate_proj.weight": "model-00039-of-00047.safetensors", + "model.layers.38.mlp.experts.117.gate_proj.weight_scale": "model-00039-of-00047.safetensors", + "model.layers.38.mlp.experts.117.up_proj.weight": "model-00039-of-00047.safetensors", + "model.layers.38.mlp.experts.117.up_proj.weight_scale": "model-00039-of-00047.safetensors", + "model.layers.38.mlp.experts.118.down_proj.weight": "model-00039-of-00047.safetensors", + "model.layers.38.mlp.experts.118.down_proj.weight_scale": "model-00039-of-00047.safetensors", + "model.layers.38.mlp.experts.118.gate_proj.weight": "model-00039-of-00047.safetensors", + "model.layers.38.mlp.experts.118.gate_proj.weight_scale": "model-00039-of-00047.safetensors", + "model.layers.38.mlp.experts.118.up_proj.weight": "model-00039-of-00047.safetensors", + "model.layers.38.mlp.experts.118.up_proj.weight_scale": "model-00039-of-00047.safetensors", + "model.layers.38.mlp.experts.119.down_proj.weight": "model-00039-of-00047.safetensors", + "model.layers.38.mlp.experts.119.down_proj.weight_scale": "model-00039-of-00047.safetensors", + "model.layers.38.mlp.experts.119.gate_proj.weight": "model-00039-of-00047.safetensors", + "model.layers.38.mlp.experts.119.gate_proj.weight_scale": "model-00039-of-00047.safetensors", + "model.layers.38.mlp.experts.119.up_proj.weight": "model-00039-of-00047.safetensors", + "model.layers.38.mlp.experts.119.up_proj.weight_scale": "model-00039-of-00047.safetensors", + "model.layers.38.mlp.experts.12.down_proj.weight": "model-00039-of-00047.safetensors", + "model.layers.38.mlp.experts.12.down_proj.weight_scale": "model-00039-of-00047.safetensors", + "model.layers.38.mlp.experts.12.gate_proj.weight": "model-00039-of-00047.safetensors", + "model.layers.38.mlp.experts.12.gate_proj.weight_scale": "model-00039-of-00047.safetensors", + "model.layers.38.mlp.experts.12.up_proj.weight": "model-00039-of-00047.safetensors", + "model.layers.38.mlp.experts.12.up_proj.weight_scale": "model-00039-of-00047.safetensors", + "model.layers.38.mlp.experts.120.down_proj.weight": "model-00039-of-00047.safetensors", + "model.layers.38.mlp.experts.120.down_proj.weight_scale": "model-00039-of-00047.safetensors", + "model.layers.38.mlp.experts.120.gate_proj.weight": "model-00039-of-00047.safetensors", + "model.layers.38.mlp.experts.120.gate_proj.weight_scale": "model-00039-of-00047.safetensors", + "model.layers.38.mlp.experts.120.up_proj.weight": "model-00039-of-00047.safetensors", + "model.layers.38.mlp.experts.120.up_proj.weight_scale": "model-00039-of-00047.safetensors", + "model.layers.38.mlp.experts.121.down_proj.weight": "model-00039-of-00047.safetensors", + "model.layers.38.mlp.experts.121.down_proj.weight_scale": "model-00039-of-00047.safetensors", + "model.layers.38.mlp.experts.121.gate_proj.weight": "model-00039-of-00047.safetensors", + "model.layers.38.mlp.experts.121.gate_proj.weight_scale": "model-00039-of-00047.safetensors", + "model.layers.38.mlp.experts.121.up_proj.weight": "model-00039-of-00047.safetensors", + "model.layers.38.mlp.experts.121.up_proj.weight_scale": "model-00039-of-00047.safetensors", + "model.layers.38.mlp.experts.122.down_proj.weight": "model-00039-of-00047.safetensors", + "model.layers.38.mlp.experts.122.down_proj.weight_scale": "model-00039-of-00047.safetensors", + "model.layers.38.mlp.experts.122.gate_proj.weight": "model-00039-of-00047.safetensors", + "model.layers.38.mlp.experts.122.gate_proj.weight_scale": "model-00039-of-00047.safetensors", + "model.layers.38.mlp.experts.122.up_proj.weight": "model-00039-of-00047.safetensors", + "model.layers.38.mlp.experts.122.up_proj.weight_scale": "model-00039-of-00047.safetensors", + "model.layers.38.mlp.experts.123.down_proj.weight": "model-00039-of-00047.safetensors", + "model.layers.38.mlp.experts.123.down_proj.weight_scale": "model-00039-of-00047.safetensors", + "model.layers.38.mlp.experts.123.gate_proj.weight": "model-00039-of-00047.safetensors", + "model.layers.38.mlp.experts.123.gate_proj.weight_scale": "model-00039-of-00047.safetensors", + "model.layers.38.mlp.experts.123.up_proj.weight": "model-00039-of-00047.safetensors", + "model.layers.38.mlp.experts.123.up_proj.weight_scale": "model-00039-of-00047.safetensors", + "model.layers.38.mlp.experts.124.down_proj.weight": "model-00039-of-00047.safetensors", + "model.layers.38.mlp.experts.124.down_proj.weight_scale": "model-00039-of-00047.safetensors", + "model.layers.38.mlp.experts.124.gate_proj.weight": "model-00039-of-00047.safetensors", + "model.layers.38.mlp.experts.124.gate_proj.weight_scale": "model-00039-of-00047.safetensors", + "model.layers.38.mlp.experts.124.up_proj.weight": "model-00039-of-00047.safetensors", + "model.layers.38.mlp.experts.124.up_proj.weight_scale": "model-00039-of-00047.safetensors", + "model.layers.38.mlp.experts.125.down_proj.weight": "model-00039-of-00047.safetensors", + "model.layers.38.mlp.experts.125.down_proj.weight_scale": "model-00039-of-00047.safetensors", + "model.layers.38.mlp.experts.125.gate_proj.weight": "model-00039-of-00047.safetensors", + "model.layers.38.mlp.experts.125.gate_proj.weight_scale": "model-00039-of-00047.safetensors", + "model.layers.38.mlp.experts.125.up_proj.weight": "model-00039-of-00047.safetensors", + "model.layers.38.mlp.experts.125.up_proj.weight_scale": "model-00039-of-00047.safetensors", + "model.layers.38.mlp.experts.126.down_proj.weight": "model-00039-of-00047.safetensors", + "model.layers.38.mlp.experts.126.down_proj.weight_scale": "model-00039-of-00047.safetensors", + "model.layers.38.mlp.experts.126.gate_proj.weight": "model-00039-of-00047.safetensors", + "model.layers.38.mlp.experts.126.gate_proj.weight_scale": "model-00039-of-00047.safetensors", + "model.layers.38.mlp.experts.126.up_proj.weight": "model-00039-of-00047.safetensors", + "model.layers.38.mlp.experts.126.up_proj.weight_scale": "model-00039-of-00047.safetensors", + "model.layers.38.mlp.experts.127.down_proj.weight": "model-00039-of-00047.safetensors", + "model.layers.38.mlp.experts.127.down_proj.weight_scale": "model-00039-of-00047.safetensors", + "model.layers.38.mlp.experts.127.gate_proj.weight": "model-00039-of-00047.safetensors", + "model.layers.38.mlp.experts.127.gate_proj.weight_scale": "model-00039-of-00047.safetensors", + "model.layers.38.mlp.experts.127.up_proj.weight": "model-00039-of-00047.safetensors", + "model.layers.38.mlp.experts.127.up_proj.weight_scale": "model-00039-of-00047.safetensors", + "model.layers.38.mlp.experts.13.down_proj.weight": "model-00039-of-00047.safetensors", + "model.layers.38.mlp.experts.13.down_proj.weight_scale": "model-00039-of-00047.safetensors", + "model.layers.38.mlp.experts.13.gate_proj.weight": "model-00039-of-00047.safetensors", + "model.layers.38.mlp.experts.13.gate_proj.weight_scale": "model-00039-of-00047.safetensors", + "model.layers.38.mlp.experts.13.up_proj.weight": "model-00039-of-00047.safetensors", + "model.layers.38.mlp.experts.13.up_proj.weight_scale": "model-00039-of-00047.safetensors", + "model.layers.38.mlp.experts.14.down_proj.weight": "model-00039-of-00047.safetensors", + "model.layers.38.mlp.experts.14.down_proj.weight_scale": "model-00039-of-00047.safetensors", + "model.layers.38.mlp.experts.14.gate_proj.weight": "model-00039-of-00047.safetensors", + "model.layers.38.mlp.experts.14.gate_proj.weight_scale": "model-00039-of-00047.safetensors", + "model.layers.38.mlp.experts.14.up_proj.weight": "model-00039-of-00047.safetensors", + "model.layers.38.mlp.experts.14.up_proj.weight_scale": "model-00039-of-00047.safetensors", + "model.layers.38.mlp.experts.15.down_proj.weight": "model-00039-of-00047.safetensors", + "model.layers.38.mlp.experts.15.down_proj.weight_scale": "model-00039-of-00047.safetensors", + "model.layers.38.mlp.experts.15.gate_proj.weight": "model-00039-of-00047.safetensors", + "model.layers.38.mlp.experts.15.gate_proj.weight_scale": "model-00039-of-00047.safetensors", + "model.layers.38.mlp.experts.15.up_proj.weight": "model-00039-of-00047.safetensors", + "model.layers.38.mlp.experts.15.up_proj.weight_scale": "model-00039-of-00047.safetensors", + "model.layers.38.mlp.experts.16.down_proj.weight": "model-00039-of-00047.safetensors", + "model.layers.38.mlp.experts.16.down_proj.weight_scale": "model-00039-of-00047.safetensors", + "model.layers.38.mlp.experts.16.gate_proj.weight": "model-00039-of-00047.safetensors", + "model.layers.38.mlp.experts.16.gate_proj.weight_scale": "model-00039-of-00047.safetensors", + "model.layers.38.mlp.experts.16.up_proj.weight": "model-00039-of-00047.safetensors", + "model.layers.38.mlp.experts.16.up_proj.weight_scale": "model-00039-of-00047.safetensors", + "model.layers.38.mlp.experts.17.down_proj.weight": "model-00039-of-00047.safetensors", + "model.layers.38.mlp.experts.17.down_proj.weight_scale": "model-00039-of-00047.safetensors", + "model.layers.38.mlp.experts.17.gate_proj.weight": "model-00039-of-00047.safetensors", + "model.layers.38.mlp.experts.17.gate_proj.weight_scale": "model-00039-of-00047.safetensors", + "model.layers.38.mlp.experts.17.up_proj.weight": "model-00039-of-00047.safetensors", + "model.layers.38.mlp.experts.17.up_proj.weight_scale": "model-00039-of-00047.safetensors", + "model.layers.38.mlp.experts.18.down_proj.weight": "model-00039-of-00047.safetensors", + "model.layers.38.mlp.experts.18.down_proj.weight_scale": "model-00039-of-00047.safetensors", + "model.layers.38.mlp.experts.18.gate_proj.weight": "model-00039-of-00047.safetensors", + "model.layers.38.mlp.experts.18.gate_proj.weight_scale": "model-00039-of-00047.safetensors", + "model.layers.38.mlp.experts.18.up_proj.weight": "model-00039-of-00047.safetensors", + "model.layers.38.mlp.experts.18.up_proj.weight_scale": "model-00039-of-00047.safetensors", + "model.layers.38.mlp.experts.19.down_proj.weight": "model-00039-of-00047.safetensors", + "model.layers.38.mlp.experts.19.down_proj.weight_scale": "model-00039-of-00047.safetensors", + "model.layers.38.mlp.experts.19.gate_proj.weight": "model-00039-of-00047.safetensors", + "model.layers.38.mlp.experts.19.gate_proj.weight_scale": "model-00039-of-00047.safetensors", + "model.layers.38.mlp.experts.19.up_proj.weight": "model-00039-of-00047.safetensors", + "model.layers.38.mlp.experts.19.up_proj.weight_scale": "model-00039-of-00047.safetensors", + "model.layers.38.mlp.experts.2.down_proj.weight": "model-00039-of-00047.safetensors", + "model.layers.38.mlp.experts.2.down_proj.weight_scale": "model-00039-of-00047.safetensors", + "model.layers.38.mlp.experts.2.gate_proj.weight": "model-00039-of-00047.safetensors", + "model.layers.38.mlp.experts.2.gate_proj.weight_scale": "model-00039-of-00047.safetensors", + "model.layers.38.mlp.experts.2.up_proj.weight": "model-00039-of-00047.safetensors", + "model.layers.38.mlp.experts.2.up_proj.weight_scale": "model-00039-of-00047.safetensors", + "model.layers.38.mlp.experts.20.down_proj.weight": "model-00039-of-00047.safetensors", + "model.layers.38.mlp.experts.20.down_proj.weight_scale": "model-00039-of-00047.safetensors", + "model.layers.38.mlp.experts.20.gate_proj.weight": "model-00039-of-00047.safetensors", + "model.layers.38.mlp.experts.20.gate_proj.weight_scale": "model-00039-of-00047.safetensors", + "model.layers.38.mlp.experts.20.up_proj.weight": "model-00039-of-00047.safetensors", + "model.layers.38.mlp.experts.20.up_proj.weight_scale": "model-00039-of-00047.safetensors", + "model.layers.38.mlp.experts.21.down_proj.weight": "model-00039-of-00047.safetensors", + "model.layers.38.mlp.experts.21.down_proj.weight_scale": "model-00039-of-00047.safetensors", + "model.layers.38.mlp.experts.21.gate_proj.weight": "model-00039-of-00047.safetensors", + "model.layers.38.mlp.experts.21.gate_proj.weight_scale": "model-00039-of-00047.safetensors", + "model.layers.38.mlp.experts.21.up_proj.weight": "model-00039-of-00047.safetensors", + "model.layers.38.mlp.experts.21.up_proj.weight_scale": "model-00039-of-00047.safetensors", + "model.layers.38.mlp.experts.22.down_proj.weight": "model-00039-of-00047.safetensors", + "model.layers.38.mlp.experts.22.down_proj.weight_scale": "model-00039-of-00047.safetensors", + "model.layers.38.mlp.experts.22.gate_proj.weight": "model-00039-of-00047.safetensors", + "model.layers.38.mlp.experts.22.gate_proj.weight_scale": "model-00039-of-00047.safetensors", + "model.layers.38.mlp.experts.22.up_proj.weight": "model-00039-of-00047.safetensors", + "model.layers.38.mlp.experts.22.up_proj.weight_scale": "model-00039-of-00047.safetensors", + "model.layers.38.mlp.experts.23.down_proj.weight": "model-00039-of-00047.safetensors", + "model.layers.38.mlp.experts.23.down_proj.weight_scale": "model-00039-of-00047.safetensors", + "model.layers.38.mlp.experts.23.gate_proj.weight": "model-00039-of-00047.safetensors", + "model.layers.38.mlp.experts.23.gate_proj.weight_scale": "model-00039-of-00047.safetensors", + "model.layers.38.mlp.experts.23.up_proj.weight": "model-00039-of-00047.safetensors", + "model.layers.38.mlp.experts.23.up_proj.weight_scale": "model-00039-of-00047.safetensors", + "model.layers.38.mlp.experts.24.down_proj.weight": "model-00039-of-00047.safetensors", + "model.layers.38.mlp.experts.24.down_proj.weight_scale": "model-00039-of-00047.safetensors", + "model.layers.38.mlp.experts.24.gate_proj.weight": "model-00039-of-00047.safetensors", + "model.layers.38.mlp.experts.24.gate_proj.weight_scale": "model-00039-of-00047.safetensors", + "model.layers.38.mlp.experts.24.up_proj.weight": "model-00039-of-00047.safetensors", + "model.layers.38.mlp.experts.24.up_proj.weight_scale": "model-00039-of-00047.safetensors", + "model.layers.38.mlp.experts.25.down_proj.weight": "model-00039-of-00047.safetensors", + "model.layers.38.mlp.experts.25.down_proj.weight_scale": "model-00039-of-00047.safetensors", + "model.layers.38.mlp.experts.25.gate_proj.weight": "model-00039-of-00047.safetensors", + "model.layers.38.mlp.experts.25.gate_proj.weight_scale": "model-00039-of-00047.safetensors", + "model.layers.38.mlp.experts.25.up_proj.weight": "model-00039-of-00047.safetensors", + "model.layers.38.mlp.experts.25.up_proj.weight_scale": "model-00039-of-00047.safetensors", + "model.layers.38.mlp.experts.26.down_proj.weight": "model-00039-of-00047.safetensors", + "model.layers.38.mlp.experts.26.down_proj.weight_scale": "model-00039-of-00047.safetensors", + "model.layers.38.mlp.experts.26.gate_proj.weight": "model-00039-of-00047.safetensors", + "model.layers.38.mlp.experts.26.gate_proj.weight_scale": "model-00039-of-00047.safetensors", + "model.layers.38.mlp.experts.26.up_proj.weight": "model-00039-of-00047.safetensors", + "model.layers.38.mlp.experts.26.up_proj.weight_scale": "model-00039-of-00047.safetensors", + "model.layers.38.mlp.experts.27.down_proj.weight": "model-00039-of-00047.safetensors", + "model.layers.38.mlp.experts.27.down_proj.weight_scale": "model-00039-of-00047.safetensors", + "model.layers.38.mlp.experts.27.gate_proj.weight": "model-00039-of-00047.safetensors", + "model.layers.38.mlp.experts.27.gate_proj.weight_scale": "model-00039-of-00047.safetensors", + "model.layers.38.mlp.experts.27.up_proj.weight": "model-00039-of-00047.safetensors", + "model.layers.38.mlp.experts.27.up_proj.weight_scale": "model-00039-of-00047.safetensors", + "model.layers.38.mlp.experts.28.down_proj.weight": "model-00039-of-00047.safetensors", + "model.layers.38.mlp.experts.28.down_proj.weight_scale": "model-00039-of-00047.safetensors", + "model.layers.38.mlp.experts.28.gate_proj.weight": "model-00039-of-00047.safetensors", + "model.layers.38.mlp.experts.28.gate_proj.weight_scale": "model-00039-of-00047.safetensors", + "model.layers.38.mlp.experts.28.up_proj.weight": "model-00039-of-00047.safetensors", + "model.layers.38.mlp.experts.28.up_proj.weight_scale": "model-00039-of-00047.safetensors", + "model.layers.38.mlp.experts.29.down_proj.weight": "model-00039-of-00047.safetensors", + "model.layers.38.mlp.experts.29.down_proj.weight_scale": "model-00039-of-00047.safetensors", + "model.layers.38.mlp.experts.29.gate_proj.weight": "model-00039-of-00047.safetensors", + "model.layers.38.mlp.experts.29.gate_proj.weight_scale": "model-00039-of-00047.safetensors", + "model.layers.38.mlp.experts.29.up_proj.weight": "model-00039-of-00047.safetensors", + "model.layers.38.mlp.experts.29.up_proj.weight_scale": "model-00039-of-00047.safetensors", + "model.layers.38.mlp.experts.3.down_proj.weight": "model-00039-of-00047.safetensors", + "model.layers.38.mlp.experts.3.down_proj.weight_scale": "model-00039-of-00047.safetensors", + "model.layers.38.mlp.experts.3.gate_proj.weight": "model-00039-of-00047.safetensors", + "model.layers.38.mlp.experts.3.gate_proj.weight_scale": "model-00039-of-00047.safetensors", + "model.layers.38.mlp.experts.3.up_proj.weight": "model-00039-of-00047.safetensors", + "model.layers.38.mlp.experts.3.up_proj.weight_scale": "model-00039-of-00047.safetensors", + "model.layers.38.mlp.experts.30.down_proj.weight": "model-00039-of-00047.safetensors", + "model.layers.38.mlp.experts.30.down_proj.weight_scale": "model-00039-of-00047.safetensors", + "model.layers.38.mlp.experts.30.gate_proj.weight": "model-00039-of-00047.safetensors", + "model.layers.38.mlp.experts.30.gate_proj.weight_scale": "model-00039-of-00047.safetensors", + "model.layers.38.mlp.experts.30.up_proj.weight": "model-00039-of-00047.safetensors", + "model.layers.38.mlp.experts.30.up_proj.weight_scale": "model-00039-of-00047.safetensors", + "model.layers.38.mlp.experts.31.down_proj.weight": "model-00039-of-00047.safetensors", + "model.layers.38.mlp.experts.31.down_proj.weight_scale": "model-00039-of-00047.safetensors", + "model.layers.38.mlp.experts.31.gate_proj.weight": "model-00039-of-00047.safetensors", + "model.layers.38.mlp.experts.31.gate_proj.weight_scale": "model-00039-of-00047.safetensors", + "model.layers.38.mlp.experts.31.up_proj.weight": "model-00039-of-00047.safetensors", + "model.layers.38.mlp.experts.31.up_proj.weight_scale": "model-00039-of-00047.safetensors", + "model.layers.38.mlp.experts.32.down_proj.weight": "model-00039-of-00047.safetensors", + "model.layers.38.mlp.experts.32.down_proj.weight_scale": "model-00039-of-00047.safetensors", + "model.layers.38.mlp.experts.32.gate_proj.weight": "model-00039-of-00047.safetensors", + "model.layers.38.mlp.experts.32.gate_proj.weight_scale": "model-00039-of-00047.safetensors", + "model.layers.38.mlp.experts.32.up_proj.weight": "model-00039-of-00047.safetensors", + "model.layers.38.mlp.experts.32.up_proj.weight_scale": "model-00039-of-00047.safetensors", + "model.layers.38.mlp.experts.33.down_proj.weight": "model-00039-of-00047.safetensors", + "model.layers.38.mlp.experts.33.down_proj.weight_scale": "model-00039-of-00047.safetensors", + "model.layers.38.mlp.experts.33.gate_proj.weight": "model-00039-of-00047.safetensors", + "model.layers.38.mlp.experts.33.gate_proj.weight_scale": "model-00039-of-00047.safetensors", + "model.layers.38.mlp.experts.33.up_proj.weight": "model-00039-of-00047.safetensors", + "model.layers.38.mlp.experts.33.up_proj.weight_scale": "model-00039-of-00047.safetensors", + "model.layers.38.mlp.experts.34.down_proj.weight": "model-00039-of-00047.safetensors", + "model.layers.38.mlp.experts.34.down_proj.weight_scale": "model-00039-of-00047.safetensors", + "model.layers.38.mlp.experts.34.gate_proj.weight": "model-00039-of-00047.safetensors", + "model.layers.38.mlp.experts.34.gate_proj.weight_scale": "model-00039-of-00047.safetensors", + "model.layers.38.mlp.experts.34.up_proj.weight": "model-00039-of-00047.safetensors", + "model.layers.38.mlp.experts.34.up_proj.weight_scale": "model-00039-of-00047.safetensors", + "model.layers.38.mlp.experts.35.down_proj.weight": "model-00039-of-00047.safetensors", + "model.layers.38.mlp.experts.35.down_proj.weight_scale": "model-00039-of-00047.safetensors", + "model.layers.38.mlp.experts.35.gate_proj.weight": "model-00039-of-00047.safetensors", + "model.layers.38.mlp.experts.35.gate_proj.weight_scale": "model-00039-of-00047.safetensors", + "model.layers.38.mlp.experts.35.up_proj.weight": "model-00039-of-00047.safetensors", + "model.layers.38.mlp.experts.35.up_proj.weight_scale": "model-00039-of-00047.safetensors", + "model.layers.38.mlp.experts.36.down_proj.weight": "model-00039-of-00047.safetensors", + "model.layers.38.mlp.experts.36.down_proj.weight_scale": "model-00039-of-00047.safetensors", + "model.layers.38.mlp.experts.36.gate_proj.weight": "model-00039-of-00047.safetensors", + "model.layers.38.mlp.experts.36.gate_proj.weight_scale": "model-00039-of-00047.safetensors", + "model.layers.38.mlp.experts.36.up_proj.weight": "model-00039-of-00047.safetensors", + "model.layers.38.mlp.experts.36.up_proj.weight_scale": "model-00039-of-00047.safetensors", + "model.layers.38.mlp.experts.37.down_proj.weight": "model-00039-of-00047.safetensors", + "model.layers.38.mlp.experts.37.down_proj.weight_scale": "model-00039-of-00047.safetensors", + "model.layers.38.mlp.experts.37.gate_proj.weight": "model-00039-of-00047.safetensors", + "model.layers.38.mlp.experts.37.gate_proj.weight_scale": "model-00039-of-00047.safetensors", + "model.layers.38.mlp.experts.37.up_proj.weight": "model-00039-of-00047.safetensors", + "model.layers.38.mlp.experts.37.up_proj.weight_scale": "model-00039-of-00047.safetensors", + "model.layers.38.mlp.experts.38.down_proj.weight": "model-00039-of-00047.safetensors", + "model.layers.38.mlp.experts.38.down_proj.weight_scale": "model-00039-of-00047.safetensors", + "model.layers.38.mlp.experts.38.gate_proj.weight": "model-00039-of-00047.safetensors", + "model.layers.38.mlp.experts.38.gate_proj.weight_scale": "model-00039-of-00047.safetensors", + "model.layers.38.mlp.experts.38.up_proj.weight": "model-00039-of-00047.safetensors", + "model.layers.38.mlp.experts.38.up_proj.weight_scale": "model-00039-of-00047.safetensors", + "model.layers.38.mlp.experts.39.down_proj.weight": "model-00039-of-00047.safetensors", + "model.layers.38.mlp.experts.39.down_proj.weight_scale": "model-00039-of-00047.safetensors", + "model.layers.38.mlp.experts.39.gate_proj.weight": "model-00039-of-00047.safetensors", + "model.layers.38.mlp.experts.39.gate_proj.weight_scale": "model-00039-of-00047.safetensors", + "model.layers.38.mlp.experts.39.up_proj.weight": "model-00039-of-00047.safetensors", + "model.layers.38.mlp.experts.39.up_proj.weight_scale": "model-00039-of-00047.safetensors", + "model.layers.38.mlp.experts.4.down_proj.weight": "model-00039-of-00047.safetensors", + "model.layers.38.mlp.experts.4.down_proj.weight_scale": "model-00039-of-00047.safetensors", + "model.layers.38.mlp.experts.4.gate_proj.weight": "model-00039-of-00047.safetensors", + "model.layers.38.mlp.experts.4.gate_proj.weight_scale": "model-00039-of-00047.safetensors", + "model.layers.38.mlp.experts.4.up_proj.weight": "model-00039-of-00047.safetensors", + "model.layers.38.mlp.experts.4.up_proj.weight_scale": "model-00039-of-00047.safetensors", + "model.layers.38.mlp.experts.40.down_proj.weight": "model-00039-of-00047.safetensors", + "model.layers.38.mlp.experts.40.down_proj.weight_scale": "model-00039-of-00047.safetensors", + "model.layers.38.mlp.experts.40.gate_proj.weight": "model-00039-of-00047.safetensors", + "model.layers.38.mlp.experts.40.gate_proj.weight_scale": "model-00039-of-00047.safetensors", + "model.layers.38.mlp.experts.40.up_proj.weight": "model-00039-of-00047.safetensors", + "model.layers.38.mlp.experts.40.up_proj.weight_scale": "model-00039-of-00047.safetensors", + "model.layers.38.mlp.experts.41.down_proj.weight": "model-00039-of-00047.safetensors", + "model.layers.38.mlp.experts.41.down_proj.weight_scale": "model-00039-of-00047.safetensors", + "model.layers.38.mlp.experts.41.gate_proj.weight": "model-00039-of-00047.safetensors", + "model.layers.38.mlp.experts.41.gate_proj.weight_scale": "model-00039-of-00047.safetensors", + "model.layers.38.mlp.experts.41.up_proj.weight": "model-00039-of-00047.safetensors", + "model.layers.38.mlp.experts.41.up_proj.weight_scale": "model-00039-of-00047.safetensors", + "model.layers.38.mlp.experts.42.down_proj.weight": "model-00039-of-00047.safetensors", + "model.layers.38.mlp.experts.42.down_proj.weight_scale": "model-00039-of-00047.safetensors", + "model.layers.38.mlp.experts.42.gate_proj.weight": "model-00039-of-00047.safetensors", + "model.layers.38.mlp.experts.42.gate_proj.weight_scale": "model-00039-of-00047.safetensors", + "model.layers.38.mlp.experts.42.up_proj.weight": "model-00039-of-00047.safetensors", + "model.layers.38.mlp.experts.42.up_proj.weight_scale": "model-00039-of-00047.safetensors", + "model.layers.38.mlp.experts.43.down_proj.weight": "model-00039-of-00047.safetensors", + "model.layers.38.mlp.experts.43.down_proj.weight_scale": "model-00039-of-00047.safetensors", + "model.layers.38.mlp.experts.43.gate_proj.weight": "model-00039-of-00047.safetensors", + "model.layers.38.mlp.experts.43.gate_proj.weight_scale": "model-00039-of-00047.safetensors", + "model.layers.38.mlp.experts.43.up_proj.weight": "model-00039-of-00047.safetensors", + "model.layers.38.mlp.experts.43.up_proj.weight_scale": "model-00039-of-00047.safetensors", + "model.layers.38.mlp.experts.44.down_proj.weight": "model-00039-of-00047.safetensors", + "model.layers.38.mlp.experts.44.down_proj.weight_scale": "model-00039-of-00047.safetensors", + "model.layers.38.mlp.experts.44.gate_proj.weight": "model-00039-of-00047.safetensors", + "model.layers.38.mlp.experts.44.gate_proj.weight_scale": "model-00039-of-00047.safetensors", + "model.layers.38.mlp.experts.44.up_proj.weight": "model-00039-of-00047.safetensors", + "model.layers.38.mlp.experts.44.up_proj.weight_scale": "model-00039-of-00047.safetensors", + "model.layers.38.mlp.experts.45.down_proj.weight": "model-00039-of-00047.safetensors", + "model.layers.38.mlp.experts.45.down_proj.weight_scale": "model-00039-of-00047.safetensors", + "model.layers.38.mlp.experts.45.gate_proj.weight": "model-00039-of-00047.safetensors", + "model.layers.38.mlp.experts.45.gate_proj.weight_scale": "model-00039-of-00047.safetensors", + "model.layers.38.mlp.experts.45.up_proj.weight": "model-00039-of-00047.safetensors", + "model.layers.38.mlp.experts.45.up_proj.weight_scale": "model-00039-of-00047.safetensors", + "model.layers.38.mlp.experts.46.down_proj.weight": "model-00039-of-00047.safetensors", + "model.layers.38.mlp.experts.46.down_proj.weight_scale": "model-00039-of-00047.safetensors", + "model.layers.38.mlp.experts.46.gate_proj.weight": "model-00039-of-00047.safetensors", + "model.layers.38.mlp.experts.46.gate_proj.weight_scale": "model-00039-of-00047.safetensors", + "model.layers.38.mlp.experts.46.up_proj.weight": "model-00039-of-00047.safetensors", + "model.layers.38.mlp.experts.46.up_proj.weight_scale": "model-00039-of-00047.safetensors", + "model.layers.38.mlp.experts.47.down_proj.weight": "model-00039-of-00047.safetensors", + "model.layers.38.mlp.experts.47.down_proj.weight_scale": "model-00039-of-00047.safetensors", + "model.layers.38.mlp.experts.47.gate_proj.weight": "model-00039-of-00047.safetensors", + "model.layers.38.mlp.experts.47.gate_proj.weight_scale": "model-00039-of-00047.safetensors", + "model.layers.38.mlp.experts.47.up_proj.weight": "model-00039-of-00047.safetensors", + "model.layers.38.mlp.experts.47.up_proj.weight_scale": "model-00039-of-00047.safetensors", + "model.layers.38.mlp.experts.48.down_proj.weight": "model-00039-of-00047.safetensors", + "model.layers.38.mlp.experts.48.down_proj.weight_scale": "model-00039-of-00047.safetensors", + "model.layers.38.mlp.experts.48.gate_proj.weight": "model-00039-of-00047.safetensors", + "model.layers.38.mlp.experts.48.gate_proj.weight_scale": "model-00039-of-00047.safetensors", + "model.layers.38.mlp.experts.48.up_proj.weight": "model-00039-of-00047.safetensors", + "model.layers.38.mlp.experts.48.up_proj.weight_scale": "model-00039-of-00047.safetensors", + "model.layers.38.mlp.experts.49.down_proj.weight": "model-00039-of-00047.safetensors", + "model.layers.38.mlp.experts.49.down_proj.weight_scale": "model-00039-of-00047.safetensors", + "model.layers.38.mlp.experts.49.gate_proj.weight": "model-00039-of-00047.safetensors", + "model.layers.38.mlp.experts.49.gate_proj.weight_scale": "model-00039-of-00047.safetensors", + "model.layers.38.mlp.experts.49.up_proj.weight": "model-00039-of-00047.safetensors", + "model.layers.38.mlp.experts.49.up_proj.weight_scale": "model-00039-of-00047.safetensors", + "model.layers.38.mlp.experts.5.down_proj.weight": "model-00039-of-00047.safetensors", + "model.layers.38.mlp.experts.5.down_proj.weight_scale": "model-00039-of-00047.safetensors", + "model.layers.38.mlp.experts.5.gate_proj.weight": "model-00039-of-00047.safetensors", + "model.layers.38.mlp.experts.5.gate_proj.weight_scale": "model-00039-of-00047.safetensors", + "model.layers.38.mlp.experts.5.up_proj.weight": "model-00039-of-00047.safetensors", + "model.layers.38.mlp.experts.5.up_proj.weight_scale": "model-00039-of-00047.safetensors", + "model.layers.38.mlp.experts.50.down_proj.weight": "model-00039-of-00047.safetensors", + "model.layers.38.mlp.experts.50.down_proj.weight_scale": "model-00039-of-00047.safetensors", + "model.layers.38.mlp.experts.50.gate_proj.weight": "model-00039-of-00047.safetensors", + "model.layers.38.mlp.experts.50.gate_proj.weight_scale": "model-00039-of-00047.safetensors", + "model.layers.38.mlp.experts.50.up_proj.weight": "model-00039-of-00047.safetensors", + "model.layers.38.mlp.experts.50.up_proj.weight_scale": "model-00039-of-00047.safetensors", + "model.layers.38.mlp.experts.51.down_proj.weight": "model-00039-of-00047.safetensors", + "model.layers.38.mlp.experts.51.down_proj.weight_scale": "model-00039-of-00047.safetensors", + "model.layers.38.mlp.experts.51.gate_proj.weight": "model-00039-of-00047.safetensors", + "model.layers.38.mlp.experts.51.gate_proj.weight_scale": "model-00039-of-00047.safetensors", + "model.layers.38.mlp.experts.51.up_proj.weight": "model-00039-of-00047.safetensors", + "model.layers.38.mlp.experts.51.up_proj.weight_scale": "model-00039-of-00047.safetensors", + "model.layers.38.mlp.experts.52.down_proj.weight": "model-00039-of-00047.safetensors", + "model.layers.38.mlp.experts.52.down_proj.weight_scale": "model-00039-of-00047.safetensors", + "model.layers.38.mlp.experts.52.gate_proj.weight": "model-00039-of-00047.safetensors", + "model.layers.38.mlp.experts.52.gate_proj.weight_scale": "model-00039-of-00047.safetensors", + "model.layers.38.mlp.experts.52.up_proj.weight": "model-00039-of-00047.safetensors", + "model.layers.38.mlp.experts.52.up_proj.weight_scale": "model-00039-of-00047.safetensors", + "model.layers.38.mlp.experts.53.down_proj.weight": "model-00039-of-00047.safetensors", + "model.layers.38.mlp.experts.53.down_proj.weight_scale": "model-00039-of-00047.safetensors", + "model.layers.38.mlp.experts.53.gate_proj.weight": "model-00039-of-00047.safetensors", + "model.layers.38.mlp.experts.53.gate_proj.weight_scale": "model-00039-of-00047.safetensors", + "model.layers.38.mlp.experts.53.up_proj.weight": "model-00039-of-00047.safetensors", + "model.layers.38.mlp.experts.53.up_proj.weight_scale": "model-00039-of-00047.safetensors", + "model.layers.38.mlp.experts.54.down_proj.weight": "model-00039-of-00047.safetensors", + "model.layers.38.mlp.experts.54.down_proj.weight_scale": "model-00039-of-00047.safetensors", + "model.layers.38.mlp.experts.54.gate_proj.weight": "model-00039-of-00047.safetensors", + "model.layers.38.mlp.experts.54.gate_proj.weight_scale": "model-00039-of-00047.safetensors", + "model.layers.38.mlp.experts.54.up_proj.weight": "model-00039-of-00047.safetensors", + "model.layers.38.mlp.experts.54.up_proj.weight_scale": "model-00039-of-00047.safetensors", + "model.layers.38.mlp.experts.55.down_proj.weight": "model-00039-of-00047.safetensors", + "model.layers.38.mlp.experts.55.down_proj.weight_scale": "model-00039-of-00047.safetensors", + "model.layers.38.mlp.experts.55.gate_proj.weight": "model-00039-of-00047.safetensors", + "model.layers.38.mlp.experts.55.gate_proj.weight_scale": "model-00039-of-00047.safetensors", + "model.layers.38.mlp.experts.55.up_proj.weight": "model-00039-of-00047.safetensors", + "model.layers.38.mlp.experts.55.up_proj.weight_scale": "model-00039-of-00047.safetensors", + "model.layers.38.mlp.experts.56.down_proj.weight": "model-00039-of-00047.safetensors", + "model.layers.38.mlp.experts.56.down_proj.weight_scale": "model-00039-of-00047.safetensors", + "model.layers.38.mlp.experts.56.gate_proj.weight": "model-00039-of-00047.safetensors", + "model.layers.38.mlp.experts.56.gate_proj.weight_scale": "model-00039-of-00047.safetensors", + "model.layers.38.mlp.experts.56.up_proj.weight": "model-00039-of-00047.safetensors", + "model.layers.38.mlp.experts.56.up_proj.weight_scale": "model-00039-of-00047.safetensors", + "model.layers.38.mlp.experts.57.down_proj.weight": "model-00039-of-00047.safetensors", + "model.layers.38.mlp.experts.57.down_proj.weight_scale": "model-00039-of-00047.safetensors", + "model.layers.38.mlp.experts.57.gate_proj.weight": "model-00039-of-00047.safetensors", + "model.layers.38.mlp.experts.57.gate_proj.weight_scale": "model-00039-of-00047.safetensors", + "model.layers.38.mlp.experts.57.up_proj.weight": "model-00039-of-00047.safetensors", + "model.layers.38.mlp.experts.57.up_proj.weight_scale": "model-00039-of-00047.safetensors", + "model.layers.38.mlp.experts.58.down_proj.weight": "model-00039-of-00047.safetensors", + "model.layers.38.mlp.experts.58.down_proj.weight_scale": "model-00039-of-00047.safetensors", + "model.layers.38.mlp.experts.58.gate_proj.weight": "model-00039-of-00047.safetensors", + "model.layers.38.mlp.experts.58.gate_proj.weight_scale": "model-00039-of-00047.safetensors", + "model.layers.38.mlp.experts.58.up_proj.weight": "model-00039-of-00047.safetensors", + "model.layers.38.mlp.experts.58.up_proj.weight_scale": "model-00039-of-00047.safetensors", + "model.layers.38.mlp.experts.59.down_proj.weight": "model-00039-of-00047.safetensors", + "model.layers.38.mlp.experts.59.down_proj.weight_scale": "model-00039-of-00047.safetensors", + "model.layers.38.mlp.experts.59.gate_proj.weight": "model-00039-of-00047.safetensors", + "model.layers.38.mlp.experts.59.gate_proj.weight_scale": "model-00039-of-00047.safetensors", + "model.layers.38.mlp.experts.59.up_proj.weight": "model-00039-of-00047.safetensors", + "model.layers.38.mlp.experts.59.up_proj.weight_scale": "model-00039-of-00047.safetensors", + "model.layers.38.mlp.experts.6.down_proj.weight": "model-00039-of-00047.safetensors", + "model.layers.38.mlp.experts.6.down_proj.weight_scale": "model-00039-of-00047.safetensors", + "model.layers.38.mlp.experts.6.gate_proj.weight": "model-00039-of-00047.safetensors", + "model.layers.38.mlp.experts.6.gate_proj.weight_scale": "model-00039-of-00047.safetensors", + "model.layers.38.mlp.experts.6.up_proj.weight": "model-00039-of-00047.safetensors", + "model.layers.38.mlp.experts.6.up_proj.weight_scale": "model-00039-of-00047.safetensors", + "model.layers.38.mlp.experts.60.down_proj.weight": "model-00039-of-00047.safetensors", + "model.layers.38.mlp.experts.60.down_proj.weight_scale": "model-00039-of-00047.safetensors", + "model.layers.38.mlp.experts.60.gate_proj.weight": "model-00039-of-00047.safetensors", + "model.layers.38.mlp.experts.60.gate_proj.weight_scale": "model-00039-of-00047.safetensors", + "model.layers.38.mlp.experts.60.up_proj.weight": "model-00039-of-00047.safetensors", + "model.layers.38.mlp.experts.60.up_proj.weight_scale": "model-00039-of-00047.safetensors", + "model.layers.38.mlp.experts.61.down_proj.weight": "model-00039-of-00047.safetensors", + "model.layers.38.mlp.experts.61.down_proj.weight_scale": "model-00039-of-00047.safetensors", + "model.layers.38.mlp.experts.61.gate_proj.weight": "model-00039-of-00047.safetensors", + "model.layers.38.mlp.experts.61.gate_proj.weight_scale": "model-00039-of-00047.safetensors", + "model.layers.38.mlp.experts.61.up_proj.weight": "model-00039-of-00047.safetensors", + "model.layers.38.mlp.experts.61.up_proj.weight_scale": "model-00039-of-00047.safetensors", + "model.layers.38.mlp.experts.62.down_proj.weight": "model-00039-of-00047.safetensors", + "model.layers.38.mlp.experts.62.down_proj.weight_scale": "model-00039-of-00047.safetensors", + "model.layers.38.mlp.experts.62.gate_proj.weight": "model-00039-of-00047.safetensors", + "model.layers.38.mlp.experts.62.gate_proj.weight_scale": "model-00039-of-00047.safetensors", + "model.layers.38.mlp.experts.62.up_proj.weight": "model-00039-of-00047.safetensors", + "model.layers.38.mlp.experts.62.up_proj.weight_scale": "model-00039-of-00047.safetensors", + "model.layers.38.mlp.experts.63.down_proj.weight": "model-00039-of-00047.safetensors", + "model.layers.38.mlp.experts.63.down_proj.weight_scale": "model-00039-of-00047.safetensors", + "model.layers.38.mlp.experts.63.gate_proj.weight": "model-00039-of-00047.safetensors", + "model.layers.38.mlp.experts.63.gate_proj.weight_scale": "model-00039-of-00047.safetensors", + "model.layers.38.mlp.experts.63.up_proj.weight": "model-00039-of-00047.safetensors", + "model.layers.38.mlp.experts.63.up_proj.weight_scale": "model-00039-of-00047.safetensors", + "model.layers.38.mlp.experts.64.down_proj.weight": "model-00039-of-00047.safetensors", + "model.layers.38.mlp.experts.64.down_proj.weight_scale": "model-00039-of-00047.safetensors", + "model.layers.38.mlp.experts.64.gate_proj.weight": "model-00039-of-00047.safetensors", + "model.layers.38.mlp.experts.64.gate_proj.weight_scale": "model-00039-of-00047.safetensors", + "model.layers.38.mlp.experts.64.up_proj.weight": "model-00039-of-00047.safetensors", + "model.layers.38.mlp.experts.64.up_proj.weight_scale": "model-00039-of-00047.safetensors", + "model.layers.38.mlp.experts.65.down_proj.weight": "model-00039-of-00047.safetensors", + "model.layers.38.mlp.experts.65.down_proj.weight_scale": "model-00039-of-00047.safetensors", + "model.layers.38.mlp.experts.65.gate_proj.weight": "model-00039-of-00047.safetensors", + "model.layers.38.mlp.experts.65.gate_proj.weight_scale": "model-00039-of-00047.safetensors", + "model.layers.38.mlp.experts.65.up_proj.weight": "model-00039-of-00047.safetensors", + "model.layers.38.mlp.experts.65.up_proj.weight_scale": "model-00039-of-00047.safetensors", + "model.layers.38.mlp.experts.66.down_proj.weight": "model-00039-of-00047.safetensors", + "model.layers.38.mlp.experts.66.down_proj.weight_scale": "model-00039-of-00047.safetensors", + "model.layers.38.mlp.experts.66.gate_proj.weight": "model-00039-of-00047.safetensors", + "model.layers.38.mlp.experts.66.gate_proj.weight_scale": "model-00039-of-00047.safetensors", + "model.layers.38.mlp.experts.66.up_proj.weight": "model-00039-of-00047.safetensors", + "model.layers.38.mlp.experts.66.up_proj.weight_scale": "model-00039-of-00047.safetensors", + "model.layers.38.mlp.experts.67.down_proj.weight": "model-00039-of-00047.safetensors", + "model.layers.38.mlp.experts.67.down_proj.weight_scale": "model-00039-of-00047.safetensors", + "model.layers.38.mlp.experts.67.gate_proj.weight": "model-00039-of-00047.safetensors", + "model.layers.38.mlp.experts.67.gate_proj.weight_scale": "model-00039-of-00047.safetensors", + "model.layers.38.mlp.experts.67.up_proj.weight": "model-00039-of-00047.safetensors", + "model.layers.38.mlp.experts.67.up_proj.weight_scale": "model-00039-of-00047.safetensors", + "model.layers.38.mlp.experts.68.down_proj.weight": "model-00039-of-00047.safetensors", + "model.layers.38.mlp.experts.68.down_proj.weight_scale": "model-00039-of-00047.safetensors", + "model.layers.38.mlp.experts.68.gate_proj.weight": "model-00039-of-00047.safetensors", + "model.layers.38.mlp.experts.68.gate_proj.weight_scale": "model-00039-of-00047.safetensors", + "model.layers.38.mlp.experts.68.up_proj.weight": "model-00039-of-00047.safetensors", + "model.layers.38.mlp.experts.68.up_proj.weight_scale": "model-00039-of-00047.safetensors", + "model.layers.38.mlp.experts.69.down_proj.weight": "model-00039-of-00047.safetensors", + "model.layers.38.mlp.experts.69.down_proj.weight_scale": "model-00039-of-00047.safetensors", + "model.layers.38.mlp.experts.69.gate_proj.weight": "model-00039-of-00047.safetensors", + "model.layers.38.mlp.experts.69.gate_proj.weight_scale": "model-00039-of-00047.safetensors", + "model.layers.38.mlp.experts.69.up_proj.weight": "model-00039-of-00047.safetensors", + "model.layers.38.mlp.experts.69.up_proj.weight_scale": "model-00039-of-00047.safetensors", + "model.layers.38.mlp.experts.7.down_proj.weight": "model-00039-of-00047.safetensors", + "model.layers.38.mlp.experts.7.down_proj.weight_scale": "model-00039-of-00047.safetensors", + "model.layers.38.mlp.experts.7.gate_proj.weight": "model-00039-of-00047.safetensors", + "model.layers.38.mlp.experts.7.gate_proj.weight_scale": "model-00039-of-00047.safetensors", + "model.layers.38.mlp.experts.7.up_proj.weight": "model-00039-of-00047.safetensors", + "model.layers.38.mlp.experts.7.up_proj.weight_scale": "model-00039-of-00047.safetensors", + "model.layers.38.mlp.experts.70.down_proj.weight": "model-00039-of-00047.safetensors", + "model.layers.38.mlp.experts.70.down_proj.weight_scale": "model-00039-of-00047.safetensors", + "model.layers.38.mlp.experts.70.gate_proj.weight": "model-00039-of-00047.safetensors", + "model.layers.38.mlp.experts.70.gate_proj.weight_scale": "model-00039-of-00047.safetensors", + "model.layers.38.mlp.experts.70.up_proj.weight": "model-00039-of-00047.safetensors", + "model.layers.38.mlp.experts.70.up_proj.weight_scale": "model-00039-of-00047.safetensors", + "model.layers.38.mlp.experts.71.down_proj.weight": "model-00039-of-00047.safetensors", + "model.layers.38.mlp.experts.71.down_proj.weight_scale": "model-00039-of-00047.safetensors", + "model.layers.38.mlp.experts.71.gate_proj.weight": "model-00039-of-00047.safetensors", + "model.layers.38.mlp.experts.71.gate_proj.weight_scale": "model-00039-of-00047.safetensors", + "model.layers.38.mlp.experts.71.up_proj.weight": "model-00039-of-00047.safetensors", + "model.layers.38.mlp.experts.71.up_proj.weight_scale": "model-00039-of-00047.safetensors", + "model.layers.38.mlp.experts.72.down_proj.weight": "model-00039-of-00047.safetensors", + "model.layers.38.mlp.experts.72.down_proj.weight_scale": "model-00039-of-00047.safetensors", + "model.layers.38.mlp.experts.72.gate_proj.weight": "model-00039-of-00047.safetensors", + "model.layers.38.mlp.experts.72.gate_proj.weight_scale": "model-00039-of-00047.safetensors", + "model.layers.38.mlp.experts.72.up_proj.weight": "model-00039-of-00047.safetensors", + "model.layers.38.mlp.experts.72.up_proj.weight_scale": "model-00039-of-00047.safetensors", + "model.layers.38.mlp.experts.73.down_proj.weight": "model-00039-of-00047.safetensors", + "model.layers.38.mlp.experts.73.down_proj.weight_scale": "model-00039-of-00047.safetensors", + "model.layers.38.mlp.experts.73.gate_proj.weight": "model-00039-of-00047.safetensors", + "model.layers.38.mlp.experts.73.gate_proj.weight_scale": "model-00039-of-00047.safetensors", + "model.layers.38.mlp.experts.73.up_proj.weight": "model-00039-of-00047.safetensors", + "model.layers.38.mlp.experts.73.up_proj.weight_scale": "model-00039-of-00047.safetensors", + "model.layers.38.mlp.experts.74.down_proj.weight": "model-00039-of-00047.safetensors", + "model.layers.38.mlp.experts.74.down_proj.weight_scale": "model-00039-of-00047.safetensors", + "model.layers.38.mlp.experts.74.gate_proj.weight": "model-00039-of-00047.safetensors", + "model.layers.38.mlp.experts.74.gate_proj.weight_scale": "model-00039-of-00047.safetensors", + "model.layers.38.mlp.experts.74.up_proj.weight": "model-00039-of-00047.safetensors", + "model.layers.38.mlp.experts.74.up_proj.weight_scale": "model-00039-of-00047.safetensors", + "model.layers.38.mlp.experts.75.down_proj.weight": "model-00039-of-00047.safetensors", + "model.layers.38.mlp.experts.75.down_proj.weight_scale": "model-00039-of-00047.safetensors", + "model.layers.38.mlp.experts.75.gate_proj.weight": "model-00039-of-00047.safetensors", + "model.layers.38.mlp.experts.75.gate_proj.weight_scale": "model-00039-of-00047.safetensors", + "model.layers.38.mlp.experts.75.up_proj.weight": "model-00039-of-00047.safetensors", + "model.layers.38.mlp.experts.75.up_proj.weight_scale": "model-00039-of-00047.safetensors", + "model.layers.38.mlp.experts.76.down_proj.weight": "model-00039-of-00047.safetensors", + "model.layers.38.mlp.experts.76.down_proj.weight_scale": "model-00039-of-00047.safetensors", + "model.layers.38.mlp.experts.76.gate_proj.weight": "model-00039-of-00047.safetensors", + "model.layers.38.mlp.experts.76.gate_proj.weight_scale": "model-00039-of-00047.safetensors", + "model.layers.38.mlp.experts.76.up_proj.weight": "model-00039-of-00047.safetensors", + "model.layers.38.mlp.experts.76.up_proj.weight_scale": "model-00039-of-00047.safetensors", + "model.layers.38.mlp.experts.77.down_proj.weight": "model-00039-of-00047.safetensors", + "model.layers.38.mlp.experts.77.down_proj.weight_scale": "model-00039-of-00047.safetensors", + "model.layers.38.mlp.experts.77.gate_proj.weight": "model-00039-of-00047.safetensors", + "model.layers.38.mlp.experts.77.gate_proj.weight_scale": "model-00039-of-00047.safetensors", + "model.layers.38.mlp.experts.77.up_proj.weight": "model-00039-of-00047.safetensors", + "model.layers.38.mlp.experts.77.up_proj.weight_scale": "model-00039-of-00047.safetensors", + "model.layers.38.mlp.experts.78.down_proj.weight": "model-00039-of-00047.safetensors", + "model.layers.38.mlp.experts.78.down_proj.weight_scale": "model-00039-of-00047.safetensors", + "model.layers.38.mlp.experts.78.gate_proj.weight": "model-00039-of-00047.safetensors", + "model.layers.38.mlp.experts.78.gate_proj.weight_scale": "model-00039-of-00047.safetensors", + "model.layers.38.mlp.experts.78.up_proj.weight": "model-00039-of-00047.safetensors", + "model.layers.38.mlp.experts.78.up_proj.weight_scale": "model-00039-of-00047.safetensors", + "model.layers.38.mlp.experts.79.down_proj.weight": "model-00039-of-00047.safetensors", + "model.layers.38.mlp.experts.79.down_proj.weight_scale": "model-00039-of-00047.safetensors", + "model.layers.38.mlp.experts.79.gate_proj.weight": "model-00039-of-00047.safetensors", + "model.layers.38.mlp.experts.79.gate_proj.weight_scale": "model-00039-of-00047.safetensors", + "model.layers.38.mlp.experts.79.up_proj.weight": "model-00039-of-00047.safetensors", + "model.layers.38.mlp.experts.79.up_proj.weight_scale": "model-00039-of-00047.safetensors", + "model.layers.38.mlp.experts.8.down_proj.weight": "model-00039-of-00047.safetensors", + "model.layers.38.mlp.experts.8.down_proj.weight_scale": "model-00039-of-00047.safetensors", + "model.layers.38.mlp.experts.8.gate_proj.weight": "model-00039-of-00047.safetensors", + "model.layers.38.mlp.experts.8.gate_proj.weight_scale": "model-00039-of-00047.safetensors", + "model.layers.38.mlp.experts.8.up_proj.weight": "model-00039-of-00047.safetensors", + "model.layers.38.mlp.experts.8.up_proj.weight_scale": "model-00039-of-00047.safetensors", + "model.layers.38.mlp.experts.80.down_proj.weight": "model-00039-of-00047.safetensors", + "model.layers.38.mlp.experts.80.down_proj.weight_scale": "model-00039-of-00047.safetensors", + "model.layers.38.mlp.experts.80.gate_proj.weight": "model-00039-of-00047.safetensors", + "model.layers.38.mlp.experts.80.gate_proj.weight_scale": "model-00039-of-00047.safetensors", + "model.layers.38.mlp.experts.80.up_proj.weight": "model-00039-of-00047.safetensors", + "model.layers.38.mlp.experts.80.up_proj.weight_scale": "model-00039-of-00047.safetensors", + "model.layers.38.mlp.experts.81.down_proj.weight": "model-00039-of-00047.safetensors", + "model.layers.38.mlp.experts.81.down_proj.weight_scale": "model-00039-of-00047.safetensors", + "model.layers.38.mlp.experts.81.gate_proj.weight": "model-00039-of-00047.safetensors", + "model.layers.38.mlp.experts.81.gate_proj.weight_scale": "model-00039-of-00047.safetensors", + "model.layers.38.mlp.experts.81.up_proj.weight": "model-00039-of-00047.safetensors", + "model.layers.38.mlp.experts.81.up_proj.weight_scale": "model-00039-of-00047.safetensors", + "model.layers.38.mlp.experts.82.down_proj.weight": "model-00039-of-00047.safetensors", + "model.layers.38.mlp.experts.82.down_proj.weight_scale": "model-00039-of-00047.safetensors", + "model.layers.38.mlp.experts.82.gate_proj.weight": "model-00039-of-00047.safetensors", + "model.layers.38.mlp.experts.82.gate_proj.weight_scale": "model-00039-of-00047.safetensors", + "model.layers.38.mlp.experts.82.up_proj.weight": "model-00039-of-00047.safetensors", + "model.layers.38.mlp.experts.82.up_proj.weight_scale": "model-00039-of-00047.safetensors", + "model.layers.38.mlp.experts.83.down_proj.weight": "model-00039-of-00047.safetensors", + "model.layers.38.mlp.experts.83.down_proj.weight_scale": "model-00039-of-00047.safetensors", + "model.layers.38.mlp.experts.83.gate_proj.weight": "model-00039-of-00047.safetensors", + "model.layers.38.mlp.experts.83.gate_proj.weight_scale": "model-00039-of-00047.safetensors", + "model.layers.38.mlp.experts.83.up_proj.weight": "model-00039-of-00047.safetensors", + "model.layers.38.mlp.experts.83.up_proj.weight_scale": "model-00039-of-00047.safetensors", + "model.layers.38.mlp.experts.84.down_proj.weight": "model-00039-of-00047.safetensors", + "model.layers.38.mlp.experts.84.down_proj.weight_scale": "model-00039-of-00047.safetensors", + "model.layers.38.mlp.experts.84.gate_proj.weight": "model-00039-of-00047.safetensors", + "model.layers.38.mlp.experts.84.gate_proj.weight_scale": "model-00039-of-00047.safetensors", + "model.layers.38.mlp.experts.84.up_proj.weight": "model-00039-of-00047.safetensors", + "model.layers.38.mlp.experts.84.up_proj.weight_scale": "model-00039-of-00047.safetensors", + "model.layers.38.mlp.experts.85.down_proj.weight": "model-00039-of-00047.safetensors", + "model.layers.38.mlp.experts.85.down_proj.weight_scale": "model-00039-of-00047.safetensors", + "model.layers.38.mlp.experts.85.gate_proj.weight": "model-00039-of-00047.safetensors", + "model.layers.38.mlp.experts.85.gate_proj.weight_scale": "model-00039-of-00047.safetensors", + "model.layers.38.mlp.experts.85.up_proj.weight": "model-00039-of-00047.safetensors", + "model.layers.38.mlp.experts.85.up_proj.weight_scale": "model-00039-of-00047.safetensors", + "model.layers.38.mlp.experts.86.down_proj.weight": "model-00039-of-00047.safetensors", + "model.layers.38.mlp.experts.86.down_proj.weight_scale": "model-00039-of-00047.safetensors", + "model.layers.38.mlp.experts.86.gate_proj.weight": "model-00039-of-00047.safetensors", + "model.layers.38.mlp.experts.86.gate_proj.weight_scale": "model-00039-of-00047.safetensors", + "model.layers.38.mlp.experts.86.up_proj.weight": "model-00039-of-00047.safetensors", + "model.layers.38.mlp.experts.86.up_proj.weight_scale": "model-00039-of-00047.safetensors", + "model.layers.38.mlp.experts.87.down_proj.weight": "model-00039-of-00047.safetensors", + "model.layers.38.mlp.experts.87.down_proj.weight_scale": "model-00039-of-00047.safetensors", + "model.layers.38.mlp.experts.87.gate_proj.weight": "model-00039-of-00047.safetensors", + "model.layers.38.mlp.experts.87.gate_proj.weight_scale": "model-00039-of-00047.safetensors", + "model.layers.38.mlp.experts.87.up_proj.weight": "model-00039-of-00047.safetensors", + "model.layers.38.mlp.experts.87.up_proj.weight_scale": "model-00039-of-00047.safetensors", + "model.layers.38.mlp.experts.88.down_proj.weight": "model-00039-of-00047.safetensors", + "model.layers.38.mlp.experts.88.down_proj.weight_scale": "model-00039-of-00047.safetensors", + "model.layers.38.mlp.experts.88.gate_proj.weight": "model-00039-of-00047.safetensors", + "model.layers.38.mlp.experts.88.gate_proj.weight_scale": "model-00039-of-00047.safetensors", + "model.layers.38.mlp.experts.88.up_proj.weight": "model-00039-of-00047.safetensors", + "model.layers.38.mlp.experts.88.up_proj.weight_scale": "model-00039-of-00047.safetensors", + "model.layers.38.mlp.experts.89.down_proj.weight": "model-00039-of-00047.safetensors", + "model.layers.38.mlp.experts.89.down_proj.weight_scale": "model-00039-of-00047.safetensors", + "model.layers.38.mlp.experts.89.gate_proj.weight": "model-00039-of-00047.safetensors", + "model.layers.38.mlp.experts.89.gate_proj.weight_scale": "model-00039-of-00047.safetensors", + "model.layers.38.mlp.experts.89.up_proj.weight": "model-00039-of-00047.safetensors", + "model.layers.38.mlp.experts.89.up_proj.weight_scale": "model-00039-of-00047.safetensors", + "model.layers.38.mlp.experts.9.down_proj.weight": "model-00039-of-00047.safetensors", + "model.layers.38.mlp.experts.9.down_proj.weight_scale": "model-00039-of-00047.safetensors", + "model.layers.38.mlp.experts.9.gate_proj.weight": "model-00039-of-00047.safetensors", + "model.layers.38.mlp.experts.9.gate_proj.weight_scale": "model-00039-of-00047.safetensors", + "model.layers.38.mlp.experts.9.up_proj.weight": "model-00039-of-00047.safetensors", + "model.layers.38.mlp.experts.9.up_proj.weight_scale": "model-00039-of-00047.safetensors", + "model.layers.38.mlp.experts.90.down_proj.weight": "model-00039-of-00047.safetensors", + "model.layers.38.mlp.experts.90.down_proj.weight_scale": "model-00039-of-00047.safetensors", + "model.layers.38.mlp.experts.90.gate_proj.weight": "model-00039-of-00047.safetensors", + "model.layers.38.mlp.experts.90.gate_proj.weight_scale": "model-00039-of-00047.safetensors", + "model.layers.38.mlp.experts.90.up_proj.weight": "model-00039-of-00047.safetensors", + "model.layers.38.mlp.experts.90.up_proj.weight_scale": "model-00039-of-00047.safetensors", + "model.layers.38.mlp.experts.91.down_proj.weight": "model-00039-of-00047.safetensors", + "model.layers.38.mlp.experts.91.down_proj.weight_scale": "model-00039-of-00047.safetensors", + "model.layers.38.mlp.experts.91.gate_proj.weight": "model-00039-of-00047.safetensors", + "model.layers.38.mlp.experts.91.gate_proj.weight_scale": "model-00039-of-00047.safetensors", + "model.layers.38.mlp.experts.91.up_proj.weight": "model-00039-of-00047.safetensors", + "model.layers.38.mlp.experts.91.up_proj.weight_scale": "model-00039-of-00047.safetensors", + "model.layers.38.mlp.experts.92.down_proj.weight": "model-00039-of-00047.safetensors", + "model.layers.38.mlp.experts.92.down_proj.weight_scale": "model-00039-of-00047.safetensors", + "model.layers.38.mlp.experts.92.gate_proj.weight": "model-00039-of-00047.safetensors", + "model.layers.38.mlp.experts.92.gate_proj.weight_scale": "model-00039-of-00047.safetensors", + "model.layers.38.mlp.experts.92.up_proj.weight": "model-00039-of-00047.safetensors", + "model.layers.38.mlp.experts.92.up_proj.weight_scale": "model-00039-of-00047.safetensors", + "model.layers.38.mlp.experts.93.down_proj.weight": "model-00039-of-00047.safetensors", + "model.layers.38.mlp.experts.93.down_proj.weight_scale": "model-00039-of-00047.safetensors", + "model.layers.38.mlp.experts.93.gate_proj.weight": "model-00039-of-00047.safetensors", + "model.layers.38.mlp.experts.93.gate_proj.weight_scale": "model-00039-of-00047.safetensors", + "model.layers.38.mlp.experts.93.up_proj.weight": "model-00039-of-00047.safetensors", + "model.layers.38.mlp.experts.93.up_proj.weight_scale": "model-00039-of-00047.safetensors", + "model.layers.38.mlp.experts.94.down_proj.weight": "model-00039-of-00047.safetensors", + "model.layers.38.mlp.experts.94.down_proj.weight_scale": "model-00039-of-00047.safetensors", + "model.layers.38.mlp.experts.94.gate_proj.weight": "model-00039-of-00047.safetensors", + "model.layers.38.mlp.experts.94.gate_proj.weight_scale": "model-00039-of-00047.safetensors", + "model.layers.38.mlp.experts.94.up_proj.weight": "model-00039-of-00047.safetensors", + "model.layers.38.mlp.experts.94.up_proj.weight_scale": "model-00039-of-00047.safetensors", + "model.layers.38.mlp.experts.95.down_proj.weight": "model-00039-of-00047.safetensors", + "model.layers.38.mlp.experts.95.down_proj.weight_scale": "model-00039-of-00047.safetensors", + "model.layers.38.mlp.experts.95.gate_proj.weight": "model-00039-of-00047.safetensors", + "model.layers.38.mlp.experts.95.gate_proj.weight_scale": "model-00039-of-00047.safetensors", + "model.layers.38.mlp.experts.95.up_proj.weight": "model-00039-of-00047.safetensors", + "model.layers.38.mlp.experts.95.up_proj.weight_scale": "model-00039-of-00047.safetensors", + "model.layers.38.mlp.experts.96.down_proj.weight": "model-00039-of-00047.safetensors", + "model.layers.38.mlp.experts.96.down_proj.weight_scale": "model-00039-of-00047.safetensors", + "model.layers.38.mlp.experts.96.gate_proj.weight": "model-00039-of-00047.safetensors", + "model.layers.38.mlp.experts.96.gate_proj.weight_scale": "model-00039-of-00047.safetensors", + "model.layers.38.mlp.experts.96.up_proj.weight": "model-00039-of-00047.safetensors", + "model.layers.38.mlp.experts.96.up_proj.weight_scale": "model-00039-of-00047.safetensors", + "model.layers.38.mlp.experts.97.down_proj.weight": "model-00039-of-00047.safetensors", + "model.layers.38.mlp.experts.97.down_proj.weight_scale": "model-00039-of-00047.safetensors", + "model.layers.38.mlp.experts.97.gate_proj.weight": "model-00039-of-00047.safetensors", + "model.layers.38.mlp.experts.97.gate_proj.weight_scale": "model-00039-of-00047.safetensors", + "model.layers.38.mlp.experts.97.up_proj.weight": "model-00039-of-00047.safetensors", + "model.layers.38.mlp.experts.97.up_proj.weight_scale": "model-00039-of-00047.safetensors", + "model.layers.38.mlp.experts.98.down_proj.weight": "model-00039-of-00047.safetensors", + "model.layers.38.mlp.experts.98.down_proj.weight_scale": "model-00039-of-00047.safetensors", + "model.layers.38.mlp.experts.98.gate_proj.weight": "model-00039-of-00047.safetensors", + "model.layers.38.mlp.experts.98.gate_proj.weight_scale": "model-00039-of-00047.safetensors", + "model.layers.38.mlp.experts.98.up_proj.weight": "model-00039-of-00047.safetensors", + "model.layers.38.mlp.experts.98.up_proj.weight_scale": "model-00039-of-00047.safetensors", + "model.layers.38.mlp.experts.99.down_proj.weight": "model-00039-of-00047.safetensors", + "model.layers.38.mlp.experts.99.down_proj.weight_scale": "model-00039-of-00047.safetensors", + "model.layers.38.mlp.experts.99.gate_proj.weight": "model-00039-of-00047.safetensors", + "model.layers.38.mlp.experts.99.gate_proj.weight_scale": "model-00039-of-00047.safetensors", + "model.layers.38.mlp.experts.99.up_proj.weight": "model-00039-of-00047.safetensors", + "model.layers.38.mlp.experts.99.up_proj.weight_scale": "model-00039-of-00047.safetensors", + "model.layers.38.mlp.gate.e_score_correction_bias": "model-00039-of-00047.safetensors", + "model.layers.38.mlp.gate.weight": "model-00039-of-00047.safetensors", + "model.layers.38.mlp.shared_experts.down_proj.weight": "model-00039-of-00047.safetensors", + "model.layers.38.mlp.shared_experts.down_proj.weight_scale": "model-00039-of-00047.safetensors", + "model.layers.38.mlp.shared_experts.gate_proj.weight": "model-00039-of-00047.safetensors", + "model.layers.38.mlp.shared_experts.gate_proj.weight_scale": "model-00039-of-00047.safetensors", + "model.layers.38.mlp.shared_experts.up_proj.weight": "model-00039-of-00047.safetensors", + "model.layers.38.mlp.shared_experts.up_proj.weight_scale": "model-00039-of-00047.safetensors", + "model.layers.38.post_attention_layernorm.weight": "model-00039-of-00047.safetensors", + "model.layers.38.self_attn.k_proj.bias": "model-00039-of-00047.safetensors", + "model.layers.38.self_attn.k_proj.weight": "model-00039-of-00047.safetensors", + "model.layers.38.self_attn.k_proj.weight_scale": "model-00039-of-00047.safetensors", + "model.layers.38.self_attn.o_proj.weight": "model-00039-of-00047.safetensors", + "model.layers.38.self_attn.o_proj.weight_scale": "model-00039-of-00047.safetensors", + "model.layers.38.self_attn.q_proj.bias": "model-00039-of-00047.safetensors", + "model.layers.38.self_attn.q_proj.weight": "model-00039-of-00047.safetensors", + "model.layers.38.self_attn.q_proj.weight_scale": "model-00039-of-00047.safetensors", + "model.layers.38.self_attn.v_proj.bias": "model-00039-of-00047.safetensors", + "model.layers.38.self_attn.v_proj.weight": "model-00039-of-00047.safetensors", + "model.layers.38.self_attn.v_proj.weight_scale": "model-00039-of-00047.safetensors", + "model.layers.39.input_layernorm.weight": "model-00040-of-00047.safetensors", + "model.layers.39.mlp.experts.0.down_proj.weight": "model-00040-of-00047.safetensors", + "model.layers.39.mlp.experts.0.down_proj.weight_scale": "model-00040-of-00047.safetensors", + "model.layers.39.mlp.experts.0.gate_proj.weight": "model-00040-of-00047.safetensors", + "model.layers.39.mlp.experts.0.gate_proj.weight_scale": "model-00040-of-00047.safetensors", + "model.layers.39.mlp.experts.0.up_proj.weight": "model-00040-of-00047.safetensors", + "model.layers.39.mlp.experts.0.up_proj.weight_scale": "model-00040-of-00047.safetensors", + "model.layers.39.mlp.experts.1.down_proj.weight": "model-00040-of-00047.safetensors", + "model.layers.39.mlp.experts.1.down_proj.weight_scale": "model-00040-of-00047.safetensors", + "model.layers.39.mlp.experts.1.gate_proj.weight": "model-00040-of-00047.safetensors", + "model.layers.39.mlp.experts.1.gate_proj.weight_scale": "model-00040-of-00047.safetensors", + "model.layers.39.mlp.experts.1.up_proj.weight": "model-00040-of-00047.safetensors", + "model.layers.39.mlp.experts.1.up_proj.weight_scale": "model-00040-of-00047.safetensors", + "model.layers.39.mlp.experts.10.down_proj.weight": "model-00040-of-00047.safetensors", + "model.layers.39.mlp.experts.10.down_proj.weight_scale": "model-00040-of-00047.safetensors", + "model.layers.39.mlp.experts.10.gate_proj.weight": "model-00040-of-00047.safetensors", + "model.layers.39.mlp.experts.10.gate_proj.weight_scale": "model-00040-of-00047.safetensors", + "model.layers.39.mlp.experts.10.up_proj.weight": "model-00040-of-00047.safetensors", + "model.layers.39.mlp.experts.10.up_proj.weight_scale": "model-00040-of-00047.safetensors", + "model.layers.39.mlp.experts.100.down_proj.weight": "model-00040-of-00047.safetensors", + "model.layers.39.mlp.experts.100.down_proj.weight_scale": "model-00040-of-00047.safetensors", + "model.layers.39.mlp.experts.100.gate_proj.weight": "model-00040-of-00047.safetensors", + "model.layers.39.mlp.experts.100.gate_proj.weight_scale": "model-00040-of-00047.safetensors", + "model.layers.39.mlp.experts.100.up_proj.weight": "model-00040-of-00047.safetensors", + "model.layers.39.mlp.experts.100.up_proj.weight_scale": "model-00040-of-00047.safetensors", + "model.layers.39.mlp.experts.101.down_proj.weight": "model-00040-of-00047.safetensors", + "model.layers.39.mlp.experts.101.down_proj.weight_scale": "model-00040-of-00047.safetensors", + "model.layers.39.mlp.experts.101.gate_proj.weight": "model-00040-of-00047.safetensors", + "model.layers.39.mlp.experts.101.gate_proj.weight_scale": "model-00040-of-00047.safetensors", + "model.layers.39.mlp.experts.101.up_proj.weight": "model-00040-of-00047.safetensors", + "model.layers.39.mlp.experts.101.up_proj.weight_scale": "model-00040-of-00047.safetensors", + "model.layers.39.mlp.experts.102.down_proj.weight": "model-00040-of-00047.safetensors", + "model.layers.39.mlp.experts.102.down_proj.weight_scale": "model-00040-of-00047.safetensors", + "model.layers.39.mlp.experts.102.gate_proj.weight": "model-00040-of-00047.safetensors", + "model.layers.39.mlp.experts.102.gate_proj.weight_scale": "model-00040-of-00047.safetensors", + "model.layers.39.mlp.experts.102.up_proj.weight": "model-00040-of-00047.safetensors", + "model.layers.39.mlp.experts.102.up_proj.weight_scale": "model-00040-of-00047.safetensors", + "model.layers.39.mlp.experts.103.down_proj.weight": "model-00040-of-00047.safetensors", + "model.layers.39.mlp.experts.103.down_proj.weight_scale": "model-00040-of-00047.safetensors", + "model.layers.39.mlp.experts.103.gate_proj.weight": "model-00040-of-00047.safetensors", + "model.layers.39.mlp.experts.103.gate_proj.weight_scale": "model-00040-of-00047.safetensors", + "model.layers.39.mlp.experts.103.up_proj.weight": "model-00040-of-00047.safetensors", + "model.layers.39.mlp.experts.103.up_proj.weight_scale": "model-00040-of-00047.safetensors", + "model.layers.39.mlp.experts.104.down_proj.weight": "model-00040-of-00047.safetensors", + "model.layers.39.mlp.experts.104.down_proj.weight_scale": "model-00040-of-00047.safetensors", + "model.layers.39.mlp.experts.104.gate_proj.weight": "model-00040-of-00047.safetensors", + "model.layers.39.mlp.experts.104.gate_proj.weight_scale": "model-00040-of-00047.safetensors", + "model.layers.39.mlp.experts.104.up_proj.weight": "model-00040-of-00047.safetensors", + "model.layers.39.mlp.experts.104.up_proj.weight_scale": "model-00040-of-00047.safetensors", + "model.layers.39.mlp.experts.105.down_proj.weight": "model-00040-of-00047.safetensors", + "model.layers.39.mlp.experts.105.down_proj.weight_scale": "model-00040-of-00047.safetensors", + "model.layers.39.mlp.experts.105.gate_proj.weight": "model-00040-of-00047.safetensors", + "model.layers.39.mlp.experts.105.gate_proj.weight_scale": "model-00040-of-00047.safetensors", + "model.layers.39.mlp.experts.105.up_proj.weight": "model-00040-of-00047.safetensors", + "model.layers.39.mlp.experts.105.up_proj.weight_scale": "model-00040-of-00047.safetensors", + "model.layers.39.mlp.experts.106.down_proj.weight": "model-00040-of-00047.safetensors", + "model.layers.39.mlp.experts.106.down_proj.weight_scale": "model-00040-of-00047.safetensors", + "model.layers.39.mlp.experts.106.gate_proj.weight": "model-00040-of-00047.safetensors", + "model.layers.39.mlp.experts.106.gate_proj.weight_scale": "model-00040-of-00047.safetensors", + "model.layers.39.mlp.experts.106.up_proj.weight": "model-00040-of-00047.safetensors", + "model.layers.39.mlp.experts.106.up_proj.weight_scale": "model-00040-of-00047.safetensors", + "model.layers.39.mlp.experts.107.down_proj.weight": "model-00040-of-00047.safetensors", + "model.layers.39.mlp.experts.107.down_proj.weight_scale": "model-00040-of-00047.safetensors", + "model.layers.39.mlp.experts.107.gate_proj.weight": "model-00040-of-00047.safetensors", + "model.layers.39.mlp.experts.107.gate_proj.weight_scale": "model-00040-of-00047.safetensors", + "model.layers.39.mlp.experts.107.up_proj.weight": "model-00040-of-00047.safetensors", + "model.layers.39.mlp.experts.107.up_proj.weight_scale": "model-00040-of-00047.safetensors", + "model.layers.39.mlp.experts.108.down_proj.weight": "model-00040-of-00047.safetensors", + "model.layers.39.mlp.experts.108.down_proj.weight_scale": "model-00040-of-00047.safetensors", + "model.layers.39.mlp.experts.108.gate_proj.weight": "model-00040-of-00047.safetensors", + "model.layers.39.mlp.experts.108.gate_proj.weight_scale": "model-00040-of-00047.safetensors", + "model.layers.39.mlp.experts.108.up_proj.weight": "model-00040-of-00047.safetensors", + "model.layers.39.mlp.experts.108.up_proj.weight_scale": "model-00040-of-00047.safetensors", + "model.layers.39.mlp.experts.109.down_proj.weight": "model-00040-of-00047.safetensors", + "model.layers.39.mlp.experts.109.down_proj.weight_scale": "model-00040-of-00047.safetensors", + "model.layers.39.mlp.experts.109.gate_proj.weight": "model-00040-of-00047.safetensors", + "model.layers.39.mlp.experts.109.gate_proj.weight_scale": "model-00040-of-00047.safetensors", + "model.layers.39.mlp.experts.109.up_proj.weight": "model-00040-of-00047.safetensors", + "model.layers.39.mlp.experts.109.up_proj.weight_scale": "model-00040-of-00047.safetensors", + "model.layers.39.mlp.experts.11.down_proj.weight": "model-00040-of-00047.safetensors", + "model.layers.39.mlp.experts.11.down_proj.weight_scale": "model-00040-of-00047.safetensors", + "model.layers.39.mlp.experts.11.gate_proj.weight": "model-00040-of-00047.safetensors", + "model.layers.39.mlp.experts.11.gate_proj.weight_scale": "model-00040-of-00047.safetensors", + "model.layers.39.mlp.experts.11.up_proj.weight": "model-00040-of-00047.safetensors", + "model.layers.39.mlp.experts.11.up_proj.weight_scale": "model-00040-of-00047.safetensors", + "model.layers.39.mlp.experts.110.down_proj.weight": "model-00040-of-00047.safetensors", + "model.layers.39.mlp.experts.110.down_proj.weight_scale": "model-00040-of-00047.safetensors", + "model.layers.39.mlp.experts.110.gate_proj.weight": "model-00040-of-00047.safetensors", + "model.layers.39.mlp.experts.110.gate_proj.weight_scale": "model-00040-of-00047.safetensors", + "model.layers.39.mlp.experts.110.up_proj.weight": "model-00040-of-00047.safetensors", + "model.layers.39.mlp.experts.110.up_proj.weight_scale": "model-00040-of-00047.safetensors", + "model.layers.39.mlp.experts.111.down_proj.weight": "model-00040-of-00047.safetensors", + "model.layers.39.mlp.experts.111.down_proj.weight_scale": "model-00040-of-00047.safetensors", + "model.layers.39.mlp.experts.111.gate_proj.weight": "model-00040-of-00047.safetensors", + "model.layers.39.mlp.experts.111.gate_proj.weight_scale": "model-00040-of-00047.safetensors", + "model.layers.39.mlp.experts.111.up_proj.weight": "model-00040-of-00047.safetensors", + "model.layers.39.mlp.experts.111.up_proj.weight_scale": "model-00040-of-00047.safetensors", + "model.layers.39.mlp.experts.112.down_proj.weight": "model-00040-of-00047.safetensors", + "model.layers.39.mlp.experts.112.down_proj.weight_scale": "model-00040-of-00047.safetensors", + "model.layers.39.mlp.experts.112.gate_proj.weight": "model-00040-of-00047.safetensors", + "model.layers.39.mlp.experts.112.gate_proj.weight_scale": "model-00040-of-00047.safetensors", + "model.layers.39.mlp.experts.112.up_proj.weight": "model-00040-of-00047.safetensors", + "model.layers.39.mlp.experts.112.up_proj.weight_scale": "model-00040-of-00047.safetensors", + "model.layers.39.mlp.experts.113.down_proj.weight": "model-00040-of-00047.safetensors", + "model.layers.39.mlp.experts.113.down_proj.weight_scale": "model-00040-of-00047.safetensors", + "model.layers.39.mlp.experts.113.gate_proj.weight": "model-00040-of-00047.safetensors", + "model.layers.39.mlp.experts.113.gate_proj.weight_scale": "model-00040-of-00047.safetensors", + "model.layers.39.mlp.experts.113.up_proj.weight": "model-00040-of-00047.safetensors", + "model.layers.39.mlp.experts.113.up_proj.weight_scale": "model-00040-of-00047.safetensors", + "model.layers.39.mlp.experts.114.down_proj.weight": "model-00040-of-00047.safetensors", + "model.layers.39.mlp.experts.114.down_proj.weight_scale": "model-00040-of-00047.safetensors", + "model.layers.39.mlp.experts.114.gate_proj.weight": "model-00040-of-00047.safetensors", + "model.layers.39.mlp.experts.114.gate_proj.weight_scale": "model-00040-of-00047.safetensors", + "model.layers.39.mlp.experts.114.up_proj.weight": "model-00040-of-00047.safetensors", + "model.layers.39.mlp.experts.114.up_proj.weight_scale": "model-00040-of-00047.safetensors", + "model.layers.39.mlp.experts.115.down_proj.weight": "model-00040-of-00047.safetensors", + "model.layers.39.mlp.experts.115.down_proj.weight_scale": "model-00040-of-00047.safetensors", + "model.layers.39.mlp.experts.115.gate_proj.weight": "model-00040-of-00047.safetensors", + "model.layers.39.mlp.experts.115.gate_proj.weight_scale": "model-00040-of-00047.safetensors", + "model.layers.39.mlp.experts.115.up_proj.weight": "model-00040-of-00047.safetensors", + "model.layers.39.mlp.experts.115.up_proj.weight_scale": "model-00040-of-00047.safetensors", + "model.layers.39.mlp.experts.116.down_proj.weight": "model-00040-of-00047.safetensors", + "model.layers.39.mlp.experts.116.down_proj.weight_scale": "model-00040-of-00047.safetensors", + "model.layers.39.mlp.experts.116.gate_proj.weight": "model-00040-of-00047.safetensors", + "model.layers.39.mlp.experts.116.gate_proj.weight_scale": "model-00040-of-00047.safetensors", + "model.layers.39.mlp.experts.116.up_proj.weight": "model-00040-of-00047.safetensors", + "model.layers.39.mlp.experts.116.up_proj.weight_scale": "model-00040-of-00047.safetensors", + "model.layers.39.mlp.experts.117.down_proj.weight": "model-00040-of-00047.safetensors", + "model.layers.39.mlp.experts.117.down_proj.weight_scale": "model-00040-of-00047.safetensors", + "model.layers.39.mlp.experts.117.gate_proj.weight": "model-00040-of-00047.safetensors", + "model.layers.39.mlp.experts.117.gate_proj.weight_scale": "model-00040-of-00047.safetensors", + "model.layers.39.mlp.experts.117.up_proj.weight": "model-00040-of-00047.safetensors", + "model.layers.39.mlp.experts.117.up_proj.weight_scale": "model-00040-of-00047.safetensors", + "model.layers.39.mlp.experts.118.down_proj.weight": "model-00040-of-00047.safetensors", + "model.layers.39.mlp.experts.118.down_proj.weight_scale": "model-00040-of-00047.safetensors", + "model.layers.39.mlp.experts.118.gate_proj.weight": "model-00040-of-00047.safetensors", + "model.layers.39.mlp.experts.118.gate_proj.weight_scale": "model-00040-of-00047.safetensors", + "model.layers.39.mlp.experts.118.up_proj.weight": "model-00040-of-00047.safetensors", + "model.layers.39.mlp.experts.118.up_proj.weight_scale": "model-00040-of-00047.safetensors", + "model.layers.39.mlp.experts.119.down_proj.weight": "model-00040-of-00047.safetensors", + "model.layers.39.mlp.experts.119.down_proj.weight_scale": "model-00040-of-00047.safetensors", + "model.layers.39.mlp.experts.119.gate_proj.weight": "model-00040-of-00047.safetensors", + "model.layers.39.mlp.experts.119.gate_proj.weight_scale": "model-00040-of-00047.safetensors", + "model.layers.39.mlp.experts.119.up_proj.weight": "model-00040-of-00047.safetensors", + "model.layers.39.mlp.experts.119.up_proj.weight_scale": "model-00040-of-00047.safetensors", + "model.layers.39.mlp.experts.12.down_proj.weight": "model-00040-of-00047.safetensors", + "model.layers.39.mlp.experts.12.down_proj.weight_scale": "model-00040-of-00047.safetensors", + "model.layers.39.mlp.experts.12.gate_proj.weight": "model-00040-of-00047.safetensors", + "model.layers.39.mlp.experts.12.gate_proj.weight_scale": "model-00040-of-00047.safetensors", + "model.layers.39.mlp.experts.12.up_proj.weight": "model-00040-of-00047.safetensors", + "model.layers.39.mlp.experts.12.up_proj.weight_scale": "model-00040-of-00047.safetensors", + "model.layers.39.mlp.experts.120.down_proj.weight": "model-00040-of-00047.safetensors", + "model.layers.39.mlp.experts.120.down_proj.weight_scale": "model-00040-of-00047.safetensors", + "model.layers.39.mlp.experts.120.gate_proj.weight": "model-00040-of-00047.safetensors", + "model.layers.39.mlp.experts.120.gate_proj.weight_scale": "model-00040-of-00047.safetensors", + "model.layers.39.mlp.experts.120.up_proj.weight": "model-00040-of-00047.safetensors", + "model.layers.39.mlp.experts.120.up_proj.weight_scale": "model-00040-of-00047.safetensors", + "model.layers.39.mlp.experts.121.down_proj.weight": "model-00040-of-00047.safetensors", + "model.layers.39.mlp.experts.121.down_proj.weight_scale": "model-00040-of-00047.safetensors", + "model.layers.39.mlp.experts.121.gate_proj.weight": "model-00040-of-00047.safetensors", + "model.layers.39.mlp.experts.121.gate_proj.weight_scale": "model-00040-of-00047.safetensors", + "model.layers.39.mlp.experts.121.up_proj.weight": "model-00040-of-00047.safetensors", + "model.layers.39.mlp.experts.121.up_proj.weight_scale": "model-00040-of-00047.safetensors", + "model.layers.39.mlp.experts.122.down_proj.weight": "model-00040-of-00047.safetensors", + "model.layers.39.mlp.experts.122.down_proj.weight_scale": "model-00040-of-00047.safetensors", + "model.layers.39.mlp.experts.122.gate_proj.weight": "model-00040-of-00047.safetensors", + "model.layers.39.mlp.experts.122.gate_proj.weight_scale": "model-00040-of-00047.safetensors", + "model.layers.39.mlp.experts.122.up_proj.weight": "model-00040-of-00047.safetensors", + "model.layers.39.mlp.experts.122.up_proj.weight_scale": "model-00040-of-00047.safetensors", + "model.layers.39.mlp.experts.123.down_proj.weight": "model-00040-of-00047.safetensors", + "model.layers.39.mlp.experts.123.down_proj.weight_scale": "model-00040-of-00047.safetensors", + "model.layers.39.mlp.experts.123.gate_proj.weight": "model-00040-of-00047.safetensors", + "model.layers.39.mlp.experts.123.gate_proj.weight_scale": "model-00040-of-00047.safetensors", + "model.layers.39.mlp.experts.123.up_proj.weight": "model-00040-of-00047.safetensors", + "model.layers.39.mlp.experts.123.up_proj.weight_scale": "model-00040-of-00047.safetensors", + "model.layers.39.mlp.experts.124.down_proj.weight": "model-00040-of-00047.safetensors", + "model.layers.39.mlp.experts.124.down_proj.weight_scale": "model-00040-of-00047.safetensors", + "model.layers.39.mlp.experts.124.gate_proj.weight": "model-00040-of-00047.safetensors", + "model.layers.39.mlp.experts.124.gate_proj.weight_scale": "model-00040-of-00047.safetensors", + "model.layers.39.mlp.experts.124.up_proj.weight": "model-00040-of-00047.safetensors", + "model.layers.39.mlp.experts.124.up_proj.weight_scale": "model-00040-of-00047.safetensors", + "model.layers.39.mlp.experts.125.down_proj.weight": "model-00040-of-00047.safetensors", + "model.layers.39.mlp.experts.125.down_proj.weight_scale": "model-00040-of-00047.safetensors", + "model.layers.39.mlp.experts.125.gate_proj.weight": "model-00040-of-00047.safetensors", + "model.layers.39.mlp.experts.125.gate_proj.weight_scale": "model-00040-of-00047.safetensors", + "model.layers.39.mlp.experts.125.up_proj.weight": "model-00040-of-00047.safetensors", + "model.layers.39.mlp.experts.125.up_proj.weight_scale": "model-00040-of-00047.safetensors", + "model.layers.39.mlp.experts.126.down_proj.weight": "model-00040-of-00047.safetensors", + "model.layers.39.mlp.experts.126.down_proj.weight_scale": "model-00040-of-00047.safetensors", + "model.layers.39.mlp.experts.126.gate_proj.weight": "model-00040-of-00047.safetensors", + "model.layers.39.mlp.experts.126.gate_proj.weight_scale": "model-00040-of-00047.safetensors", + "model.layers.39.mlp.experts.126.up_proj.weight": "model-00040-of-00047.safetensors", + "model.layers.39.mlp.experts.126.up_proj.weight_scale": "model-00040-of-00047.safetensors", + "model.layers.39.mlp.experts.127.down_proj.weight": "model-00040-of-00047.safetensors", + "model.layers.39.mlp.experts.127.down_proj.weight_scale": "model-00040-of-00047.safetensors", + "model.layers.39.mlp.experts.127.gate_proj.weight": "model-00040-of-00047.safetensors", + "model.layers.39.mlp.experts.127.gate_proj.weight_scale": "model-00040-of-00047.safetensors", + "model.layers.39.mlp.experts.127.up_proj.weight": "model-00040-of-00047.safetensors", + "model.layers.39.mlp.experts.127.up_proj.weight_scale": "model-00040-of-00047.safetensors", + "model.layers.39.mlp.experts.13.down_proj.weight": "model-00040-of-00047.safetensors", + "model.layers.39.mlp.experts.13.down_proj.weight_scale": "model-00040-of-00047.safetensors", + "model.layers.39.mlp.experts.13.gate_proj.weight": "model-00040-of-00047.safetensors", + "model.layers.39.mlp.experts.13.gate_proj.weight_scale": "model-00040-of-00047.safetensors", + "model.layers.39.mlp.experts.13.up_proj.weight": "model-00040-of-00047.safetensors", + "model.layers.39.mlp.experts.13.up_proj.weight_scale": "model-00040-of-00047.safetensors", + "model.layers.39.mlp.experts.14.down_proj.weight": "model-00040-of-00047.safetensors", + "model.layers.39.mlp.experts.14.down_proj.weight_scale": "model-00040-of-00047.safetensors", + "model.layers.39.mlp.experts.14.gate_proj.weight": "model-00040-of-00047.safetensors", + "model.layers.39.mlp.experts.14.gate_proj.weight_scale": "model-00040-of-00047.safetensors", + "model.layers.39.mlp.experts.14.up_proj.weight": "model-00040-of-00047.safetensors", + "model.layers.39.mlp.experts.14.up_proj.weight_scale": "model-00040-of-00047.safetensors", + "model.layers.39.mlp.experts.15.down_proj.weight": "model-00040-of-00047.safetensors", + "model.layers.39.mlp.experts.15.down_proj.weight_scale": "model-00040-of-00047.safetensors", + "model.layers.39.mlp.experts.15.gate_proj.weight": "model-00040-of-00047.safetensors", + "model.layers.39.mlp.experts.15.gate_proj.weight_scale": "model-00040-of-00047.safetensors", + "model.layers.39.mlp.experts.15.up_proj.weight": "model-00040-of-00047.safetensors", + "model.layers.39.mlp.experts.15.up_proj.weight_scale": "model-00040-of-00047.safetensors", + "model.layers.39.mlp.experts.16.down_proj.weight": "model-00040-of-00047.safetensors", + "model.layers.39.mlp.experts.16.down_proj.weight_scale": "model-00040-of-00047.safetensors", + "model.layers.39.mlp.experts.16.gate_proj.weight": "model-00040-of-00047.safetensors", + "model.layers.39.mlp.experts.16.gate_proj.weight_scale": "model-00040-of-00047.safetensors", + "model.layers.39.mlp.experts.16.up_proj.weight": "model-00040-of-00047.safetensors", + "model.layers.39.mlp.experts.16.up_proj.weight_scale": "model-00040-of-00047.safetensors", + "model.layers.39.mlp.experts.17.down_proj.weight": "model-00040-of-00047.safetensors", + "model.layers.39.mlp.experts.17.down_proj.weight_scale": "model-00040-of-00047.safetensors", + "model.layers.39.mlp.experts.17.gate_proj.weight": "model-00040-of-00047.safetensors", + "model.layers.39.mlp.experts.17.gate_proj.weight_scale": "model-00040-of-00047.safetensors", + "model.layers.39.mlp.experts.17.up_proj.weight": "model-00040-of-00047.safetensors", + "model.layers.39.mlp.experts.17.up_proj.weight_scale": "model-00040-of-00047.safetensors", + "model.layers.39.mlp.experts.18.down_proj.weight": "model-00040-of-00047.safetensors", + "model.layers.39.mlp.experts.18.down_proj.weight_scale": "model-00040-of-00047.safetensors", + "model.layers.39.mlp.experts.18.gate_proj.weight": "model-00040-of-00047.safetensors", + "model.layers.39.mlp.experts.18.gate_proj.weight_scale": "model-00040-of-00047.safetensors", + "model.layers.39.mlp.experts.18.up_proj.weight": "model-00040-of-00047.safetensors", + "model.layers.39.mlp.experts.18.up_proj.weight_scale": "model-00040-of-00047.safetensors", + "model.layers.39.mlp.experts.19.down_proj.weight": "model-00040-of-00047.safetensors", + "model.layers.39.mlp.experts.19.down_proj.weight_scale": "model-00040-of-00047.safetensors", + "model.layers.39.mlp.experts.19.gate_proj.weight": "model-00040-of-00047.safetensors", + "model.layers.39.mlp.experts.19.gate_proj.weight_scale": "model-00040-of-00047.safetensors", + "model.layers.39.mlp.experts.19.up_proj.weight": "model-00040-of-00047.safetensors", + "model.layers.39.mlp.experts.19.up_proj.weight_scale": "model-00040-of-00047.safetensors", + "model.layers.39.mlp.experts.2.down_proj.weight": "model-00040-of-00047.safetensors", + "model.layers.39.mlp.experts.2.down_proj.weight_scale": "model-00040-of-00047.safetensors", + "model.layers.39.mlp.experts.2.gate_proj.weight": "model-00040-of-00047.safetensors", + "model.layers.39.mlp.experts.2.gate_proj.weight_scale": "model-00040-of-00047.safetensors", + "model.layers.39.mlp.experts.2.up_proj.weight": "model-00040-of-00047.safetensors", + "model.layers.39.mlp.experts.2.up_proj.weight_scale": "model-00040-of-00047.safetensors", + "model.layers.39.mlp.experts.20.down_proj.weight": "model-00040-of-00047.safetensors", + "model.layers.39.mlp.experts.20.down_proj.weight_scale": "model-00040-of-00047.safetensors", + "model.layers.39.mlp.experts.20.gate_proj.weight": "model-00040-of-00047.safetensors", + "model.layers.39.mlp.experts.20.gate_proj.weight_scale": "model-00040-of-00047.safetensors", + "model.layers.39.mlp.experts.20.up_proj.weight": "model-00040-of-00047.safetensors", + "model.layers.39.mlp.experts.20.up_proj.weight_scale": "model-00040-of-00047.safetensors", + "model.layers.39.mlp.experts.21.down_proj.weight": "model-00040-of-00047.safetensors", + "model.layers.39.mlp.experts.21.down_proj.weight_scale": "model-00040-of-00047.safetensors", + "model.layers.39.mlp.experts.21.gate_proj.weight": "model-00040-of-00047.safetensors", + "model.layers.39.mlp.experts.21.gate_proj.weight_scale": "model-00040-of-00047.safetensors", + "model.layers.39.mlp.experts.21.up_proj.weight": "model-00040-of-00047.safetensors", + "model.layers.39.mlp.experts.21.up_proj.weight_scale": "model-00040-of-00047.safetensors", + "model.layers.39.mlp.experts.22.down_proj.weight": "model-00040-of-00047.safetensors", + "model.layers.39.mlp.experts.22.down_proj.weight_scale": "model-00040-of-00047.safetensors", + "model.layers.39.mlp.experts.22.gate_proj.weight": "model-00040-of-00047.safetensors", + "model.layers.39.mlp.experts.22.gate_proj.weight_scale": "model-00040-of-00047.safetensors", + "model.layers.39.mlp.experts.22.up_proj.weight": "model-00040-of-00047.safetensors", + "model.layers.39.mlp.experts.22.up_proj.weight_scale": "model-00040-of-00047.safetensors", + "model.layers.39.mlp.experts.23.down_proj.weight": "model-00040-of-00047.safetensors", + "model.layers.39.mlp.experts.23.down_proj.weight_scale": "model-00040-of-00047.safetensors", + "model.layers.39.mlp.experts.23.gate_proj.weight": "model-00040-of-00047.safetensors", + "model.layers.39.mlp.experts.23.gate_proj.weight_scale": "model-00040-of-00047.safetensors", + "model.layers.39.mlp.experts.23.up_proj.weight": "model-00040-of-00047.safetensors", + "model.layers.39.mlp.experts.23.up_proj.weight_scale": "model-00040-of-00047.safetensors", + "model.layers.39.mlp.experts.24.down_proj.weight": "model-00040-of-00047.safetensors", + "model.layers.39.mlp.experts.24.down_proj.weight_scale": "model-00040-of-00047.safetensors", + "model.layers.39.mlp.experts.24.gate_proj.weight": "model-00040-of-00047.safetensors", + "model.layers.39.mlp.experts.24.gate_proj.weight_scale": "model-00040-of-00047.safetensors", + "model.layers.39.mlp.experts.24.up_proj.weight": "model-00040-of-00047.safetensors", + "model.layers.39.mlp.experts.24.up_proj.weight_scale": "model-00040-of-00047.safetensors", + "model.layers.39.mlp.experts.25.down_proj.weight": "model-00040-of-00047.safetensors", + "model.layers.39.mlp.experts.25.down_proj.weight_scale": "model-00040-of-00047.safetensors", + "model.layers.39.mlp.experts.25.gate_proj.weight": "model-00040-of-00047.safetensors", + "model.layers.39.mlp.experts.25.gate_proj.weight_scale": "model-00040-of-00047.safetensors", + "model.layers.39.mlp.experts.25.up_proj.weight": "model-00040-of-00047.safetensors", + "model.layers.39.mlp.experts.25.up_proj.weight_scale": "model-00040-of-00047.safetensors", + "model.layers.39.mlp.experts.26.down_proj.weight": "model-00040-of-00047.safetensors", + "model.layers.39.mlp.experts.26.down_proj.weight_scale": "model-00040-of-00047.safetensors", + "model.layers.39.mlp.experts.26.gate_proj.weight": "model-00040-of-00047.safetensors", + "model.layers.39.mlp.experts.26.gate_proj.weight_scale": "model-00040-of-00047.safetensors", + "model.layers.39.mlp.experts.26.up_proj.weight": "model-00040-of-00047.safetensors", + "model.layers.39.mlp.experts.26.up_proj.weight_scale": "model-00040-of-00047.safetensors", + "model.layers.39.mlp.experts.27.down_proj.weight": "model-00040-of-00047.safetensors", + "model.layers.39.mlp.experts.27.down_proj.weight_scale": "model-00040-of-00047.safetensors", + "model.layers.39.mlp.experts.27.gate_proj.weight": "model-00040-of-00047.safetensors", + "model.layers.39.mlp.experts.27.gate_proj.weight_scale": "model-00040-of-00047.safetensors", + "model.layers.39.mlp.experts.27.up_proj.weight": "model-00040-of-00047.safetensors", + "model.layers.39.mlp.experts.27.up_proj.weight_scale": "model-00040-of-00047.safetensors", + "model.layers.39.mlp.experts.28.down_proj.weight": "model-00040-of-00047.safetensors", + "model.layers.39.mlp.experts.28.down_proj.weight_scale": "model-00040-of-00047.safetensors", + "model.layers.39.mlp.experts.28.gate_proj.weight": "model-00040-of-00047.safetensors", + "model.layers.39.mlp.experts.28.gate_proj.weight_scale": "model-00040-of-00047.safetensors", + "model.layers.39.mlp.experts.28.up_proj.weight": "model-00040-of-00047.safetensors", + "model.layers.39.mlp.experts.28.up_proj.weight_scale": "model-00040-of-00047.safetensors", + "model.layers.39.mlp.experts.29.down_proj.weight": "model-00040-of-00047.safetensors", + "model.layers.39.mlp.experts.29.down_proj.weight_scale": "model-00040-of-00047.safetensors", + "model.layers.39.mlp.experts.29.gate_proj.weight": "model-00040-of-00047.safetensors", + "model.layers.39.mlp.experts.29.gate_proj.weight_scale": "model-00040-of-00047.safetensors", + "model.layers.39.mlp.experts.29.up_proj.weight": "model-00040-of-00047.safetensors", + "model.layers.39.mlp.experts.29.up_proj.weight_scale": "model-00040-of-00047.safetensors", + "model.layers.39.mlp.experts.3.down_proj.weight": "model-00040-of-00047.safetensors", + "model.layers.39.mlp.experts.3.down_proj.weight_scale": "model-00040-of-00047.safetensors", + "model.layers.39.mlp.experts.3.gate_proj.weight": "model-00040-of-00047.safetensors", + "model.layers.39.mlp.experts.3.gate_proj.weight_scale": "model-00040-of-00047.safetensors", + "model.layers.39.mlp.experts.3.up_proj.weight": "model-00040-of-00047.safetensors", + "model.layers.39.mlp.experts.3.up_proj.weight_scale": "model-00040-of-00047.safetensors", + "model.layers.39.mlp.experts.30.down_proj.weight": "model-00040-of-00047.safetensors", + "model.layers.39.mlp.experts.30.down_proj.weight_scale": "model-00040-of-00047.safetensors", + "model.layers.39.mlp.experts.30.gate_proj.weight": "model-00040-of-00047.safetensors", + "model.layers.39.mlp.experts.30.gate_proj.weight_scale": "model-00040-of-00047.safetensors", + "model.layers.39.mlp.experts.30.up_proj.weight": "model-00040-of-00047.safetensors", + "model.layers.39.mlp.experts.30.up_proj.weight_scale": "model-00040-of-00047.safetensors", + "model.layers.39.mlp.experts.31.down_proj.weight": "model-00040-of-00047.safetensors", + "model.layers.39.mlp.experts.31.down_proj.weight_scale": "model-00040-of-00047.safetensors", + "model.layers.39.mlp.experts.31.gate_proj.weight": "model-00040-of-00047.safetensors", + "model.layers.39.mlp.experts.31.gate_proj.weight_scale": "model-00040-of-00047.safetensors", + "model.layers.39.mlp.experts.31.up_proj.weight": "model-00040-of-00047.safetensors", + "model.layers.39.mlp.experts.31.up_proj.weight_scale": "model-00040-of-00047.safetensors", + "model.layers.39.mlp.experts.32.down_proj.weight": "model-00040-of-00047.safetensors", + "model.layers.39.mlp.experts.32.down_proj.weight_scale": "model-00040-of-00047.safetensors", + "model.layers.39.mlp.experts.32.gate_proj.weight": "model-00040-of-00047.safetensors", + "model.layers.39.mlp.experts.32.gate_proj.weight_scale": "model-00040-of-00047.safetensors", + "model.layers.39.mlp.experts.32.up_proj.weight": "model-00040-of-00047.safetensors", + "model.layers.39.mlp.experts.32.up_proj.weight_scale": "model-00040-of-00047.safetensors", + "model.layers.39.mlp.experts.33.down_proj.weight": "model-00040-of-00047.safetensors", + "model.layers.39.mlp.experts.33.down_proj.weight_scale": "model-00040-of-00047.safetensors", + "model.layers.39.mlp.experts.33.gate_proj.weight": "model-00040-of-00047.safetensors", + "model.layers.39.mlp.experts.33.gate_proj.weight_scale": "model-00040-of-00047.safetensors", + "model.layers.39.mlp.experts.33.up_proj.weight": "model-00040-of-00047.safetensors", + "model.layers.39.mlp.experts.33.up_proj.weight_scale": "model-00040-of-00047.safetensors", + "model.layers.39.mlp.experts.34.down_proj.weight": "model-00040-of-00047.safetensors", + "model.layers.39.mlp.experts.34.down_proj.weight_scale": "model-00040-of-00047.safetensors", + "model.layers.39.mlp.experts.34.gate_proj.weight": "model-00040-of-00047.safetensors", + "model.layers.39.mlp.experts.34.gate_proj.weight_scale": "model-00040-of-00047.safetensors", + "model.layers.39.mlp.experts.34.up_proj.weight": "model-00040-of-00047.safetensors", + "model.layers.39.mlp.experts.34.up_proj.weight_scale": "model-00040-of-00047.safetensors", + "model.layers.39.mlp.experts.35.down_proj.weight": "model-00040-of-00047.safetensors", + "model.layers.39.mlp.experts.35.down_proj.weight_scale": "model-00040-of-00047.safetensors", + "model.layers.39.mlp.experts.35.gate_proj.weight": "model-00040-of-00047.safetensors", + "model.layers.39.mlp.experts.35.gate_proj.weight_scale": "model-00040-of-00047.safetensors", + "model.layers.39.mlp.experts.35.up_proj.weight": "model-00040-of-00047.safetensors", + "model.layers.39.mlp.experts.35.up_proj.weight_scale": "model-00040-of-00047.safetensors", + "model.layers.39.mlp.experts.36.down_proj.weight": "model-00040-of-00047.safetensors", + "model.layers.39.mlp.experts.36.down_proj.weight_scale": "model-00040-of-00047.safetensors", + "model.layers.39.mlp.experts.36.gate_proj.weight": "model-00040-of-00047.safetensors", + "model.layers.39.mlp.experts.36.gate_proj.weight_scale": "model-00040-of-00047.safetensors", + "model.layers.39.mlp.experts.36.up_proj.weight": "model-00040-of-00047.safetensors", + "model.layers.39.mlp.experts.36.up_proj.weight_scale": "model-00040-of-00047.safetensors", + "model.layers.39.mlp.experts.37.down_proj.weight": "model-00040-of-00047.safetensors", + "model.layers.39.mlp.experts.37.down_proj.weight_scale": "model-00040-of-00047.safetensors", + "model.layers.39.mlp.experts.37.gate_proj.weight": "model-00040-of-00047.safetensors", + "model.layers.39.mlp.experts.37.gate_proj.weight_scale": "model-00040-of-00047.safetensors", + "model.layers.39.mlp.experts.37.up_proj.weight": "model-00040-of-00047.safetensors", + "model.layers.39.mlp.experts.37.up_proj.weight_scale": "model-00040-of-00047.safetensors", + "model.layers.39.mlp.experts.38.down_proj.weight": "model-00040-of-00047.safetensors", + "model.layers.39.mlp.experts.38.down_proj.weight_scale": "model-00040-of-00047.safetensors", + "model.layers.39.mlp.experts.38.gate_proj.weight": "model-00040-of-00047.safetensors", + "model.layers.39.mlp.experts.38.gate_proj.weight_scale": "model-00040-of-00047.safetensors", + "model.layers.39.mlp.experts.38.up_proj.weight": "model-00040-of-00047.safetensors", + "model.layers.39.mlp.experts.38.up_proj.weight_scale": "model-00040-of-00047.safetensors", + "model.layers.39.mlp.experts.39.down_proj.weight": "model-00040-of-00047.safetensors", + "model.layers.39.mlp.experts.39.down_proj.weight_scale": "model-00040-of-00047.safetensors", + "model.layers.39.mlp.experts.39.gate_proj.weight": "model-00040-of-00047.safetensors", + "model.layers.39.mlp.experts.39.gate_proj.weight_scale": "model-00040-of-00047.safetensors", + "model.layers.39.mlp.experts.39.up_proj.weight": "model-00040-of-00047.safetensors", + "model.layers.39.mlp.experts.39.up_proj.weight_scale": "model-00040-of-00047.safetensors", + "model.layers.39.mlp.experts.4.down_proj.weight": "model-00040-of-00047.safetensors", + "model.layers.39.mlp.experts.4.down_proj.weight_scale": "model-00040-of-00047.safetensors", + "model.layers.39.mlp.experts.4.gate_proj.weight": "model-00040-of-00047.safetensors", + "model.layers.39.mlp.experts.4.gate_proj.weight_scale": "model-00040-of-00047.safetensors", + "model.layers.39.mlp.experts.4.up_proj.weight": "model-00040-of-00047.safetensors", + "model.layers.39.mlp.experts.4.up_proj.weight_scale": "model-00040-of-00047.safetensors", + "model.layers.39.mlp.experts.40.down_proj.weight": "model-00040-of-00047.safetensors", + "model.layers.39.mlp.experts.40.down_proj.weight_scale": "model-00040-of-00047.safetensors", + "model.layers.39.mlp.experts.40.gate_proj.weight": "model-00040-of-00047.safetensors", + "model.layers.39.mlp.experts.40.gate_proj.weight_scale": "model-00040-of-00047.safetensors", + "model.layers.39.mlp.experts.40.up_proj.weight": "model-00040-of-00047.safetensors", + "model.layers.39.mlp.experts.40.up_proj.weight_scale": "model-00040-of-00047.safetensors", + "model.layers.39.mlp.experts.41.down_proj.weight": "model-00040-of-00047.safetensors", + "model.layers.39.mlp.experts.41.down_proj.weight_scale": "model-00040-of-00047.safetensors", + "model.layers.39.mlp.experts.41.gate_proj.weight": "model-00040-of-00047.safetensors", + "model.layers.39.mlp.experts.41.gate_proj.weight_scale": "model-00040-of-00047.safetensors", + "model.layers.39.mlp.experts.41.up_proj.weight": "model-00040-of-00047.safetensors", + "model.layers.39.mlp.experts.41.up_proj.weight_scale": "model-00040-of-00047.safetensors", + "model.layers.39.mlp.experts.42.down_proj.weight": "model-00040-of-00047.safetensors", + "model.layers.39.mlp.experts.42.down_proj.weight_scale": "model-00040-of-00047.safetensors", + "model.layers.39.mlp.experts.42.gate_proj.weight": "model-00040-of-00047.safetensors", + "model.layers.39.mlp.experts.42.gate_proj.weight_scale": "model-00040-of-00047.safetensors", + "model.layers.39.mlp.experts.42.up_proj.weight": "model-00040-of-00047.safetensors", + "model.layers.39.mlp.experts.42.up_proj.weight_scale": "model-00040-of-00047.safetensors", + "model.layers.39.mlp.experts.43.down_proj.weight": "model-00040-of-00047.safetensors", + "model.layers.39.mlp.experts.43.down_proj.weight_scale": "model-00040-of-00047.safetensors", + "model.layers.39.mlp.experts.43.gate_proj.weight": "model-00040-of-00047.safetensors", + "model.layers.39.mlp.experts.43.gate_proj.weight_scale": "model-00040-of-00047.safetensors", + "model.layers.39.mlp.experts.43.up_proj.weight": "model-00040-of-00047.safetensors", + "model.layers.39.mlp.experts.43.up_proj.weight_scale": "model-00040-of-00047.safetensors", + "model.layers.39.mlp.experts.44.down_proj.weight": "model-00040-of-00047.safetensors", + "model.layers.39.mlp.experts.44.down_proj.weight_scale": "model-00040-of-00047.safetensors", + "model.layers.39.mlp.experts.44.gate_proj.weight": "model-00040-of-00047.safetensors", + "model.layers.39.mlp.experts.44.gate_proj.weight_scale": "model-00040-of-00047.safetensors", + "model.layers.39.mlp.experts.44.up_proj.weight": "model-00040-of-00047.safetensors", + "model.layers.39.mlp.experts.44.up_proj.weight_scale": "model-00040-of-00047.safetensors", + "model.layers.39.mlp.experts.45.down_proj.weight": "model-00040-of-00047.safetensors", + "model.layers.39.mlp.experts.45.down_proj.weight_scale": "model-00040-of-00047.safetensors", + "model.layers.39.mlp.experts.45.gate_proj.weight": "model-00040-of-00047.safetensors", + "model.layers.39.mlp.experts.45.gate_proj.weight_scale": "model-00040-of-00047.safetensors", + "model.layers.39.mlp.experts.45.up_proj.weight": "model-00040-of-00047.safetensors", + "model.layers.39.mlp.experts.45.up_proj.weight_scale": "model-00040-of-00047.safetensors", + "model.layers.39.mlp.experts.46.down_proj.weight": "model-00040-of-00047.safetensors", + "model.layers.39.mlp.experts.46.down_proj.weight_scale": "model-00040-of-00047.safetensors", + "model.layers.39.mlp.experts.46.gate_proj.weight": "model-00040-of-00047.safetensors", + "model.layers.39.mlp.experts.46.gate_proj.weight_scale": "model-00040-of-00047.safetensors", + "model.layers.39.mlp.experts.46.up_proj.weight": "model-00040-of-00047.safetensors", + "model.layers.39.mlp.experts.46.up_proj.weight_scale": "model-00040-of-00047.safetensors", + "model.layers.39.mlp.experts.47.down_proj.weight": "model-00040-of-00047.safetensors", + "model.layers.39.mlp.experts.47.down_proj.weight_scale": "model-00040-of-00047.safetensors", + "model.layers.39.mlp.experts.47.gate_proj.weight": "model-00040-of-00047.safetensors", + "model.layers.39.mlp.experts.47.gate_proj.weight_scale": "model-00040-of-00047.safetensors", + "model.layers.39.mlp.experts.47.up_proj.weight": "model-00040-of-00047.safetensors", + "model.layers.39.mlp.experts.47.up_proj.weight_scale": "model-00040-of-00047.safetensors", + "model.layers.39.mlp.experts.48.down_proj.weight": "model-00040-of-00047.safetensors", + "model.layers.39.mlp.experts.48.down_proj.weight_scale": "model-00040-of-00047.safetensors", + "model.layers.39.mlp.experts.48.gate_proj.weight": "model-00040-of-00047.safetensors", + "model.layers.39.mlp.experts.48.gate_proj.weight_scale": "model-00040-of-00047.safetensors", + "model.layers.39.mlp.experts.48.up_proj.weight": "model-00040-of-00047.safetensors", + "model.layers.39.mlp.experts.48.up_proj.weight_scale": "model-00040-of-00047.safetensors", + "model.layers.39.mlp.experts.49.down_proj.weight": "model-00040-of-00047.safetensors", + "model.layers.39.mlp.experts.49.down_proj.weight_scale": "model-00040-of-00047.safetensors", + "model.layers.39.mlp.experts.49.gate_proj.weight": "model-00040-of-00047.safetensors", + "model.layers.39.mlp.experts.49.gate_proj.weight_scale": "model-00040-of-00047.safetensors", + "model.layers.39.mlp.experts.49.up_proj.weight": "model-00040-of-00047.safetensors", + "model.layers.39.mlp.experts.49.up_proj.weight_scale": "model-00040-of-00047.safetensors", + "model.layers.39.mlp.experts.5.down_proj.weight": "model-00040-of-00047.safetensors", + "model.layers.39.mlp.experts.5.down_proj.weight_scale": "model-00040-of-00047.safetensors", + "model.layers.39.mlp.experts.5.gate_proj.weight": "model-00040-of-00047.safetensors", + "model.layers.39.mlp.experts.5.gate_proj.weight_scale": "model-00040-of-00047.safetensors", + "model.layers.39.mlp.experts.5.up_proj.weight": "model-00040-of-00047.safetensors", + "model.layers.39.mlp.experts.5.up_proj.weight_scale": "model-00040-of-00047.safetensors", + "model.layers.39.mlp.experts.50.down_proj.weight": "model-00040-of-00047.safetensors", + "model.layers.39.mlp.experts.50.down_proj.weight_scale": "model-00040-of-00047.safetensors", + "model.layers.39.mlp.experts.50.gate_proj.weight": "model-00040-of-00047.safetensors", + "model.layers.39.mlp.experts.50.gate_proj.weight_scale": "model-00040-of-00047.safetensors", + "model.layers.39.mlp.experts.50.up_proj.weight": "model-00040-of-00047.safetensors", + "model.layers.39.mlp.experts.50.up_proj.weight_scale": "model-00040-of-00047.safetensors", + "model.layers.39.mlp.experts.51.down_proj.weight": "model-00040-of-00047.safetensors", + "model.layers.39.mlp.experts.51.down_proj.weight_scale": "model-00040-of-00047.safetensors", + "model.layers.39.mlp.experts.51.gate_proj.weight": "model-00040-of-00047.safetensors", + "model.layers.39.mlp.experts.51.gate_proj.weight_scale": "model-00040-of-00047.safetensors", + "model.layers.39.mlp.experts.51.up_proj.weight": "model-00040-of-00047.safetensors", + "model.layers.39.mlp.experts.51.up_proj.weight_scale": "model-00040-of-00047.safetensors", + "model.layers.39.mlp.experts.52.down_proj.weight": "model-00040-of-00047.safetensors", + "model.layers.39.mlp.experts.52.down_proj.weight_scale": "model-00040-of-00047.safetensors", + "model.layers.39.mlp.experts.52.gate_proj.weight": "model-00040-of-00047.safetensors", + "model.layers.39.mlp.experts.52.gate_proj.weight_scale": "model-00040-of-00047.safetensors", + "model.layers.39.mlp.experts.52.up_proj.weight": "model-00040-of-00047.safetensors", + "model.layers.39.mlp.experts.52.up_proj.weight_scale": "model-00040-of-00047.safetensors", + "model.layers.39.mlp.experts.53.down_proj.weight": "model-00040-of-00047.safetensors", + "model.layers.39.mlp.experts.53.down_proj.weight_scale": "model-00040-of-00047.safetensors", + "model.layers.39.mlp.experts.53.gate_proj.weight": "model-00040-of-00047.safetensors", + "model.layers.39.mlp.experts.53.gate_proj.weight_scale": "model-00040-of-00047.safetensors", + "model.layers.39.mlp.experts.53.up_proj.weight": "model-00040-of-00047.safetensors", + "model.layers.39.mlp.experts.53.up_proj.weight_scale": "model-00040-of-00047.safetensors", + "model.layers.39.mlp.experts.54.down_proj.weight": "model-00040-of-00047.safetensors", + "model.layers.39.mlp.experts.54.down_proj.weight_scale": "model-00040-of-00047.safetensors", + "model.layers.39.mlp.experts.54.gate_proj.weight": "model-00040-of-00047.safetensors", + "model.layers.39.mlp.experts.54.gate_proj.weight_scale": "model-00040-of-00047.safetensors", + "model.layers.39.mlp.experts.54.up_proj.weight": "model-00040-of-00047.safetensors", + "model.layers.39.mlp.experts.54.up_proj.weight_scale": "model-00040-of-00047.safetensors", + "model.layers.39.mlp.experts.55.down_proj.weight": "model-00040-of-00047.safetensors", + "model.layers.39.mlp.experts.55.down_proj.weight_scale": "model-00040-of-00047.safetensors", + "model.layers.39.mlp.experts.55.gate_proj.weight": "model-00040-of-00047.safetensors", + "model.layers.39.mlp.experts.55.gate_proj.weight_scale": "model-00040-of-00047.safetensors", + "model.layers.39.mlp.experts.55.up_proj.weight": "model-00040-of-00047.safetensors", + "model.layers.39.mlp.experts.55.up_proj.weight_scale": "model-00040-of-00047.safetensors", + "model.layers.39.mlp.experts.56.down_proj.weight": "model-00040-of-00047.safetensors", + "model.layers.39.mlp.experts.56.down_proj.weight_scale": "model-00040-of-00047.safetensors", + "model.layers.39.mlp.experts.56.gate_proj.weight": "model-00040-of-00047.safetensors", + "model.layers.39.mlp.experts.56.gate_proj.weight_scale": "model-00040-of-00047.safetensors", + "model.layers.39.mlp.experts.56.up_proj.weight": "model-00040-of-00047.safetensors", + "model.layers.39.mlp.experts.56.up_proj.weight_scale": "model-00040-of-00047.safetensors", + "model.layers.39.mlp.experts.57.down_proj.weight": "model-00040-of-00047.safetensors", + "model.layers.39.mlp.experts.57.down_proj.weight_scale": "model-00040-of-00047.safetensors", + "model.layers.39.mlp.experts.57.gate_proj.weight": "model-00040-of-00047.safetensors", + "model.layers.39.mlp.experts.57.gate_proj.weight_scale": "model-00040-of-00047.safetensors", + "model.layers.39.mlp.experts.57.up_proj.weight": "model-00040-of-00047.safetensors", + "model.layers.39.mlp.experts.57.up_proj.weight_scale": "model-00040-of-00047.safetensors", + "model.layers.39.mlp.experts.58.down_proj.weight": "model-00040-of-00047.safetensors", + "model.layers.39.mlp.experts.58.down_proj.weight_scale": "model-00040-of-00047.safetensors", + "model.layers.39.mlp.experts.58.gate_proj.weight": "model-00040-of-00047.safetensors", + "model.layers.39.mlp.experts.58.gate_proj.weight_scale": "model-00040-of-00047.safetensors", + "model.layers.39.mlp.experts.58.up_proj.weight": "model-00040-of-00047.safetensors", + "model.layers.39.mlp.experts.58.up_proj.weight_scale": "model-00040-of-00047.safetensors", + "model.layers.39.mlp.experts.59.down_proj.weight": "model-00040-of-00047.safetensors", + "model.layers.39.mlp.experts.59.down_proj.weight_scale": "model-00040-of-00047.safetensors", + "model.layers.39.mlp.experts.59.gate_proj.weight": "model-00040-of-00047.safetensors", + "model.layers.39.mlp.experts.59.gate_proj.weight_scale": "model-00040-of-00047.safetensors", + "model.layers.39.mlp.experts.59.up_proj.weight": "model-00040-of-00047.safetensors", + "model.layers.39.mlp.experts.59.up_proj.weight_scale": "model-00040-of-00047.safetensors", + "model.layers.39.mlp.experts.6.down_proj.weight": "model-00040-of-00047.safetensors", + "model.layers.39.mlp.experts.6.down_proj.weight_scale": "model-00040-of-00047.safetensors", + "model.layers.39.mlp.experts.6.gate_proj.weight": "model-00040-of-00047.safetensors", + "model.layers.39.mlp.experts.6.gate_proj.weight_scale": "model-00040-of-00047.safetensors", + "model.layers.39.mlp.experts.6.up_proj.weight": "model-00040-of-00047.safetensors", + "model.layers.39.mlp.experts.6.up_proj.weight_scale": "model-00040-of-00047.safetensors", + "model.layers.39.mlp.experts.60.down_proj.weight": "model-00040-of-00047.safetensors", + "model.layers.39.mlp.experts.60.down_proj.weight_scale": "model-00040-of-00047.safetensors", + "model.layers.39.mlp.experts.60.gate_proj.weight": "model-00040-of-00047.safetensors", + "model.layers.39.mlp.experts.60.gate_proj.weight_scale": "model-00040-of-00047.safetensors", + "model.layers.39.mlp.experts.60.up_proj.weight": "model-00040-of-00047.safetensors", + "model.layers.39.mlp.experts.60.up_proj.weight_scale": "model-00040-of-00047.safetensors", + "model.layers.39.mlp.experts.61.down_proj.weight": "model-00040-of-00047.safetensors", + "model.layers.39.mlp.experts.61.down_proj.weight_scale": "model-00040-of-00047.safetensors", + "model.layers.39.mlp.experts.61.gate_proj.weight": "model-00040-of-00047.safetensors", + "model.layers.39.mlp.experts.61.gate_proj.weight_scale": "model-00040-of-00047.safetensors", + "model.layers.39.mlp.experts.61.up_proj.weight": "model-00040-of-00047.safetensors", + "model.layers.39.mlp.experts.61.up_proj.weight_scale": "model-00040-of-00047.safetensors", + "model.layers.39.mlp.experts.62.down_proj.weight": "model-00040-of-00047.safetensors", + "model.layers.39.mlp.experts.62.down_proj.weight_scale": "model-00040-of-00047.safetensors", + "model.layers.39.mlp.experts.62.gate_proj.weight": "model-00040-of-00047.safetensors", + "model.layers.39.mlp.experts.62.gate_proj.weight_scale": "model-00040-of-00047.safetensors", + "model.layers.39.mlp.experts.62.up_proj.weight": "model-00040-of-00047.safetensors", + "model.layers.39.mlp.experts.62.up_proj.weight_scale": "model-00040-of-00047.safetensors", + "model.layers.39.mlp.experts.63.down_proj.weight": "model-00040-of-00047.safetensors", + "model.layers.39.mlp.experts.63.down_proj.weight_scale": "model-00040-of-00047.safetensors", + "model.layers.39.mlp.experts.63.gate_proj.weight": "model-00040-of-00047.safetensors", + "model.layers.39.mlp.experts.63.gate_proj.weight_scale": "model-00040-of-00047.safetensors", + "model.layers.39.mlp.experts.63.up_proj.weight": "model-00040-of-00047.safetensors", + "model.layers.39.mlp.experts.63.up_proj.weight_scale": "model-00040-of-00047.safetensors", + "model.layers.39.mlp.experts.64.down_proj.weight": "model-00040-of-00047.safetensors", + "model.layers.39.mlp.experts.64.down_proj.weight_scale": "model-00040-of-00047.safetensors", + "model.layers.39.mlp.experts.64.gate_proj.weight": "model-00040-of-00047.safetensors", + "model.layers.39.mlp.experts.64.gate_proj.weight_scale": "model-00040-of-00047.safetensors", + "model.layers.39.mlp.experts.64.up_proj.weight": "model-00040-of-00047.safetensors", + "model.layers.39.mlp.experts.64.up_proj.weight_scale": "model-00040-of-00047.safetensors", + "model.layers.39.mlp.experts.65.down_proj.weight": "model-00040-of-00047.safetensors", + "model.layers.39.mlp.experts.65.down_proj.weight_scale": "model-00040-of-00047.safetensors", + "model.layers.39.mlp.experts.65.gate_proj.weight": "model-00040-of-00047.safetensors", + "model.layers.39.mlp.experts.65.gate_proj.weight_scale": "model-00040-of-00047.safetensors", + "model.layers.39.mlp.experts.65.up_proj.weight": "model-00040-of-00047.safetensors", + "model.layers.39.mlp.experts.65.up_proj.weight_scale": "model-00040-of-00047.safetensors", + "model.layers.39.mlp.experts.66.down_proj.weight": "model-00040-of-00047.safetensors", + "model.layers.39.mlp.experts.66.down_proj.weight_scale": "model-00040-of-00047.safetensors", + "model.layers.39.mlp.experts.66.gate_proj.weight": "model-00040-of-00047.safetensors", + "model.layers.39.mlp.experts.66.gate_proj.weight_scale": "model-00040-of-00047.safetensors", + "model.layers.39.mlp.experts.66.up_proj.weight": "model-00040-of-00047.safetensors", + "model.layers.39.mlp.experts.66.up_proj.weight_scale": "model-00040-of-00047.safetensors", + "model.layers.39.mlp.experts.67.down_proj.weight": "model-00040-of-00047.safetensors", + "model.layers.39.mlp.experts.67.down_proj.weight_scale": "model-00040-of-00047.safetensors", + "model.layers.39.mlp.experts.67.gate_proj.weight": "model-00040-of-00047.safetensors", + "model.layers.39.mlp.experts.67.gate_proj.weight_scale": "model-00040-of-00047.safetensors", + "model.layers.39.mlp.experts.67.up_proj.weight": "model-00040-of-00047.safetensors", + "model.layers.39.mlp.experts.67.up_proj.weight_scale": "model-00040-of-00047.safetensors", + "model.layers.39.mlp.experts.68.down_proj.weight": "model-00040-of-00047.safetensors", + "model.layers.39.mlp.experts.68.down_proj.weight_scale": "model-00040-of-00047.safetensors", + "model.layers.39.mlp.experts.68.gate_proj.weight": "model-00040-of-00047.safetensors", + "model.layers.39.mlp.experts.68.gate_proj.weight_scale": "model-00040-of-00047.safetensors", + "model.layers.39.mlp.experts.68.up_proj.weight": "model-00040-of-00047.safetensors", + "model.layers.39.mlp.experts.68.up_proj.weight_scale": "model-00040-of-00047.safetensors", + "model.layers.39.mlp.experts.69.down_proj.weight": "model-00040-of-00047.safetensors", + "model.layers.39.mlp.experts.69.down_proj.weight_scale": "model-00040-of-00047.safetensors", + "model.layers.39.mlp.experts.69.gate_proj.weight": "model-00040-of-00047.safetensors", + "model.layers.39.mlp.experts.69.gate_proj.weight_scale": "model-00040-of-00047.safetensors", + "model.layers.39.mlp.experts.69.up_proj.weight": "model-00040-of-00047.safetensors", + "model.layers.39.mlp.experts.69.up_proj.weight_scale": "model-00040-of-00047.safetensors", + "model.layers.39.mlp.experts.7.down_proj.weight": "model-00040-of-00047.safetensors", + "model.layers.39.mlp.experts.7.down_proj.weight_scale": "model-00040-of-00047.safetensors", + "model.layers.39.mlp.experts.7.gate_proj.weight": "model-00040-of-00047.safetensors", + "model.layers.39.mlp.experts.7.gate_proj.weight_scale": "model-00040-of-00047.safetensors", + "model.layers.39.mlp.experts.7.up_proj.weight": "model-00040-of-00047.safetensors", + "model.layers.39.mlp.experts.7.up_proj.weight_scale": "model-00040-of-00047.safetensors", + "model.layers.39.mlp.experts.70.down_proj.weight": "model-00040-of-00047.safetensors", + "model.layers.39.mlp.experts.70.down_proj.weight_scale": "model-00040-of-00047.safetensors", + "model.layers.39.mlp.experts.70.gate_proj.weight": "model-00040-of-00047.safetensors", + "model.layers.39.mlp.experts.70.gate_proj.weight_scale": "model-00040-of-00047.safetensors", + "model.layers.39.mlp.experts.70.up_proj.weight": "model-00040-of-00047.safetensors", + "model.layers.39.mlp.experts.70.up_proj.weight_scale": "model-00040-of-00047.safetensors", + "model.layers.39.mlp.experts.71.down_proj.weight": "model-00040-of-00047.safetensors", + "model.layers.39.mlp.experts.71.down_proj.weight_scale": "model-00040-of-00047.safetensors", + "model.layers.39.mlp.experts.71.gate_proj.weight": "model-00040-of-00047.safetensors", + "model.layers.39.mlp.experts.71.gate_proj.weight_scale": "model-00040-of-00047.safetensors", + "model.layers.39.mlp.experts.71.up_proj.weight": "model-00040-of-00047.safetensors", + "model.layers.39.mlp.experts.71.up_proj.weight_scale": "model-00040-of-00047.safetensors", + "model.layers.39.mlp.experts.72.down_proj.weight": "model-00040-of-00047.safetensors", + "model.layers.39.mlp.experts.72.down_proj.weight_scale": "model-00040-of-00047.safetensors", + "model.layers.39.mlp.experts.72.gate_proj.weight": "model-00040-of-00047.safetensors", + "model.layers.39.mlp.experts.72.gate_proj.weight_scale": "model-00040-of-00047.safetensors", + "model.layers.39.mlp.experts.72.up_proj.weight": "model-00040-of-00047.safetensors", + "model.layers.39.mlp.experts.72.up_proj.weight_scale": "model-00040-of-00047.safetensors", + "model.layers.39.mlp.experts.73.down_proj.weight": "model-00040-of-00047.safetensors", + "model.layers.39.mlp.experts.73.down_proj.weight_scale": "model-00040-of-00047.safetensors", + "model.layers.39.mlp.experts.73.gate_proj.weight": "model-00040-of-00047.safetensors", + "model.layers.39.mlp.experts.73.gate_proj.weight_scale": "model-00040-of-00047.safetensors", + "model.layers.39.mlp.experts.73.up_proj.weight": "model-00040-of-00047.safetensors", + "model.layers.39.mlp.experts.73.up_proj.weight_scale": "model-00040-of-00047.safetensors", + "model.layers.39.mlp.experts.74.down_proj.weight": "model-00040-of-00047.safetensors", + "model.layers.39.mlp.experts.74.down_proj.weight_scale": "model-00040-of-00047.safetensors", + "model.layers.39.mlp.experts.74.gate_proj.weight": "model-00040-of-00047.safetensors", + "model.layers.39.mlp.experts.74.gate_proj.weight_scale": "model-00040-of-00047.safetensors", + "model.layers.39.mlp.experts.74.up_proj.weight": "model-00040-of-00047.safetensors", + "model.layers.39.mlp.experts.74.up_proj.weight_scale": "model-00040-of-00047.safetensors", + "model.layers.39.mlp.experts.75.down_proj.weight": "model-00040-of-00047.safetensors", + "model.layers.39.mlp.experts.75.down_proj.weight_scale": "model-00040-of-00047.safetensors", + "model.layers.39.mlp.experts.75.gate_proj.weight": "model-00040-of-00047.safetensors", + "model.layers.39.mlp.experts.75.gate_proj.weight_scale": "model-00040-of-00047.safetensors", + "model.layers.39.mlp.experts.75.up_proj.weight": "model-00040-of-00047.safetensors", + "model.layers.39.mlp.experts.75.up_proj.weight_scale": "model-00040-of-00047.safetensors", + "model.layers.39.mlp.experts.76.down_proj.weight": "model-00040-of-00047.safetensors", + "model.layers.39.mlp.experts.76.down_proj.weight_scale": "model-00040-of-00047.safetensors", + "model.layers.39.mlp.experts.76.gate_proj.weight": "model-00040-of-00047.safetensors", + "model.layers.39.mlp.experts.76.gate_proj.weight_scale": "model-00040-of-00047.safetensors", + "model.layers.39.mlp.experts.76.up_proj.weight": "model-00040-of-00047.safetensors", + "model.layers.39.mlp.experts.76.up_proj.weight_scale": "model-00040-of-00047.safetensors", + "model.layers.39.mlp.experts.77.down_proj.weight": "model-00040-of-00047.safetensors", + "model.layers.39.mlp.experts.77.down_proj.weight_scale": "model-00040-of-00047.safetensors", + "model.layers.39.mlp.experts.77.gate_proj.weight": "model-00040-of-00047.safetensors", + "model.layers.39.mlp.experts.77.gate_proj.weight_scale": "model-00040-of-00047.safetensors", + "model.layers.39.mlp.experts.77.up_proj.weight": "model-00040-of-00047.safetensors", + "model.layers.39.mlp.experts.77.up_proj.weight_scale": "model-00040-of-00047.safetensors", + "model.layers.39.mlp.experts.78.down_proj.weight": "model-00040-of-00047.safetensors", + "model.layers.39.mlp.experts.78.down_proj.weight_scale": "model-00040-of-00047.safetensors", + "model.layers.39.mlp.experts.78.gate_proj.weight": "model-00040-of-00047.safetensors", + "model.layers.39.mlp.experts.78.gate_proj.weight_scale": "model-00040-of-00047.safetensors", + "model.layers.39.mlp.experts.78.up_proj.weight": "model-00040-of-00047.safetensors", + "model.layers.39.mlp.experts.78.up_proj.weight_scale": "model-00040-of-00047.safetensors", + "model.layers.39.mlp.experts.79.down_proj.weight": "model-00040-of-00047.safetensors", + "model.layers.39.mlp.experts.79.down_proj.weight_scale": "model-00040-of-00047.safetensors", + "model.layers.39.mlp.experts.79.gate_proj.weight": "model-00040-of-00047.safetensors", + "model.layers.39.mlp.experts.79.gate_proj.weight_scale": "model-00040-of-00047.safetensors", + "model.layers.39.mlp.experts.79.up_proj.weight": "model-00040-of-00047.safetensors", + "model.layers.39.mlp.experts.79.up_proj.weight_scale": "model-00040-of-00047.safetensors", + "model.layers.39.mlp.experts.8.down_proj.weight": "model-00040-of-00047.safetensors", + "model.layers.39.mlp.experts.8.down_proj.weight_scale": "model-00040-of-00047.safetensors", + "model.layers.39.mlp.experts.8.gate_proj.weight": "model-00040-of-00047.safetensors", + "model.layers.39.mlp.experts.8.gate_proj.weight_scale": "model-00040-of-00047.safetensors", + "model.layers.39.mlp.experts.8.up_proj.weight": "model-00040-of-00047.safetensors", + "model.layers.39.mlp.experts.8.up_proj.weight_scale": "model-00040-of-00047.safetensors", + "model.layers.39.mlp.experts.80.down_proj.weight": "model-00040-of-00047.safetensors", + "model.layers.39.mlp.experts.80.down_proj.weight_scale": "model-00040-of-00047.safetensors", + "model.layers.39.mlp.experts.80.gate_proj.weight": "model-00040-of-00047.safetensors", + "model.layers.39.mlp.experts.80.gate_proj.weight_scale": "model-00040-of-00047.safetensors", + "model.layers.39.mlp.experts.80.up_proj.weight": "model-00040-of-00047.safetensors", + "model.layers.39.mlp.experts.80.up_proj.weight_scale": "model-00040-of-00047.safetensors", + "model.layers.39.mlp.experts.81.down_proj.weight": "model-00040-of-00047.safetensors", + "model.layers.39.mlp.experts.81.down_proj.weight_scale": "model-00040-of-00047.safetensors", + "model.layers.39.mlp.experts.81.gate_proj.weight": "model-00040-of-00047.safetensors", + "model.layers.39.mlp.experts.81.gate_proj.weight_scale": "model-00040-of-00047.safetensors", + "model.layers.39.mlp.experts.81.up_proj.weight": "model-00040-of-00047.safetensors", + "model.layers.39.mlp.experts.81.up_proj.weight_scale": "model-00040-of-00047.safetensors", + "model.layers.39.mlp.experts.82.down_proj.weight": "model-00040-of-00047.safetensors", + "model.layers.39.mlp.experts.82.down_proj.weight_scale": "model-00040-of-00047.safetensors", + "model.layers.39.mlp.experts.82.gate_proj.weight": "model-00040-of-00047.safetensors", + "model.layers.39.mlp.experts.82.gate_proj.weight_scale": "model-00040-of-00047.safetensors", + "model.layers.39.mlp.experts.82.up_proj.weight": "model-00040-of-00047.safetensors", + "model.layers.39.mlp.experts.82.up_proj.weight_scale": "model-00040-of-00047.safetensors", + "model.layers.39.mlp.experts.83.down_proj.weight": "model-00040-of-00047.safetensors", + "model.layers.39.mlp.experts.83.down_proj.weight_scale": "model-00040-of-00047.safetensors", + "model.layers.39.mlp.experts.83.gate_proj.weight": "model-00040-of-00047.safetensors", + "model.layers.39.mlp.experts.83.gate_proj.weight_scale": "model-00040-of-00047.safetensors", + "model.layers.39.mlp.experts.83.up_proj.weight": "model-00040-of-00047.safetensors", + "model.layers.39.mlp.experts.83.up_proj.weight_scale": "model-00040-of-00047.safetensors", + "model.layers.39.mlp.experts.84.down_proj.weight": "model-00040-of-00047.safetensors", + "model.layers.39.mlp.experts.84.down_proj.weight_scale": "model-00040-of-00047.safetensors", + "model.layers.39.mlp.experts.84.gate_proj.weight": "model-00040-of-00047.safetensors", + "model.layers.39.mlp.experts.84.gate_proj.weight_scale": "model-00040-of-00047.safetensors", + "model.layers.39.mlp.experts.84.up_proj.weight": "model-00040-of-00047.safetensors", + "model.layers.39.mlp.experts.84.up_proj.weight_scale": "model-00040-of-00047.safetensors", + "model.layers.39.mlp.experts.85.down_proj.weight": "model-00040-of-00047.safetensors", + "model.layers.39.mlp.experts.85.down_proj.weight_scale": "model-00040-of-00047.safetensors", + "model.layers.39.mlp.experts.85.gate_proj.weight": "model-00040-of-00047.safetensors", + "model.layers.39.mlp.experts.85.gate_proj.weight_scale": "model-00040-of-00047.safetensors", + "model.layers.39.mlp.experts.85.up_proj.weight": "model-00040-of-00047.safetensors", + "model.layers.39.mlp.experts.85.up_proj.weight_scale": "model-00040-of-00047.safetensors", + "model.layers.39.mlp.experts.86.down_proj.weight": "model-00040-of-00047.safetensors", + "model.layers.39.mlp.experts.86.down_proj.weight_scale": "model-00040-of-00047.safetensors", + "model.layers.39.mlp.experts.86.gate_proj.weight": "model-00040-of-00047.safetensors", + "model.layers.39.mlp.experts.86.gate_proj.weight_scale": "model-00040-of-00047.safetensors", + "model.layers.39.mlp.experts.86.up_proj.weight": "model-00040-of-00047.safetensors", + "model.layers.39.mlp.experts.86.up_proj.weight_scale": "model-00040-of-00047.safetensors", + "model.layers.39.mlp.experts.87.down_proj.weight": "model-00040-of-00047.safetensors", + "model.layers.39.mlp.experts.87.down_proj.weight_scale": "model-00040-of-00047.safetensors", + "model.layers.39.mlp.experts.87.gate_proj.weight": "model-00040-of-00047.safetensors", + "model.layers.39.mlp.experts.87.gate_proj.weight_scale": "model-00040-of-00047.safetensors", + "model.layers.39.mlp.experts.87.up_proj.weight": "model-00040-of-00047.safetensors", + "model.layers.39.mlp.experts.87.up_proj.weight_scale": "model-00040-of-00047.safetensors", + "model.layers.39.mlp.experts.88.down_proj.weight": "model-00040-of-00047.safetensors", + "model.layers.39.mlp.experts.88.down_proj.weight_scale": "model-00040-of-00047.safetensors", + "model.layers.39.mlp.experts.88.gate_proj.weight": "model-00040-of-00047.safetensors", + "model.layers.39.mlp.experts.88.gate_proj.weight_scale": "model-00040-of-00047.safetensors", + "model.layers.39.mlp.experts.88.up_proj.weight": "model-00040-of-00047.safetensors", + "model.layers.39.mlp.experts.88.up_proj.weight_scale": "model-00040-of-00047.safetensors", + "model.layers.39.mlp.experts.89.down_proj.weight": "model-00040-of-00047.safetensors", + "model.layers.39.mlp.experts.89.down_proj.weight_scale": "model-00040-of-00047.safetensors", + "model.layers.39.mlp.experts.89.gate_proj.weight": "model-00040-of-00047.safetensors", + "model.layers.39.mlp.experts.89.gate_proj.weight_scale": "model-00040-of-00047.safetensors", + "model.layers.39.mlp.experts.89.up_proj.weight": "model-00040-of-00047.safetensors", + "model.layers.39.mlp.experts.89.up_proj.weight_scale": "model-00040-of-00047.safetensors", + "model.layers.39.mlp.experts.9.down_proj.weight": "model-00040-of-00047.safetensors", + "model.layers.39.mlp.experts.9.down_proj.weight_scale": "model-00040-of-00047.safetensors", + "model.layers.39.mlp.experts.9.gate_proj.weight": "model-00040-of-00047.safetensors", + "model.layers.39.mlp.experts.9.gate_proj.weight_scale": "model-00040-of-00047.safetensors", + "model.layers.39.mlp.experts.9.up_proj.weight": "model-00040-of-00047.safetensors", + "model.layers.39.mlp.experts.9.up_proj.weight_scale": "model-00040-of-00047.safetensors", + "model.layers.39.mlp.experts.90.down_proj.weight": "model-00040-of-00047.safetensors", + "model.layers.39.mlp.experts.90.down_proj.weight_scale": "model-00040-of-00047.safetensors", + "model.layers.39.mlp.experts.90.gate_proj.weight": "model-00040-of-00047.safetensors", + "model.layers.39.mlp.experts.90.gate_proj.weight_scale": "model-00040-of-00047.safetensors", + "model.layers.39.mlp.experts.90.up_proj.weight": "model-00040-of-00047.safetensors", + "model.layers.39.mlp.experts.90.up_proj.weight_scale": "model-00040-of-00047.safetensors", + "model.layers.39.mlp.experts.91.down_proj.weight": "model-00040-of-00047.safetensors", + "model.layers.39.mlp.experts.91.down_proj.weight_scale": "model-00040-of-00047.safetensors", + "model.layers.39.mlp.experts.91.gate_proj.weight": "model-00040-of-00047.safetensors", + "model.layers.39.mlp.experts.91.gate_proj.weight_scale": "model-00040-of-00047.safetensors", + "model.layers.39.mlp.experts.91.up_proj.weight": "model-00040-of-00047.safetensors", + "model.layers.39.mlp.experts.91.up_proj.weight_scale": "model-00040-of-00047.safetensors", + "model.layers.39.mlp.experts.92.down_proj.weight": "model-00040-of-00047.safetensors", + "model.layers.39.mlp.experts.92.down_proj.weight_scale": "model-00040-of-00047.safetensors", + "model.layers.39.mlp.experts.92.gate_proj.weight": "model-00040-of-00047.safetensors", + "model.layers.39.mlp.experts.92.gate_proj.weight_scale": "model-00040-of-00047.safetensors", + "model.layers.39.mlp.experts.92.up_proj.weight": "model-00040-of-00047.safetensors", + "model.layers.39.mlp.experts.92.up_proj.weight_scale": "model-00040-of-00047.safetensors", + "model.layers.39.mlp.experts.93.down_proj.weight": "model-00040-of-00047.safetensors", + "model.layers.39.mlp.experts.93.down_proj.weight_scale": "model-00040-of-00047.safetensors", + "model.layers.39.mlp.experts.93.gate_proj.weight": "model-00040-of-00047.safetensors", + "model.layers.39.mlp.experts.93.gate_proj.weight_scale": "model-00040-of-00047.safetensors", + "model.layers.39.mlp.experts.93.up_proj.weight": "model-00040-of-00047.safetensors", + "model.layers.39.mlp.experts.93.up_proj.weight_scale": "model-00040-of-00047.safetensors", + "model.layers.39.mlp.experts.94.down_proj.weight": "model-00040-of-00047.safetensors", + "model.layers.39.mlp.experts.94.down_proj.weight_scale": "model-00040-of-00047.safetensors", + "model.layers.39.mlp.experts.94.gate_proj.weight": "model-00040-of-00047.safetensors", + "model.layers.39.mlp.experts.94.gate_proj.weight_scale": "model-00040-of-00047.safetensors", + "model.layers.39.mlp.experts.94.up_proj.weight": "model-00040-of-00047.safetensors", + "model.layers.39.mlp.experts.94.up_proj.weight_scale": "model-00040-of-00047.safetensors", + "model.layers.39.mlp.experts.95.down_proj.weight": "model-00040-of-00047.safetensors", + "model.layers.39.mlp.experts.95.down_proj.weight_scale": "model-00040-of-00047.safetensors", + "model.layers.39.mlp.experts.95.gate_proj.weight": "model-00040-of-00047.safetensors", + "model.layers.39.mlp.experts.95.gate_proj.weight_scale": "model-00040-of-00047.safetensors", + "model.layers.39.mlp.experts.95.up_proj.weight": "model-00040-of-00047.safetensors", + "model.layers.39.mlp.experts.95.up_proj.weight_scale": "model-00040-of-00047.safetensors", + "model.layers.39.mlp.experts.96.down_proj.weight": "model-00040-of-00047.safetensors", + "model.layers.39.mlp.experts.96.down_proj.weight_scale": "model-00040-of-00047.safetensors", + "model.layers.39.mlp.experts.96.gate_proj.weight": "model-00040-of-00047.safetensors", + "model.layers.39.mlp.experts.96.gate_proj.weight_scale": "model-00040-of-00047.safetensors", + "model.layers.39.mlp.experts.96.up_proj.weight": "model-00040-of-00047.safetensors", + "model.layers.39.mlp.experts.96.up_proj.weight_scale": "model-00040-of-00047.safetensors", + "model.layers.39.mlp.experts.97.down_proj.weight": "model-00040-of-00047.safetensors", + "model.layers.39.mlp.experts.97.down_proj.weight_scale": "model-00040-of-00047.safetensors", + "model.layers.39.mlp.experts.97.gate_proj.weight": "model-00040-of-00047.safetensors", + "model.layers.39.mlp.experts.97.gate_proj.weight_scale": "model-00040-of-00047.safetensors", + "model.layers.39.mlp.experts.97.up_proj.weight": "model-00040-of-00047.safetensors", + "model.layers.39.mlp.experts.97.up_proj.weight_scale": "model-00040-of-00047.safetensors", + "model.layers.39.mlp.experts.98.down_proj.weight": "model-00040-of-00047.safetensors", + "model.layers.39.mlp.experts.98.down_proj.weight_scale": "model-00040-of-00047.safetensors", + "model.layers.39.mlp.experts.98.gate_proj.weight": "model-00040-of-00047.safetensors", + "model.layers.39.mlp.experts.98.gate_proj.weight_scale": "model-00040-of-00047.safetensors", + "model.layers.39.mlp.experts.98.up_proj.weight": "model-00040-of-00047.safetensors", + "model.layers.39.mlp.experts.98.up_proj.weight_scale": "model-00040-of-00047.safetensors", + "model.layers.39.mlp.experts.99.down_proj.weight": "model-00040-of-00047.safetensors", + "model.layers.39.mlp.experts.99.down_proj.weight_scale": "model-00040-of-00047.safetensors", + "model.layers.39.mlp.experts.99.gate_proj.weight": "model-00040-of-00047.safetensors", + "model.layers.39.mlp.experts.99.gate_proj.weight_scale": "model-00040-of-00047.safetensors", + "model.layers.39.mlp.experts.99.up_proj.weight": "model-00040-of-00047.safetensors", + "model.layers.39.mlp.experts.99.up_proj.weight_scale": "model-00040-of-00047.safetensors", + "model.layers.39.mlp.gate.e_score_correction_bias": "model-00040-of-00047.safetensors", + "model.layers.39.mlp.gate.weight": "model-00040-of-00047.safetensors", + "model.layers.39.mlp.shared_experts.down_proj.weight": "model-00040-of-00047.safetensors", + "model.layers.39.mlp.shared_experts.down_proj.weight_scale": "model-00040-of-00047.safetensors", + "model.layers.39.mlp.shared_experts.gate_proj.weight": "model-00040-of-00047.safetensors", + "model.layers.39.mlp.shared_experts.gate_proj.weight_scale": "model-00040-of-00047.safetensors", + "model.layers.39.mlp.shared_experts.up_proj.weight": "model-00040-of-00047.safetensors", + "model.layers.39.mlp.shared_experts.up_proj.weight_scale": "model-00040-of-00047.safetensors", + "model.layers.39.post_attention_layernorm.weight": "model-00040-of-00047.safetensors", + "model.layers.39.self_attn.k_proj.bias": "model-00040-of-00047.safetensors", + "model.layers.39.self_attn.k_proj.weight": "model-00040-of-00047.safetensors", + "model.layers.39.self_attn.k_proj.weight_scale": "model-00040-of-00047.safetensors", + "model.layers.39.self_attn.o_proj.weight": "model-00040-of-00047.safetensors", + "model.layers.39.self_attn.o_proj.weight_scale": "model-00040-of-00047.safetensors", + "model.layers.39.self_attn.q_proj.bias": "model-00040-of-00047.safetensors", + "model.layers.39.self_attn.q_proj.weight": "model-00040-of-00047.safetensors", + "model.layers.39.self_attn.q_proj.weight_scale": "model-00040-of-00047.safetensors", + "model.layers.39.self_attn.v_proj.bias": "model-00040-of-00047.safetensors", + "model.layers.39.self_attn.v_proj.weight": "model-00040-of-00047.safetensors", + "model.layers.39.self_attn.v_proj.weight_scale": "model-00040-of-00047.safetensors", + "model.layers.40.input_layernorm.weight": "model-00041-of-00047.safetensors", + "model.layers.40.mlp.experts.0.down_proj.weight": "model-00041-of-00047.safetensors", + "model.layers.40.mlp.experts.0.down_proj.weight_scale": "model-00041-of-00047.safetensors", + "model.layers.40.mlp.experts.0.gate_proj.weight": "model-00041-of-00047.safetensors", + "model.layers.40.mlp.experts.0.gate_proj.weight_scale": "model-00041-of-00047.safetensors", + "model.layers.40.mlp.experts.0.up_proj.weight": "model-00041-of-00047.safetensors", + "model.layers.40.mlp.experts.0.up_proj.weight_scale": "model-00041-of-00047.safetensors", + "model.layers.40.mlp.experts.1.down_proj.weight": "model-00041-of-00047.safetensors", + "model.layers.40.mlp.experts.1.down_proj.weight_scale": "model-00041-of-00047.safetensors", + "model.layers.40.mlp.experts.1.gate_proj.weight": "model-00041-of-00047.safetensors", + "model.layers.40.mlp.experts.1.gate_proj.weight_scale": "model-00041-of-00047.safetensors", + "model.layers.40.mlp.experts.1.up_proj.weight": "model-00041-of-00047.safetensors", + "model.layers.40.mlp.experts.1.up_proj.weight_scale": "model-00041-of-00047.safetensors", + "model.layers.40.mlp.experts.10.down_proj.weight": "model-00041-of-00047.safetensors", + "model.layers.40.mlp.experts.10.down_proj.weight_scale": "model-00041-of-00047.safetensors", + "model.layers.40.mlp.experts.10.gate_proj.weight": "model-00041-of-00047.safetensors", + "model.layers.40.mlp.experts.10.gate_proj.weight_scale": "model-00041-of-00047.safetensors", + "model.layers.40.mlp.experts.10.up_proj.weight": "model-00041-of-00047.safetensors", + "model.layers.40.mlp.experts.10.up_proj.weight_scale": "model-00041-of-00047.safetensors", + "model.layers.40.mlp.experts.100.down_proj.weight": "model-00041-of-00047.safetensors", + "model.layers.40.mlp.experts.100.down_proj.weight_scale": "model-00041-of-00047.safetensors", + "model.layers.40.mlp.experts.100.gate_proj.weight": "model-00041-of-00047.safetensors", + "model.layers.40.mlp.experts.100.gate_proj.weight_scale": "model-00041-of-00047.safetensors", + "model.layers.40.mlp.experts.100.up_proj.weight": "model-00041-of-00047.safetensors", + "model.layers.40.mlp.experts.100.up_proj.weight_scale": "model-00041-of-00047.safetensors", + "model.layers.40.mlp.experts.101.down_proj.weight": "model-00041-of-00047.safetensors", + "model.layers.40.mlp.experts.101.down_proj.weight_scale": "model-00041-of-00047.safetensors", + "model.layers.40.mlp.experts.101.gate_proj.weight": "model-00041-of-00047.safetensors", + "model.layers.40.mlp.experts.101.gate_proj.weight_scale": "model-00041-of-00047.safetensors", + "model.layers.40.mlp.experts.101.up_proj.weight": "model-00041-of-00047.safetensors", + "model.layers.40.mlp.experts.101.up_proj.weight_scale": "model-00041-of-00047.safetensors", + "model.layers.40.mlp.experts.102.down_proj.weight": "model-00041-of-00047.safetensors", + "model.layers.40.mlp.experts.102.down_proj.weight_scale": "model-00041-of-00047.safetensors", + "model.layers.40.mlp.experts.102.gate_proj.weight": "model-00041-of-00047.safetensors", + "model.layers.40.mlp.experts.102.gate_proj.weight_scale": "model-00041-of-00047.safetensors", + "model.layers.40.mlp.experts.102.up_proj.weight": "model-00041-of-00047.safetensors", + "model.layers.40.mlp.experts.102.up_proj.weight_scale": "model-00041-of-00047.safetensors", + "model.layers.40.mlp.experts.103.down_proj.weight": "model-00041-of-00047.safetensors", + "model.layers.40.mlp.experts.103.down_proj.weight_scale": "model-00041-of-00047.safetensors", + "model.layers.40.mlp.experts.103.gate_proj.weight": "model-00041-of-00047.safetensors", + "model.layers.40.mlp.experts.103.gate_proj.weight_scale": "model-00041-of-00047.safetensors", + "model.layers.40.mlp.experts.103.up_proj.weight": "model-00041-of-00047.safetensors", + "model.layers.40.mlp.experts.103.up_proj.weight_scale": "model-00041-of-00047.safetensors", + "model.layers.40.mlp.experts.104.down_proj.weight": "model-00041-of-00047.safetensors", + "model.layers.40.mlp.experts.104.down_proj.weight_scale": "model-00041-of-00047.safetensors", + "model.layers.40.mlp.experts.104.gate_proj.weight": "model-00041-of-00047.safetensors", + "model.layers.40.mlp.experts.104.gate_proj.weight_scale": "model-00041-of-00047.safetensors", + "model.layers.40.mlp.experts.104.up_proj.weight": "model-00041-of-00047.safetensors", + "model.layers.40.mlp.experts.104.up_proj.weight_scale": "model-00041-of-00047.safetensors", + "model.layers.40.mlp.experts.105.down_proj.weight": "model-00041-of-00047.safetensors", + "model.layers.40.mlp.experts.105.down_proj.weight_scale": "model-00041-of-00047.safetensors", + "model.layers.40.mlp.experts.105.gate_proj.weight": "model-00041-of-00047.safetensors", + "model.layers.40.mlp.experts.105.gate_proj.weight_scale": "model-00041-of-00047.safetensors", + "model.layers.40.mlp.experts.105.up_proj.weight": "model-00041-of-00047.safetensors", + "model.layers.40.mlp.experts.105.up_proj.weight_scale": "model-00041-of-00047.safetensors", + "model.layers.40.mlp.experts.106.down_proj.weight": "model-00041-of-00047.safetensors", + "model.layers.40.mlp.experts.106.down_proj.weight_scale": "model-00041-of-00047.safetensors", + "model.layers.40.mlp.experts.106.gate_proj.weight": "model-00041-of-00047.safetensors", + "model.layers.40.mlp.experts.106.gate_proj.weight_scale": "model-00041-of-00047.safetensors", + "model.layers.40.mlp.experts.106.up_proj.weight": "model-00041-of-00047.safetensors", + "model.layers.40.mlp.experts.106.up_proj.weight_scale": "model-00041-of-00047.safetensors", + "model.layers.40.mlp.experts.107.down_proj.weight": "model-00041-of-00047.safetensors", + "model.layers.40.mlp.experts.107.down_proj.weight_scale": "model-00041-of-00047.safetensors", + "model.layers.40.mlp.experts.107.gate_proj.weight": "model-00041-of-00047.safetensors", + "model.layers.40.mlp.experts.107.gate_proj.weight_scale": "model-00041-of-00047.safetensors", + "model.layers.40.mlp.experts.107.up_proj.weight": "model-00041-of-00047.safetensors", + "model.layers.40.mlp.experts.107.up_proj.weight_scale": "model-00041-of-00047.safetensors", + "model.layers.40.mlp.experts.108.down_proj.weight": "model-00041-of-00047.safetensors", + "model.layers.40.mlp.experts.108.down_proj.weight_scale": "model-00041-of-00047.safetensors", + "model.layers.40.mlp.experts.108.gate_proj.weight": "model-00041-of-00047.safetensors", + "model.layers.40.mlp.experts.108.gate_proj.weight_scale": "model-00041-of-00047.safetensors", + "model.layers.40.mlp.experts.108.up_proj.weight": "model-00041-of-00047.safetensors", + "model.layers.40.mlp.experts.108.up_proj.weight_scale": "model-00041-of-00047.safetensors", + "model.layers.40.mlp.experts.109.down_proj.weight": "model-00041-of-00047.safetensors", + "model.layers.40.mlp.experts.109.down_proj.weight_scale": "model-00041-of-00047.safetensors", + "model.layers.40.mlp.experts.109.gate_proj.weight": "model-00041-of-00047.safetensors", + "model.layers.40.mlp.experts.109.gate_proj.weight_scale": "model-00041-of-00047.safetensors", + "model.layers.40.mlp.experts.109.up_proj.weight": "model-00041-of-00047.safetensors", + "model.layers.40.mlp.experts.109.up_proj.weight_scale": "model-00041-of-00047.safetensors", + "model.layers.40.mlp.experts.11.down_proj.weight": "model-00041-of-00047.safetensors", + "model.layers.40.mlp.experts.11.down_proj.weight_scale": "model-00041-of-00047.safetensors", + "model.layers.40.mlp.experts.11.gate_proj.weight": "model-00041-of-00047.safetensors", + "model.layers.40.mlp.experts.11.gate_proj.weight_scale": "model-00041-of-00047.safetensors", + "model.layers.40.mlp.experts.11.up_proj.weight": "model-00041-of-00047.safetensors", + "model.layers.40.mlp.experts.11.up_proj.weight_scale": "model-00041-of-00047.safetensors", + "model.layers.40.mlp.experts.110.down_proj.weight": "model-00041-of-00047.safetensors", + "model.layers.40.mlp.experts.110.down_proj.weight_scale": "model-00041-of-00047.safetensors", + "model.layers.40.mlp.experts.110.gate_proj.weight": "model-00041-of-00047.safetensors", + "model.layers.40.mlp.experts.110.gate_proj.weight_scale": "model-00041-of-00047.safetensors", + "model.layers.40.mlp.experts.110.up_proj.weight": "model-00041-of-00047.safetensors", + "model.layers.40.mlp.experts.110.up_proj.weight_scale": "model-00041-of-00047.safetensors", + "model.layers.40.mlp.experts.111.down_proj.weight": "model-00041-of-00047.safetensors", + "model.layers.40.mlp.experts.111.down_proj.weight_scale": "model-00041-of-00047.safetensors", + "model.layers.40.mlp.experts.111.gate_proj.weight": "model-00041-of-00047.safetensors", + "model.layers.40.mlp.experts.111.gate_proj.weight_scale": "model-00041-of-00047.safetensors", + "model.layers.40.mlp.experts.111.up_proj.weight": "model-00041-of-00047.safetensors", + "model.layers.40.mlp.experts.111.up_proj.weight_scale": "model-00041-of-00047.safetensors", + "model.layers.40.mlp.experts.112.down_proj.weight": "model-00041-of-00047.safetensors", + "model.layers.40.mlp.experts.112.down_proj.weight_scale": "model-00041-of-00047.safetensors", + "model.layers.40.mlp.experts.112.gate_proj.weight": "model-00041-of-00047.safetensors", + "model.layers.40.mlp.experts.112.gate_proj.weight_scale": "model-00041-of-00047.safetensors", + "model.layers.40.mlp.experts.112.up_proj.weight": "model-00041-of-00047.safetensors", + "model.layers.40.mlp.experts.112.up_proj.weight_scale": "model-00041-of-00047.safetensors", + "model.layers.40.mlp.experts.113.down_proj.weight": "model-00041-of-00047.safetensors", + "model.layers.40.mlp.experts.113.down_proj.weight_scale": "model-00041-of-00047.safetensors", + "model.layers.40.mlp.experts.113.gate_proj.weight": "model-00041-of-00047.safetensors", + "model.layers.40.mlp.experts.113.gate_proj.weight_scale": "model-00041-of-00047.safetensors", + "model.layers.40.mlp.experts.113.up_proj.weight": "model-00041-of-00047.safetensors", + "model.layers.40.mlp.experts.113.up_proj.weight_scale": "model-00041-of-00047.safetensors", + "model.layers.40.mlp.experts.114.down_proj.weight": "model-00041-of-00047.safetensors", + "model.layers.40.mlp.experts.114.down_proj.weight_scale": "model-00041-of-00047.safetensors", + "model.layers.40.mlp.experts.114.gate_proj.weight": "model-00041-of-00047.safetensors", + "model.layers.40.mlp.experts.114.gate_proj.weight_scale": "model-00041-of-00047.safetensors", + "model.layers.40.mlp.experts.114.up_proj.weight": "model-00041-of-00047.safetensors", + "model.layers.40.mlp.experts.114.up_proj.weight_scale": "model-00041-of-00047.safetensors", + "model.layers.40.mlp.experts.115.down_proj.weight": "model-00041-of-00047.safetensors", + "model.layers.40.mlp.experts.115.down_proj.weight_scale": "model-00041-of-00047.safetensors", + "model.layers.40.mlp.experts.115.gate_proj.weight": "model-00041-of-00047.safetensors", + "model.layers.40.mlp.experts.115.gate_proj.weight_scale": "model-00041-of-00047.safetensors", + "model.layers.40.mlp.experts.115.up_proj.weight": "model-00041-of-00047.safetensors", + "model.layers.40.mlp.experts.115.up_proj.weight_scale": "model-00041-of-00047.safetensors", + "model.layers.40.mlp.experts.116.down_proj.weight": "model-00041-of-00047.safetensors", + "model.layers.40.mlp.experts.116.down_proj.weight_scale": "model-00041-of-00047.safetensors", + "model.layers.40.mlp.experts.116.gate_proj.weight": "model-00041-of-00047.safetensors", + "model.layers.40.mlp.experts.116.gate_proj.weight_scale": "model-00041-of-00047.safetensors", + "model.layers.40.mlp.experts.116.up_proj.weight": "model-00041-of-00047.safetensors", + "model.layers.40.mlp.experts.116.up_proj.weight_scale": "model-00041-of-00047.safetensors", + "model.layers.40.mlp.experts.117.down_proj.weight": "model-00041-of-00047.safetensors", + "model.layers.40.mlp.experts.117.down_proj.weight_scale": "model-00041-of-00047.safetensors", + "model.layers.40.mlp.experts.117.gate_proj.weight": "model-00041-of-00047.safetensors", + "model.layers.40.mlp.experts.117.gate_proj.weight_scale": "model-00041-of-00047.safetensors", + "model.layers.40.mlp.experts.117.up_proj.weight": "model-00041-of-00047.safetensors", + "model.layers.40.mlp.experts.117.up_proj.weight_scale": "model-00041-of-00047.safetensors", + "model.layers.40.mlp.experts.118.down_proj.weight": "model-00041-of-00047.safetensors", + "model.layers.40.mlp.experts.118.down_proj.weight_scale": "model-00041-of-00047.safetensors", + "model.layers.40.mlp.experts.118.gate_proj.weight": "model-00041-of-00047.safetensors", + "model.layers.40.mlp.experts.118.gate_proj.weight_scale": "model-00041-of-00047.safetensors", + "model.layers.40.mlp.experts.118.up_proj.weight": "model-00041-of-00047.safetensors", + "model.layers.40.mlp.experts.118.up_proj.weight_scale": "model-00041-of-00047.safetensors", + "model.layers.40.mlp.experts.119.down_proj.weight": "model-00041-of-00047.safetensors", + "model.layers.40.mlp.experts.119.down_proj.weight_scale": "model-00041-of-00047.safetensors", + "model.layers.40.mlp.experts.119.gate_proj.weight": "model-00041-of-00047.safetensors", + "model.layers.40.mlp.experts.119.gate_proj.weight_scale": "model-00041-of-00047.safetensors", + "model.layers.40.mlp.experts.119.up_proj.weight": "model-00041-of-00047.safetensors", + "model.layers.40.mlp.experts.119.up_proj.weight_scale": "model-00041-of-00047.safetensors", + "model.layers.40.mlp.experts.12.down_proj.weight": "model-00041-of-00047.safetensors", + "model.layers.40.mlp.experts.12.down_proj.weight_scale": "model-00041-of-00047.safetensors", + "model.layers.40.mlp.experts.12.gate_proj.weight": "model-00041-of-00047.safetensors", + "model.layers.40.mlp.experts.12.gate_proj.weight_scale": "model-00041-of-00047.safetensors", + "model.layers.40.mlp.experts.12.up_proj.weight": "model-00041-of-00047.safetensors", + "model.layers.40.mlp.experts.12.up_proj.weight_scale": "model-00041-of-00047.safetensors", + "model.layers.40.mlp.experts.120.down_proj.weight": "model-00041-of-00047.safetensors", + "model.layers.40.mlp.experts.120.down_proj.weight_scale": "model-00041-of-00047.safetensors", + "model.layers.40.mlp.experts.120.gate_proj.weight": "model-00041-of-00047.safetensors", + "model.layers.40.mlp.experts.120.gate_proj.weight_scale": "model-00041-of-00047.safetensors", + "model.layers.40.mlp.experts.120.up_proj.weight": "model-00041-of-00047.safetensors", + "model.layers.40.mlp.experts.120.up_proj.weight_scale": "model-00041-of-00047.safetensors", + "model.layers.40.mlp.experts.121.down_proj.weight": "model-00041-of-00047.safetensors", + "model.layers.40.mlp.experts.121.down_proj.weight_scale": "model-00041-of-00047.safetensors", + "model.layers.40.mlp.experts.121.gate_proj.weight": "model-00041-of-00047.safetensors", + "model.layers.40.mlp.experts.121.gate_proj.weight_scale": "model-00041-of-00047.safetensors", + "model.layers.40.mlp.experts.121.up_proj.weight": "model-00041-of-00047.safetensors", + "model.layers.40.mlp.experts.121.up_proj.weight_scale": "model-00041-of-00047.safetensors", + "model.layers.40.mlp.experts.122.down_proj.weight": "model-00041-of-00047.safetensors", + "model.layers.40.mlp.experts.122.down_proj.weight_scale": "model-00041-of-00047.safetensors", + "model.layers.40.mlp.experts.122.gate_proj.weight": "model-00041-of-00047.safetensors", + "model.layers.40.mlp.experts.122.gate_proj.weight_scale": "model-00041-of-00047.safetensors", + "model.layers.40.mlp.experts.122.up_proj.weight": "model-00041-of-00047.safetensors", + "model.layers.40.mlp.experts.122.up_proj.weight_scale": "model-00041-of-00047.safetensors", + "model.layers.40.mlp.experts.123.down_proj.weight": "model-00041-of-00047.safetensors", + "model.layers.40.mlp.experts.123.down_proj.weight_scale": "model-00041-of-00047.safetensors", + "model.layers.40.mlp.experts.123.gate_proj.weight": "model-00041-of-00047.safetensors", + "model.layers.40.mlp.experts.123.gate_proj.weight_scale": "model-00041-of-00047.safetensors", + "model.layers.40.mlp.experts.123.up_proj.weight": "model-00041-of-00047.safetensors", + "model.layers.40.mlp.experts.123.up_proj.weight_scale": "model-00041-of-00047.safetensors", + "model.layers.40.mlp.experts.124.down_proj.weight": "model-00041-of-00047.safetensors", + "model.layers.40.mlp.experts.124.down_proj.weight_scale": "model-00041-of-00047.safetensors", + "model.layers.40.mlp.experts.124.gate_proj.weight": "model-00041-of-00047.safetensors", + "model.layers.40.mlp.experts.124.gate_proj.weight_scale": "model-00041-of-00047.safetensors", + "model.layers.40.mlp.experts.124.up_proj.weight": "model-00041-of-00047.safetensors", + "model.layers.40.mlp.experts.124.up_proj.weight_scale": "model-00041-of-00047.safetensors", + "model.layers.40.mlp.experts.125.down_proj.weight": "model-00041-of-00047.safetensors", + "model.layers.40.mlp.experts.125.down_proj.weight_scale": "model-00041-of-00047.safetensors", + "model.layers.40.mlp.experts.125.gate_proj.weight": "model-00041-of-00047.safetensors", + "model.layers.40.mlp.experts.125.gate_proj.weight_scale": "model-00041-of-00047.safetensors", + "model.layers.40.mlp.experts.125.up_proj.weight": "model-00041-of-00047.safetensors", + "model.layers.40.mlp.experts.125.up_proj.weight_scale": "model-00041-of-00047.safetensors", + "model.layers.40.mlp.experts.126.down_proj.weight": "model-00041-of-00047.safetensors", + "model.layers.40.mlp.experts.126.down_proj.weight_scale": "model-00041-of-00047.safetensors", + "model.layers.40.mlp.experts.126.gate_proj.weight": "model-00041-of-00047.safetensors", + "model.layers.40.mlp.experts.126.gate_proj.weight_scale": "model-00041-of-00047.safetensors", + "model.layers.40.mlp.experts.126.up_proj.weight": "model-00041-of-00047.safetensors", + "model.layers.40.mlp.experts.126.up_proj.weight_scale": "model-00041-of-00047.safetensors", + "model.layers.40.mlp.experts.127.down_proj.weight": "model-00041-of-00047.safetensors", + "model.layers.40.mlp.experts.127.down_proj.weight_scale": "model-00041-of-00047.safetensors", + "model.layers.40.mlp.experts.127.gate_proj.weight": "model-00041-of-00047.safetensors", + "model.layers.40.mlp.experts.127.gate_proj.weight_scale": "model-00041-of-00047.safetensors", + "model.layers.40.mlp.experts.127.up_proj.weight": "model-00041-of-00047.safetensors", + "model.layers.40.mlp.experts.127.up_proj.weight_scale": "model-00041-of-00047.safetensors", + "model.layers.40.mlp.experts.13.down_proj.weight": "model-00041-of-00047.safetensors", + "model.layers.40.mlp.experts.13.down_proj.weight_scale": "model-00041-of-00047.safetensors", + "model.layers.40.mlp.experts.13.gate_proj.weight": "model-00041-of-00047.safetensors", + "model.layers.40.mlp.experts.13.gate_proj.weight_scale": "model-00041-of-00047.safetensors", + "model.layers.40.mlp.experts.13.up_proj.weight": "model-00041-of-00047.safetensors", + "model.layers.40.mlp.experts.13.up_proj.weight_scale": "model-00041-of-00047.safetensors", + "model.layers.40.mlp.experts.14.down_proj.weight": "model-00041-of-00047.safetensors", + "model.layers.40.mlp.experts.14.down_proj.weight_scale": "model-00041-of-00047.safetensors", + "model.layers.40.mlp.experts.14.gate_proj.weight": "model-00041-of-00047.safetensors", + "model.layers.40.mlp.experts.14.gate_proj.weight_scale": "model-00041-of-00047.safetensors", + "model.layers.40.mlp.experts.14.up_proj.weight": "model-00041-of-00047.safetensors", + "model.layers.40.mlp.experts.14.up_proj.weight_scale": "model-00041-of-00047.safetensors", + "model.layers.40.mlp.experts.15.down_proj.weight": "model-00041-of-00047.safetensors", + "model.layers.40.mlp.experts.15.down_proj.weight_scale": "model-00041-of-00047.safetensors", + "model.layers.40.mlp.experts.15.gate_proj.weight": "model-00041-of-00047.safetensors", + "model.layers.40.mlp.experts.15.gate_proj.weight_scale": "model-00041-of-00047.safetensors", + "model.layers.40.mlp.experts.15.up_proj.weight": "model-00041-of-00047.safetensors", + "model.layers.40.mlp.experts.15.up_proj.weight_scale": "model-00041-of-00047.safetensors", + "model.layers.40.mlp.experts.16.down_proj.weight": "model-00041-of-00047.safetensors", + "model.layers.40.mlp.experts.16.down_proj.weight_scale": "model-00041-of-00047.safetensors", + "model.layers.40.mlp.experts.16.gate_proj.weight": "model-00041-of-00047.safetensors", + "model.layers.40.mlp.experts.16.gate_proj.weight_scale": "model-00041-of-00047.safetensors", + "model.layers.40.mlp.experts.16.up_proj.weight": "model-00041-of-00047.safetensors", + "model.layers.40.mlp.experts.16.up_proj.weight_scale": "model-00041-of-00047.safetensors", + "model.layers.40.mlp.experts.17.down_proj.weight": "model-00041-of-00047.safetensors", + "model.layers.40.mlp.experts.17.down_proj.weight_scale": "model-00041-of-00047.safetensors", + "model.layers.40.mlp.experts.17.gate_proj.weight": "model-00041-of-00047.safetensors", + "model.layers.40.mlp.experts.17.gate_proj.weight_scale": "model-00041-of-00047.safetensors", + "model.layers.40.mlp.experts.17.up_proj.weight": "model-00041-of-00047.safetensors", + "model.layers.40.mlp.experts.17.up_proj.weight_scale": "model-00041-of-00047.safetensors", + "model.layers.40.mlp.experts.18.down_proj.weight": "model-00041-of-00047.safetensors", + "model.layers.40.mlp.experts.18.down_proj.weight_scale": "model-00041-of-00047.safetensors", + "model.layers.40.mlp.experts.18.gate_proj.weight": "model-00041-of-00047.safetensors", + "model.layers.40.mlp.experts.18.gate_proj.weight_scale": "model-00041-of-00047.safetensors", + "model.layers.40.mlp.experts.18.up_proj.weight": "model-00041-of-00047.safetensors", + "model.layers.40.mlp.experts.18.up_proj.weight_scale": "model-00041-of-00047.safetensors", + "model.layers.40.mlp.experts.19.down_proj.weight": "model-00041-of-00047.safetensors", + "model.layers.40.mlp.experts.19.down_proj.weight_scale": "model-00041-of-00047.safetensors", + "model.layers.40.mlp.experts.19.gate_proj.weight": "model-00041-of-00047.safetensors", + "model.layers.40.mlp.experts.19.gate_proj.weight_scale": "model-00041-of-00047.safetensors", + "model.layers.40.mlp.experts.19.up_proj.weight": "model-00041-of-00047.safetensors", + "model.layers.40.mlp.experts.19.up_proj.weight_scale": "model-00041-of-00047.safetensors", + "model.layers.40.mlp.experts.2.down_proj.weight": "model-00041-of-00047.safetensors", + "model.layers.40.mlp.experts.2.down_proj.weight_scale": "model-00041-of-00047.safetensors", + "model.layers.40.mlp.experts.2.gate_proj.weight": "model-00041-of-00047.safetensors", + "model.layers.40.mlp.experts.2.gate_proj.weight_scale": "model-00041-of-00047.safetensors", + "model.layers.40.mlp.experts.2.up_proj.weight": "model-00041-of-00047.safetensors", + "model.layers.40.mlp.experts.2.up_proj.weight_scale": "model-00041-of-00047.safetensors", + "model.layers.40.mlp.experts.20.down_proj.weight": "model-00041-of-00047.safetensors", + "model.layers.40.mlp.experts.20.down_proj.weight_scale": "model-00041-of-00047.safetensors", + "model.layers.40.mlp.experts.20.gate_proj.weight": "model-00041-of-00047.safetensors", + "model.layers.40.mlp.experts.20.gate_proj.weight_scale": "model-00041-of-00047.safetensors", + "model.layers.40.mlp.experts.20.up_proj.weight": "model-00041-of-00047.safetensors", + "model.layers.40.mlp.experts.20.up_proj.weight_scale": "model-00041-of-00047.safetensors", + "model.layers.40.mlp.experts.21.down_proj.weight": "model-00041-of-00047.safetensors", + "model.layers.40.mlp.experts.21.down_proj.weight_scale": "model-00041-of-00047.safetensors", + "model.layers.40.mlp.experts.21.gate_proj.weight": "model-00041-of-00047.safetensors", + "model.layers.40.mlp.experts.21.gate_proj.weight_scale": "model-00041-of-00047.safetensors", + "model.layers.40.mlp.experts.21.up_proj.weight": "model-00041-of-00047.safetensors", + "model.layers.40.mlp.experts.21.up_proj.weight_scale": "model-00041-of-00047.safetensors", + "model.layers.40.mlp.experts.22.down_proj.weight": "model-00041-of-00047.safetensors", + "model.layers.40.mlp.experts.22.down_proj.weight_scale": "model-00041-of-00047.safetensors", + "model.layers.40.mlp.experts.22.gate_proj.weight": "model-00041-of-00047.safetensors", + "model.layers.40.mlp.experts.22.gate_proj.weight_scale": "model-00041-of-00047.safetensors", + "model.layers.40.mlp.experts.22.up_proj.weight": "model-00041-of-00047.safetensors", + "model.layers.40.mlp.experts.22.up_proj.weight_scale": "model-00041-of-00047.safetensors", + "model.layers.40.mlp.experts.23.down_proj.weight": "model-00041-of-00047.safetensors", + "model.layers.40.mlp.experts.23.down_proj.weight_scale": "model-00041-of-00047.safetensors", + "model.layers.40.mlp.experts.23.gate_proj.weight": "model-00041-of-00047.safetensors", + "model.layers.40.mlp.experts.23.gate_proj.weight_scale": "model-00041-of-00047.safetensors", + "model.layers.40.mlp.experts.23.up_proj.weight": "model-00041-of-00047.safetensors", + "model.layers.40.mlp.experts.23.up_proj.weight_scale": "model-00041-of-00047.safetensors", + "model.layers.40.mlp.experts.24.down_proj.weight": "model-00041-of-00047.safetensors", + "model.layers.40.mlp.experts.24.down_proj.weight_scale": "model-00041-of-00047.safetensors", + "model.layers.40.mlp.experts.24.gate_proj.weight": "model-00041-of-00047.safetensors", + "model.layers.40.mlp.experts.24.gate_proj.weight_scale": "model-00041-of-00047.safetensors", + "model.layers.40.mlp.experts.24.up_proj.weight": "model-00041-of-00047.safetensors", + "model.layers.40.mlp.experts.24.up_proj.weight_scale": "model-00041-of-00047.safetensors", + "model.layers.40.mlp.experts.25.down_proj.weight": "model-00041-of-00047.safetensors", + "model.layers.40.mlp.experts.25.down_proj.weight_scale": "model-00041-of-00047.safetensors", + "model.layers.40.mlp.experts.25.gate_proj.weight": "model-00041-of-00047.safetensors", + "model.layers.40.mlp.experts.25.gate_proj.weight_scale": "model-00041-of-00047.safetensors", + "model.layers.40.mlp.experts.25.up_proj.weight": "model-00041-of-00047.safetensors", + "model.layers.40.mlp.experts.25.up_proj.weight_scale": "model-00041-of-00047.safetensors", + "model.layers.40.mlp.experts.26.down_proj.weight": "model-00041-of-00047.safetensors", + "model.layers.40.mlp.experts.26.down_proj.weight_scale": "model-00041-of-00047.safetensors", + "model.layers.40.mlp.experts.26.gate_proj.weight": "model-00041-of-00047.safetensors", + "model.layers.40.mlp.experts.26.gate_proj.weight_scale": "model-00041-of-00047.safetensors", + "model.layers.40.mlp.experts.26.up_proj.weight": "model-00041-of-00047.safetensors", + "model.layers.40.mlp.experts.26.up_proj.weight_scale": "model-00041-of-00047.safetensors", + "model.layers.40.mlp.experts.27.down_proj.weight": "model-00041-of-00047.safetensors", + "model.layers.40.mlp.experts.27.down_proj.weight_scale": "model-00041-of-00047.safetensors", + "model.layers.40.mlp.experts.27.gate_proj.weight": "model-00041-of-00047.safetensors", + "model.layers.40.mlp.experts.27.gate_proj.weight_scale": "model-00041-of-00047.safetensors", + "model.layers.40.mlp.experts.27.up_proj.weight": "model-00041-of-00047.safetensors", + "model.layers.40.mlp.experts.27.up_proj.weight_scale": "model-00041-of-00047.safetensors", + "model.layers.40.mlp.experts.28.down_proj.weight": "model-00041-of-00047.safetensors", + "model.layers.40.mlp.experts.28.down_proj.weight_scale": "model-00041-of-00047.safetensors", + "model.layers.40.mlp.experts.28.gate_proj.weight": "model-00041-of-00047.safetensors", + "model.layers.40.mlp.experts.28.gate_proj.weight_scale": "model-00041-of-00047.safetensors", + "model.layers.40.mlp.experts.28.up_proj.weight": "model-00041-of-00047.safetensors", + "model.layers.40.mlp.experts.28.up_proj.weight_scale": "model-00041-of-00047.safetensors", + "model.layers.40.mlp.experts.29.down_proj.weight": "model-00041-of-00047.safetensors", + "model.layers.40.mlp.experts.29.down_proj.weight_scale": "model-00041-of-00047.safetensors", + "model.layers.40.mlp.experts.29.gate_proj.weight": "model-00041-of-00047.safetensors", + "model.layers.40.mlp.experts.29.gate_proj.weight_scale": "model-00041-of-00047.safetensors", + "model.layers.40.mlp.experts.29.up_proj.weight": "model-00041-of-00047.safetensors", + "model.layers.40.mlp.experts.29.up_proj.weight_scale": "model-00041-of-00047.safetensors", + "model.layers.40.mlp.experts.3.down_proj.weight": "model-00041-of-00047.safetensors", + "model.layers.40.mlp.experts.3.down_proj.weight_scale": "model-00041-of-00047.safetensors", + "model.layers.40.mlp.experts.3.gate_proj.weight": "model-00041-of-00047.safetensors", + "model.layers.40.mlp.experts.3.gate_proj.weight_scale": "model-00041-of-00047.safetensors", + "model.layers.40.mlp.experts.3.up_proj.weight": "model-00041-of-00047.safetensors", + "model.layers.40.mlp.experts.3.up_proj.weight_scale": "model-00041-of-00047.safetensors", + "model.layers.40.mlp.experts.30.down_proj.weight": "model-00041-of-00047.safetensors", + "model.layers.40.mlp.experts.30.down_proj.weight_scale": "model-00041-of-00047.safetensors", + "model.layers.40.mlp.experts.30.gate_proj.weight": "model-00041-of-00047.safetensors", + "model.layers.40.mlp.experts.30.gate_proj.weight_scale": "model-00041-of-00047.safetensors", + "model.layers.40.mlp.experts.30.up_proj.weight": "model-00041-of-00047.safetensors", + "model.layers.40.mlp.experts.30.up_proj.weight_scale": "model-00041-of-00047.safetensors", + "model.layers.40.mlp.experts.31.down_proj.weight": "model-00041-of-00047.safetensors", + "model.layers.40.mlp.experts.31.down_proj.weight_scale": "model-00041-of-00047.safetensors", + "model.layers.40.mlp.experts.31.gate_proj.weight": "model-00041-of-00047.safetensors", + "model.layers.40.mlp.experts.31.gate_proj.weight_scale": "model-00041-of-00047.safetensors", + "model.layers.40.mlp.experts.31.up_proj.weight": "model-00041-of-00047.safetensors", + "model.layers.40.mlp.experts.31.up_proj.weight_scale": "model-00041-of-00047.safetensors", + "model.layers.40.mlp.experts.32.down_proj.weight": "model-00041-of-00047.safetensors", + "model.layers.40.mlp.experts.32.down_proj.weight_scale": "model-00041-of-00047.safetensors", + "model.layers.40.mlp.experts.32.gate_proj.weight": "model-00041-of-00047.safetensors", + "model.layers.40.mlp.experts.32.gate_proj.weight_scale": "model-00041-of-00047.safetensors", + "model.layers.40.mlp.experts.32.up_proj.weight": "model-00041-of-00047.safetensors", + "model.layers.40.mlp.experts.32.up_proj.weight_scale": "model-00041-of-00047.safetensors", + "model.layers.40.mlp.experts.33.down_proj.weight": "model-00041-of-00047.safetensors", + "model.layers.40.mlp.experts.33.down_proj.weight_scale": "model-00041-of-00047.safetensors", + "model.layers.40.mlp.experts.33.gate_proj.weight": "model-00041-of-00047.safetensors", + "model.layers.40.mlp.experts.33.gate_proj.weight_scale": "model-00041-of-00047.safetensors", + "model.layers.40.mlp.experts.33.up_proj.weight": "model-00041-of-00047.safetensors", + "model.layers.40.mlp.experts.33.up_proj.weight_scale": "model-00041-of-00047.safetensors", + "model.layers.40.mlp.experts.34.down_proj.weight": "model-00041-of-00047.safetensors", + "model.layers.40.mlp.experts.34.down_proj.weight_scale": "model-00041-of-00047.safetensors", + "model.layers.40.mlp.experts.34.gate_proj.weight": "model-00041-of-00047.safetensors", + "model.layers.40.mlp.experts.34.gate_proj.weight_scale": "model-00041-of-00047.safetensors", + "model.layers.40.mlp.experts.34.up_proj.weight": "model-00041-of-00047.safetensors", + "model.layers.40.mlp.experts.34.up_proj.weight_scale": "model-00041-of-00047.safetensors", + "model.layers.40.mlp.experts.35.down_proj.weight": "model-00041-of-00047.safetensors", + "model.layers.40.mlp.experts.35.down_proj.weight_scale": "model-00041-of-00047.safetensors", + "model.layers.40.mlp.experts.35.gate_proj.weight": "model-00041-of-00047.safetensors", + "model.layers.40.mlp.experts.35.gate_proj.weight_scale": "model-00041-of-00047.safetensors", + "model.layers.40.mlp.experts.35.up_proj.weight": "model-00041-of-00047.safetensors", + "model.layers.40.mlp.experts.35.up_proj.weight_scale": "model-00041-of-00047.safetensors", + "model.layers.40.mlp.experts.36.down_proj.weight": "model-00041-of-00047.safetensors", + "model.layers.40.mlp.experts.36.down_proj.weight_scale": "model-00041-of-00047.safetensors", + "model.layers.40.mlp.experts.36.gate_proj.weight": "model-00041-of-00047.safetensors", + "model.layers.40.mlp.experts.36.gate_proj.weight_scale": "model-00041-of-00047.safetensors", + "model.layers.40.mlp.experts.36.up_proj.weight": "model-00041-of-00047.safetensors", + "model.layers.40.mlp.experts.36.up_proj.weight_scale": "model-00041-of-00047.safetensors", + "model.layers.40.mlp.experts.37.down_proj.weight": "model-00041-of-00047.safetensors", + "model.layers.40.mlp.experts.37.down_proj.weight_scale": "model-00041-of-00047.safetensors", + "model.layers.40.mlp.experts.37.gate_proj.weight": "model-00041-of-00047.safetensors", + "model.layers.40.mlp.experts.37.gate_proj.weight_scale": "model-00041-of-00047.safetensors", + "model.layers.40.mlp.experts.37.up_proj.weight": "model-00041-of-00047.safetensors", + "model.layers.40.mlp.experts.37.up_proj.weight_scale": "model-00041-of-00047.safetensors", + "model.layers.40.mlp.experts.38.down_proj.weight": "model-00041-of-00047.safetensors", + "model.layers.40.mlp.experts.38.down_proj.weight_scale": "model-00041-of-00047.safetensors", + "model.layers.40.mlp.experts.38.gate_proj.weight": "model-00041-of-00047.safetensors", + "model.layers.40.mlp.experts.38.gate_proj.weight_scale": "model-00041-of-00047.safetensors", + "model.layers.40.mlp.experts.38.up_proj.weight": "model-00041-of-00047.safetensors", + "model.layers.40.mlp.experts.38.up_proj.weight_scale": "model-00041-of-00047.safetensors", + "model.layers.40.mlp.experts.39.down_proj.weight": "model-00041-of-00047.safetensors", + "model.layers.40.mlp.experts.39.down_proj.weight_scale": "model-00041-of-00047.safetensors", + "model.layers.40.mlp.experts.39.gate_proj.weight": "model-00041-of-00047.safetensors", + "model.layers.40.mlp.experts.39.gate_proj.weight_scale": "model-00041-of-00047.safetensors", + "model.layers.40.mlp.experts.39.up_proj.weight": "model-00041-of-00047.safetensors", + "model.layers.40.mlp.experts.39.up_proj.weight_scale": "model-00041-of-00047.safetensors", + "model.layers.40.mlp.experts.4.down_proj.weight": "model-00041-of-00047.safetensors", + "model.layers.40.mlp.experts.4.down_proj.weight_scale": "model-00041-of-00047.safetensors", + "model.layers.40.mlp.experts.4.gate_proj.weight": "model-00041-of-00047.safetensors", + "model.layers.40.mlp.experts.4.gate_proj.weight_scale": "model-00041-of-00047.safetensors", + "model.layers.40.mlp.experts.4.up_proj.weight": "model-00041-of-00047.safetensors", + "model.layers.40.mlp.experts.4.up_proj.weight_scale": "model-00041-of-00047.safetensors", + "model.layers.40.mlp.experts.40.down_proj.weight": "model-00041-of-00047.safetensors", + "model.layers.40.mlp.experts.40.down_proj.weight_scale": "model-00041-of-00047.safetensors", + "model.layers.40.mlp.experts.40.gate_proj.weight": "model-00041-of-00047.safetensors", + "model.layers.40.mlp.experts.40.gate_proj.weight_scale": "model-00041-of-00047.safetensors", + "model.layers.40.mlp.experts.40.up_proj.weight": "model-00041-of-00047.safetensors", + "model.layers.40.mlp.experts.40.up_proj.weight_scale": "model-00041-of-00047.safetensors", + "model.layers.40.mlp.experts.41.down_proj.weight": "model-00041-of-00047.safetensors", + "model.layers.40.mlp.experts.41.down_proj.weight_scale": "model-00041-of-00047.safetensors", + "model.layers.40.mlp.experts.41.gate_proj.weight": "model-00041-of-00047.safetensors", + "model.layers.40.mlp.experts.41.gate_proj.weight_scale": "model-00041-of-00047.safetensors", + "model.layers.40.mlp.experts.41.up_proj.weight": "model-00041-of-00047.safetensors", + "model.layers.40.mlp.experts.41.up_proj.weight_scale": "model-00041-of-00047.safetensors", + "model.layers.40.mlp.experts.42.down_proj.weight": "model-00041-of-00047.safetensors", + "model.layers.40.mlp.experts.42.down_proj.weight_scale": "model-00041-of-00047.safetensors", + "model.layers.40.mlp.experts.42.gate_proj.weight": "model-00041-of-00047.safetensors", + "model.layers.40.mlp.experts.42.gate_proj.weight_scale": "model-00041-of-00047.safetensors", + "model.layers.40.mlp.experts.42.up_proj.weight": "model-00041-of-00047.safetensors", + "model.layers.40.mlp.experts.42.up_proj.weight_scale": "model-00041-of-00047.safetensors", + "model.layers.40.mlp.experts.43.down_proj.weight": "model-00041-of-00047.safetensors", + "model.layers.40.mlp.experts.43.down_proj.weight_scale": "model-00041-of-00047.safetensors", + "model.layers.40.mlp.experts.43.gate_proj.weight": "model-00041-of-00047.safetensors", + "model.layers.40.mlp.experts.43.gate_proj.weight_scale": "model-00041-of-00047.safetensors", + "model.layers.40.mlp.experts.43.up_proj.weight": "model-00041-of-00047.safetensors", + "model.layers.40.mlp.experts.43.up_proj.weight_scale": "model-00041-of-00047.safetensors", + "model.layers.40.mlp.experts.44.down_proj.weight": "model-00041-of-00047.safetensors", + "model.layers.40.mlp.experts.44.down_proj.weight_scale": "model-00041-of-00047.safetensors", + "model.layers.40.mlp.experts.44.gate_proj.weight": "model-00041-of-00047.safetensors", + "model.layers.40.mlp.experts.44.gate_proj.weight_scale": "model-00041-of-00047.safetensors", + "model.layers.40.mlp.experts.44.up_proj.weight": "model-00041-of-00047.safetensors", + "model.layers.40.mlp.experts.44.up_proj.weight_scale": "model-00041-of-00047.safetensors", + "model.layers.40.mlp.experts.45.down_proj.weight": "model-00041-of-00047.safetensors", + "model.layers.40.mlp.experts.45.down_proj.weight_scale": "model-00041-of-00047.safetensors", + "model.layers.40.mlp.experts.45.gate_proj.weight": "model-00041-of-00047.safetensors", + "model.layers.40.mlp.experts.45.gate_proj.weight_scale": "model-00041-of-00047.safetensors", + "model.layers.40.mlp.experts.45.up_proj.weight": "model-00041-of-00047.safetensors", + "model.layers.40.mlp.experts.45.up_proj.weight_scale": "model-00041-of-00047.safetensors", + "model.layers.40.mlp.experts.46.down_proj.weight": "model-00041-of-00047.safetensors", + "model.layers.40.mlp.experts.46.down_proj.weight_scale": "model-00041-of-00047.safetensors", + "model.layers.40.mlp.experts.46.gate_proj.weight": "model-00041-of-00047.safetensors", + "model.layers.40.mlp.experts.46.gate_proj.weight_scale": "model-00041-of-00047.safetensors", + "model.layers.40.mlp.experts.46.up_proj.weight": "model-00041-of-00047.safetensors", + "model.layers.40.mlp.experts.46.up_proj.weight_scale": "model-00041-of-00047.safetensors", + "model.layers.40.mlp.experts.47.down_proj.weight": "model-00041-of-00047.safetensors", + "model.layers.40.mlp.experts.47.down_proj.weight_scale": "model-00041-of-00047.safetensors", + "model.layers.40.mlp.experts.47.gate_proj.weight": "model-00041-of-00047.safetensors", + "model.layers.40.mlp.experts.47.gate_proj.weight_scale": "model-00041-of-00047.safetensors", + "model.layers.40.mlp.experts.47.up_proj.weight": "model-00041-of-00047.safetensors", + "model.layers.40.mlp.experts.47.up_proj.weight_scale": "model-00041-of-00047.safetensors", + "model.layers.40.mlp.experts.48.down_proj.weight": "model-00041-of-00047.safetensors", + "model.layers.40.mlp.experts.48.down_proj.weight_scale": "model-00041-of-00047.safetensors", + "model.layers.40.mlp.experts.48.gate_proj.weight": "model-00041-of-00047.safetensors", + "model.layers.40.mlp.experts.48.gate_proj.weight_scale": "model-00041-of-00047.safetensors", + "model.layers.40.mlp.experts.48.up_proj.weight": "model-00041-of-00047.safetensors", + "model.layers.40.mlp.experts.48.up_proj.weight_scale": "model-00041-of-00047.safetensors", + "model.layers.40.mlp.experts.49.down_proj.weight": "model-00041-of-00047.safetensors", + "model.layers.40.mlp.experts.49.down_proj.weight_scale": "model-00041-of-00047.safetensors", + "model.layers.40.mlp.experts.49.gate_proj.weight": "model-00041-of-00047.safetensors", + "model.layers.40.mlp.experts.49.gate_proj.weight_scale": "model-00041-of-00047.safetensors", + "model.layers.40.mlp.experts.49.up_proj.weight": "model-00041-of-00047.safetensors", + "model.layers.40.mlp.experts.49.up_proj.weight_scale": "model-00041-of-00047.safetensors", + "model.layers.40.mlp.experts.5.down_proj.weight": "model-00041-of-00047.safetensors", + "model.layers.40.mlp.experts.5.down_proj.weight_scale": "model-00041-of-00047.safetensors", + "model.layers.40.mlp.experts.5.gate_proj.weight": "model-00041-of-00047.safetensors", + "model.layers.40.mlp.experts.5.gate_proj.weight_scale": "model-00041-of-00047.safetensors", + "model.layers.40.mlp.experts.5.up_proj.weight": "model-00041-of-00047.safetensors", + "model.layers.40.mlp.experts.5.up_proj.weight_scale": "model-00041-of-00047.safetensors", + "model.layers.40.mlp.experts.50.down_proj.weight": "model-00041-of-00047.safetensors", + "model.layers.40.mlp.experts.50.down_proj.weight_scale": "model-00041-of-00047.safetensors", + "model.layers.40.mlp.experts.50.gate_proj.weight": "model-00041-of-00047.safetensors", + "model.layers.40.mlp.experts.50.gate_proj.weight_scale": "model-00041-of-00047.safetensors", + "model.layers.40.mlp.experts.50.up_proj.weight": "model-00041-of-00047.safetensors", + "model.layers.40.mlp.experts.50.up_proj.weight_scale": "model-00041-of-00047.safetensors", + "model.layers.40.mlp.experts.51.down_proj.weight": "model-00041-of-00047.safetensors", + "model.layers.40.mlp.experts.51.down_proj.weight_scale": "model-00041-of-00047.safetensors", + "model.layers.40.mlp.experts.51.gate_proj.weight": "model-00041-of-00047.safetensors", + "model.layers.40.mlp.experts.51.gate_proj.weight_scale": "model-00041-of-00047.safetensors", + "model.layers.40.mlp.experts.51.up_proj.weight": "model-00041-of-00047.safetensors", + "model.layers.40.mlp.experts.51.up_proj.weight_scale": "model-00041-of-00047.safetensors", + "model.layers.40.mlp.experts.52.down_proj.weight": "model-00041-of-00047.safetensors", + "model.layers.40.mlp.experts.52.down_proj.weight_scale": "model-00041-of-00047.safetensors", + "model.layers.40.mlp.experts.52.gate_proj.weight": "model-00041-of-00047.safetensors", + "model.layers.40.mlp.experts.52.gate_proj.weight_scale": "model-00041-of-00047.safetensors", + "model.layers.40.mlp.experts.52.up_proj.weight": "model-00041-of-00047.safetensors", + "model.layers.40.mlp.experts.52.up_proj.weight_scale": "model-00041-of-00047.safetensors", + "model.layers.40.mlp.experts.53.down_proj.weight": "model-00041-of-00047.safetensors", + "model.layers.40.mlp.experts.53.down_proj.weight_scale": "model-00041-of-00047.safetensors", + "model.layers.40.mlp.experts.53.gate_proj.weight": "model-00041-of-00047.safetensors", + "model.layers.40.mlp.experts.53.gate_proj.weight_scale": "model-00041-of-00047.safetensors", + "model.layers.40.mlp.experts.53.up_proj.weight": "model-00041-of-00047.safetensors", + "model.layers.40.mlp.experts.53.up_proj.weight_scale": "model-00041-of-00047.safetensors", + "model.layers.40.mlp.experts.54.down_proj.weight": "model-00041-of-00047.safetensors", + "model.layers.40.mlp.experts.54.down_proj.weight_scale": "model-00041-of-00047.safetensors", + "model.layers.40.mlp.experts.54.gate_proj.weight": "model-00041-of-00047.safetensors", + "model.layers.40.mlp.experts.54.gate_proj.weight_scale": "model-00041-of-00047.safetensors", + "model.layers.40.mlp.experts.54.up_proj.weight": "model-00041-of-00047.safetensors", + "model.layers.40.mlp.experts.54.up_proj.weight_scale": "model-00041-of-00047.safetensors", + "model.layers.40.mlp.experts.55.down_proj.weight": "model-00041-of-00047.safetensors", + "model.layers.40.mlp.experts.55.down_proj.weight_scale": "model-00041-of-00047.safetensors", + "model.layers.40.mlp.experts.55.gate_proj.weight": "model-00041-of-00047.safetensors", + "model.layers.40.mlp.experts.55.gate_proj.weight_scale": "model-00041-of-00047.safetensors", + "model.layers.40.mlp.experts.55.up_proj.weight": "model-00041-of-00047.safetensors", + "model.layers.40.mlp.experts.55.up_proj.weight_scale": "model-00041-of-00047.safetensors", + "model.layers.40.mlp.experts.56.down_proj.weight": "model-00041-of-00047.safetensors", + "model.layers.40.mlp.experts.56.down_proj.weight_scale": "model-00041-of-00047.safetensors", + "model.layers.40.mlp.experts.56.gate_proj.weight": "model-00041-of-00047.safetensors", + "model.layers.40.mlp.experts.56.gate_proj.weight_scale": "model-00041-of-00047.safetensors", + "model.layers.40.mlp.experts.56.up_proj.weight": "model-00041-of-00047.safetensors", + "model.layers.40.mlp.experts.56.up_proj.weight_scale": "model-00041-of-00047.safetensors", + "model.layers.40.mlp.experts.57.down_proj.weight": "model-00041-of-00047.safetensors", + "model.layers.40.mlp.experts.57.down_proj.weight_scale": "model-00041-of-00047.safetensors", + "model.layers.40.mlp.experts.57.gate_proj.weight": "model-00041-of-00047.safetensors", + "model.layers.40.mlp.experts.57.gate_proj.weight_scale": "model-00041-of-00047.safetensors", + "model.layers.40.mlp.experts.57.up_proj.weight": "model-00041-of-00047.safetensors", + "model.layers.40.mlp.experts.57.up_proj.weight_scale": "model-00041-of-00047.safetensors", + "model.layers.40.mlp.experts.58.down_proj.weight": "model-00041-of-00047.safetensors", + "model.layers.40.mlp.experts.58.down_proj.weight_scale": "model-00041-of-00047.safetensors", + "model.layers.40.mlp.experts.58.gate_proj.weight": "model-00041-of-00047.safetensors", + "model.layers.40.mlp.experts.58.gate_proj.weight_scale": "model-00041-of-00047.safetensors", + "model.layers.40.mlp.experts.58.up_proj.weight": "model-00041-of-00047.safetensors", + "model.layers.40.mlp.experts.58.up_proj.weight_scale": "model-00041-of-00047.safetensors", + "model.layers.40.mlp.experts.59.down_proj.weight": "model-00041-of-00047.safetensors", + "model.layers.40.mlp.experts.59.down_proj.weight_scale": "model-00041-of-00047.safetensors", + "model.layers.40.mlp.experts.59.gate_proj.weight": "model-00041-of-00047.safetensors", + "model.layers.40.mlp.experts.59.gate_proj.weight_scale": "model-00041-of-00047.safetensors", + "model.layers.40.mlp.experts.59.up_proj.weight": "model-00041-of-00047.safetensors", + "model.layers.40.mlp.experts.59.up_proj.weight_scale": "model-00041-of-00047.safetensors", + "model.layers.40.mlp.experts.6.down_proj.weight": "model-00041-of-00047.safetensors", + "model.layers.40.mlp.experts.6.down_proj.weight_scale": "model-00041-of-00047.safetensors", + "model.layers.40.mlp.experts.6.gate_proj.weight": "model-00041-of-00047.safetensors", + "model.layers.40.mlp.experts.6.gate_proj.weight_scale": "model-00041-of-00047.safetensors", + "model.layers.40.mlp.experts.6.up_proj.weight": "model-00041-of-00047.safetensors", + "model.layers.40.mlp.experts.6.up_proj.weight_scale": "model-00041-of-00047.safetensors", + "model.layers.40.mlp.experts.60.down_proj.weight": "model-00041-of-00047.safetensors", + "model.layers.40.mlp.experts.60.down_proj.weight_scale": "model-00041-of-00047.safetensors", + "model.layers.40.mlp.experts.60.gate_proj.weight": "model-00041-of-00047.safetensors", + "model.layers.40.mlp.experts.60.gate_proj.weight_scale": "model-00041-of-00047.safetensors", + "model.layers.40.mlp.experts.60.up_proj.weight": "model-00041-of-00047.safetensors", + "model.layers.40.mlp.experts.60.up_proj.weight_scale": "model-00041-of-00047.safetensors", + "model.layers.40.mlp.experts.61.down_proj.weight": "model-00041-of-00047.safetensors", + "model.layers.40.mlp.experts.61.down_proj.weight_scale": "model-00041-of-00047.safetensors", + "model.layers.40.mlp.experts.61.gate_proj.weight": "model-00041-of-00047.safetensors", + "model.layers.40.mlp.experts.61.gate_proj.weight_scale": "model-00041-of-00047.safetensors", + "model.layers.40.mlp.experts.61.up_proj.weight": "model-00041-of-00047.safetensors", + "model.layers.40.mlp.experts.61.up_proj.weight_scale": "model-00041-of-00047.safetensors", + "model.layers.40.mlp.experts.62.down_proj.weight": "model-00041-of-00047.safetensors", + "model.layers.40.mlp.experts.62.down_proj.weight_scale": "model-00041-of-00047.safetensors", + "model.layers.40.mlp.experts.62.gate_proj.weight": "model-00041-of-00047.safetensors", + "model.layers.40.mlp.experts.62.gate_proj.weight_scale": "model-00041-of-00047.safetensors", + "model.layers.40.mlp.experts.62.up_proj.weight": "model-00041-of-00047.safetensors", + "model.layers.40.mlp.experts.62.up_proj.weight_scale": "model-00041-of-00047.safetensors", + "model.layers.40.mlp.experts.63.down_proj.weight": "model-00041-of-00047.safetensors", + "model.layers.40.mlp.experts.63.down_proj.weight_scale": "model-00041-of-00047.safetensors", + "model.layers.40.mlp.experts.63.gate_proj.weight": "model-00041-of-00047.safetensors", + "model.layers.40.mlp.experts.63.gate_proj.weight_scale": "model-00041-of-00047.safetensors", + "model.layers.40.mlp.experts.63.up_proj.weight": "model-00041-of-00047.safetensors", + "model.layers.40.mlp.experts.63.up_proj.weight_scale": "model-00041-of-00047.safetensors", + "model.layers.40.mlp.experts.64.down_proj.weight": "model-00041-of-00047.safetensors", + "model.layers.40.mlp.experts.64.down_proj.weight_scale": "model-00041-of-00047.safetensors", + "model.layers.40.mlp.experts.64.gate_proj.weight": "model-00041-of-00047.safetensors", + "model.layers.40.mlp.experts.64.gate_proj.weight_scale": "model-00041-of-00047.safetensors", + "model.layers.40.mlp.experts.64.up_proj.weight": "model-00041-of-00047.safetensors", + "model.layers.40.mlp.experts.64.up_proj.weight_scale": "model-00041-of-00047.safetensors", + "model.layers.40.mlp.experts.65.down_proj.weight": "model-00041-of-00047.safetensors", + "model.layers.40.mlp.experts.65.down_proj.weight_scale": "model-00041-of-00047.safetensors", + "model.layers.40.mlp.experts.65.gate_proj.weight": "model-00041-of-00047.safetensors", + "model.layers.40.mlp.experts.65.gate_proj.weight_scale": "model-00041-of-00047.safetensors", + "model.layers.40.mlp.experts.65.up_proj.weight": "model-00041-of-00047.safetensors", + "model.layers.40.mlp.experts.65.up_proj.weight_scale": "model-00041-of-00047.safetensors", + "model.layers.40.mlp.experts.66.down_proj.weight": "model-00041-of-00047.safetensors", + "model.layers.40.mlp.experts.66.down_proj.weight_scale": "model-00041-of-00047.safetensors", + "model.layers.40.mlp.experts.66.gate_proj.weight": "model-00041-of-00047.safetensors", + "model.layers.40.mlp.experts.66.gate_proj.weight_scale": "model-00041-of-00047.safetensors", + "model.layers.40.mlp.experts.66.up_proj.weight": "model-00041-of-00047.safetensors", + "model.layers.40.mlp.experts.66.up_proj.weight_scale": "model-00041-of-00047.safetensors", + "model.layers.40.mlp.experts.67.down_proj.weight": "model-00041-of-00047.safetensors", + "model.layers.40.mlp.experts.67.down_proj.weight_scale": "model-00041-of-00047.safetensors", + "model.layers.40.mlp.experts.67.gate_proj.weight": "model-00041-of-00047.safetensors", + "model.layers.40.mlp.experts.67.gate_proj.weight_scale": "model-00041-of-00047.safetensors", + "model.layers.40.mlp.experts.67.up_proj.weight": "model-00041-of-00047.safetensors", + "model.layers.40.mlp.experts.67.up_proj.weight_scale": "model-00041-of-00047.safetensors", + "model.layers.40.mlp.experts.68.down_proj.weight": "model-00041-of-00047.safetensors", + "model.layers.40.mlp.experts.68.down_proj.weight_scale": "model-00041-of-00047.safetensors", + "model.layers.40.mlp.experts.68.gate_proj.weight": "model-00041-of-00047.safetensors", + "model.layers.40.mlp.experts.68.gate_proj.weight_scale": "model-00041-of-00047.safetensors", + "model.layers.40.mlp.experts.68.up_proj.weight": "model-00041-of-00047.safetensors", + "model.layers.40.mlp.experts.68.up_proj.weight_scale": "model-00041-of-00047.safetensors", + "model.layers.40.mlp.experts.69.down_proj.weight": "model-00041-of-00047.safetensors", + "model.layers.40.mlp.experts.69.down_proj.weight_scale": "model-00041-of-00047.safetensors", + "model.layers.40.mlp.experts.69.gate_proj.weight": "model-00041-of-00047.safetensors", + "model.layers.40.mlp.experts.69.gate_proj.weight_scale": "model-00041-of-00047.safetensors", + "model.layers.40.mlp.experts.69.up_proj.weight": "model-00041-of-00047.safetensors", + "model.layers.40.mlp.experts.69.up_proj.weight_scale": "model-00041-of-00047.safetensors", + "model.layers.40.mlp.experts.7.down_proj.weight": "model-00041-of-00047.safetensors", + "model.layers.40.mlp.experts.7.down_proj.weight_scale": "model-00041-of-00047.safetensors", + "model.layers.40.mlp.experts.7.gate_proj.weight": "model-00041-of-00047.safetensors", + "model.layers.40.mlp.experts.7.gate_proj.weight_scale": "model-00041-of-00047.safetensors", + "model.layers.40.mlp.experts.7.up_proj.weight": "model-00041-of-00047.safetensors", + "model.layers.40.mlp.experts.7.up_proj.weight_scale": "model-00041-of-00047.safetensors", + "model.layers.40.mlp.experts.70.down_proj.weight": "model-00041-of-00047.safetensors", + "model.layers.40.mlp.experts.70.down_proj.weight_scale": "model-00041-of-00047.safetensors", + "model.layers.40.mlp.experts.70.gate_proj.weight": "model-00041-of-00047.safetensors", + "model.layers.40.mlp.experts.70.gate_proj.weight_scale": "model-00041-of-00047.safetensors", + "model.layers.40.mlp.experts.70.up_proj.weight": "model-00041-of-00047.safetensors", + "model.layers.40.mlp.experts.70.up_proj.weight_scale": "model-00041-of-00047.safetensors", + "model.layers.40.mlp.experts.71.down_proj.weight": "model-00041-of-00047.safetensors", + "model.layers.40.mlp.experts.71.down_proj.weight_scale": "model-00041-of-00047.safetensors", + "model.layers.40.mlp.experts.71.gate_proj.weight": "model-00041-of-00047.safetensors", + "model.layers.40.mlp.experts.71.gate_proj.weight_scale": "model-00041-of-00047.safetensors", + "model.layers.40.mlp.experts.71.up_proj.weight": "model-00041-of-00047.safetensors", + "model.layers.40.mlp.experts.71.up_proj.weight_scale": "model-00041-of-00047.safetensors", + "model.layers.40.mlp.experts.72.down_proj.weight": "model-00041-of-00047.safetensors", + "model.layers.40.mlp.experts.72.down_proj.weight_scale": "model-00041-of-00047.safetensors", + "model.layers.40.mlp.experts.72.gate_proj.weight": "model-00041-of-00047.safetensors", + "model.layers.40.mlp.experts.72.gate_proj.weight_scale": "model-00041-of-00047.safetensors", + "model.layers.40.mlp.experts.72.up_proj.weight": "model-00041-of-00047.safetensors", + "model.layers.40.mlp.experts.72.up_proj.weight_scale": "model-00041-of-00047.safetensors", + "model.layers.40.mlp.experts.73.down_proj.weight": "model-00041-of-00047.safetensors", + "model.layers.40.mlp.experts.73.down_proj.weight_scale": "model-00041-of-00047.safetensors", + "model.layers.40.mlp.experts.73.gate_proj.weight": "model-00041-of-00047.safetensors", + "model.layers.40.mlp.experts.73.gate_proj.weight_scale": "model-00041-of-00047.safetensors", + "model.layers.40.mlp.experts.73.up_proj.weight": "model-00041-of-00047.safetensors", + "model.layers.40.mlp.experts.73.up_proj.weight_scale": "model-00041-of-00047.safetensors", + "model.layers.40.mlp.experts.74.down_proj.weight": "model-00041-of-00047.safetensors", + "model.layers.40.mlp.experts.74.down_proj.weight_scale": "model-00041-of-00047.safetensors", + "model.layers.40.mlp.experts.74.gate_proj.weight": "model-00041-of-00047.safetensors", + "model.layers.40.mlp.experts.74.gate_proj.weight_scale": "model-00041-of-00047.safetensors", + "model.layers.40.mlp.experts.74.up_proj.weight": "model-00041-of-00047.safetensors", + "model.layers.40.mlp.experts.74.up_proj.weight_scale": "model-00041-of-00047.safetensors", + "model.layers.40.mlp.experts.75.down_proj.weight": "model-00041-of-00047.safetensors", + "model.layers.40.mlp.experts.75.down_proj.weight_scale": "model-00041-of-00047.safetensors", + "model.layers.40.mlp.experts.75.gate_proj.weight": "model-00041-of-00047.safetensors", + "model.layers.40.mlp.experts.75.gate_proj.weight_scale": "model-00041-of-00047.safetensors", + "model.layers.40.mlp.experts.75.up_proj.weight": "model-00041-of-00047.safetensors", + "model.layers.40.mlp.experts.75.up_proj.weight_scale": "model-00041-of-00047.safetensors", + "model.layers.40.mlp.experts.76.down_proj.weight": "model-00041-of-00047.safetensors", + "model.layers.40.mlp.experts.76.down_proj.weight_scale": "model-00041-of-00047.safetensors", + "model.layers.40.mlp.experts.76.gate_proj.weight": "model-00041-of-00047.safetensors", + "model.layers.40.mlp.experts.76.gate_proj.weight_scale": "model-00041-of-00047.safetensors", + "model.layers.40.mlp.experts.76.up_proj.weight": "model-00041-of-00047.safetensors", + "model.layers.40.mlp.experts.76.up_proj.weight_scale": "model-00041-of-00047.safetensors", + "model.layers.40.mlp.experts.77.down_proj.weight": "model-00041-of-00047.safetensors", + "model.layers.40.mlp.experts.77.down_proj.weight_scale": "model-00041-of-00047.safetensors", + "model.layers.40.mlp.experts.77.gate_proj.weight": "model-00041-of-00047.safetensors", + "model.layers.40.mlp.experts.77.gate_proj.weight_scale": "model-00041-of-00047.safetensors", + "model.layers.40.mlp.experts.77.up_proj.weight": "model-00041-of-00047.safetensors", + "model.layers.40.mlp.experts.77.up_proj.weight_scale": "model-00041-of-00047.safetensors", + "model.layers.40.mlp.experts.78.down_proj.weight": "model-00041-of-00047.safetensors", + "model.layers.40.mlp.experts.78.down_proj.weight_scale": "model-00041-of-00047.safetensors", + "model.layers.40.mlp.experts.78.gate_proj.weight": "model-00041-of-00047.safetensors", + "model.layers.40.mlp.experts.78.gate_proj.weight_scale": "model-00041-of-00047.safetensors", + "model.layers.40.mlp.experts.78.up_proj.weight": "model-00041-of-00047.safetensors", + "model.layers.40.mlp.experts.78.up_proj.weight_scale": "model-00041-of-00047.safetensors", + "model.layers.40.mlp.experts.79.down_proj.weight": "model-00041-of-00047.safetensors", + "model.layers.40.mlp.experts.79.down_proj.weight_scale": "model-00041-of-00047.safetensors", + "model.layers.40.mlp.experts.79.gate_proj.weight": "model-00041-of-00047.safetensors", + "model.layers.40.mlp.experts.79.gate_proj.weight_scale": "model-00041-of-00047.safetensors", + "model.layers.40.mlp.experts.79.up_proj.weight": "model-00041-of-00047.safetensors", + "model.layers.40.mlp.experts.79.up_proj.weight_scale": "model-00041-of-00047.safetensors", + "model.layers.40.mlp.experts.8.down_proj.weight": "model-00041-of-00047.safetensors", + "model.layers.40.mlp.experts.8.down_proj.weight_scale": "model-00041-of-00047.safetensors", + "model.layers.40.mlp.experts.8.gate_proj.weight": "model-00041-of-00047.safetensors", + "model.layers.40.mlp.experts.8.gate_proj.weight_scale": "model-00041-of-00047.safetensors", + "model.layers.40.mlp.experts.8.up_proj.weight": "model-00041-of-00047.safetensors", + "model.layers.40.mlp.experts.8.up_proj.weight_scale": "model-00041-of-00047.safetensors", + "model.layers.40.mlp.experts.80.down_proj.weight": "model-00041-of-00047.safetensors", + "model.layers.40.mlp.experts.80.down_proj.weight_scale": "model-00041-of-00047.safetensors", + "model.layers.40.mlp.experts.80.gate_proj.weight": "model-00041-of-00047.safetensors", + "model.layers.40.mlp.experts.80.gate_proj.weight_scale": "model-00041-of-00047.safetensors", + "model.layers.40.mlp.experts.80.up_proj.weight": "model-00041-of-00047.safetensors", + "model.layers.40.mlp.experts.80.up_proj.weight_scale": "model-00041-of-00047.safetensors", + "model.layers.40.mlp.experts.81.down_proj.weight": "model-00041-of-00047.safetensors", + "model.layers.40.mlp.experts.81.down_proj.weight_scale": "model-00041-of-00047.safetensors", + "model.layers.40.mlp.experts.81.gate_proj.weight": "model-00041-of-00047.safetensors", + "model.layers.40.mlp.experts.81.gate_proj.weight_scale": "model-00041-of-00047.safetensors", + "model.layers.40.mlp.experts.81.up_proj.weight": "model-00041-of-00047.safetensors", + "model.layers.40.mlp.experts.81.up_proj.weight_scale": "model-00041-of-00047.safetensors", + "model.layers.40.mlp.experts.82.down_proj.weight": "model-00041-of-00047.safetensors", + "model.layers.40.mlp.experts.82.down_proj.weight_scale": "model-00041-of-00047.safetensors", + "model.layers.40.mlp.experts.82.gate_proj.weight": "model-00041-of-00047.safetensors", + "model.layers.40.mlp.experts.82.gate_proj.weight_scale": "model-00041-of-00047.safetensors", + "model.layers.40.mlp.experts.82.up_proj.weight": "model-00041-of-00047.safetensors", + "model.layers.40.mlp.experts.82.up_proj.weight_scale": "model-00041-of-00047.safetensors", + "model.layers.40.mlp.experts.83.down_proj.weight": "model-00041-of-00047.safetensors", + "model.layers.40.mlp.experts.83.down_proj.weight_scale": "model-00041-of-00047.safetensors", + "model.layers.40.mlp.experts.83.gate_proj.weight": "model-00041-of-00047.safetensors", + "model.layers.40.mlp.experts.83.gate_proj.weight_scale": "model-00041-of-00047.safetensors", + "model.layers.40.mlp.experts.83.up_proj.weight": "model-00041-of-00047.safetensors", + "model.layers.40.mlp.experts.83.up_proj.weight_scale": "model-00041-of-00047.safetensors", + "model.layers.40.mlp.experts.84.down_proj.weight": "model-00041-of-00047.safetensors", + "model.layers.40.mlp.experts.84.down_proj.weight_scale": "model-00041-of-00047.safetensors", + "model.layers.40.mlp.experts.84.gate_proj.weight": "model-00041-of-00047.safetensors", + "model.layers.40.mlp.experts.84.gate_proj.weight_scale": "model-00041-of-00047.safetensors", + "model.layers.40.mlp.experts.84.up_proj.weight": "model-00041-of-00047.safetensors", + "model.layers.40.mlp.experts.84.up_proj.weight_scale": "model-00041-of-00047.safetensors", + "model.layers.40.mlp.experts.85.down_proj.weight": "model-00041-of-00047.safetensors", + "model.layers.40.mlp.experts.85.down_proj.weight_scale": "model-00041-of-00047.safetensors", + "model.layers.40.mlp.experts.85.gate_proj.weight": "model-00041-of-00047.safetensors", + "model.layers.40.mlp.experts.85.gate_proj.weight_scale": "model-00041-of-00047.safetensors", + "model.layers.40.mlp.experts.85.up_proj.weight": "model-00041-of-00047.safetensors", + "model.layers.40.mlp.experts.85.up_proj.weight_scale": "model-00041-of-00047.safetensors", + "model.layers.40.mlp.experts.86.down_proj.weight": "model-00041-of-00047.safetensors", + "model.layers.40.mlp.experts.86.down_proj.weight_scale": "model-00041-of-00047.safetensors", + "model.layers.40.mlp.experts.86.gate_proj.weight": "model-00041-of-00047.safetensors", + "model.layers.40.mlp.experts.86.gate_proj.weight_scale": "model-00041-of-00047.safetensors", + "model.layers.40.mlp.experts.86.up_proj.weight": "model-00041-of-00047.safetensors", + "model.layers.40.mlp.experts.86.up_proj.weight_scale": "model-00041-of-00047.safetensors", + "model.layers.40.mlp.experts.87.down_proj.weight": "model-00041-of-00047.safetensors", + "model.layers.40.mlp.experts.87.down_proj.weight_scale": "model-00041-of-00047.safetensors", + "model.layers.40.mlp.experts.87.gate_proj.weight": "model-00041-of-00047.safetensors", + "model.layers.40.mlp.experts.87.gate_proj.weight_scale": "model-00041-of-00047.safetensors", + "model.layers.40.mlp.experts.87.up_proj.weight": "model-00041-of-00047.safetensors", + "model.layers.40.mlp.experts.87.up_proj.weight_scale": "model-00041-of-00047.safetensors", + "model.layers.40.mlp.experts.88.down_proj.weight": "model-00041-of-00047.safetensors", + "model.layers.40.mlp.experts.88.down_proj.weight_scale": "model-00041-of-00047.safetensors", + "model.layers.40.mlp.experts.88.gate_proj.weight": "model-00041-of-00047.safetensors", + "model.layers.40.mlp.experts.88.gate_proj.weight_scale": "model-00041-of-00047.safetensors", + "model.layers.40.mlp.experts.88.up_proj.weight": "model-00041-of-00047.safetensors", + "model.layers.40.mlp.experts.88.up_proj.weight_scale": "model-00041-of-00047.safetensors", + "model.layers.40.mlp.experts.89.down_proj.weight": "model-00041-of-00047.safetensors", + "model.layers.40.mlp.experts.89.down_proj.weight_scale": "model-00041-of-00047.safetensors", + "model.layers.40.mlp.experts.89.gate_proj.weight": "model-00041-of-00047.safetensors", + "model.layers.40.mlp.experts.89.gate_proj.weight_scale": "model-00041-of-00047.safetensors", + "model.layers.40.mlp.experts.89.up_proj.weight": "model-00041-of-00047.safetensors", + "model.layers.40.mlp.experts.89.up_proj.weight_scale": "model-00041-of-00047.safetensors", + "model.layers.40.mlp.experts.9.down_proj.weight": "model-00041-of-00047.safetensors", + "model.layers.40.mlp.experts.9.down_proj.weight_scale": "model-00041-of-00047.safetensors", + "model.layers.40.mlp.experts.9.gate_proj.weight": "model-00041-of-00047.safetensors", + "model.layers.40.mlp.experts.9.gate_proj.weight_scale": "model-00041-of-00047.safetensors", + "model.layers.40.mlp.experts.9.up_proj.weight": "model-00041-of-00047.safetensors", + "model.layers.40.mlp.experts.9.up_proj.weight_scale": "model-00041-of-00047.safetensors", + "model.layers.40.mlp.experts.90.down_proj.weight": "model-00041-of-00047.safetensors", + "model.layers.40.mlp.experts.90.down_proj.weight_scale": "model-00041-of-00047.safetensors", + "model.layers.40.mlp.experts.90.gate_proj.weight": "model-00041-of-00047.safetensors", + "model.layers.40.mlp.experts.90.gate_proj.weight_scale": "model-00041-of-00047.safetensors", + "model.layers.40.mlp.experts.90.up_proj.weight": "model-00041-of-00047.safetensors", + "model.layers.40.mlp.experts.90.up_proj.weight_scale": "model-00041-of-00047.safetensors", + "model.layers.40.mlp.experts.91.down_proj.weight": "model-00041-of-00047.safetensors", + "model.layers.40.mlp.experts.91.down_proj.weight_scale": "model-00041-of-00047.safetensors", + "model.layers.40.mlp.experts.91.gate_proj.weight": "model-00041-of-00047.safetensors", + "model.layers.40.mlp.experts.91.gate_proj.weight_scale": "model-00041-of-00047.safetensors", + "model.layers.40.mlp.experts.91.up_proj.weight": "model-00041-of-00047.safetensors", + "model.layers.40.mlp.experts.91.up_proj.weight_scale": "model-00041-of-00047.safetensors", + "model.layers.40.mlp.experts.92.down_proj.weight": "model-00041-of-00047.safetensors", + "model.layers.40.mlp.experts.92.down_proj.weight_scale": "model-00041-of-00047.safetensors", + "model.layers.40.mlp.experts.92.gate_proj.weight": "model-00041-of-00047.safetensors", + "model.layers.40.mlp.experts.92.gate_proj.weight_scale": "model-00041-of-00047.safetensors", + "model.layers.40.mlp.experts.92.up_proj.weight": "model-00041-of-00047.safetensors", + "model.layers.40.mlp.experts.92.up_proj.weight_scale": "model-00041-of-00047.safetensors", + "model.layers.40.mlp.experts.93.down_proj.weight": "model-00041-of-00047.safetensors", + "model.layers.40.mlp.experts.93.down_proj.weight_scale": "model-00041-of-00047.safetensors", + "model.layers.40.mlp.experts.93.gate_proj.weight": "model-00041-of-00047.safetensors", + "model.layers.40.mlp.experts.93.gate_proj.weight_scale": "model-00041-of-00047.safetensors", + "model.layers.40.mlp.experts.93.up_proj.weight": "model-00041-of-00047.safetensors", + "model.layers.40.mlp.experts.93.up_proj.weight_scale": "model-00041-of-00047.safetensors", + "model.layers.40.mlp.experts.94.down_proj.weight": "model-00041-of-00047.safetensors", + "model.layers.40.mlp.experts.94.down_proj.weight_scale": "model-00041-of-00047.safetensors", + "model.layers.40.mlp.experts.94.gate_proj.weight": "model-00041-of-00047.safetensors", + "model.layers.40.mlp.experts.94.gate_proj.weight_scale": "model-00041-of-00047.safetensors", + "model.layers.40.mlp.experts.94.up_proj.weight": "model-00041-of-00047.safetensors", + "model.layers.40.mlp.experts.94.up_proj.weight_scale": "model-00041-of-00047.safetensors", + "model.layers.40.mlp.experts.95.down_proj.weight": "model-00041-of-00047.safetensors", + "model.layers.40.mlp.experts.95.down_proj.weight_scale": "model-00041-of-00047.safetensors", + "model.layers.40.mlp.experts.95.gate_proj.weight": "model-00041-of-00047.safetensors", + "model.layers.40.mlp.experts.95.gate_proj.weight_scale": "model-00041-of-00047.safetensors", + "model.layers.40.mlp.experts.95.up_proj.weight": "model-00041-of-00047.safetensors", + "model.layers.40.mlp.experts.95.up_proj.weight_scale": "model-00041-of-00047.safetensors", + "model.layers.40.mlp.experts.96.down_proj.weight": "model-00041-of-00047.safetensors", + "model.layers.40.mlp.experts.96.down_proj.weight_scale": "model-00041-of-00047.safetensors", + "model.layers.40.mlp.experts.96.gate_proj.weight": "model-00041-of-00047.safetensors", + "model.layers.40.mlp.experts.96.gate_proj.weight_scale": "model-00041-of-00047.safetensors", + "model.layers.40.mlp.experts.96.up_proj.weight": "model-00041-of-00047.safetensors", + "model.layers.40.mlp.experts.96.up_proj.weight_scale": "model-00041-of-00047.safetensors", + "model.layers.40.mlp.experts.97.down_proj.weight": "model-00041-of-00047.safetensors", + "model.layers.40.mlp.experts.97.down_proj.weight_scale": "model-00041-of-00047.safetensors", + "model.layers.40.mlp.experts.97.gate_proj.weight": "model-00041-of-00047.safetensors", + "model.layers.40.mlp.experts.97.gate_proj.weight_scale": "model-00041-of-00047.safetensors", + "model.layers.40.mlp.experts.97.up_proj.weight": "model-00041-of-00047.safetensors", + "model.layers.40.mlp.experts.97.up_proj.weight_scale": "model-00041-of-00047.safetensors", + "model.layers.40.mlp.experts.98.down_proj.weight": "model-00041-of-00047.safetensors", + "model.layers.40.mlp.experts.98.down_proj.weight_scale": "model-00041-of-00047.safetensors", + "model.layers.40.mlp.experts.98.gate_proj.weight": "model-00041-of-00047.safetensors", + "model.layers.40.mlp.experts.98.gate_proj.weight_scale": "model-00041-of-00047.safetensors", + "model.layers.40.mlp.experts.98.up_proj.weight": "model-00041-of-00047.safetensors", + "model.layers.40.mlp.experts.98.up_proj.weight_scale": "model-00041-of-00047.safetensors", + "model.layers.40.mlp.experts.99.down_proj.weight": "model-00041-of-00047.safetensors", + "model.layers.40.mlp.experts.99.down_proj.weight_scale": "model-00041-of-00047.safetensors", + "model.layers.40.mlp.experts.99.gate_proj.weight": "model-00041-of-00047.safetensors", + "model.layers.40.mlp.experts.99.gate_proj.weight_scale": "model-00041-of-00047.safetensors", + "model.layers.40.mlp.experts.99.up_proj.weight": "model-00041-of-00047.safetensors", + "model.layers.40.mlp.experts.99.up_proj.weight_scale": "model-00041-of-00047.safetensors", + "model.layers.40.mlp.gate.e_score_correction_bias": "model-00041-of-00047.safetensors", + "model.layers.40.mlp.gate.weight": "model-00041-of-00047.safetensors", + "model.layers.40.mlp.shared_experts.down_proj.weight": "model-00041-of-00047.safetensors", + "model.layers.40.mlp.shared_experts.down_proj.weight_scale": "model-00041-of-00047.safetensors", + "model.layers.40.mlp.shared_experts.gate_proj.weight": "model-00041-of-00047.safetensors", + "model.layers.40.mlp.shared_experts.gate_proj.weight_scale": "model-00041-of-00047.safetensors", + "model.layers.40.mlp.shared_experts.up_proj.weight": "model-00041-of-00047.safetensors", + "model.layers.40.mlp.shared_experts.up_proj.weight_scale": "model-00041-of-00047.safetensors", + "model.layers.40.post_attention_layernorm.weight": "model-00041-of-00047.safetensors", + "model.layers.40.self_attn.k_proj.bias": "model-00041-of-00047.safetensors", + "model.layers.40.self_attn.k_proj.weight": "model-00041-of-00047.safetensors", + "model.layers.40.self_attn.k_proj.weight_scale": "model-00041-of-00047.safetensors", + "model.layers.40.self_attn.o_proj.weight": "model-00041-of-00047.safetensors", + "model.layers.40.self_attn.o_proj.weight_scale": "model-00041-of-00047.safetensors", + "model.layers.40.self_attn.q_proj.bias": "model-00041-of-00047.safetensors", + "model.layers.40.self_attn.q_proj.weight": "model-00041-of-00047.safetensors", + "model.layers.40.self_attn.q_proj.weight_scale": "model-00041-of-00047.safetensors", + "model.layers.40.self_attn.v_proj.bias": "model-00041-of-00047.safetensors", + "model.layers.40.self_attn.v_proj.weight": "model-00041-of-00047.safetensors", + "model.layers.40.self_attn.v_proj.weight_scale": "model-00041-of-00047.safetensors", + "model.layers.41.input_layernorm.weight": "model-00042-of-00047.safetensors", + "model.layers.41.mlp.experts.0.down_proj.weight": "model-00042-of-00047.safetensors", + "model.layers.41.mlp.experts.0.down_proj.weight_scale": "model-00042-of-00047.safetensors", + "model.layers.41.mlp.experts.0.gate_proj.weight": "model-00042-of-00047.safetensors", + "model.layers.41.mlp.experts.0.gate_proj.weight_scale": "model-00042-of-00047.safetensors", + "model.layers.41.mlp.experts.0.up_proj.weight": "model-00042-of-00047.safetensors", + "model.layers.41.mlp.experts.0.up_proj.weight_scale": "model-00042-of-00047.safetensors", + "model.layers.41.mlp.experts.1.down_proj.weight": "model-00042-of-00047.safetensors", + "model.layers.41.mlp.experts.1.down_proj.weight_scale": "model-00042-of-00047.safetensors", + "model.layers.41.mlp.experts.1.gate_proj.weight": "model-00042-of-00047.safetensors", + "model.layers.41.mlp.experts.1.gate_proj.weight_scale": "model-00042-of-00047.safetensors", + "model.layers.41.mlp.experts.1.up_proj.weight": "model-00042-of-00047.safetensors", + "model.layers.41.mlp.experts.1.up_proj.weight_scale": "model-00042-of-00047.safetensors", + "model.layers.41.mlp.experts.10.down_proj.weight": "model-00042-of-00047.safetensors", + "model.layers.41.mlp.experts.10.down_proj.weight_scale": "model-00042-of-00047.safetensors", + "model.layers.41.mlp.experts.10.gate_proj.weight": "model-00042-of-00047.safetensors", + "model.layers.41.mlp.experts.10.gate_proj.weight_scale": "model-00042-of-00047.safetensors", + "model.layers.41.mlp.experts.10.up_proj.weight": "model-00042-of-00047.safetensors", + "model.layers.41.mlp.experts.10.up_proj.weight_scale": "model-00042-of-00047.safetensors", + "model.layers.41.mlp.experts.100.down_proj.weight": "model-00042-of-00047.safetensors", + "model.layers.41.mlp.experts.100.down_proj.weight_scale": "model-00042-of-00047.safetensors", + "model.layers.41.mlp.experts.100.gate_proj.weight": "model-00042-of-00047.safetensors", + "model.layers.41.mlp.experts.100.gate_proj.weight_scale": "model-00042-of-00047.safetensors", + "model.layers.41.mlp.experts.100.up_proj.weight": "model-00042-of-00047.safetensors", + "model.layers.41.mlp.experts.100.up_proj.weight_scale": "model-00042-of-00047.safetensors", + "model.layers.41.mlp.experts.101.down_proj.weight": "model-00042-of-00047.safetensors", + "model.layers.41.mlp.experts.101.down_proj.weight_scale": "model-00042-of-00047.safetensors", + "model.layers.41.mlp.experts.101.gate_proj.weight": "model-00042-of-00047.safetensors", + "model.layers.41.mlp.experts.101.gate_proj.weight_scale": "model-00042-of-00047.safetensors", + "model.layers.41.mlp.experts.101.up_proj.weight": "model-00042-of-00047.safetensors", + "model.layers.41.mlp.experts.101.up_proj.weight_scale": "model-00042-of-00047.safetensors", + "model.layers.41.mlp.experts.102.down_proj.weight": "model-00042-of-00047.safetensors", + "model.layers.41.mlp.experts.102.down_proj.weight_scale": "model-00042-of-00047.safetensors", + "model.layers.41.mlp.experts.102.gate_proj.weight": "model-00042-of-00047.safetensors", + "model.layers.41.mlp.experts.102.gate_proj.weight_scale": "model-00042-of-00047.safetensors", + "model.layers.41.mlp.experts.102.up_proj.weight": "model-00042-of-00047.safetensors", + "model.layers.41.mlp.experts.102.up_proj.weight_scale": "model-00042-of-00047.safetensors", + "model.layers.41.mlp.experts.103.down_proj.weight": "model-00042-of-00047.safetensors", + "model.layers.41.mlp.experts.103.down_proj.weight_scale": "model-00042-of-00047.safetensors", + "model.layers.41.mlp.experts.103.gate_proj.weight": "model-00042-of-00047.safetensors", + "model.layers.41.mlp.experts.103.gate_proj.weight_scale": "model-00042-of-00047.safetensors", + "model.layers.41.mlp.experts.103.up_proj.weight": "model-00042-of-00047.safetensors", + "model.layers.41.mlp.experts.103.up_proj.weight_scale": "model-00042-of-00047.safetensors", + "model.layers.41.mlp.experts.104.down_proj.weight": "model-00042-of-00047.safetensors", + "model.layers.41.mlp.experts.104.down_proj.weight_scale": "model-00042-of-00047.safetensors", + "model.layers.41.mlp.experts.104.gate_proj.weight": "model-00042-of-00047.safetensors", + "model.layers.41.mlp.experts.104.gate_proj.weight_scale": "model-00042-of-00047.safetensors", + "model.layers.41.mlp.experts.104.up_proj.weight": "model-00042-of-00047.safetensors", + "model.layers.41.mlp.experts.104.up_proj.weight_scale": "model-00042-of-00047.safetensors", + "model.layers.41.mlp.experts.105.down_proj.weight": "model-00042-of-00047.safetensors", + "model.layers.41.mlp.experts.105.down_proj.weight_scale": "model-00042-of-00047.safetensors", + "model.layers.41.mlp.experts.105.gate_proj.weight": "model-00042-of-00047.safetensors", + "model.layers.41.mlp.experts.105.gate_proj.weight_scale": "model-00042-of-00047.safetensors", + "model.layers.41.mlp.experts.105.up_proj.weight": "model-00042-of-00047.safetensors", + "model.layers.41.mlp.experts.105.up_proj.weight_scale": "model-00042-of-00047.safetensors", + "model.layers.41.mlp.experts.106.down_proj.weight": "model-00042-of-00047.safetensors", + "model.layers.41.mlp.experts.106.down_proj.weight_scale": "model-00042-of-00047.safetensors", + "model.layers.41.mlp.experts.106.gate_proj.weight": "model-00042-of-00047.safetensors", + "model.layers.41.mlp.experts.106.gate_proj.weight_scale": "model-00042-of-00047.safetensors", + "model.layers.41.mlp.experts.106.up_proj.weight": "model-00042-of-00047.safetensors", + "model.layers.41.mlp.experts.106.up_proj.weight_scale": "model-00042-of-00047.safetensors", + "model.layers.41.mlp.experts.107.down_proj.weight": "model-00042-of-00047.safetensors", + "model.layers.41.mlp.experts.107.down_proj.weight_scale": "model-00042-of-00047.safetensors", + "model.layers.41.mlp.experts.107.gate_proj.weight": "model-00042-of-00047.safetensors", + "model.layers.41.mlp.experts.107.gate_proj.weight_scale": "model-00042-of-00047.safetensors", + "model.layers.41.mlp.experts.107.up_proj.weight": "model-00042-of-00047.safetensors", + "model.layers.41.mlp.experts.107.up_proj.weight_scale": "model-00042-of-00047.safetensors", + "model.layers.41.mlp.experts.108.down_proj.weight": "model-00042-of-00047.safetensors", + "model.layers.41.mlp.experts.108.down_proj.weight_scale": "model-00042-of-00047.safetensors", + "model.layers.41.mlp.experts.108.gate_proj.weight": "model-00042-of-00047.safetensors", + "model.layers.41.mlp.experts.108.gate_proj.weight_scale": "model-00042-of-00047.safetensors", + "model.layers.41.mlp.experts.108.up_proj.weight": "model-00042-of-00047.safetensors", + "model.layers.41.mlp.experts.108.up_proj.weight_scale": "model-00042-of-00047.safetensors", + "model.layers.41.mlp.experts.109.down_proj.weight": "model-00042-of-00047.safetensors", + "model.layers.41.mlp.experts.109.down_proj.weight_scale": "model-00042-of-00047.safetensors", + "model.layers.41.mlp.experts.109.gate_proj.weight": "model-00042-of-00047.safetensors", + "model.layers.41.mlp.experts.109.gate_proj.weight_scale": "model-00042-of-00047.safetensors", + "model.layers.41.mlp.experts.109.up_proj.weight": "model-00042-of-00047.safetensors", + "model.layers.41.mlp.experts.109.up_proj.weight_scale": "model-00042-of-00047.safetensors", + "model.layers.41.mlp.experts.11.down_proj.weight": "model-00042-of-00047.safetensors", + "model.layers.41.mlp.experts.11.down_proj.weight_scale": "model-00042-of-00047.safetensors", + "model.layers.41.mlp.experts.11.gate_proj.weight": "model-00042-of-00047.safetensors", + "model.layers.41.mlp.experts.11.gate_proj.weight_scale": "model-00042-of-00047.safetensors", + "model.layers.41.mlp.experts.11.up_proj.weight": "model-00042-of-00047.safetensors", + "model.layers.41.mlp.experts.11.up_proj.weight_scale": "model-00042-of-00047.safetensors", + "model.layers.41.mlp.experts.110.down_proj.weight": "model-00042-of-00047.safetensors", + "model.layers.41.mlp.experts.110.down_proj.weight_scale": "model-00042-of-00047.safetensors", + "model.layers.41.mlp.experts.110.gate_proj.weight": "model-00042-of-00047.safetensors", + "model.layers.41.mlp.experts.110.gate_proj.weight_scale": "model-00042-of-00047.safetensors", + "model.layers.41.mlp.experts.110.up_proj.weight": "model-00042-of-00047.safetensors", + "model.layers.41.mlp.experts.110.up_proj.weight_scale": "model-00042-of-00047.safetensors", + "model.layers.41.mlp.experts.111.down_proj.weight": "model-00042-of-00047.safetensors", + "model.layers.41.mlp.experts.111.down_proj.weight_scale": "model-00042-of-00047.safetensors", + "model.layers.41.mlp.experts.111.gate_proj.weight": "model-00042-of-00047.safetensors", + "model.layers.41.mlp.experts.111.gate_proj.weight_scale": "model-00042-of-00047.safetensors", + "model.layers.41.mlp.experts.111.up_proj.weight": "model-00042-of-00047.safetensors", + "model.layers.41.mlp.experts.111.up_proj.weight_scale": "model-00042-of-00047.safetensors", + "model.layers.41.mlp.experts.112.down_proj.weight": "model-00042-of-00047.safetensors", + "model.layers.41.mlp.experts.112.down_proj.weight_scale": "model-00042-of-00047.safetensors", + "model.layers.41.mlp.experts.112.gate_proj.weight": "model-00042-of-00047.safetensors", + "model.layers.41.mlp.experts.112.gate_proj.weight_scale": "model-00042-of-00047.safetensors", + "model.layers.41.mlp.experts.112.up_proj.weight": "model-00042-of-00047.safetensors", + "model.layers.41.mlp.experts.112.up_proj.weight_scale": "model-00042-of-00047.safetensors", + "model.layers.41.mlp.experts.113.down_proj.weight": "model-00042-of-00047.safetensors", + "model.layers.41.mlp.experts.113.down_proj.weight_scale": "model-00042-of-00047.safetensors", + "model.layers.41.mlp.experts.113.gate_proj.weight": "model-00042-of-00047.safetensors", + "model.layers.41.mlp.experts.113.gate_proj.weight_scale": "model-00042-of-00047.safetensors", + "model.layers.41.mlp.experts.113.up_proj.weight": "model-00042-of-00047.safetensors", + "model.layers.41.mlp.experts.113.up_proj.weight_scale": "model-00042-of-00047.safetensors", + "model.layers.41.mlp.experts.114.down_proj.weight": "model-00042-of-00047.safetensors", + "model.layers.41.mlp.experts.114.down_proj.weight_scale": "model-00042-of-00047.safetensors", + "model.layers.41.mlp.experts.114.gate_proj.weight": "model-00042-of-00047.safetensors", + "model.layers.41.mlp.experts.114.gate_proj.weight_scale": "model-00042-of-00047.safetensors", + "model.layers.41.mlp.experts.114.up_proj.weight": "model-00042-of-00047.safetensors", + "model.layers.41.mlp.experts.114.up_proj.weight_scale": "model-00042-of-00047.safetensors", + "model.layers.41.mlp.experts.115.down_proj.weight": "model-00042-of-00047.safetensors", + "model.layers.41.mlp.experts.115.down_proj.weight_scale": "model-00042-of-00047.safetensors", + "model.layers.41.mlp.experts.115.gate_proj.weight": "model-00042-of-00047.safetensors", + "model.layers.41.mlp.experts.115.gate_proj.weight_scale": "model-00042-of-00047.safetensors", + "model.layers.41.mlp.experts.115.up_proj.weight": "model-00042-of-00047.safetensors", + "model.layers.41.mlp.experts.115.up_proj.weight_scale": "model-00042-of-00047.safetensors", + "model.layers.41.mlp.experts.116.down_proj.weight": "model-00042-of-00047.safetensors", + "model.layers.41.mlp.experts.116.down_proj.weight_scale": "model-00042-of-00047.safetensors", + "model.layers.41.mlp.experts.116.gate_proj.weight": "model-00042-of-00047.safetensors", + "model.layers.41.mlp.experts.116.gate_proj.weight_scale": "model-00042-of-00047.safetensors", + "model.layers.41.mlp.experts.116.up_proj.weight": "model-00042-of-00047.safetensors", + "model.layers.41.mlp.experts.116.up_proj.weight_scale": "model-00042-of-00047.safetensors", + "model.layers.41.mlp.experts.117.down_proj.weight": "model-00042-of-00047.safetensors", + "model.layers.41.mlp.experts.117.down_proj.weight_scale": "model-00042-of-00047.safetensors", + "model.layers.41.mlp.experts.117.gate_proj.weight": "model-00042-of-00047.safetensors", + "model.layers.41.mlp.experts.117.gate_proj.weight_scale": "model-00042-of-00047.safetensors", + "model.layers.41.mlp.experts.117.up_proj.weight": "model-00042-of-00047.safetensors", + "model.layers.41.mlp.experts.117.up_proj.weight_scale": "model-00042-of-00047.safetensors", + "model.layers.41.mlp.experts.118.down_proj.weight": "model-00042-of-00047.safetensors", + "model.layers.41.mlp.experts.118.down_proj.weight_scale": "model-00042-of-00047.safetensors", + "model.layers.41.mlp.experts.118.gate_proj.weight": "model-00042-of-00047.safetensors", + "model.layers.41.mlp.experts.118.gate_proj.weight_scale": "model-00042-of-00047.safetensors", + "model.layers.41.mlp.experts.118.up_proj.weight": "model-00042-of-00047.safetensors", + "model.layers.41.mlp.experts.118.up_proj.weight_scale": "model-00042-of-00047.safetensors", + "model.layers.41.mlp.experts.119.down_proj.weight": "model-00042-of-00047.safetensors", + "model.layers.41.mlp.experts.119.down_proj.weight_scale": "model-00042-of-00047.safetensors", + "model.layers.41.mlp.experts.119.gate_proj.weight": "model-00042-of-00047.safetensors", + "model.layers.41.mlp.experts.119.gate_proj.weight_scale": "model-00042-of-00047.safetensors", + "model.layers.41.mlp.experts.119.up_proj.weight": "model-00042-of-00047.safetensors", + "model.layers.41.mlp.experts.119.up_proj.weight_scale": "model-00042-of-00047.safetensors", + "model.layers.41.mlp.experts.12.down_proj.weight": "model-00042-of-00047.safetensors", + "model.layers.41.mlp.experts.12.down_proj.weight_scale": "model-00042-of-00047.safetensors", + "model.layers.41.mlp.experts.12.gate_proj.weight": "model-00042-of-00047.safetensors", + "model.layers.41.mlp.experts.12.gate_proj.weight_scale": "model-00042-of-00047.safetensors", + "model.layers.41.mlp.experts.12.up_proj.weight": "model-00042-of-00047.safetensors", + "model.layers.41.mlp.experts.12.up_proj.weight_scale": "model-00042-of-00047.safetensors", + "model.layers.41.mlp.experts.120.down_proj.weight": "model-00042-of-00047.safetensors", + "model.layers.41.mlp.experts.120.down_proj.weight_scale": "model-00042-of-00047.safetensors", + "model.layers.41.mlp.experts.120.gate_proj.weight": "model-00042-of-00047.safetensors", + "model.layers.41.mlp.experts.120.gate_proj.weight_scale": "model-00042-of-00047.safetensors", + "model.layers.41.mlp.experts.120.up_proj.weight": "model-00042-of-00047.safetensors", + "model.layers.41.mlp.experts.120.up_proj.weight_scale": "model-00042-of-00047.safetensors", + "model.layers.41.mlp.experts.121.down_proj.weight": "model-00042-of-00047.safetensors", + "model.layers.41.mlp.experts.121.down_proj.weight_scale": "model-00042-of-00047.safetensors", + "model.layers.41.mlp.experts.121.gate_proj.weight": "model-00042-of-00047.safetensors", + "model.layers.41.mlp.experts.121.gate_proj.weight_scale": "model-00042-of-00047.safetensors", + "model.layers.41.mlp.experts.121.up_proj.weight": "model-00042-of-00047.safetensors", + "model.layers.41.mlp.experts.121.up_proj.weight_scale": "model-00042-of-00047.safetensors", + "model.layers.41.mlp.experts.122.down_proj.weight": "model-00042-of-00047.safetensors", + "model.layers.41.mlp.experts.122.down_proj.weight_scale": "model-00042-of-00047.safetensors", + "model.layers.41.mlp.experts.122.gate_proj.weight": "model-00042-of-00047.safetensors", + "model.layers.41.mlp.experts.122.gate_proj.weight_scale": "model-00042-of-00047.safetensors", + "model.layers.41.mlp.experts.122.up_proj.weight": "model-00042-of-00047.safetensors", + "model.layers.41.mlp.experts.122.up_proj.weight_scale": "model-00042-of-00047.safetensors", + "model.layers.41.mlp.experts.123.down_proj.weight": "model-00042-of-00047.safetensors", + "model.layers.41.mlp.experts.123.down_proj.weight_scale": "model-00042-of-00047.safetensors", + "model.layers.41.mlp.experts.123.gate_proj.weight": "model-00042-of-00047.safetensors", + "model.layers.41.mlp.experts.123.gate_proj.weight_scale": "model-00042-of-00047.safetensors", + "model.layers.41.mlp.experts.123.up_proj.weight": "model-00042-of-00047.safetensors", + "model.layers.41.mlp.experts.123.up_proj.weight_scale": "model-00042-of-00047.safetensors", + "model.layers.41.mlp.experts.124.down_proj.weight": "model-00042-of-00047.safetensors", + "model.layers.41.mlp.experts.124.down_proj.weight_scale": "model-00042-of-00047.safetensors", + "model.layers.41.mlp.experts.124.gate_proj.weight": "model-00042-of-00047.safetensors", + "model.layers.41.mlp.experts.124.gate_proj.weight_scale": "model-00042-of-00047.safetensors", + "model.layers.41.mlp.experts.124.up_proj.weight": "model-00042-of-00047.safetensors", + "model.layers.41.mlp.experts.124.up_proj.weight_scale": "model-00042-of-00047.safetensors", + "model.layers.41.mlp.experts.125.down_proj.weight": "model-00042-of-00047.safetensors", + "model.layers.41.mlp.experts.125.down_proj.weight_scale": "model-00042-of-00047.safetensors", + "model.layers.41.mlp.experts.125.gate_proj.weight": "model-00042-of-00047.safetensors", + "model.layers.41.mlp.experts.125.gate_proj.weight_scale": "model-00042-of-00047.safetensors", + "model.layers.41.mlp.experts.125.up_proj.weight": "model-00042-of-00047.safetensors", + "model.layers.41.mlp.experts.125.up_proj.weight_scale": "model-00042-of-00047.safetensors", + "model.layers.41.mlp.experts.126.down_proj.weight": "model-00042-of-00047.safetensors", + "model.layers.41.mlp.experts.126.down_proj.weight_scale": "model-00042-of-00047.safetensors", + "model.layers.41.mlp.experts.126.gate_proj.weight": "model-00042-of-00047.safetensors", + "model.layers.41.mlp.experts.126.gate_proj.weight_scale": "model-00042-of-00047.safetensors", + "model.layers.41.mlp.experts.126.up_proj.weight": "model-00042-of-00047.safetensors", + "model.layers.41.mlp.experts.126.up_proj.weight_scale": "model-00042-of-00047.safetensors", + "model.layers.41.mlp.experts.127.down_proj.weight": "model-00042-of-00047.safetensors", + "model.layers.41.mlp.experts.127.down_proj.weight_scale": "model-00042-of-00047.safetensors", + "model.layers.41.mlp.experts.127.gate_proj.weight": "model-00042-of-00047.safetensors", + "model.layers.41.mlp.experts.127.gate_proj.weight_scale": "model-00042-of-00047.safetensors", + "model.layers.41.mlp.experts.127.up_proj.weight": "model-00042-of-00047.safetensors", + "model.layers.41.mlp.experts.127.up_proj.weight_scale": "model-00042-of-00047.safetensors", + "model.layers.41.mlp.experts.13.down_proj.weight": "model-00042-of-00047.safetensors", + "model.layers.41.mlp.experts.13.down_proj.weight_scale": "model-00042-of-00047.safetensors", + "model.layers.41.mlp.experts.13.gate_proj.weight": "model-00042-of-00047.safetensors", + "model.layers.41.mlp.experts.13.gate_proj.weight_scale": "model-00042-of-00047.safetensors", + "model.layers.41.mlp.experts.13.up_proj.weight": "model-00042-of-00047.safetensors", + "model.layers.41.mlp.experts.13.up_proj.weight_scale": "model-00042-of-00047.safetensors", + "model.layers.41.mlp.experts.14.down_proj.weight": "model-00042-of-00047.safetensors", + "model.layers.41.mlp.experts.14.down_proj.weight_scale": "model-00042-of-00047.safetensors", + "model.layers.41.mlp.experts.14.gate_proj.weight": "model-00042-of-00047.safetensors", + "model.layers.41.mlp.experts.14.gate_proj.weight_scale": "model-00042-of-00047.safetensors", + "model.layers.41.mlp.experts.14.up_proj.weight": "model-00042-of-00047.safetensors", + "model.layers.41.mlp.experts.14.up_proj.weight_scale": "model-00042-of-00047.safetensors", + "model.layers.41.mlp.experts.15.down_proj.weight": "model-00042-of-00047.safetensors", + "model.layers.41.mlp.experts.15.down_proj.weight_scale": "model-00042-of-00047.safetensors", + "model.layers.41.mlp.experts.15.gate_proj.weight": "model-00042-of-00047.safetensors", + "model.layers.41.mlp.experts.15.gate_proj.weight_scale": "model-00042-of-00047.safetensors", + "model.layers.41.mlp.experts.15.up_proj.weight": "model-00042-of-00047.safetensors", + "model.layers.41.mlp.experts.15.up_proj.weight_scale": "model-00042-of-00047.safetensors", + "model.layers.41.mlp.experts.16.down_proj.weight": "model-00042-of-00047.safetensors", + "model.layers.41.mlp.experts.16.down_proj.weight_scale": "model-00042-of-00047.safetensors", + "model.layers.41.mlp.experts.16.gate_proj.weight": "model-00042-of-00047.safetensors", + "model.layers.41.mlp.experts.16.gate_proj.weight_scale": "model-00042-of-00047.safetensors", + "model.layers.41.mlp.experts.16.up_proj.weight": "model-00042-of-00047.safetensors", + "model.layers.41.mlp.experts.16.up_proj.weight_scale": "model-00042-of-00047.safetensors", + "model.layers.41.mlp.experts.17.down_proj.weight": "model-00042-of-00047.safetensors", + "model.layers.41.mlp.experts.17.down_proj.weight_scale": "model-00042-of-00047.safetensors", + "model.layers.41.mlp.experts.17.gate_proj.weight": "model-00042-of-00047.safetensors", + "model.layers.41.mlp.experts.17.gate_proj.weight_scale": "model-00042-of-00047.safetensors", + "model.layers.41.mlp.experts.17.up_proj.weight": "model-00042-of-00047.safetensors", + "model.layers.41.mlp.experts.17.up_proj.weight_scale": "model-00042-of-00047.safetensors", + "model.layers.41.mlp.experts.18.down_proj.weight": "model-00042-of-00047.safetensors", + "model.layers.41.mlp.experts.18.down_proj.weight_scale": "model-00042-of-00047.safetensors", + "model.layers.41.mlp.experts.18.gate_proj.weight": "model-00042-of-00047.safetensors", + "model.layers.41.mlp.experts.18.gate_proj.weight_scale": "model-00042-of-00047.safetensors", + "model.layers.41.mlp.experts.18.up_proj.weight": "model-00042-of-00047.safetensors", + "model.layers.41.mlp.experts.18.up_proj.weight_scale": "model-00042-of-00047.safetensors", + "model.layers.41.mlp.experts.19.down_proj.weight": "model-00042-of-00047.safetensors", + "model.layers.41.mlp.experts.19.down_proj.weight_scale": "model-00042-of-00047.safetensors", + "model.layers.41.mlp.experts.19.gate_proj.weight": "model-00042-of-00047.safetensors", + "model.layers.41.mlp.experts.19.gate_proj.weight_scale": "model-00042-of-00047.safetensors", + "model.layers.41.mlp.experts.19.up_proj.weight": "model-00042-of-00047.safetensors", + "model.layers.41.mlp.experts.19.up_proj.weight_scale": "model-00042-of-00047.safetensors", + "model.layers.41.mlp.experts.2.down_proj.weight": "model-00042-of-00047.safetensors", + "model.layers.41.mlp.experts.2.down_proj.weight_scale": "model-00042-of-00047.safetensors", + "model.layers.41.mlp.experts.2.gate_proj.weight": "model-00042-of-00047.safetensors", + "model.layers.41.mlp.experts.2.gate_proj.weight_scale": "model-00042-of-00047.safetensors", + "model.layers.41.mlp.experts.2.up_proj.weight": "model-00042-of-00047.safetensors", + "model.layers.41.mlp.experts.2.up_proj.weight_scale": "model-00042-of-00047.safetensors", + "model.layers.41.mlp.experts.20.down_proj.weight": "model-00042-of-00047.safetensors", + "model.layers.41.mlp.experts.20.down_proj.weight_scale": "model-00042-of-00047.safetensors", + "model.layers.41.mlp.experts.20.gate_proj.weight": "model-00042-of-00047.safetensors", + "model.layers.41.mlp.experts.20.gate_proj.weight_scale": "model-00042-of-00047.safetensors", + "model.layers.41.mlp.experts.20.up_proj.weight": "model-00042-of-00047.safetensors", + "model.layers.41.mlp.experts.20.up_proj.weight_scale": "model-00042-of-00047.safetensors", + "model.layers.41.mlp.experts.21.down_proj.weight": "model-00042-of-00047.safetensors", + "model.layers.41.mlp.experts.21.down_proj.weight_scale": "model-00042-of-00047.safetensors", + "model.layers.41.mlp.experts.21.gate_proj.weight": "model-00042-of-00047.safetensors", + "model.layers.41.mlp.experts.21.gate_proj.weight_scale": "model-00042-of-00047.safetensors", + "model.layers.41.mlp.experts.21.up_proj.weight": "model-00042-of-00047.safetensors", + "model.layers.41.mlp.experts.21.up_proj.weight_scale": "model-00042-of-00047.safetensors", + "model.layers.41.mlp.experts.22.down_proj.weight": "model-00042-of-00047.safetensors", + "model.layers.41.mlp.experts.22.down_proj.weight_scale": "model-00042-of-00047.safetensors", + "model.layers.41.mlp.experts.22.gate_proj.weight": "model-00042-of-00047.safetensors", + "model.layers.41.mlp.experts.22.gate_proj.weight_scale": "model-00042-of-00047.safetensors", + "model.layers.41.mlp.experts.22.up_proj.weight": "model-00042-of-00047.safetensors", + "model.layers.41.mlp.experts.22.up_proj.weight_scale": "model-00042-of-00047.safetensors", + "model.layers.41.mlp.experts.23.down_proj.weight": "model-00042-of-00047.safetensors", + "model.layers.41.mlp.experts.23.down_proj.weight_scale": "model-00042-of-00047.safetensors", + "model.layers.41.mlp.experts.23.gate_proj.weight": "model-00042-of-00047.safetensors", + "model.layers.41.mlp.experts.23.gate_proj.weight_scale": "model-00042-of-00047.safetensors", + "model.layers.41.mlp.experts.23.up_proj.weight": "model-00042-of-00047.safetensors", + "model.layers.41.mlp.experts.23.up_proj.weight_scale": "model-00042-of-00047.safetensors", + "model.layers.41.mlp.experts.24.down_proj.weight": "model-00042-of-00047.safetensors", + "model.layers.41.mlp.experts.24.down_proj.weight_scale": "model-00042-of-00047.safetensors", + "model.layers.41.mlp.experts.24.gate_proj.weight": "model-00042-of-00047.safetensors", + "model.layers.41.mlp.experts.24.gate_proj.weight_scale": "model-00042-of-00047.safetensors", + "model.layers.41.mlp.experts.24.up_proj.weight": "model-00042-of-00047.safetensors", + "model.layers.41.mlp.experts.24.up_proj.weight_scale": "model-00042-of-00047.safetensors", + "model.layers.41.mlp.experts.25.down_proj.weight": "model-00042-of-00047.safetensors", + "model.layers.41.mlp.experts.25.down_proj.weight_scale": "model-00042-of-00047.safetensors", + "model.layers.41.mlp.experts.25.gate_proj.weight": "model-00042-of-00047.safetensors", + "model.layers.41.mlp.experts.25.gate_proj.weight_scale": "model-00042-of-00047.safetensors", + "model.layers.41.mlp.experts.25.up_proj.weight": "model-00042-of-00047.safetensors", + "model.layers.41.mlp.experts.25.up_proj.weight_scale": "model-00042-of-00047.safetensors", + "model.layers.41.mlp.experts.26.down_proj.weight": "model-00042-of-00047.safetensors", + "model.layers.41.mlp.experts.26.down_proj.weight_scale": "model-00042-of-00047.safetensors", + "model.layers.41.mlp.experts.26.gate_proj.weight": "model-00042-of-00047.safetensors", + "model.layers.41.mlp.experts.26.gate_proj.weight_scale": "model-00042-of-00047.safetensors", + "model.layers.41.mlp.experts.26.up_proj.weight": "model-00042-of-00047.safetensors", + "model.layers.41.mlp.experts.26.up_proj.weight_scale": "model-00042-of-00047.safetensors", + "model.layers.41.mlp.experts.27.down_proj.weight": "model-00042-of-00047.safetensors", + "model.layers.41.mlp.experts.27.down_proj.weight_scale": "model-00042-of-00047.safetensors", + "model.layers.41.mlp.experts.27.gate_proj.weight": "model-00042-of-00047.safetensors", + "model.layers.41.mlp.experts.27.gate_proj.weight_scale": "model-00042-of-00047.safetensors", + "model.layers.41.mlp.experts.27.up_proj.weight": "model-00042-of-00047.safetensors", + "model.layers.41.mlp.experts.27.up_proj.weight_scale": "model-00042-of-00047.safetensors", + "model.layers.41.mlp.experts.28.down_proj.weight": "model-00042-of-00047.safetensors", + "model.layers.41.mlp.experts.28.down_proj.weight_scale": "model-00042-of-00047.safetensors", + "model.layers.41.mlp.experts.28.gate_proj.weight": "model-00042-of-00047.safetensors", + "model.layers.41.mlp.experts.28.gate_proj.weight_scale": "model-00042-of-00047.safetensors", + "model.layers.41.mlp.experts.28.up_proj.weight": "model-00042-of-00047.safetensors", + "model.layers.41.mlp.experts.28.up_proj.weight_scale": "model-00042-of-00047.safetensors", + "model.layers.41.mlp.experts.29.down_proj.weight": "model-00042-of-00047.safetensors", + "model.layers.41.mlp.experts.29.down_proj.weight_scale": "model-00042-of-00047.safetensors", + "model.layers.41.mlp.experts.29.gate_proj.weight": "model-00042-of-00047.safetensors", + "model.layers.41.mlp.experts.29.gate_proj.weight_scale": "model-00042-of-00047.safetensors", + "model.layers.41.mlp.experts.29.up_proj.weight": "model-00042-of-00047.safetensors", + "model.layers.41.mlp.experts.29.up_proj.weight_scale": "model-00042-of-00047.safetensors", + "model.layers.41.mlp.experts.3.down_proj.weight": "model-00042-of-00047.safetensors", + "model.layers.41.mlp.experts.3.down_proj.weight_scale": "model-00042-of-00047.safetensors", + "model.layers.41.mlp.experts.3.gate_proj.weight": "model-00042-of-00047.safetensors", + "model.layers.41.mlp.experts.3.gate_proj.weight_scale": "model-00042-of-00047.safetensors", + "model.layers.41.mlp.experts.3.up_proj.weight": "model-00042-of-00047.safetensors", + "model.layers.41.mlp.experts.3.up_proj.weight_scale": "model-00042-of-00047.safetensors", + "model.layers.41.mlp.experts.30.down_proj.weight": "model-00042-of-00047.safetensors", + "model.layers.41.mlp.experts.30.down_proj.weight_scale": "model-00042-of-00047.safetensors", + "model.layers.41.mlp.experts.30.gate_proj.weight": "model-00042-of-00047.safetensors", + "model.layers.41.mlp.experts.30.gate_proj.weight_scale": "model-00042-of-00047.safetensors", + "model.layers.41.mlp.experts.30.up_proj.weight": "model-00042-of-00047.safetensors", + "model.layers.41.mlp.experts.30.up_proj.weight_scale": "model-00042-of-00047.safetensors", + "model.layers.41.mlp.experts.31.down_proj.weight": "model-00042-of-00047.safetensors", + "model.layers.41.mlp.experts.31.down_proj.weight_scale": "model-00042-of-00047.safetensors", + "model.layers.41.mlp.experts.31.gate_proj.weight": "model-00042-of-00047.safetensors", + "model.layers.41.mlp.experts.31.gate_proj.weight_scale": "model-00042-of-00047.safetensors", + "model.layers.41.mlp.experts.31.up_proj.weight": "model-00042-of-00047.safetensors", + "model.layers.41.mlp.experts.31.up_proj.weight_scale": "model-00042-of-00047.safetensors", + "model.layers.41.mlp.experts.32.down_proj.weight": "model-00042-of-00047.safetensors", + "model.layers.41.mlp.experts.32.down_proj.weight_scale": "model-00042-of-00047.safetensors", + "model.layers.41.mlp.experts.32.gate_proj.weight": "model-00042-of-00047.safetensors", + "model.layers.41.mlp.experts.32.gate_proj.weight_scale": "model-00042-of-00047.safetensors", + "model.layers.41.mlp.experts.32.up_proj.weight": "model-00042-of-00047.safetensors", + "model.layers.41.mlp.experts.32.up_proj.weight_scale": "model-00042-of-00047.safetensors", + "model.layers.41.mlp.experts.33.down_proj.weight": "model-00042-of-00047.safetensors", + "model.layers.41.mlp.experts.33.down_proj.weight_scale": "model-00042-of-00047.safetensors", + "model.layers.41.mlp.experts.33.gate_proj.weight": "model-00042-of-00047.safetensors", + "model.layers.41.mlp.experts.33.gate_proj.weight_scale": "model-00042-of-00047.safetensors", + "model.layers.41.mlp.experts.33.up_proj.weight": "model-00042-of-00047.safetensors", + "model.layers.41.mlp.experts.33.up_proj.weight_scale": "model-00042-of-00047.safetensors", + "model.layers.41.mlp.experts.34.down_proj.weight": "model-00042-of-00047.safetensors", + "model.layers.41.mlp.experts.34.down_proj.weight_scale": "model-00042-of-00047.safetensors", + "model.layers.41.mlp.experts.34.gate_proj.weight": "model-00042-of-00047.safetensors", + "model.layers.41.mlp.experts.34.gate_proj.weight_scale": "model-00042-of-00047.safetensors", + "model.layers.41.mlp.experts.34.up_proj.weight": "model-00042-of-00047.safetensors", + "model.layers.41.mlp.experts.34.up_proj.weight_scale": "model-00042-of-00047.safetensors", + "model.layers.41.mlp.experts.35.down_proj.weight": "model-00042-of-00047.safetensors", + "model.layers.41.mlp.experts.35.down_proj.weight_scale": "model-00042-of-00047.safetensors", + "model.layers.41.mlp.experts.35.gate_proj.weight": "model-00042-of-00047.safetensors", + "model.layers.41.mlp.experts.35.gate_proj.weight_scale": "model-00042-of-00047.safetensors", + "model.layers.41.mlp.experts.35.up_proj.weight": "model-00042-of-00047.safetensors", + "model.layers.41.mlp.experts.35.up_proj.weight_scale": "model-00042-of-00047.safetensors", + "model.layers.41.mlp.experts.36.down_proj.weight": "model-00042-of-00047.safetensors", + "model.layers.41.mlp.experts.36.down_proj.weight_scale": "model-00042-of-00047.safetensors", + "model.layers.41.mlp.experts.36.gate_proj.weight": "model-00042-of-00047.safetensors", + "model.layers.41.mlp.experts.36.gate_proj.weight_scale": "model-00042-of-00047.safetensors", + "model.layers.41.mlp.experts.36.up_proj.weight": "model-00042-of-00047.safetensors", + "model.layers.41.mlp.experts.36.up_proj.weight_scale": "model-00042-of-00047.safetensors", + "model.layers.41.mlp.experts.37.down_proj.weight": "model-00042-of-00047.safetensors", + "model.layers.41.mlp.experts.37.down_proj.weight_scale": "model-00042-of-00047.safetensors", + "model.layers.41.mlp.experts.37.gate_proj.weight": "model-00042-of-00047.safetensors", + "model.layers.41.mlp.experts.37.gate_proj.weight_scale": "model-00042-of-00047.safetensors", + "model.layers.41.mlp.experts.37.up_proj.weight": "model-00042-of-00047.safetensors", + "model.layers.41.mlp.experts.37.up_proj.weight_scale": "model-00042-of-00047.safetensors", + "model.layers.41.mlp.experts.38.down_proj.weight": "model-00042-of-00047.safetensors", + "model.layers.41.mlp.experts.38.down_proj.weight_scale": "model-00042-of-00047.safetensors", + "model.layers.41.mlp.experts.38.gate_proj.weight": "model-00042-of-00047.safetensors", + "model.layers.41.mlp.experts.38.gate_proj.weight_scale": "model-00042-of-00047.safetensors", + "model.layers.41.mlp.experts.38.up_proj.weight": "model-00042-of-00047.safetensors", + "model.layers.41.mlp.experts.38.up_proj.weight_scale": "model-00042-of-00047.safetensors", + "model.layers.41.mlp.experts.39.down_proj.weight": "model-00042-of-00047.safetensors", + "model.layers.41.mlp.experts.39.down_proj.weight_scale": "model-00042-of-00047.safetensors", + "model.layers.41.mlp.experts.39.gate_proj.weight": "model-00042-of-00047.safetensors", + "model.layers.41.mlp.experts.39.gate_proj.weight_scale": "model-00042-of-00047.safetensors", + "model.layers.41.mlp.experts.39.up_proj.weight": "model-00042-of-00047.safetensors", + "model.layers.41.mlp.experts.39.up_proj.weight_scale": "model-00042-of-00047.safetensors", + "model.layers.41.mlp.experts.4.down_proj.weight": "model-00042-of-00047.safetensors", + "model.layers.41.mlp.experts.4.down_proj.weight_scale": "model-00042-of-00047.safetensors", + "model.layers.41.mlp.experts.4.gate_proj.weight": "model-00042-of-00047.safetensors", + "model.layers.41.mlp.experts.4.gate_proj.weight_scale": "model-00042-of-00047.safetensors", + "model.layers.41.mlp.experts.4.up_proj.weight": "model-00042-of-00047.safetensors", + "model.layers.41.mlp.experts.4.up_proj.weight_scale": "model-00042-of-00047.safetensors", + "model.layers.41.mlp.experts.40.down_proj.weight": "model-00042-of-00047.safetensors", + "model.layers.41.mlp.experts.40.down_proj.weight_scale": "model-00042-of-00047.safetensors", + "model.layers.41.mlp.experts.40.gate_proj.weight": "model-00042-of-00047.safetensors", + "model.layers.41.mlp.experts.40.gate_proj.weight_scale": "model-00042-of-00047.safetensors", + "model.layers.41.mlp.experts.40.up_proj.weight": "model-00042-of-00047.safetensors", + "model.layers.41.mlp.experts.40.up_proj.weight_scale": "model-00042-of-00047.safetensors", + "model.layers.41.mlp.experts.41.down_proj.weight": "model-00042-of-00047.safetensors", + "model.layers.41.mlp.experts.41.down_proj.weight_scale": "model-00042-of-00047.safetensors", + "model.layers.41.mlp.experts.41.gate_proj.weight": "model-00042-of-00047.safetensors", + "model.layers.41.mlp.experts.41.gate_proj.weight_scale": "model-00042-of-00047.safetensors", + "model.layers.41.mlp.experts.41.up_proj.weight": "model-00042-of-00047.safetensors", + "model.layers.41.mlp.experts.41.up_proj.weight_scale": "model-00042-of-00047.safetensors", + "model.layers.41.mlp.experts.42.down_proj.weight": "model-00042-of-00047.safetensors", + "model.layers.41.mlp.experts.42.down_proj.weight_scale": "model-00042-of-00047.safetensors", + "model.layers.41.mlp.experts.42.gate_proj.weight": "model-00042-of-00047.safetensors", + "model.layers.41.mlp.experts.42.gate_proj.weight_scale": "model-00042-of-00047.safetensors", + "model.layers.41.mlp.experts.42.up_proj.weight": "model-00042-of-00047.safetensors", + "model.layers.41.mlp.experts.42.up_proj.weight_scale": "model-00042-of-00047.safetensors", + "model.layers.41.mlp.experts.43.down_proj.weight": "model-00042-of-00047.safetensors", + "model.layers.41.mlp.experts.43.down_proj.weight_scale": "model-00042-of-00047.safetensors", + "model.layers.41.mlp.experts.43.gate_proj.weight": "model-00042-of-00047.safetensors", + "model.layers.41.mlp.experts.43.gate_proj.weight_scale": "model-00042-of-00047.safetensors", + "model.layers.41.mlp.experts.43.up_proj.weight": "model-00042-of-00047.safetensors", + "model.layers.41.mlp.experts.43.up_proj.weight_scale": "model-00042-of-00047.safetensors", + "model.layers.41.mlp.experts.44.down_proj.weight": "model-00042-of-00047.safetensors", + "model.layers.41.mlp.experts.44.down_proj.weight_scale": "model-00042-of-00047.safetensors", + "model.layers.41.mlp.experts.44.gate_proj.weight": "model-00042-of-00047.safetensors", + "model.layers.41.mlp.experts.44.gate_proj.weight_scale": "model-00042-of-00047.safetensors", + "model.layers.41.mlp.experts.44.up_proj.weight": "model-00042-of-00047.safetensors", + "model.layers.41.mlp.experts.44.up_proj.weight_scale": "model-00042-of-00047.safetensors", + "model.layers.41.mlp.experts.45.down_proj.weight": "model-00042-of-00047.safetensors", + "model.layers.41.mlp.experts.45.down_proj.weight_scale": "model-00042-of-00047.safetensors", + "model.layers.41.mlp.experts.45.gate_proj.weight": "model-00042-of-00047.safetensors", + "model.layers.41.mlp.experts.45.gate_proj.weight_scale": "model-00042-of-00047.safetensors", + "model.layers.41.mlp.experts.45.up_proj.weight": "model-00042-of-00047.safetensors", + "model.layers.41.mlp.experts.45.up_proj.weight_scale": "model-00042-of-00047.safetensors", + "model.layers.41.mlp.experts.46.down_proj.weight": "model-00042-of-00047.safetensors", + "model.layers.41.mlp.experts.46.down_proj.weight_scale": "model-00042-of-00047.safetensors", + "model.layers.41.mlp.experts.46.gate_proj.weight": "model-00042-of-00047.safetensors", + "model.layers.41.mlp.experts.46.gate_proj.weight_scale": "model-00042-of-00047.safetensors", + "model.layers.41.mlp.experts.46.up_proj.weight": "model-00042-of-00047.safetensors", + "model.layers.41.mlp.experts.46.up_proj.weight_scale": "model-00042-of-00047.safetensors", + "model.layers.41.mlp.experts.47.down_proj.weight": "model-00042-of-00047.safetensors", + "model.layers.41.mlp.experts.47.down_proj.weight_scale": "model-00042-of-00047.safetensors", + "model.layers.41.mlp.experts.47.gate_proj.weight": "model-00042-of-00047.safetensors", + "model.layers.41.mlp.experts.47.gate_proj.weight_scale": "model-00042-of-00047.safetensors", + "model.layers.41.mlp.experts.47.up_proj.weight": "model-00042-of-00047.safetensors", + "model.layers.41.mlp.experts.47.up_proj.weight_scale": "model-00042-of-00047.safetensors", + "model.layers.41.mlp.experts.48.down_proj.weight": "model-00042-of-00047.safetensors", + "model.layers.41.mlp.experts.48.down_proj.weight_scale": "model-00042-of-00047.safetensors", + "model.layers.41.mlp.experts.48.gate_proj.weight": "model-00042-of-00047.safetensors", + "model.layers.41.mlp.experts.48.gate_proj.weight_scale": "model-00042-of-00047.safetensors", + "model.layers.41.mlp.experts.48.up_proj.weight": "model-00042-of-00047.safetensors", + "model.layers.41.mlp.experts.48.up_proj.weight_scale": "model-00042-of-00047.safetensors", + "model.layers.41.mlp.experts.49.down_proj.weight": "model-00042-of-00047.safetensors", + "model.layers.41.mlp.experts.49.down_proj.weight_scale": "model-00042-of-00047.safetensors", + "model.layers.41.mlp.experts.49.gate_proj.weight": "model-00042-of-00047.safetensors", + "model.layers.41.mlp.experts.49.gate_proj.weight_scale": "model-00042-of-00047.safetensors", + "model.layers.41.mlp.experts.49.up_proj.weight": "model-00042-of-00047.safetensors", + "model.layers.41.mlp.experts.49.up_proj.weight_scale": "model-00042-of-00047.safetensors", + "model.layers.41.mlp.experts.5.down_proj.weight": "model-00042-of-00047.safetensors", + "model.layers.41.mlp.experts.5.down_proj.weight_scale": "model-00042-of-00047.safetensors", + "model.layers.41.mlp.experts.5.gate_proj.weight": "model-00042-of-00047.safetensors", + "model.layers.41.mlp.experts.5.gate_proj.weight_scale": "model-00042-of-00047.safetensors", + "model.layers.41.mlp.experts.5.up_proj.weight": "model-00042-of-00047.safetensors", + "model.layers.41.mlp.experts.5.up_proj.weight_scale": "model-00042-of-00047.safetensors", + "model.layers.41.mlp.experts.50.down_proj.weight": "model-00042-of-00047.safetensors", + "model.layers.41.mlp.experts.50.down_proj.weight_scale": "model-00042-of-00047.safetensors", + "model.layers.41.mlp.experts.50.gate_proj.weight": "model-00042-of-00047.safetensors", + "model.layers.41.mlp.experts.50.gate_proj.weight_scale": "model-00042-of-00047.safetensors", + "model.layers.41.mlp.experts.50.up_proj.weight": "model-00042-of-00047.safetensors", + "model.layers.41.mlp.experts.50.up_proj.weight_scale": "model-00042-of-00047.safetensors", + "model.layers.41.mlp.experts.51.down_proj.weight": "model-00042-of-00047.safetensors", + "model.layers.41.mlp.experts.51.down_proj.weight_scale": "model-00042-of-00047.safetensors", + "model.layers.41.mlp.experts.51.gate_proj.weight": "model-00042-of-00047.safetensors", + "model.layers.41.mlp.experts.51.gate_proj.weight_scale": "model-00042-of-00047.safetensors", + "model.layers.41.mlp.experts.51.up_proj.weight": "model-00042-of-00047.safetensors", + "model.layers.41.mlp.experts.51.up_proj.weight_scale": "model-00042-of-00047.safetensors", + "model.layers.41.mlp.experts.52.down_proj.weight": "model-00042-of-00047.safetensors", + "model.layers.41.mlp.experts.52.down_proj.weight_scale": "model-00042-of-00047.safetensors", + "model.layers.41.mlp.experts.52.gate_proj.weight": "model-00042-of-00047.safetensors", + "model.layers.41.mlp.experts.52.gate_proj.weight_scale": "model-00042-of-00047.safetensors", + "model.layers.41.mlp.experts.52.up_proj.weight": "model-00042-of-00047.safetensors", + "model.layers.41.mlp.experts.52.up_proj.weight_scale": "model-00042-of-00047.safetensors", + "model.layers.41.mlp.experts.53.down_proj.weight": "model-00042-of-00047.safetensors", + "model.layers.41.mlp.experts.53.down_proj.weight_scale": "model-00042-of-00047.safetensors", + "model.layers.41.mlp.experts.53.gate_proj.weight": "model-00042-of-00047.safetensors", + "model.layers.41.mlp.experts.53.gate_proj.weight_scale": "model-00042-of-00047.safetensors", + "model.layers.41.mlp.experts.53.up_proj.weight": "model-00042-of-00047.safetensors", + "model.layers.41.mlp.experts.53.up_proj.weight_scale": "model-00042-of-00047.safetensors", + "model.layers.41.mlp.experts.54.down_proj.weight": "model-00042-of-00047.safetensors", + "model.layers.41.mlp.experts.54.down_proj.weight_scale": "model-00042-of-00047.safetensors", + "model.layers.41.mlp.experts.54.gate_proj.weight": "model-00042-of-00047.safetensors", + "model.layers.41.mlp.experts.54.gate_proj.weight_scale": "model-00042-of-00047.safetensors", + "model.layers.41.mlp.experts.54.up_proj.weight": "model-00042-of-00047.safetensors", + "model.layers.41.mlp.experts.54.up_proj.weight_scale": "model-00042-of-00047.safetensors", + "model.layers.41.mlp.experts.55.down_proj.weight": "model-00042-of-00047.safetensors", + "model.layers.41.mlp.experts.55.down_proj.weight_scale": "model-00042-of-00047.safetensors", + "model.layers.41.mlp.experts.55.gate_proj.weight": "model-00042-of-00047.safetensors", + "model.layers.41.mlp.experts.55.gate_proj.weight_scale": "model-00042-of-00047.safetensors", + "model.layers.41.mlp.experts.55.up_proj.weight": "model-00042-of-00047.safetensors", + "model.layers.41.mlp.experts.55.up_proj.weight_scale": "model-00042-of-00047.safetensors", + "model.layers.41.mlp.experts.56.down_proj.weight": "model-00042-of-00047.safetensors", + "model.layers.41.mlp.experts.56.down_proj.weight_scale": "model-00042-of-00047.safetensors", + "model.layers.41.mlp.experts.56.gate_proj.weight": "model-00042-of-00047.safetensors", + "model.layers.41.mlp.experts.56.gate_proj.weight_scale": "model-00042-of-00047.safetensors", + "model.layers.41.mlp.experts.56.up_proj.weight": "model-00042-of-00047.safetensors", + "model.layers.41.mlp.experts.56.up_proj.weight_scale": "model-00042-of-00047.safetensors", + "model.layers.41.mlp.experts.57.down_proj.weight": "model-00042-of-00047.safetensors", + "model.layers.41.mlp.experts.57.down_proj.weight_scale": "model-00042-of-00047.safetensors", + "model.layers.41.mlp.experts.57.gate_proj.weight": "model-00042-of-00047.safetensors", + "model.layers.41.mlp.experts.57.gate_proj.weight_scale": "model-00042-of-00047.safetensors", + "model.layers.41.mlp.experts.57.up_proj.weight": "model-00042-of-00047.safetensors", + "model.layers.41.mlp.experts.57.up_proj.weight_scale": "model-00042-of-00047.safetensors", + "model.layers.41.mlp.experts.58.down_proj.weight": "model-00042-of-00047.safetensors", + "model.layers.41.mlp.experts.58.down_proj.weight_scale": "model-00042-of-00047.safetensors", + "model.layers.41.mlp.experts.58.gate_proj.weight": "model-00042-of-00047.safetensors", + "model.layers.41.mlp.experts.58.gate_proj.weight_scale": "model-00042-of-00047.safetensors", + "model.layers.41.mlp.experts.58.up_proj.weight": "model-00042-of-00047.safetensors", + "model.layers.41.mlp.experts.58.up_proj.weight_scale": "model-00042-of-00047.safetensors", + "model.layers.41.mlp.experts.59.down_proj.weight": "model-00042-of-00047.safetensors", + "model.layers.41.mlp.experts.59.down_proj.weight_scale": "model-00042-of-00047.safetensors", + "model.layers.41.mlp.experts.59.gate_proj.weight": "model-00042-of-00047.safetensors", + "model.layers.41.mlp.experts.59.gate_proj.weight_scale": "model-00042-of-00047.safetensors", + "model.layers.41.mlp.experts.59.up_proj.weight": "model-00042-of-00047.safetensors", + "model.layers.41.mlp.experts.59.up_proj.weight_scale": "model-00042-of-00047.safetensors", + "model.layers.41.mlp.experts.6.down_proj.weight": "model-00042-of-00047.safetensors", + "model.layers.41.mlp.experts.6.down_proj.weight_scale": "model-00042-of-00047.safetensors", + "model.layers.41.mlp.experts.6.gate_proj.weight": "model-00042-of-00047.safetensors", + "model.layers.41.mlp.experts.6.gate_proj.weight_scale": "model-00042-of-00047.safetensors", + "model.layers.41.mlp.experts.6.up_proj.weight": "model-00042-of-00047.safetensors", + "model.layers.41.mlp.experts.6.up_proj.weight_scale": "model-00042-of-00047.safetensors", + "model.layers.41.mlp.experts.60.down_proj.weight": "model-00042-of-00047.safetensors", + "model.layers.41.mlp.experts.60.down_proj.weight_scale": "model-00042-of-00047.safetensors", + "model.layers.41.mlp.experts.60.gate_proj.weight": "model-00042-of-00047.safetensors", + "model.layers.41.mlp.experts.60.gate_proj.weight_scale": "model-00042-of-00047.safetensors", + "model.layers.41.mlp.experts.60.up_proj.weight": "model-00042-of-00047.safetensors", + "model.layers.41.mlp.experts.60.up_proj.weight_scale": "model-00042-of-00047.safetensors", + "model.layers.41.mlp.experts.61.down_proj.weight": "model-00042-of-00047.safetensors", + "model.layers.41.mlp.experts.61.down_proj.weight_scale": "model-00042-of-00047.safetensors", + "model.layers.41.mlp.experts.61.gate_proj.weight": "model-00042-of-00047.safetensors", + "model.layers.41.mlp.experts.61.gate_proj.weight_scale": "model-00042-of-00047.safetensors", + "model.layers.41.mlp.experts.61.up_proj.weight": "model-00042-of-00047.safetensors", + "model.layers.41.mlp.experts.61.up_proj.weight_scale": "model-00042-of-00047.safetensors", + "model.layers.41.mlp.experts.62.down_proj.weight": "model-00042-of-00047.safetensors", + "model.layers.41.mlp.experts.62.down_proj.weight_scale": "model-00042-of-00047.safetensors", + "model.layers.41.mlp.experts.62.gate_proj.weight": "model-00042-of-00047.safetensors", + "model.layers.41.mlp.experts.62.gate_proj.weight_scale": "model-00042-of-00047.safetensors", + "model.layers.41.mlp.experts.62.up_proj.weight": "model-00042-of-00047.safetensors", + "model.layers.41.mlp.experts.62.up_proj.weight_scale": "model-00042-of-00047.safetensors", + "model.layers.41.mlp.experts.63.down_proj.weight": "model-00042-of-00047.safetensors", + "model.layers.41.mlp.experts.63.down_proj.weight_scale": "model-00042-of-00047.safetensors", + "model.layers.41.mlp.experts.63.gate_proj.weight": "model-00042-of-00047.safetensors", + "model.layers.41.mlp.experts.63.gate_proj.weight_scale": "model-00042-of-00047.safetensors", + "model.layers.41.mlp.experts.63.up_proj.weight": "model-00042-of-00047.safetensors", + "model.layers.41.mlp.experts.63.up_proj.weight_scale": "model-00042-of-00047.safetensors", + "model.layers.41.mlp.experts.64.down_proj.weight": "model-00042-of-00047.safetensors", + "model.layers.41.mlp.experts.64.down_proj.weight_scale": "model-00042-of-00047.safetensors", + "model.layers.41.mlp.experts.64.gate_proj.weight": "model-00042-of-00047.safetensors", + "model.layers.41.mlp.experts.64.gate_proj.weight_scale": "model-00042-of-00047.safetensors", + "model.layers.41.mlp.experts.64.up_proj.weight": "model-00042-of-00047.safetensors", + "model.layers.41.mlp.experts.64.up_proj.weight_scale": "model-00042-of-00047.safetensors", + "model.layers.41.mlp.experts.65.down_proj.weight": "model-00042-of-00047.safetensors", + "model.layers.41.mlp.experts.65.down_proj.weight_scale": "model-00042-of-00047.safetensors", + "model.layers.41.mlp.experts.65.gate_proj.weight": "model-00042-of-00047.safetensors", + "model.layers.41.mlp.experts.65.gate_proj.weight_scale": "model-00042-of-00047.safetensors", + "model.layers.41.mlp.experts.65.up_proj.weight": "model-00042-of-00047.safetensors", + "model.layers.41.mlp.experts.65.up_proj.weight_scale": "model-00042-of-00047.safetensors", + "model.layers.41.mlp.experts.66.down_proj.weight": "model-00042-of-00047.safetensors", + "model.layers.41.mlp.experts.66.down_proj.weight_scale": "model-00042-of-00047.safetensors", + "model.layers.41.mlp.experts.66.gate_proj.weight": "model-00042-of-00047.safetensors", + "model.layers.41.mlp.experts.66.gate_proj.weight_scale": "model-00042-of-00047.safetensors", + "model.layers.41.mlp.experts.66.up_proj.weight": "model-00042-of-00047.safetensors", + "model.layers.41.mlp.experts.66.up_proj.weight_scale": "model-00042-of-00047.safetensors", + "model.layers.41.mlp.experts.67.down_proj.weight": "model-00042-of-00047.safetensors", + "model.layers.41.mlp.experts.67.down_proj.weight_scale": "model-00042-of-00047.safetensors", + "model.layers.41.mlp.experts.67.gate_proj.weight": "model-00042-of-00047.safetensors", + "model.layers.41.mlp.experts.67.gate_proj.weight_scale": "model-00042-of-00047.safetensors", + "model.layers.41.mlp.experts.67.up_proj.weight": "model-00042-of-00047.safetensors", + "model.layers.41.mlp.experts.67.up_proj.weight_scale": "model-00042-of-00047.safetensors", + "model.layers.41.mlp.experts.68.down_proj.weight": "model-00042-of-00047.safetensors", + "model.layers.41.mlp.experts.68.down_proj.weight_scale": "model-00042-of-00047.safetensors", + "model.layers.41.mlp.experts.68.gate_proj.weight": "model-00042-of-00047.safetensors", + "model.layers.41.mlp.experts.68.gate_proj.weight_scale": "model-00042-of-00047.safetensors", + "model.layers.41.mlp.experts.68.up_proj.weight": "model-00042-of-00047.safetensors", + "model.layers.41.mlp.experts.68.up_proj.weight_scale": "model-00042-of-00047.safetensors", + "model.layers.41.mlp.experts.69.down_proj.weight": "model-00042-of-00047.safetensors", + "model.layers.41.mlp.experts.69.down_proj.weight_scale": "model-00042-of-00047.safetensors", + "model.layers.41.mlp.experts.69.gate_proj.weight": "model-00042-of-00047.safetensors", + "model.layers.41.mlp.experts.69.gate_proj.weight_scale": "model-00042-of-00047.safetensors", + "model.layers.41.mlp.experts.69.up_proj.weight": "model-00042-of-00047.safetensors", + "model.layers.41.mlp.experts.69.up_proj.weight_scale": "model-00042-of-00047.safetensors", + "model.layers.41.mlp.experts.7.down_proj.weight": "model-00042-of-00047.safetensors", + "model.layers.41.mlp.experts.7.down_proj.weight_scale": "model-00042-of-00047.safetensors", + "model.layers.41.mlp.experts.7.gate_proj.weight": "model-00042-of-00047.safetensors", + "model.layers.41.mlp.experts.7.gate_proj.weight_scale": "model-00042-of-00047.safetensors", + "model.layers.41.mlp.experts.7.up_proj.weight": "model-00042-of-00047.safetensors", + "model.layers.41.mlp.experts.7.up_proj.weight_scale": "model-00042-of-00047.safetensors", + "model.layers.41.mlp.experts.70.down_proj.weight": "model-00042-of-00047.safetensors", + "model.layers.41.mlp.experts.70.down_proj.weight_scale": "model-00042-of-00047.safetensors", + "model.layers.41.mlp.experts.70.gate_proj.weight": "model-00042-of-00047.safetensors", + "model.layers.41.mlp.experts.70.gate_proj.weight_scale": "model-00042-of-00047.safetensors", + "model.layers.41.mlp.experts.70.up_proj.weight": "model-00042-of-00047.safetensors", + "model.layers.41.mlp.experts.70.up_proj.weight_scale": "model-00042-of-00047.safetensors", + "model.layers.41.mlp.experts.71.down_proj.weight": "model-00042-of-00047.safetensors", + "model.layers.41.mlp.experts.71.down_proj.weight_scale": "model-00042-of-00047.safetensors", + "model.layers.41.mlp.experts.71.gate_proj.weight": "model-00042-of-00047.safetensors", + "model.layers.41.mlp.experts.71.gate_proj.weight_scale": "model-00042-of-00047.safetensors", + "model.layers.41.mlp.experts.71.up_proj.weight": "model-00042-of-00047.safetensors", + "model.layers.41.mlp.experts.71.up_proj.weight_scale": "model-00042-of-00047.safetensors", + "model.layers.41.mlp.experts.72.down_proj.weight": "model-00042-of-00047.safetensors", + "model.layers.41.mlp.experts.72.down_proj.weight_scale": "model-00042-of-00047.safetensors", + "model.layers.41.mlp.experts.72.gate_proj.weight": "model-00042-of-00047.safetensors", + "model.layers.41.mlp.experts.72.gate_proj.weight_scale": "model-00042-of-00047.safetensors", + "model.layers.41.mlp.experts.72.up_proj.weight": "model-00042-of-00047.safetensors", + "model.layers.41.mlp.experts.72.up_proj.weight_scale": "model-00042-of-00047.safetensors", + "model.layers.41.mlp.experts.73.down_proj.weight": "model-00042-of-00047.safetensors", + "model.layers.41.mlp.experts.73.down_proj.weight_scale": "model-00042-of-00047.safetensors", + "model.layers.41.mlp.experts.73.gate_proj.weight": "model-00042-of-00047.safetensors", + "model.layers.41.mlp.experts.73.gate_proj.weight_scale": "model-00042-of-00047.safetensors", + "model.layers.41.mlp.experts.73.up_proj.weight": "model-00042-of-00047.safetensors", + "model.layers.41.mlp.experts.73.up_proj.weight_scale": "model-00042-of-00047.safetensors", + "model.layers.41.mlp.experts.74.down_proj.weight": "model-00042-of-00047.safetensors", + "model.layers.41.mlp.experts.74.down_proj.weight_scale": "model-00042-of-00047.safetensors", + "model.layers.41.mlp.experts.74.gate_proj.weight": "model-00042-of-00047.safetensors", + "model.layers.41.mlp.experts.74.gate_proj.weight_scale": "model-00042-of-00047.safetensors", + "model.layers.41.mlp.experts.74.up_proj.weight": "model-00042-of-00047.safetensors", + "model.layers.41.mlp.experts.74.up_proj.weight_scale": "model-00042-of-00047.safetensors", + "model.layers.41.mlp.experts.75.down_proj.weight": "model-00042-of-00047.safetensors", + "model.layers.41.mlp.experts.75.down_proj.weight_scale": "model-00042-of-00047.safetensors", + "model.layers.41.mlp.experts.75.gate_proj.weight": "model-00042-of-00047.safetensors", + "model.layers.41.mlp.experts.75.gate_proj.weight_scale": "model-00042-of-00047.safetensors", + "model.layers.41.mlp.experts.75.up_proj.weight": "model-00042-of-00047.safetensors", + "model.layers.41.mlp.experts.75.up_proj.weight_scale": "model-00042-of-00047.safetensors", + "model.layers.41.mlp.experts.76.down_proj.weight": "model-00042-of-00047.safetensors", + "model.layers.41.mlp.experts.76.down_proj.weight_scale": "model-00042-of-00047.safetensors", + "model.layers.41.mlp.experts.76.gate_proj.weight": "model-00042-of-00047.safetensors", + "model.layers.41.mlp.experts.76.gate_proj.weight_scale": "model-00042-of-00047.safetensors", + "model.layers.41.mlp.experts.76.up_proj.weight": "model-00042-of-00047.safetensors", + "model.layers.41.mlp.experts.76.up_proj.weight_scale": "model-00042-of-00047.safetensors", + "model.layers.41.mlp.experts.77.down_proj.weight": "model-00042-of-00047.safetensors", + "model.layers.41.mlp.experts.77.down_proj.weight_scale": "model-00042-of-00047.safetensors", + "model.layers.41.mlp.experts.77.gate_proj.weight": "model-00042-of-00047.safetensors", + "model.layers.41.mlp.experts.77.gate_proj.weight_scale": "model-00042-of-00047.safetensors", + "model.layers.41.mlp.experts.77.up_proj.weight": "model-00042-of-00047.safetensors", + "model.layers.41.mlp.experts.77.up_proj.weight_scale": "model-00042-of-00047.safetensors", + "model.layers.41.mlp.experts.78.down_proj.weight": "model-00042-of-00047.safetensors", + "model.layers.41.mlp.experts.78.down_proj.weight_scale": "model-00042-of-00047.safetensors", + "model.layers.41.mlp.experts.78.gate_proj.weight": "model-00042-of-00047.safetensors", + "model.layers.41.mlp.experts.78.gate_proj.weight_scale": "model-00042-of-00047.safetensors", + "model.layers.41.mlp.experts.78.up_proj.weight": "model-00042-of-00047.safetensors", + "model.layers.41.mlp.experts.78.up_proj.weight_scale": "model-00042-of-00047.safetensors", + "model.layers.41.mlp.experts.79.down_proj.weight": "model-00042-of-00047.safetensors", + "model.layers.41.mlp.experts.79.down_proj.weight_scale": "model-00042-of-00047.safetensors", + "model.layers.41.mlp.experts.79.gate_proj.weight": "model-00042-of-00047.safetensors", + "model.layers.41.mlp.experts.79.gate_proj.weight_scale": "model-00042-of-00047.safetensors", + "model.layers.41.mlp.experts.79.up_proj.weight": "model-00042-of-00047.safetensors", + "model.layers.41.mlp.experts.79.up_proj.weight_scale": "model-00042-of-00047.safetensors", + "model.layers.41.mlp.experts.8.down_proj.weight": "model-00042-of-00047.safetensors", + "model.layers.41.mlp.experts.8.down_proj.weight_scale": "model-00042-of-00047.safetensors", + "model.layers.41.mlp.experts.8.gate_proj.weight": "model-00042-of-00047.safetensors", + "model.layers.41.mlp.experts.8.gate_proj.weight_scale": "model-00042-of-00047.safetensors", + "model.layers.41.mlp.experts.8.up_proj.weight": "model-00042-of-00047.safetensors", + "model.layers.41.mlp.experts.8.up_proj.weight_scale": "model-00042-of-00047.safetensors", + "model.layers.41.mlp.experts.80.down_proj.weight": "model-00042-of-00047.safetensors", + "model.layers.41.mlp.experts.80.down_proj.weight_scale": "model-00042-of-00047.safetensors", + "model.layers.41.mlp.experts.80.gate_proj.weight": "model-00042-of-00047.safetensors", + "model.layers.41.mlp.experts.80.gate_proj.weight_scale": "model-00042-of-00047.safetensors", + "model.layers.41.mlp.experts.80.up_proj.weight": "model-00042-of-00047.safetensors", + "model.layers.41.mlp.experts.80.up_proj.weight_scale": "model-00042-of-00047.safetensors", + "model.layers.41.mlp.experts.81.down_proj.weight": "model-00042-of-00047.safetensors", + "model.layers.41.mlp.experts.81.down_proj.weight_scale": "model-00042-of-00047.safetensors", + "model.layers.41.mlp.experts.81.gate_proj.weight": "model-00042-of-00047.safetensors", + "model.layers.41.mlp.experts.81.gate_proj.weight_scale": "model-00042-of-00047.safetensors", + "model.layers.41.mlp.experts.81.up_proj.weight": "model-00042-of-00047.safetensors", + "model.layers.41.mlp.experts.81.up_proj.weight_scale": "model-00042-of-00047.safetensors", + "model.layers.41.mlp.experts.82.down_proj.weight": "model-00042-of-00047.safetensors", + "model.layers.41.mlp.experts.82.down_proj.weight_scale": "model-00042-of-00047.safetensors", + "model.layers.41.mlp.experts.82.gate_proj.weight": "model-00042-of-00047.safetensors", + "model.layers.41.mlp.experts.82.gate_proj.weight_scale": "model-00042-of-00047.safetensors", + "model.layers.41.mlp.experts.82.up_proj.weight": "model-00042-of-00047.safetensors", + "model.layers.41.mlp.experts.82.up_proj.weight_scale": "model-00042-of-00047.safetensors", + "model.layers.41.mlp.experts.83.down_proj.weight": "model-00042-of-00047.safetensors", + "model.layers.41.mlp.experts.83.down_proj.weight_scale": "model-00042-of-00047.safetensors", + "model.layers.41.mlp.experts.83.gate_proj.weight": "model-00042-of-00047.safetensors", + "model.layers.41.mlp.experts.83.gate_proj.weight_scale": "model-00042-of-00047.safetensors", + "model.layers.41.mlp.experts.83.up_proj.weight": "model-00042-of-00047.safetensors", + "model.layers.41.mlp.experts.83.up_proj.weight_scale": "model-00042-of-00047.safetensors", + "model.layers.41.mlp.experts.84.down_proj.weight": "model-00042-of-00047.safetensors", + "model.layers.41.mlp.experts.84.down_proj.weight_scale": "model-00042-of-00047.safetensors", + "model.layers.41.mlp.experts.84.gate_proj.weight": "model-00042-of-00047.safetensors", + "model.layers.41.mlp.experts.84.gate_proj.weight_scale": "model-00042-of-00047.safetensors", + "model.layers.41.mlp.experts.84.up_proj.weight": "model-00042-of-00047.safetensors", + "model.layers.41.mlp.experts.84.up_proj.weight_scale": "model-00042-of-00047.safetensors", + "model.layers.41.mlp.experts.85.down_proj.weight": "model-00042-of-00047.safetensors", + "model.layers.41.mlp.experts.85.down_proj.weight_scale": "model-00042-of-00047.safetensors", + "model.layers.41.mlp.experts.85.gate_proj.weight": "model-00042-of-00047.safetensors", + "model.layers.41.mlp.experts.85.gate_proj.weight_scale": "model-00042-of-00047.safetensors", + "model.layers.41.mlp.experts.85.up_proj.weight": "model-00042-of-00047.safetensors", + "model.layers.41.mlp.experts.85.up_proj.weight_scale": "model-00042-of-00047.safetensors", + "model.layers.41.mlp.experts.86.down_proj.weight": "model-00042-of-00047.safetensors", + "model.layers.41.mlp.experts.86.down_proj.weight_scale": "model-00042-of-00047.safetensors", + "model.layers.41.mlp.experts.86.gate_proj.weight": "model-00042-of-00047.safetensors", + "model.layers.41.mlp.experts.86.gate_proj.weight_scale": "model-00042-of-00047.safetensors", + "model.layers.41.mlp.experts.86.up_proj.weight": "model-00042-of-00047.safetensors", + "model.layers.41.mlp.experts.86.up_proj.weight_scale": "model-00042-of-00047.safetensors", + "model.layers.41.mlp.experts.87.down_proj.weight": "model-00042-of-00047.safetensors", + "model.layers.41.mlp.experts.87.down_proj.weight_scale": "model-00042-of-00047.safetensors", + "model.layers.41.mlp.experts.87.gate_proj.weight": "model-00042-of-00047.safetensors", + "model.layers.41.mlp.experts.87.gate_proj.weight_scale": "model-00042-of-00047.safetensors", + "model.layers.41.mlp.experts.87.up_proj.weight": "model-00042-of-00047.safetensors", + "model.layers.41.mlp.experts.87.up_proj.weight_scale": "model-00042-of-00047.safetensors", + "model.layers.41.mlp.experts.88.down_proj.weight": "model-00042-of-00047.safetensors", + "model.layers.41.mlp.experts.88.down_proj.weight_scale": "model-00042-of-00047.safetensors", + "model.layers.41.mlp.experts.88.gate_proj.weight": "model-00042-of-00047.safetensors", + "model.layers.41.mlp.experts.88.gate_proj.weight_scale": "model-00042-of-00047.safetensors", + "model.layers.41.mlp.experts.88.up_proj.weight": "model-00042-of-00047.safetensors", + "model.layers.41.mlp.experts.88.up_proj.weight_scale": "model-00042-of-00047.safetensors", + "model.layers.41.mlp.experts.89.down_proj.weight": "model-00042-of-00047.safetensors", + "model.layers.41.mlp.experts.89.down_proj.weight_scale": "model-00042-of-00047.safetensors", + "model.layers.41.mlp.experts.89.gate_proj.weight": "model-00042-of-00047.safetensors", + "model.layers.41.mlp.experts.89.gate_proj.weight_scale": "model-00042-of-00047.safetensors", + "model.layers.41.mlp.experts.89.up_proj.weight": "model-00042-of-00047.safetensors", + "model.layers.41.mlp.experts.89.up_proj.weight_scale": "model-00042-of-00047.safetensors", + "model.layers.41.mlp.experts.9.down_proj.weight": "model-00042-of-00047.safetensors", + "model.layers.41.mlp.experts.9.down_proj.weight_scale": "model-00042-of-00047.safetensors", + "model.layers.41.mlp.experts.9.gate_proj.weight": "model-00042-of-00047.safetensors", + "model.layers.41.mlp.experts.9.gate_proj.weight_scale": "model-00042-of-00047.safetensors", + "model.layers.41.mlp.experts.9.up_proj.weight": "model-00042-of-00047.safetensors", + "model.layers.41.mlp.experts.9.up_proj.weight_scale": "model-00042-of-00047.safetensors", + "model.layers.41.mlp.experts.90.down_proj.weight": "model-00042-of-00047.safetensors", + "model.layers.41.mlp.experts.90.down_proj.weight_scale": "model-00042-of-00047.safetensors", + "model.layers.41.mlp.experts.90.gate_proj.weight": "model-00042-of-00047.safetensors", + "model.layers.41.mlp.experts.90.gate_proj.weight_scale": "model-00042-of-00047.safetensors", + "model.layers.41.mlp.experts.90.up_proj.weight": "model-00042-of-00047.safetensors", + "model.layers.41.mlp.experts.90.up_proj.weight_scale": "model-00042-of-00047.safetensors", + "model.layers.41.mlp.experts.91.down_proj.weight": "model-00042-of-00047.safetensors", + "model.layers.41.mlp.experts.91.down_proj.weight_scale": "model-00042-of-00047.safetensors", + "model.layers.41.mlp.experts.91.gate_proj.weight": "model-00042-of-00047.safetensors", + "model.layers.41.mlp.experts.91.gate_proj.weight_scale": "model-00042-of-00047.safetensors", + "model.layers.41.mlp.experts.91.up_proj.weight": "model-00042-of-00047.safetensors", + "model.layers.41.mlp.experts.91.up_proj.weight_scale": "model-00042-of-00047.safetensors", + "model.layers.41.mlp.experts.92.down_proj.weight": "model-00042-of-00047.safetensors", + "model.layers.41.mlp.experts.92.down_proj.weight_scale": "model-00042-of-00047.safetensors", + "model.layers.41.mlp.experts.92.gate_proj.weight": "model-00042-of-00047.safetensors", + "model.layers.41.mlp.experts.92.gate_proj.weight_scale": "model-00042-of-00047.safetensors", + "model.layers.41.mlp.experts.92.up_proj.weight": "model-00042-of-00047.safetensors", + "model.layers.41.mlp.experts.92.up_proj.weight_scale": "model-00042-of-00047.safetensors", + "model.layers.41.mlp.experts.93.down_proj.weight": "model-00042-of-00047.safetensors", + "model.layers.41.mlp.experts.93.down_proj.weight_scale": "model-00042-of-00047.safetensors", + "model.layers.41.mlp.experts.93.gate_proj.weight": "model-00042-of-00047.safetensors", + "model.layers.41.mlp.experts.93.gate_proj.weight_scale": "model-00042-of-00047.safetensors", + "model.layers.41.mlp.experts.93.up_proj.weight": "model-00042-of-00047.safetensors", + "model.layers.41.mlp.experts.93.up_proj.weight_scale": "model-00042-of-00047.safetensors", + "model.layers.41.mlp.experts.94.down_proj.weight": "model-00042-of-00047.safetensors", + "model.layers.41.mlp.experts.94.down_proj.weight_scale": "model-00042-of-00047.safetensors", + "model.layers.41.mlp.experts.94.gate_proj.weight": "model-00042-of-00047.safetensors", + "model.layers.41.mlp.experts.94.gate_proj.weight_scale": "model-00042-of-00047.safetensors", + "model.layers.41.mlp.experts.94.up_proj.weight": "model-00042-of-00047.safetensors", + "model.layers.41.mlp.experts.94.up_proj.weight_scale": "model-00042-of-00047.safetensors", + "model.layers.41.mlp.experts.95.down_proj.weight": "model-00042-of-00047.safetensors", + "model.layers.41.mlp.experts.95.down_proj.weight_scale": "model-00042-of-00047.safetensors", + "model.layers.41.mlp.experts.95.gate_proj.weight": "model-00042-of-00047.safetensors", + "model.layers.41.mlp.experts.95.gate_proj.weight_scale": "model-00042-of-00047.safetensors", + "model.layers.41.mlp.experts.95.up_proj.weight": "model-00042-of-00047.safetensors", + "model.layers.41.mlp.experts.95.up_proj.weight_scale": "model-00042-of-00047.safetensors", + "model.layers.41.mlp.experts.96.down_proj.weight": "model-00042-of-00047.safetensors", + "model.layers.41.mlp.experts.96.down_proj.weight_scale": "model-00042-of-00047.safetensors", + "model.layers.41.mlp.experts.96.gate_proj.weight": "model-00042-of-00047.safetensors", + "model.layers.41.mlp.experts.96.gate_proj.weight_scale": "model-00042-of-00047.safetensors", + "model.layers.41.mlp.experts.96.up_proj.weight": "model-00042-of-00047.safetensors", + "model.layers.41.mlp.experts.96.up_proj.weight_scale": "model-00042-of-00047.safetensors", + "model.layers.41.mlp.experts.97.down_proj.weight": "model-00042-of-00047.safetensors", + "model.layers.41.mlp.experts.97.down_proj.weight_scale": "model-00042-of-00047.safetensors", + "model.layers.41.mlp.experts.97.gate_proj.weight": "model-00042-of-00047.safetensors", + "model.layers.41.mlp.experts.97.gate_proj.weight_scale": "model-00042-of-00047.safetensors", + "model.layers.41.mlp.experts.97.up_proj.weight": "model-00042-of-00047.safetensors", + "model.layers.41.mlp.experts.97.up_proj.weight_scale": "model-00042-of-00047.safetensors", + "model.layers.41.mlp.experts.98.down_proj.weight": "model-00042-of-00047.safetensors", + "model.layers.41.mlp.experts.98.down_proj.weight_scale": "model-00042-of-00047.safetensors", + "model.layers.41.mlp.experts.98.gate_proj.weight": "model-00042-of-00047.safetensors", + "model.layers.41.mlp.experts.98.gate_proj.weight_scale": "model-00042-of-00047.safetensors", + "model.layers.41.mlp.experts.98.up_proj.weight": "model-00042-of-00047.safetensors", + "model.layers.41.mlp.experts.98.up_proj.weight_scale": "model-00042-of-00047.safetensors", + "model.layers.41.mlp.experts.99.down_proj.weight": "model-00042-of-00047.safetensors", + "model.layers.41.mlp.experts.99.down_proj.weight_scale": "model-00042-of-00047.safetensors", + "model.layers.41.mlp.experts.99.gate_proj.weight": "model-00042-of-00047.safetensors", + "model.layers.41.mlp.experts.99.gate_proj.weight_scale": "model-00042-of-00047.safetensors", + "model.layers.41.mlp.experts.99.up_proj.weight": "model-00042-of-00047.safetensors", + "model.layers.41.mlp.experts.99.up_proj.weight_scale": "model-00042-of-00047.safetensors", + "model.layers.41.mlp.gate.e_score_correction_bias": "model-00042-of-00047.safetensors", + "model.layers.41.mlp.gate.weight": "model-00042-of-00047.safetensors", + "model.layers.41.mlp.shared_experts.down_proj.weight": "model-00042-of-00047.safetensors", + "model.layers.41.mlp.shared_experts.down_proj.weight_scale": "model-00042-of-00047.safetensors", + "model.layers.41.mlp.shared_experts.gate_proj.weight": "model-00042-of-00047.safetensors", + "model.layers.41.mlp.shared_experts.gate_proj.weight_scale": "model-00042-of-00047.safetensors", + "model.layers.41.mlp.shared_experts.up_proj.weight": "model-00042-of-00047.safetensors", + "model.layers.41.mlp.shared_experts.up_proj.weight_scale": "model-00042-of-00047.safetensors", + "model.layers.41.post_attention_layernorm.weight": "model-00042-of-00047.safetensors", + "model.layers.41.self_attn.k_proj.bias": "model-00042-of-00047.safetensors", + "model.layers.41.self_attn.k_proj.weight": "model-00042-of-00047.safetensors", + "model.layers.41.self_attn.k_proj.weight_scale": "model-00042-of-00047.safetensors", + "model.layers.41.self_attn.o_proj.weight": "model-00042-of-00047.safetensors", + "model.layers.41.self_attn.o_proj.weight_scale": "model-00042-of-00047.safetensors", + "model.layers.41.self_attn.q_proj.bias": "model-00042-of-00047.safetensors", + "model.layers.41.self_attn.q_proj.weight": "model-00042-of-00047.safetensors", + "model.layers.41.self_attn.q_proj.weight_scale": "model-00042-of-00047.safetensors", + "model.layers.41.self_attn.v_proj.bias": "model-00042-of-00047.safetensors", + "model.layers.41.self_attn.v_proj.weight": "model-00042-of-00047.safetensors", + "model.layers.41.self_attn.v_proj.weight_scale": "model-00042-of-00047.safetensors", + "model.layers.42.input_layernorm.weight": "model-00043-of-00047.safetensors", + "model.layers.42.mlp.experts.0.down_proj.weight": "model-00043-of-00047.safetensors", + "model.layers.42.mlp.experts.0.down_proj.weight_scale": "model-00043-of-00047.safetensors", + "model.layers.42.mlp.experts.0.gate_proj.weight": "model-00043-of-00047.safetensors", + "model.layers.42.mlp.experts.0.gate_proj.weight_scale": "model-00043-of-00047.safetensors", + "model.layers.42.mlp.experts.0.up_proj.weight": "model-00043-of-00047.safetensors", + "model.layers.42.mlp.experts.0.up_proj.weight_scale": "model-00043-of-00047.safetensors", + "model.layers.42.mlp.experts.1.down_proj.weight": "model-00043-of-00047.safetensors", + "model.layers.42.mlp.experts.1.down_proj.weight_scale": "model-00043-of-00047.safetensors", + "model.layers.42.mlp.experts.1.gate_proj.weight": "model-00043-of-00047.safetensors", + "model.layers.42.mlp.experts.1.gate_proj.weight_scale": "model-00043-of-00047.safetensors", + "model.layers.42.mlp.experts.1.up_proj.weight": "model-00043-of-00047.safetensors", + "model.layers.42.mlp.experts.1.up_proj.weight_scale": "model-00043-of-00047.safetensors", + "model.layers.42.mlp.experts.10.down_proj.weight": "model-00043-of-00047.safetensors", + "model.layers.42.mlp.experts.10.down_proj.weight_scale": "model-00043-of-00047.safetensors", + "model.layers.42.mlp.experts.10.gate_proj.weight": "model-00043-of-00047.safetensors", + "model.layers.42.mlp.experts.10.gate_proj.weight_scale": "model-00043-of-00047.safetensors", + "model.layers.42.mlp.experts.10.up_proj.weight": "model-00043-of-00047.safetensors", + "model.layers.42.mlp.experts.10.up_proj.weight_scale": "model-00043-of-00047.safetensors", + "model.layers.42.mlp.experts.100.down_proj.weight": "model-00043-of-00047.safetensors", + "model.layers.42.mlp.experts.100.down_proj.weight_scale": "model-00043-of-00047.safetensors", + "model.layers.42.mlp.experts.100.gate_proj.weight": "model-00043-of-00047.safetensors", + "model.layers.42.mlp.experts.100.gate_proj.weight_scale": "model-00043-of-00047.safetensors", + "model.layers.42.mlp.experts.100.up_proj.weight": "model-00043-of-00047.safetensors", + "model.layers.42.mlp.experts.100.up_proj.weight_scale": "model-00043-of-00047.safetensors", + "model.layers.42.mlp.experts.101.down_proj.weight": "model-00043-of-00047.safetensors", + "model.layers.42.mlp.experts.101.down_proj.weight_scale": "model-00043-of-00047.safetensors", + "model.layers.42.mlp.experts.101.gate_proj.weight": "model-00043-of-00047.safetensors", + "model.layers.42.mlp.experts.101.gate_proj.weight_scale": "model-00043-of-00047.safetensors", + "model.layers.42.mlp.experts.101.up_proj.weight": "model-00043-of-00047.safetensors", + "model.layers.42.mlp.experts.101.up_proj.weight_scale": "model-00043-of-00047.safetensors", + "model.layers.42.mlp.experts.102.down_proj.weight": "model-00043-of-00047.safetensors", + "model.layers.42.mlp.experts.102.down_proj.weight_scale": "model-00043-of-00047.safetensors", + "model.layers.42.mlp.experts.102.gate_proj.weight": "model-00043-of-00047.safetensors", + "model.layers.42.mlp.experts.102.gate_proj.weight_scale": "model-00043-of-00047.safetensors", + "model.layers.42.mlp.experts.102.up_proj.weight": "model-00043-of-00047.safetensors", + "model.layers.42.mlp.experts.102.up_proj.weight_scale": "model-00043-of-00047.safetensors", + "model.layers.42.mlp.experts.103.down_proj.weight": "model-00043-of-00047.safetensors", + "model.layers.42.mlp.experts.103.down_proj.weight_scale": "model-00043-of-00047.safetensors", + "model.layers.42.mlp.experts.103.gate_proj.weight": "model-00043-of-00047.safetensors", + "model.layers.42.mlp.experts.103.gate_proj.weight_scale": "model-00043-of-00047.safetensors", + "model.layers.42.mlp.experts.103.up_proj.weight": "model-00043-of-00047.safetensors", + "model.layers.42.mlp.experts.103.up_proj.weight_scale": "model-00043-of-00047.safetensors", + "model.layers.42.mlp.experts.104.down_proj.weight": "model-00043-of-00047.safetensors", + "model.layers.42.mlp.experts.104.down_proj.weight_scale": "model-00043-of-00047.safetensors", + "model.layers.42.mlp.experts.104.gate_proj.weight": "model-00043-of-00047.safetensors", + "model.layers.42.mlp.experts.104.gate_proj.weight_scale": "model-00043-of-00047.safetensors", + "model.layers.42.mlp.experts.104.up_proj.weight": "model-00043-of-00047.safetensors", + "model.layers.42.mlp.experts.104.up_proj.weight_scale": "model-00043-of-00047.safetensors", + "model.layers.42.mlp.experts.105.down_proj.weight": "model-00043-of-00047.safetensors", + "model.layers.42.mlp.experts.105.down_proj.weight_scale": "model-00043-of-00047.safetensors", + "model.layers.42.mlp.experts.105.gate_proj.weight": "model-00043-of-00047.safetensors", + "model.layers.42.mlp.experts.105.gate_proj.weight_scale": "model-00043-of-00047.safetensors", + "model.layers.42.mlp.experts.105.up_proj.weight": "model-00043-of-00047.safetensors", + "model.layers.42.mlp.experts.105.up_proj.weight_scale": "model-00043-of-00047.safetensors", + "model.layers.42.mlp.experts.106.down_proj.weight": "model-00043-of-00047.safetensors", + "model.layers.42.mlp.experts.106.down_proj.weight_scale": "model-00043-of-00047.safetensors", + "model.layers.42.mlp.experts.106.gate_proj.weight": "model-00043-of-00047.safetensors", + "model.layers.42.mlp.experts.106.gate_proj.weight_scale": "model-00043-of-00047.safetensors", + "model.layers.42.mlp.experts.106.up_proj.weight": "model-00043-of-00047.safetensors", + "model.layers.42.mlp.experts.106.up_proj.weight_scale": "model-00043-of-00047.safetensors", + "model.layers.42.mlp.experts.107.down_proj.weight": "model-00043-of-00047.safetensors", + "model.layers.42.mlp.experts.107.down_proj.weight_scale": "model-00043-of-00047.safetensors", + "model.layers.42.mlp.experts.107.gate_proj.weight": "model-00043-of-00047.safetensors", + "model.layers.42.mlp.experts.107.gate_proj.weight_scale": "model-00043-of-00047.safetensors", + "model.layers.42.mlp.experts.107.up_proj.weight": "model-00043-of-00047.safetensors", + "model.layers.42.mlp.experts.107.up_proj.weight_scale": "model-00043-of-00047.safetensors", + "model.layers.42.mlp.experts.108.down_proj.weight": "model-00043-of-00047.safetensors", + "model.layers.42.mlp.experts.108.down_proj.weight_scale": "model-00043-of-00047.safetensors", + "model.layers.42.mlp.experts.108.gate_proj.weight": "model-00043-of-00047.safetensors", + "model.layers.42.mlp.experts.108.gate_proj.weight_scale": "model-00043-of-00047.safetensors", + "model.layers.42.mlp.experts.108.up_proj.weight": "model-00043-of-00047.safetensors", + "model.layers.42.mlp.experts.108.up_proj.weight_scale": "model-00043-of-00047.safetensors", + "model.layers.42.mlp.experts.109.down_proj.weight": "model-00043-of-00047.safetensors", + "model.layers.42.mlp.experts.109.down_proj.weight_scale": "model-00043-of-00047.safetensors", + "model.layers.42.mlp.experts.109.gate_proj.weight": "model-00043-of-00047.safetensors", + "model.layers.42.mlp.experts.109.gate_proj.weight_scale": "model-00043-of-00047.safetensors", + "model.layers.42.mlp.experts.109.up_proj.weight": "model-00043-of-00047.safetensors", + "model.layers.42.mlp.experts.109.up_proj.weight_scale": "model-00043-of-00047.safetensors", + "model.layers.42.mlp.experts.11.down_proj.weight": "model-00043-of-00047.safetensors", + "model.layers.42.mlp.experts.11.down_proj.weight_scale": "model-00043-of-00047.safetensors", + "model.layers.42.mlp.experts.11.gate_proj.weight": "model-00043-of-00047.safetensors", + "model.layers.42.mlp.experts.11.gate_proj.weight_scale": "model-00043-of-00047.safetensors", + "model.layers.42.mlp.experts.11.up_proj.weight": "model-00043-of-00047.safetensors", + "model.layers.42.mlp.experts.11.up_proj.weight_scale": "model-00043-of-00047.safetensors", + "model.layers.42.mlp.experts.110.down_proj.weight": "model-00043-of-00047.safetensors", + "model.layers.42.mlp.experts.110.down_proj.weight_scale": "model-00043-of-00047.safetensors", + "model.layers.42.mlp.experts.110.gate_proj.weight": "model-00043-of-00047.safetensors", + "model.layers.42.mlp.experts.110.gate_proj.weight_scale": "model-00043-of-00047.safetensors", + "model.layers.42.mlp.experts.110.up_proj.weight": "model-00043-of-00047.safetensors", + "model.layers.42.mlp.experts.110.up_proj.weight_scale": "model-00043-of-00047.safetensors", + "model.layers.42.mlp.experts.111.down_proj.weight": "model-00043-of-00047.safetensors", + "model.layers.42.mlp.experts.111.down_proj.weight_scale": "model-00043-of-00047.safetensors", + "model.layers.42.mlp.experts.111.gate_proj.weight": "model-00043-of-00047.safetensors", + "model.layers.42.mlp.experts.111.gate_proj.weight_scale": "model-00043-of-00047.safetensors", + "model.layers.42.mlp.experts.111.up_proj.weight": "model-00043-of-00047.safetensors", + "model.layers.42.mlp.experts.111.up_proj.weight_scale": "model-00043-of-00047.safetensors", + "model.layers.42.mlp.experts.112.down_proj.weight": "model-00043-of-00047.safetensors", + "model.layers.42.mlp.experts.112.down_proj.weight_scale": "model-00043-of-00047.safetensors", + "model.layers.42.mlp.experts.112.gate_proj.weight": "model-00043-of-00047.safetensors", + "model.layers.42.mlp.experts.112.gate_proj.weight_scale": "model-00043-of-00047.safetensors", + "model.layers.42.mlp.experts.112.up_proj.weight": "model-00043-of-00047.safetensors", + "model.layers.42.mlp.experts.112.up_proj.weight_scale": "model-00043-of-00047.safetensors", + "model.layers.42.mlp.experts.113.down_proj.weight": "model-00043-of-00047.safetensors", + "model.layers.42.mlp.experts.113.down_proj.weight_scale": "model-00043-of-00047.safetensors", + "model.layers.42.mlp.experts.113.gate_proj.weight": "model-00043-of-00047.safetensors", + "model.layers.42.mlp.experts.113.gate_proj.weight_scale": "model-00043-of-00047.safetensors", + "model.layers.42.mlp.experts.113.up_proj.weight": "model-00043-of-00047.safetensors", + "model.layers.42.mlp.experts.113.up_proj.weight_scale": "model-00043-of-00047.safetensors", + "model.layers.42.mlp.experts.114.down_proj.weight": "model-00043-of-00047.safetensors", + "model.layers.42.mlp.experts.114.down_proj.weight_scale": "model-00043-of-00047.safetensors", + "model.layers.42.mlp.experts.114.gate_proj.weight": "model-00043-of-00047.safetensors", + "model.layers.42.mlp.experts.114.gate_proj.weight_scale": "model-00043-of-00047.safetensors", + "model.layers.42.mlp.experts.114.up_proj.weight": "model-00043-of-00047.safetensors", + "model.layers.42.mlp.experts.114.up_proj.weight_scale": "model-00043-of-00047.safetensors", + "model.layers.42.mlp.experts.115.down_proj.weight": "model-00043-of-00047.safetensors", + "model.layers.42.mlp.experts.115.down_proj.weight_scale": "model-00043-of-00047.safetensors", + "model.layers.42.mlp.experts.115.gate_proj.weight": "model-00043-of-00047.safetensors", + "model.layers.42.mlp.experts.115.gate_proj.weight_scale": "model-00043-of-00047.safetensors", + "model.layers.42.mlp.experts.115.up_proj.weight": "model-00043-of-00047.safetensors", + "model.layers.42.mlp.experts.115.up_proj.weight_scale": "model-00043-of-00047.safetensors", + "model.layers.42.mlp.experts.116.down_proj.weight": "model-00043-of-00047.safetensors", + "model.layers.42.mlp.experts.116.down_proj.weight_scale": "model-00043-of-00047.safetensors", + "model.layers.42.mlp.experts.116.gate_proj.weight": "model-00043-of-00047.safetensors", + "model.layers.42.mlp.experts.116.gate_proj.weight_scale": "model-00043-of-00047.safetensors", + "model.layers.42.mlp.experts.116.up_proj.weight": "model-00043-of-00047.safetensors", + "model.layers.42.mlp.experts.116.up_proj.weight_scale": "model-00043-of-00047.safetensors", + "model.layers.42.mlp.experts.117.down_proj.weight": "model-00043-of-00047.safetensors", + "model.layers.42.mlp.experts.117.down_proj.weight_scale": "model-00043-of-00047.safetensors", + "model.layers.42.mlp.experts.117.gate_proj.weight": "model-00043-of-00047.safetensors", + "model.layers.42.mlp.experts.117.gate_proj.weight_scale": "model-00043-of-00047.safetensors", + "model.layers.42.mlp.experts.117.up_proj.weight": "model-00043-of-00047.safetensors", + "model.layers.42.mlp.experts.117.up_proj.weight_scale": "model-00043-of-00047.safetensors", + "model.layers.42.mlp.experts.118.down_proj.weight": "model-00043-of-00047.safetensors", + "model.layers.42.mlp.experts.118.down_proj.weight_scale": "model-00043-of-00047.safetensors", + "model.layers.42.mlp.experts.118.gate_proj.weight": "model-00043-of-00047.safetensors", + "model.layers.42.mlp.experts.118.gate_proj.weight_scale": "model-00043-of-00047.safetensors", + "model.layers.42.mlp.experts.118.up_proj.weight": "model-00043-of-00047.safetensors", + "model.layers.42.mlp.experts.118.up_proj.weight_scale": "model-00043-of-00047.safetensors", + "model.layers.42.mlp.experts.119.down_proj.weight": "model-00043-of-00047.safetensors", + "model.layers.42.mlp.experts.119.down_proj.weight_scale": "model-00043-of-00047.safetensors", + "model.layers.42.mlp.experts.119.gate_proj.weight": "model-00043-of-00047.safetensors", + "model.layers.42.mlp.experts.119.gate_proj.weight_scale": "model-00043-of-00047.safetensors", + "model.layers.42.mlp.experts.119.up_proj.weight": "model-00043-of-00047.safetensors", + "model.layers.42.mlp.experts.119.up_proj.weight_scale": "model-00043-of-00047.safetensors", + "model.layers.42.mlp.experts.12.down_proj.weight": "model-00043-of-00047.safetensors", + "model.layers.42.mlp.experts.12.down_proj.weight_scale": "model-00043-of-00047.safetensors", + "model.layers.42.mlp.experts.12.gate_proj.weight": "model-00043-of-00047.safetensors", + "model.layers.42.mlp.experts.12.gate_proj.weight_scale": "model-00043-of-00047.safetensors", + "model.layers.42.mlp.experts.12.up_proj.weight": "model-00043-of-00047.safetensors", + "model.layers.42.mlp.experts.12.up_proj.weight_scale": "model-00043-of-00047.safetensors", + "model.layers.42.mlp.experts.120.down_proj.weight": "model-00043-of-00047.safetensors", + "model.layers.42.mlp.experts.120.down_proj.weight_scale": "model-00043-of-00047.safetensors", + "model.layers.42.mlp.experts.120.gate_proj.weight": "model-00043-of-00047.safetensors", + "model.layers.42.mlp.experts.120.gate_proj.weight_scale": "model-00043-of-00047.safetensors", + "model.layers.42.mlp.experts.120.up_proj.weight": "model-00043-of-00047.safetensors", + "model.layers.42.mlp.experts.120.up_proj.weight_scale": "model-00043-of-00047.safetensors", + "model.layers.42.mlp.experts.121.down_proj.weight": "model-00043-of-00047.safetensors", + "model.layers.42.mlp.experts.121.down_proj.weight_scale": "model-00043-of-00047.safetensors", + "model.layers.42.mlp.experts.121.gate_proj.weight": "model-00043-of-00047.safetensors", + "model.layers.42.mlp.experts.121.gate_proj.weight_scale": "model-00043-of-00047.safetensors", + "model.layers.42.mlp.experts.121.up_proj.weight": "model-00043-of-00047.safetensors", + "model.layers.42.mlp.experts.121.up_proj.weight_scale": "model-00043-of-00047.safetensors", + "model.layers.42.mlp.experts.122.down_proj.weight": "model-00043-of-00047.safetensors", + "model.layers.42.mlp.experts.122.down_proj.weight_scale": "model-00043-of-00047.safetensors", + "model.layers.42.mlp.experts.122.gate_proj.weight": "model-00043-of-00047.safetensors", + "model.layers.42.mlp.experts.122.gate_proj.weight_scale": "model-00043-of-00047.safetensors", + "model.layers.42.mlp.experts.122.up_proj.weight": "model-00043-of-00047.safetensors", + "model.layers.42.mlp.experts.122.up_proj.weight_scale": "model-00043-of-00047.safetensors", + "model.layers.42.mlp.experts.123.down_proj.weight": "model-00043-of-00047.safetensors", + "model.layers.42.mlp.experts.123.down_proj.weight_scale": "model-00043-of-00047.safetensors", + "model.layers.42.mlp.experts.123.gate_proj.weight": "model-00043-of-00047.safetensors", + "model.layers.42.mlp.experts.123.gate_proj.weight_scale": "model-00043-of-00047.safetensors", + "model.layers.42.mlp.experts.123.up_proj.weight": "model-00043-of-00047.safetensors", + "model.layers.42.mlp.experts.123.up_proj.weight_scale": "model-00043-of-00047.safetensors", + "model.layers.42.mlp.experts.124.down_proj.weight": "model-00043-of-00047.safetensors", + "model.layers.42.mlp.experts.124.down_proj.weight_scale": "model-00043-of-00047.safetensors", + "model.layers.42.mlp.experts.124.gate_proj.weight": "model-00043-of-00047.safetensors", + "model.layers.42.mlp.experts.124.gate_proj.weight_scale": "model-00043-of-00047.safetensors", + "model.layers.42.mlp.experts.124.up_proj.weight": "model-00043-of-00047.safetensors", + "model.layers.42.mlp.experts.124.up_proj.weight_scale": "model-00043-of-00047.safetensors", + "model.layers.42.mlp.experts.125.down_proj.weight": "model-00043-of-00047.safetensors", + "model.layers.42.mlp.experts.125.down_proj.weight_scale": "model-00043-of-00047.safetensors", + "model.layers.42.mlp.experts.125.gate_proj.weight": "model-00043-of-00047.safetensors", + "model.layers.42.mlp.experts.125.gate_proj.weight_scale": "model-00043-of-00047.safetensors", + "model.layers.42.mlp.experts.125.up_proj.weight": "model-00043-of-00047.safetensors", + "model.layers.42.mlp.experts.125.up_proj.weight_scale": "model-00043-of-00047.safetensors", + "model.layers.42.mlp.experts.126.down_proj.weight": "model-00043-of-00047.safetensors", + "model.layers.42.mlp.experts.126.down_proj.weight_scale": "model-00043-of-00047.safetensors", + "model.layers.42.mlp.experts.126.gate_proj.weight": "model-00043-of-00047.safetensors", + "model.layers.42.mlp.experts.126.gate_proj.weight_scale": "model-00043-of-00047.safetensors", + "model.layers.42.mlp.experts.126.up_proj.weight": "model-00043-of-00047.safetensors", + "model.layers.42.mlp.experts.126.up_proj.weight_scale": "model-00043-of-00047.safetensors", + "model.layers.42.mlp.experts.127.down_proj.weight": "model-00043-of-00047.safetensors", + "model.layers.42.mlp.experts.127.down_proj.weight_scale": "model-00043-of-00047.safetensors", + "model.layers.42.mlp.experts.127.gate_proj.weight": "model-00043-of-00047.safetensors", + "model.layers.42.mlp.experts.127.gate_proj.weight_scale": "model-00043-of-00047.safetensors", + "model.layers.42.mlp.experts.127.up_proj.weight": "model-00043-of-00047.safetensors", + "model.layers.42.mlp.experts.127.up_proj.weight_scale": "model-00043-of-00047.safetensors", + "model.layers.42.mlp.experts.13.down_proj.weight": "model-00043-of-00047.safetensors", + "model.layers.42.mlp.experts.13.down_proj.weight_scale": "model-00043-of-00047.safetensors", + "model.layers.42.mlp.experts.13.gate_proj.weight": "model-00043-of-00047.safetensors", + "model.layers.42.mlp.experts.13.gate_proj.weight_scale": "model-00043-of-00047.safetensors", + "model.layers.42.mlp.experts.13.up_proj.weight": "model-00043-of-00047.safetensors", + "model.layers.42.mlp.experts.13.up_proj.weight_scale": "model-00043-of-00047.safetensors", + "model.layers.42.mlp.experts.14.down_proj.weight": "model-00043-of-00047.safetensors", + "model.layers.42.mlp.experts.14.down_proj.weight_scale": "model-00043-of-00047.safetensors", + "model.layers.42.mlp.experts.14.gate_proj.weight": "model-00043-of-00047.safetensors", + "model.layers.42.mlp.experts.14.gate_proj.weight_scale": "model-00043-of-00047.safetensors", + "model.layers.42.mlp.experts.14.up_proj.weight": "model-00043-of-00047.safetensors", + "model.layers.42.mlp.experts.14.up_proj.weight_scale": "model-00043-of-00047.safetensors", + "model.layers.42.mlp.experts.15.down_proj.weight": "model-00043-of-00047.safetensors", + "model.layers.42.mlp.experts.15.down_proj.weight_scale": "model-00043-of-00047.safetensors", + "model.layers.42.mlp.experts.15.gate_proj.weight": "model-00043-of-00047.safetensors", + "model.layers.42.mlp.experts.15.gate_proj.weight_scale": "model-00043-of-00047.safetensors", + "model.layers.42.mlp.experts.15.up_proj.weight": "model-00043-of-00047.safetensors", + "model.layers.42.mlp.experts.15.up_proj.weight_scale": "model-00043-of-00047.safetensors", + "model.layers.42.mlp.experts.16.down_proj.weight": "model-00043-of-00047.safetensors", + "model.layers.42.mlp.experts.16.down_proj.weight_scale": "model-00043-of-00047.safetensors", + "model.layers.42.mlp.experts.16.gate_proj.weight": "model-00043-of-00047.safetensors", + "model.layers.42.mlp.experts.16.gate_proj.weight_scale": "model-00043-of-00047.safetensors", + "model.layers.42.mlp.experts.16.up_proj.weight": "model-00043-of-00047.safetensors", + "model.layers.42.mlp.experts.16.up_proj.weight_scale": "model-00043-of-00047.safetensors", + "model.layers.42.mlp.experts.17.down_proj.weight": "model-00043-of-00047.safetensors", + "model.layers.42.mlp.experts.17.down_proj.weight_scale": "model-00043-of-00047.safetensors", + "model.layers.42.mlp.experts.17.gate_proj.weight": "model-00043-of-00047.safetensors", + "model.layers.42.mlp.experts.17.gate_proj.weight_scale": "model-00043-of-00047.safetensors", + "model.layers.42.mlp.experts.17.up_proj.weight": "model-00043-of-00047.safetensors", + "model.layers.42.mlp.experts.17.up_proj.weight_scale": "model-00043-of-00047.safetensors", + "model.layers.42.mlp.experts.18.down_proj.weight": "model-00043-of-00047.safetensors", + "model.layers.42.mlp.experts.18.down_proj.weight_scale": "model-00043-of-00047.safetensors", + "model.layers.42.mlp.experts.18.gate_proj.weight": "model-00043-of-00047.safetensors", + "model.layers.42.mlp.experts.18.gate_proj.weight_scale": "model-00043-of-00047.safetensors", + "model.layers.42.mlp.experts.18.up_proj.weight": "model-00043-of-00047.safetensors", + "model.layers.42.mlp.experts.18.up_proj.weight_scale": "model-00043-of-00047.safetensors", + "model.layers.42.mlp.experts.19.down_proj.weight": "model-00043-of-00047.safetensors", + "model.layers.42.mlp.experts.19.down_proj.weight_scale": "model-00043-of-00047.safetensors", + "model.layers.42.mlp.experts.19.gate_proj.weight": "model-00043-of-00047.safetensors", + "model.layers.42.mlp.experts.19.gate_proj.weight_scale": "model-00043-of-00047.safetensors", + "model.layers.42.mlp.experts.19.up_proj.weight": "model-00043-of-00047.safetensors", + "model.layers.42.mlp.experts.19.up_proj.weight_scale": "model-00043-of-00047.safetensors", + "model.layers.42.mlp.experts.2.down_proj.weight": "model-00043-of-00047.safetensors", + "model.layers.42.mlp.experts.2.down_proj.weight_scale": "model-00043-of-00047.safetensors", + "model.layers.42.mlp.experts.2.gate_proj.weight": "model-00043-of-00047.safetensors", + "model.layers.42.mlp.experts.2.gate_proj.weight_scale": "model-00043-of-00047.safetensors", + "model.layers.42.mlp.experts.2.up_proj.weight": "model-00043-of-00047.safetensors", + "model.layers.42.mlp.experts.2.up_proj.weight_scale": "model-00043-of-00047.safetensors", + "model.layers.42.mlp.experts.20.down_proj.weight": "model-00043-of-00047.safetensors", + "model.layers.42.mlp.experts.20.down_proj.weight_scale": "model-00043-of-00047.safetensors", + "model.layers.42.mlp.experts.20.gate_proj.weight": "model-00043-of-00047.safetensors", + "model.layers.42.mlp.experts.20.gate_proj.weight_scale": "model-00043-of-00047.safetensors", + "model.layers.42.mlp.experts.20.up_proj.weight": "model-00043-of-00047.safetensors", + "model.layers.42.mlp.experts.20.up_proj.weight_scale": "model-00043-of-00047.safetensors", + "model.layers.42.mlp.experts.21.down_proj.weight": "model-00043-of-00047.safetensors", + "model.layers.42.mlp.experts.21.down_proj.weight_scale": "model-00043-of-00047.safetensors", + "model.layers.42.mlp.experts.21.gate_proj.weight": "model-00043-of-00047.safetensors", + "model.layers.42.mlp.experts.21.gate_proj.weight_scale": "model-00043-of-00047.safetensors", + "model.layers.42.mlp.experts.21.up_proj.weight": "model-00043-of-00047.safetensors", + "model.layers.42.mlp.experts.21.up_proj.weight_scale": "model-00043-of-00047.safetensors", + "model.layers.42.mlp.experts.22.down_proj.weight": "model-00043-of-00047.safetensors", + "model.layers.42.mlp.experts.22.down_proj.weight_scale": "model-00043-of-00047.safetensors", + "model.layers.42.mlp.experts.22.gate_proj.weight": "model-00043-of-00047.safetensors", + "model.layers.42.mlp.experts.22.gate_proj.weight_scale": "model-00043-of-00047.safetensors", + "model.layers.42.mlp.experts.22.up_proj.weight": "model-00043-of-00047.safetensors", + "model.layers.42.mlp.experts.22.up_proj.weight_scale": "model-00043-of-00047.safetensors", + "model.layers.42.mlp.experts.23.down_proj.weight": "model-00043-of-00047.safetensors", + "model.layers.42.mlp.experts.23.down_proj.weight_scale": "model-00043-of-00047.safetensors", + "model.layers.42.mlp.experts.23.gate_proj.weight": "model-00043-of-00047.safetensors", + "model.layers.42.mlp.experts.23.gate_proj.weight_scale": "model-00043-of-00047.safetensors", + "model.layers.42.mlp.experts.23.up_proj.weight": "model-00043-of-00047.safetensors", + "model.layers.42.mlp.experts.23.up_proj.weight_scale": "model-00043-of-00047.safetensors", + "model.layers.42.mlp.experts.24.down_proj.weight": "model-00043-of-00047.safetensors", + "model.layers.42.mlp.experts.24.down_proj.weight_scale": "model-00043-of-00047.safetensors", + "model.layers.42.mlp.experts.24.gate_proj.weight": "model-00043-of-00047.safetensors", + "model.layers.42.mlp.experts.24.gate_proj.weight_scale": "model-00043-of-00047.safetensors", + "model.layers.42.mlp.experts.24.up_proj.weight": "model-00043-of-00047.safetensors", + "model.layers.42.mlp.experts.24.up_proj.weight_scale": "model-00043-of-00047.safetensors", + "model.layers.42.mlp.experts.25.down_proj.weight": "model-00043-of-00047.safetensors", + "model.layers.42.mlp.experts.25.down_proj.weight_scale": "model-00043-of-00047.safetensors", + "model.layers.42.mlp.experts.25.gate_proj.weight": "model-00043-of-00047.safetensors", + "model.layers.42.mlp.experts.25.gate_proj.weight_scale": "model-00043-of-00047.safetensors", + "model.layers.42.mlp.experts.25.up_proj.weight": "model-00043-of-00047.safetensors", + "model.layers.42.mlp.experts.25.up_proj.weight_scale": "model-00043-of-00047.safetensors", + "model.layers.42.mlp.experts.26.down_proj.weight": "model-00043-of-00047.safetensors", + "model.layers.42.mlp.experts.26.down_proj.weight_scale": "model-00043-of-00047.safetensors", + "model.layers.42.mlp.experts.26.gate_proj.weight": "model-00043-of-00047.safetensors", + "model.layers.42.mlp.experts.26.gate_proj.weight_scale": "model-00043-of-00047.safetensors", + "model.layers.42.mlp.experts.26.up_proj.weight": "model-00043-of-00047.safetensors", + "model.layers.42.mlp.experts.26.up_proj.weight_scale": "model-00043-of-00047.safetensors", + "model.layers.42.mlp.experts.27.down_proj.weight": "model-00043-of-00047.safetensors", + "model.layers.42.mlp.experts.27.down_proj.weight_scale": "model-00043-of-00047.safetensors", + "model.layers.42.mlp.experts.27.gate_proj.weight": "model-00043-of-00047.safetensors", + "model.layers.42.mlp.experts.27.gate_proj.weight_scale": "model-00043-of-00047.safetensors", + "model.layers.42.mlp.experts.27.up_proj.weight": "model-00043-of-00047.safetensors", + "model.layers.42.mlp.experts.27.up_proj.weight_scale": "model-00043-of-00047.safetensors", + "model.layers.42.mlp.experts.28.down_proj.weight": "model-00043-of-00047.safetensors", + "model.layers.42.mlp.experts.28.down_proj.weight_scale": "model-00043-of-00047.safetensors", + "model.layers.42.mlp.experts.28.gate_proj.weight": "model-00043-of-00047.safetensors", + "model.layers.42.mlp.experts.28.gate_proj.weight_scale": "model-00043-of-00047.safetensors", + "model.layers.42.mlp.experts.28.up_proj.weight": "model-00043-of-00047.safetensors", + "model.layers.42.mlp.experts.28.up_proj.weight_scale": "model-00043-of-00047.safetensors", + "model.layers.42.mlp.experts.29.down_proj.weight": "model-00043-of-00047.safetensors", + "model.layers.42.mlp.experts.29.down_proj.weight_scale": "model-00043-of-00047.safetensors", + "model.layers.42.mlp.experts.29.gate_proj.weight": "model-00043-of-00047.safetensors", + "model.layers.42.mlp.experts.29.gate_proj.weight_scale": "model-00043-of-00047.safetensors", + "model.layers.42.mlp.experts.29.up_proj.weight": "model-00043-of-00047.safetensors", + "model.layers.42.mlp.experts.29.up_proj.weight_scale": "model-00043-of-00047.safetensors", + "model.layers.42.mlp.experts.3.down_proj.weight": "model-00043-of-00047.safetensors", + "model.layers.42.mlp.experts.3.down_proj.weight_scale": "model-00043-of-00047.safetensors", + "model.layers.42.mlp.experts.3.gate_proj.weight": "model-00043-of-00047.safetensors", + "model.layers.42.mlp.experts.3.gate_proj.weight_scale": "model-00043-of-00047.safetensors", + "model.layers.42.mlp.experts.3.up_proj.weight": "model-00043-of-00047.safetensors", + "model.layers.42.mlp.experts.3.up_proj.weight_scale": "model-00043-of-00047.safetensors", + "model.layers.42.mlp.experts.30.down_proj.weight": "model-00043-of-00047.safetensors", + "model.layers.42.mlp.experts.30.down_proj.weight_scale": "model-00043-of-00047.safetensors", + "model.layers.42.mlp.experts.30.gate_proj.weight": "model-00043-of-00047.safetensors", + "model.layers.42.mlp.experts.30.gate_proj.weight_scale": "model-00043-of-00047.safetensors", + "model.layers.42.mlp.experts.30.up_proj.weight": "model-00043-of-00047.safetensors", + "model.layers.42.mlp.experts.30.up_proj.weight_scale": "model-00043-of-00047.safetensors", + "model.layers.42.mlp.experts.31.down_proj.weight": "model-00043-of-00047.safetensors", + "model.layers.42.mlp.experts.31.down_proj.weight_scale": "model-00043-of-00047.safetensors", + "model.layers.42.mlp.experts.31.gate_proj.weight": "model-00043-of-00047.safetensors", + "model.layers.42.mlp.experts.31.gate_proj.weight_scale": "model-00043-of-00047.safetensors", + "model.layers.42.mlp.experts.31.up_proj.weight": "model-00043-of-00047.safetensors", + "model.layers.42.mlp.experts.31.up_proj.weight_scale": "model-00043-of-00047.safetensors", + "model.layers.42.mlp.experts.32.down_proj.weight": "model-00043-of-00047.safetensors", + "model.layers.42.mlp.experts.32.down_proj.weight_scale": "model-00043-of-00047.safetensors", + "model.layers.42.mlp.experts.32.gate_proj.weight": "model-00043-of-00047.safetensors", + "model.layers.42.mlp.experts.32.gate_proj.weight_scale": "model-00043-of-00047.safetensors", + "model.layers.42.mlp.experts.32.up_proj.weight": "model-00043-of-00047.safetensors", + "model.layers.42.mlp.experts.32.up_proj.weight_scale": "model-00043-of-00047.safetensors", + "model.layers.42.mlp.experts.33.down_proj.weight": "model-00043-of-00047.safetensors", + "model.layers.42.mlp.experts.33.down_proj.weight_scale": "model-00043-of-00047.safetensors", + "model.layers.42.mlp.experts.33.gate_proj.weight": "model-00043-of-00047.safetensors", + "model.layers.42.mlp.experts.33.gate_proj.weight_scale": "model-00043-of-00047.safetensors", + "model.layers.42.mlp.experts.33.up_proj.weight": "model-00043-of-00047.safetensors", + "model.layers.42.mlp.experts.33.up_proj.weight_scale": "model-00043-of-00047.safetensors", + "model.layers.42.mlp.experts.34.down_proj.weight": "model-00043-of-00047.safetensors", + "model.layers.42.mlp.experts.34.down_proj.weight_scale": "model-00043-of-00047.safetensors", + "model.layers.42.mlp.experts.34.gate_proj.weight": "model-00043-of-00047.safetensors", + "model.layers.42.mlp.experts.34.gate_proj.weight_scale": "model-00043-of-00047.safetensors", + "model.layers.42.mlp.experts.34.up_proj.weight": "model-00043-of-00047.safetensors", + "model.layers.42.mlp.experts.34.up_proj.weight_scale": "model-00043-of-00047.safetensors", + "model.layers.42.mlp.experts.35.down_proj.weight": "model-00043-of-00047.safetensors", + "model.layers.42.mlp.experts.35.down_proj.weight_scale": "model-00043-of-00047.safetensors", + "model.layers.42.mlp.experts.35.gate_proj.weight": "model-00043-of-00047.safetensors", + "model.layers.42.mlp.experts.35.gate_proj.weight_scale": "model-00043-of-00047.safetensors", + "model.layers.42.mlp.experts.35.up_proj.weight": "model-00043-of-00047.safetensors", + "model.layers.42.mlp.experts.35.up_proj.weight_scale": "model-00043-of-00047.safetensors", + "model.layers.42.mlp.experts.36.down_proj.weight": "model-00043-of-00047.safetensors", + "model.layers.42.mlp.experts.36.down_proj.weight_scale": "model-00043-of-00047.safetensors", + "model.layers.42.mlp.experts.36.gate_proj.weight": "model-00043-of-00047.safetensors", + "model.layers.42.mlp.experts.36.gate_proj.weight_scale": "model-00043-of-00047.safetensors", + "model.layers.42.mlp.experts.36.up_proj.weight": "model-00043-of-00047.safetensors", + "model.layers.42.mlp.experts.36.up_proj.weight_scale": "model-00043-of-00047.safetensors", + "model.layers.42.mlp.experts.37.down_proj.weight": "model-00043-of-00047.safetensors", + "model.layers.42.mlp.experts.37.down_proj.weight_scale": "model-00043-of-00047.safetensors", + "model.layers.42.mlp.experts.37.gate_proj.weight": "model-00043-of-00047.safetensors", + "model.layers.42.mlp.experts.37.gate_proj.weight_scale": "model-00043-of-00047.safetensors", + "model.layers.42.mlp.experts.37.up_proj.weight": "model-00043-of-00047.safetensors", + "model.layers.42.mlp.experts.37.up_proj.weight_scale": "model-00043-of-00047.safetensors", + "model.layers.42.mlp.experts.38.down_proj.weight": "model-00043-of-00047.safetensors", + "model.layers.42.mlp.experts.38.down_proj.weight_scale": "model-00043-of-00047.safetensors", + "model.layers.42.mlp.experts.38.gate_proj.weight": "model-00043-of-00047.safetensors", + "model.layers.42.mlp.experts.38.gate_proj.weight_scale": "model-00043-of-00047.safetensors", + "model.layers.42.mlp.experts.38.up_proj.weight": "model-00043-of-00047.safetensors", + "model.layers.42.mlp.experts.38.up_proj.weight_scale": "model-00043-of-00047.safetensors", + "model.layers.42.mlp.experts.39.down_proj.weight": "model-00043-of-00047.safetensors", + "model.layers.42.mlp.experts.39.down_proj.weight_scale": "model-00043-of-00047.safetensors", + "model.layers.42.mlp.experts.39.gate_proj.weight": "model-00043-of-00047.safetensors", + "model.layers.42.mlp.experts.39.gate_proj.weight_scale": "model-00043-of-00047.safetensors", + "model.layers.42.mlp.experts.39.up_proj.weight": "model-00043-of-00047.safetensors", + "model.layers.42.mlp.experts.39.up_proj.weight_scale": "model-00043-of-00047.safetensors", + "model.layers.42.mlp.experts.4.down_proj.weight": "model-00043-of-00047.safetensors", + "model.layers.42.mlp.experts.4.down_proj.weight_scale": "model-00043-of-00047.safetensors", + "model.layers.42.mlp.experts.4.gate_proj.weight": "model-00043-of-00047.safetensors", + "model.layers.42.mlp.experts.4.gate_proj.weight_scale": "model-00043-of-00047.safetensors", + "model.layers.42.mlp.experts.4.up_proj.weight": "model-00043-of-00047.safetensors", + "model.layers.42.mlp.experts.4.up_proj.weight_scale": "model-00043-of-00047.safetensors", + "model.layers.42.mlp.experts.40.down_proj.weight": "model-00043-of-00047.safetensors", + "model.layers.42.mlp.experts.40.down_proj.weight_scale": "model-00043-of-00047.safetensors", + "model.layers.42.mlp.experts.40.gate_proj.weight": "model-00043-of-00047.safetensors", + "model.layers.42.mlp.experts.40.gate_proj.weight_scale": "model-00043-of-00047.safetensors", + "model.layers.42.mlp.experts.40.up_proj.weight": "model-00043-of-00047.safetensors", + "model.layers.42.mlp.experts.40.up_proj.weight_scale": "model-00043-of-00047.safetensors", + "model.layers.42.mlp.experts.41.down_proj.weight": "model-00043-of-00047.safetensors", + "model.layers.42.mlp.experts.41.down_proj.weight_scale": "model-00043-of-00047.safetensors", + "model.layers.42.mlp.experts.41.gate_proj.weight": "model-00043-of-00047.safetensors", + "model.layers.42.mlp.experts.41.gate_proj.weight_scale": "model-00043-of-00047.safetensors", + "model.layers.42.mlp.experts.41.up_proj.weight": "model-00043-of-00047.safetensors", + "model.layers.42.mlp.experts.41.up_proj.weight_scale": "model-00043-of-00047.safetensors", + "model.layers.42.mlp.experts.42.down_proj.weight": "model-00043-of-00047.safetensors", + "model.layers.42.mlp.experts.42.down_proj.weight_scale": "model-00043-of-00047.safetensors", + "model.layers.42.mlp.experts.42.gate_proj.weight": "model-00043-of-00047.safetensors", + "model.layers.42.mlp.experts.42.gate_proj.weight_scale": "model-00043-of-00047.safetensors", + "model.layers.42.mlp.experts.42.up_proj.weight": "model-00043-of-00047.safetensors", + "model.layers.42.mlp.experts.42.up_proj.weight_scale": "model-00043-of-00047.safetensors", + "model.layers.42.mlp.experts.43.down_proj.weight": "model-00043-of-00047.safetensors", + "model.layers.42.mlp.experts.43.down_proj.weight_scale": "model-00043-of-00047.safetensors", + "model.layers.42.mlp.experts.43.gate_proj.weight": "model-00043-of-00047.safetensors", + "model.layers.42.mlp.experts.43.gate_proj.weight_scale": "model-00043-of-00047.safetensors", + "model.layers.42.mlp.experts.43.up_proj.weight": "model-00043-of-00047.safetensors", + "model.layers.42.mlp.experts.43.up_proj.weight_scale": "model-00043-of-00047.safetensors", + "model.layers.42.mlp.experts.44.down_proj.weight": "model-00043-of-00047.safetensors", + "model.layers.42.mlp.experts.44.down_proj.weight_scale": "model-00043-of-00047.safetensors", + "model.layers.42.mlp.experts.44.gate_proj.weight": "model-00043-of-00047.safetensors", + "model.layers.42.mlp.experts.44.gate_proj.weight_scale": "model-00043-of-00047.safetensors", + "model.layers.42.mlp.experts.44.up_proj.weight": "model-00043-of-00047.safetensors", + "model.layers.42.mlp.experts.44.up_proj.weight_scale": "model-00043-of-00047.safetensors", + "model.layers.42.mlp.experts.45.down_proj.weight": "model-00043-of-00047.safetensors", + "model.layers.42.mlp.experts.45.down_proj.weight_scale": "model-00043-of-00047.safetensors", + "model.layers.42.mlp.experts.45.gate_proj.weight": "model-00043-of-00047.safetensors", + "model.layers.42.mlp.experts.45.gate_proj.weight_scale": "model-00043-of-00047.safetensors", + "model.layers.42.mlp.experts.45.up_proj.weight": "model-00043-of-00047.safetensors", + "model.layers.42.mlp.experts.45.up_proj.weight_scale": "model-00043-of-00047.safetensors", + "model.layers.42.mlp.experts.46.down_proj.weight": "model-00043-of-00047.safetensors", + "model.layers.42.mlp.experts.46.down_proj.weight_scale": "model-00043-of-00047.safetensors", + "model.layers.42.mlp.experts.46.gate_proj.weight": "model-00043-of-00047.safetensors", + "model.layers.42.mlp.experts.46.gate_proj.weight_scale": "model-00043-of-00047.safetensors", + "model.layers.42.mlp.experts.46.up_proj.weight": "model-00043-of-00047.safetensors", + "model.layers.42.mlp.experts.46.up_proj.weight_scale": "model-00043-of-00047.safetensors", + "model.layers.42.mlp.experts.47.down_proj.weight": "model-00043-of-00047.safetensors", + "model.layers.42.mlp.experts.47.down_proj.weight_scale": "model-00043-of-00047.safetensors", + "model.layers.42.mlp.experts.47.gate_proj.weight": "model-00043-of-00047.safetensors", + "model.layers.42.mlp.experts.47.gate_proj.weight_scale": "model-00043-of-00047.safetensors", + "model.layers.42.mlp.experts.47.up_proj.weight": "model-00043-of-00047.safetensors", + "model.layers.42.mlp.experts.47.up_proj.weight_scale": "model-00043-of-00047.safetensors", + "model.layers.42.mlp.experts.48.down_proj.weight": "model-00043-of-00047.safetensors", + "model.layers.42.mlp.experts.48.down_proj.weight_scale": "model-00043-of-00047.safetensors", + "model.layers.42.mlp.experts.48.gate_proj.weight": "model-00043-of-00047.safetensors", + "model.layers.42.mlp.experts.48.gate_proj.weight_scale": "model-00043-of-00047.safetensors", + "model.layers.42.mlp.experts.48.up_proj.weight": "model-00043-of-00047.safetensors", + "model.layers.42.mlp.experts.48.up_proj.weight_scale": "model-00043-of-00047.safetensors", + "model.layers.42.mlp.experts.49.down_proj.weight": "model-00043-of-00047.safetensors", + "model.layers.42.mlp.experts.49.down_proj.weight_scale": "model-00043-of-00047.safetensors", + "model.layers.42.mlp.experts.49.gate_proj.weight": "model-00043-of-00047.safetensors", + "model.layers.42.mlp.experts.49.gate_proj.weight_scale": "model-00043-of-00047.safetensors", + "model.layers.42.mlp.experts.49.up_proj.weight": "model-00043-of-00047.safetensors", + "model.layers.42.mlp.experts.49.up_proj.weight_scale": "model-00043-of-00047.safetensors", + "model.layers.42.mlp.experts.5.down_proj.weight": "model-00043-of-00047.safetensors", + "model.layers.42.mlp.experts.5.down_proj.weight_scale": "model-00043-of-00047.safetensors", + "model.layers.42.mlp.experts.5.gate_proj.weight": "model-00043-of-00047.safetensors", + "model.layers.42.mlp.experts.5.gate_proj.weight_scale": "model-00043-of-00047.safetensors", + "model.layers.42.mlp.experts.5.up_proj.weight": "model-00043-of-00047.safetensors", + "model.layers.42.mlp.experts.5.up_proj.weight_scale": "model-00043-of-00047.safetensors", + "model.layers.42.mlp.experts.50.down_proj.weight": "model-00043-of-00047.safetensors", + "model.layers.42.mlp.experts.50.down_proj.weight_scale": "model-00043-of-00047.safetensors", + "model.layers.42.mlp.experts.50.gate_proj.weight": "model-00043-of-00047.safetensors", + "model.layers.42.mlp.experts.50.gate_proj.weight_scale": "model-00043-of-00047.safetensors", + "model.layers.42.mlp.experts.50.up_proj.weight": "model-00043-of-00047.safetensors", + "model.layers.42.mlp.experts.50.up_proj.weight_scale": "model-00043-of-00047.safetensors", + "model.layers.42.mlp.experts.51.down_proj.weight": "model-00043-of-00047.safetensors", + "model.layers.42.mlp.experts.51.down_proj.weight_scale": "model-00043-of-00047.safetensors", + "model.layers.42.mlp.experts.51.gate_proj.weight": "model-00043-of-00047.safetensors", + "model.layers.42.mlp.experts.51.gate_proj.weight_scale": "model-00043-of-00047.safetensors", + "model.layers.42.mlp.experts.51.up_proj.weight": "model-00043-of-00047.safetensors", + "model.layers.42.mlp.experts.51.up_proj.weight_scale": "model-00043-of-00047.safetensors", + "model.layers.42.mlp.experts.52.down_proj.weight": "model-00043-of-00047.safetensors", + "model.layers.42.mlp.experts.52.down_proj.weight_scale": "model-00043-of-00047.safetensors", + "model.layers.42.mlp.experts.52.gate_proj.weight": "model-00043-of-00047.safetensors", + "model.layers.42.mlp.experts.52.gate_proj.weight_scale": "model-00043-of-00047.safetensors", + "model.layers.42.mlp.experts.52.up_proj.weight": "model-00043-of-00047.safetensors", + "model.layers.42.mlp.experts.52.up_proj.weight_scale": "model-00043-of-00047.safetensors", + "model.layers.42.mlp.experts.53.down_proj.weight": "model-00043-of-00047.safetensors", + "model.layers.42.mlp.experts.53.down_proj.weight_scale": "model-00043-of-00047.safetensors", + "model.layers.42.mlp.experts.53.gate_proj.weight": "model-00043-of-00047.safetensors", + "model.layers.42.mlp.experts.53.gate_proj.weight_scale": "model-00043-of-00047.safetensors", + "model.layers.42.mlp.experts.53.up_proj.weight": "model-00043-of-00047.safetensors", + "model.layers.42.mlp.experts.53.up_proj.weight_scale": "model-00043-of-00047.safetensors", + "model.layers.42.mlp.experts.54.down_proj.weight": "model-00043-of-00047.safetensors", + "model.layers.42.mlp.experts.54.down_proj.weight_scale": "model-00043-of-00047.safetensors", + "model.layers.42.mlp.experts.54.gate_proj.weight": "model-00043-of-00047.safetensors", + "model.layers.42.mlp.experts.54.gate_proj.weight_scale": "model-00043-of-00047.safetensors", + "model.layers.42.mlp.experts.54.up_proj.weight": "model-00043-of-00047.safetensors", + "model.layers.42.mlp.experts.54.up_proj.weight_scale": "model-00043-of-00047.safetensors", + "model.layers.42.mlp.experts.55.down_proj.weight": "model-00043-of-00047.safetensors", + "model.layers.42.mlp.experts.55.down_proj.weight_scale": "model-00043-of-00047.safetensors", + "model.layers.42.mlp.experts.55.gate_proj.weight": "model-00043-of-00047.safetensors", + "model.layers.42.mlp.experts.55.gate_proj.weight_scale": "model-00043-of-00047.safetensors", + "model.layers.42.mlp.experts.55.up_proj.weight": "model-00043-of-00047.safetensors", + "model.layers.42.mlp.experts.55.up_proj.weight_scale": "model-00043-of-00047.safetensors", + "model.layers.42.mlp.experts.56.down_proj.weight": "model-00043-of-00047.safetensors", + "model.layers.42.mlp.experts.56.down_proj.weight_scale": "model-00043-of-00047.safetensors", + "model.layers.42.mlp.experts.56.gate_proj.weight": "model-00043-of-00047.safetensors", + "model.layers.42.mlp.experts.56.gate_proj.weight_scale": "model-00043-of-00047.safetensors", + "model.layers.42.mlp.experts.56.up_proj.weight": "model-00043-of-00047.safetensors", + "model.layers.42.mlp.experts.56.up_proj.weight_scale": "model-00043-of-00047.safetensors", + "model.layers.42.mlp.experts.57.down_proj.weight": "model-00043-of-00047.safetensors", + "model.layers.42.mlp.experts.57.down_proj.weight_scale": "model-00043-of-00047.safetensors", + "model.layers.42.mlp.experts.57.gate_proj.weight": "model-00043-of-00047.safetensors", + "model.layers.42.mlp.experts.57.gate_proj.weight_scale": "model-00043-of-00047.safetensors", + "model.layers.42.mlp.experts.57.up_proj.weight": "model-00043-of-00047.safetensors", + "model.layers.42.mlp.experts.57.up_proj.weight_scale": "model-00043-of-00047.safetensors", + "model.layers.42.mlp.experts.58.down_proj.weight": "model-00043-of-00047.safetensors", + "model.layers.42.mlp.experts.58.down_proj.weight_scale": "model-00043-of-00047.safetensors", + "model.layers.42.mlp.experts.58.gate_proj.weight": "model-00043-of-00047.safetensors", + "model.layers.42.mlp.experts.58.gate_proj.weight_scale": "model-00043-of-00047.safetensors", + "model.layers.42.mlp.experts.58.up_proj.weight": "model-00043-of-00047.safetensors", + "model.layers.42.mlp.experts.58.up_proj.weight_scale": "model-00043-of-00047.safetensors", + "model.layers.42.mlp.experts.59.down_proj.weight": "model-00043-of-00047.safetensors", + "model.layers.42.mlp.experts.59.down_proj.weight_scale": "model-00043-of-00047.safetensors", + "model.layers.42.mlp.experts.59.gate_proj.weight": "model-00043-of-00047.safetensors", + "model.layers.42.mlp.experts.59.gate_proj.weight_scale": "model-00043-of-00047.safetensors", + "model.layers.42.mlp.experts.59.up_proj.weight": "model-00043-of-00047.safetensors", + "model.layers.42.mlp.experts.59.up_proj.weight_scale": "model-00043-of-00047.safetensors", + "model.layers.42.mlp.experts.6.down_proj.weight": "model-00043-of-00047.safetensors", + "model.layers.42.mlp.experts.6.down_proj.weight_scale": "model-00043-of-00047.safetensors", + "model.layers.42.mlp.experts.6.gate_proj.weight": "model-00043-of-00047.safetensors", + "model.layers.42.mlp.experts.6.gate_proj.weight_scale": "model-00043-of-00047.safetensors", + "model.layers.42.mlp.experts.6.up_proj.weight": "model-00043-of-00047.safetensors", + "model.layers.42.mlp.experts.6.up_proj.weight_scale": "model-00043-of-00047.safetensors", + "model.layers.42.mlp.experts.60.down_proj.weight": "model-00043-of-00047.safetensors", + "model.layers.42.mlp.experts.60.down_proj.weight_scale": "model-00043-of-00047.safetensors", + "model.layers.42.mlp.experts.60.gate_proj.weight": "model-00043-of-00047.safetensors", + "model.layers.42.mlp.experts.60.gate_proj.weight_scale": "model-00043-of-00047.safetensors", + "model.layers.42.mlp.experts.60.up_proj.weight": "model-00043-of-00047.safetensors", + "model.layers.42.mlp.experts.60.up_proj.weight_scale": "model-00043-of-00047.safetensors", + "model.layers.42.mlp.experts.61.down_proj.weight": "model-00043-of-00047.safetensors", + "model.layers.42.mlp.experts.61.down_proj.weight_scale": "model-00043-of-00047.safetensors", + "model.layers.42.mlp.experts.61.gate_proj.weight": "model-00043-of-00047.safetensors", + "model.layers.42.mlp.experts.61.gate_proj.weight_scale": "model-00043-of-00047.safetensors", + "model.layers.42.mlp.experts.61.up_proj.weight": "model-00043-of-00047.safetensors", + "model.layers.42.mlp.experts.61.up_proj.weight_scale": "model-00043-of-00047.safetensors", + "model.layers.42.mlp.experts.62.down_proj.weight": "model-00043-of-00047.safetensors", + "model.layers.42.mlp.experts.62.down_proj.weight_scale": "model-00043-of-00047.safetensors", + "model.layers.42.mlp.experts.62.gate_proj.weight": "model-00043-of-00047.safetensors", + "model.layers.42.mlp.experts.62.gate_proj.weight_scale": "model-00043-of-00047.safetensors", + "model.layers.42.mlp.experts.62.up_proj.weight": "model-00043-of-00047.safetensors", + "model.layers.42.mlp.experts.62.up_proj.weight_scale": "model-00043-of-00047.safetensors", + "model.layers.42.mlp.experts.63.down_proj.weight": "model-00043-of-00047.safetensors", + "model.layers.42.mlp.experts.63.down_proj.weight_scale": "model-00043-of-00047.safetensors", + "model.layers.42.mlp.experts.63.gate_proj.weight": "model-00043-of-00047.safetensors", + "model.layers.42.mlp.experts.63.gate_proj.weight_scale": "model-00043-of-00047.safetensors", + "model.layers.42.mlp.experts.63.up_proj.weight": "model-00043-of-00047.safetensors", + "model.layers.42.mlp.experts.63.up_proj.weight_scale": "model-00043-of-00047.safetensors", + "model.layers.42.mlp.experts.64.down_proj.weight": "model-00043-of-00047.safetensors", + "model.layers.42.mlp.experts.64.down_proj.weight_scale": "model-00043-of-00047.safetensors", + "model.layers.42.mlp.experts.64.gate_proj.weight": "model-00043-of-00047.safetensors", + "model.layers.42.mlp.experts.64.gate_proj.weight_scale": "model-00043-of-00047.safetensors", + "model.layers.42.mlp.experts.64.up_proj.weight": "model-00043-of-00047.safetensors", + "model.layers.42.mlp.experts.64.up_proj.weight_scale": "model-00043-of-00047.safetensors", + "model.layers.42.mlp.experts.65.down_proj.weight": "model-00043-of-00047.safetensors", + "model.layers.42.mlp.experts.65.down_proj.weight_scale": "model-00043-of-00047.safetensors", + "model.layers.42.mlp.experts.65.gate_proj.weight": "model-00043-of-00047.safetensors", + "model.layers.42.mlp.experts.65.gate_proj.weight_scale": "model-00043-of-00047.safetensors", + "model.layers.42.mlp.experts.65.up_proj.weight": "model-00043-of-00047.safetensors", + "model.layers.42.mlp.experts.65.up_proj.weight_scale": "model-00043-of-00047.safetensors", + "model.layers.42.mlp.experts.66.down_proj.weight": "model-00043-of-00047.safetensors", + "model.layers.42.mlp.experts.66.down_proj.weight_scale": "model-00043-of-00047.safetensors", + "model.layers.42.mlp.experts.66.gate_proj.weight": "model-00043-of-00047.safetensors", + "model.layers.42.mlp.experts.66.gate_proj.weight_scale": "model-00043-of-00047.safetensors", + "model.layers.42.mlp.experts.66.up_proj.weight": "model-00043-of-00047.safetensors", + "model.layers.42.mlp.experts.66.up_proj.weight_scale": "model-00043-of-00047.safetensors", + "model.layers.42.mlp.experts.67.down_proj.weight": "model-00043-of-00047.safetensors", + "model.layers.42.mlp.experts.67.down_proj.weight_scale": "model-00043-of-00047.safetensors", + "model.layers.42.mlp.experts.67.gate_proj.weight": "model-00043-of-00047.safetensors", + "model.layers.42.mlp.experts.67.gate_proj.weight_scale": "model-00043-of-00047.safetensors", + "model.layers.42.mlp.experts.67.up_proj.weight": "model-00043-of-00047.safetensors", + "model.layers.42.mlp.experts.67.up_proj.weight_scale": "model-00043-of-00047.safetensors", + "model.layers.42.mlp.experts.68.down_proj.weight": "model-00043-of-00047.safetensors", + "model.layers.42.mlp.experts.68.down_proj.weight_scale": "model-00043-of-00047.safetensors", + "model.layers.42.mlp.experts.68.gate_proj.weight": "model-00043-of-00047.safetensors", + "model.layers.42.mlp.experts.68.gate_proj.weight_scale": "model-00043-of-00047.safetensors", + "model.layers.42.mlp.experts.68.up_proj.weight": "model-00043-of-00047.safetensors", + "model.layers.42.mlp.experts.68.up_proj.weight_scale": "model-00043-of-00047.safetensors", + "model.layers.42.mlp.experts.69.down_proj.weight": "model-00043-of-00047.safetensors", + "model.layers.42.mlp.experts.69.down_proj.weight_scale": "model-00043-of-00047.safetensors", + "model.layers.42.mlp.experts.69.gate_proj.weight": "model-00043-of-00047.safetensors", + "model.layers.42.mlp.experts.69.gate_proj.weight_scale": "model-00043-of-00047.safetensors", + "model.layers.42.mlp.experts.69.up_proj.weight": "model-00043-of-00047.safetensors", + "model.layers.42.mlp.experts.69.up_proj.weight_scale": "model-00043-of-00047.safetensors", + "model.layers.42.mlp.experts.7.down_proj.weight": "model-00043-of-00047.safetensors", + "model.layers.42.mlp.experts.7.down_proj.weight_scale": "model-00043-of-00047.safetensors", + "model.layers.42.mlp.experts.7.gate_proj.weight": "model-00043-of-00047.safetensors", + "model.layers.42.mlp.experts.7.gate_proj.weight_scale": "model-00043-of-00047.safetensors", + "model.layers.42.mlp.experts.7.up_proj.weight": "model-00043-of-00047.safetensors", + "model.layers.42.mlp.experts.7.up_proj.weight_scale": "model-00043-of-00047.safetensors", + "model.layers.42.mlp.experts.70.down_proj.weight": "model-00043-of-00047.safetensors", + "model.layers.42.mlp.experts.70.down_proj.weight_scale": "model-00043-of-00047.safetensors", + "model.layers.42.mlp.experts.70.gate_proj.weight": "model-00043-of-00047.safetensors", + "model.layers.42.mlp.experts.70.gate_proj.weight_scale": "model-00043-of-00047.safetensors", + "model.layers.42.mlp.experts.70.up_proj.weight": "model-00043-of-00047.safetensors", + "model.layers.42.mlp.experts.70.up_proj.weight_scale": "model-00043-of-00047.safetensors", + "model.layers.42.mlp.experts.71.down_proj.weight": "model-00043-of-00047.safetensors", + "model.layers.42.mlp.experts.71.down_proj.weight_scale": "model-00043-of-00047.safetensors", + "model.layers.42.mlp.experts.71.gate_proj.weight": "model-00043-of-00047.safetensors", + "model.layers.42.mlp.experts.71.gate_proj.weight_scale": "model-00043-of-00047.safetensors", + "model.layers.42.mlp.experts.71.up_proj.weight": "model-00043-of-00047.safetensors", + "model.layers.42.mlp.experts.71.up_proj.weight_scale": "model-00043-of-00047.safetensors", + "model.layers.42.mlp.experts.72.down_proj.weight": "model-00043-of-00047.safetensors", + "model.layers.42.mlp.experts.72.down_proj.weight_scale": "model-00043-of-00047.safetensors", + "model.layers.42.mlp.experts.72.gate_proj.weight": "model-00043-of-00047.safetensors", + "model.layers.42.mlp.experts.72.gate_proj.weight_scale": "model-00043-of-00047.safetensors", + "model.layers.42.mlp.experts.72.up_proj.weight": "model-00043-of-00047.safetensors", + "model.layers.42.mlp.experts.72.up_proj.weight_scale": "model-00043-of-00047.safetensors", + "model.layers.42.mlp.experts.73.down_proj.weight": "model-00043-of-00047.safetensors", + "model.layers.42.mlp.experts.73.down_proj.weight_scale": "model-00043-of-00047.safetensors", + "model.layers.42.mlp.experts.73.gate_proj.weight": "model-00043-of-00047.safetensors", + "model.layers.42.mlp.experts.73.gate_proj.weight_scale": "model-00043-of-00047.safetensors", + "model.layers.42.mlp.experts.73.up_proj.weight": "model-00043-of-00047.safetensors", + "model.layers.42.mlp.experts.73.up_proj.weight_scale": "model-00043-of-00047.safetensors", + "model.layers.42.mlp.experts.74.down_proj.weight": "model-00043-of-00047.safetensors", + "model.layers.42.mlp.experts.74.down_proj.weight_scale": "model-00043-of-00047.safetensors", + "model.layers.42.mlp.experts.74.gate_proj.weight": "model-00043-of-00047.safetensors", + "model.layers.42.mlp.experts.74.gate_proj.weight_scale": "model-00043-of-00047.safetensors", + "model.layers.42.mlp.experts.74.up_proj.weight": "model-00043-of-00047.safetensors", + "model.layers.42.mlp.experts.74.up_proj.weight_scale": "model-00043-of-00047.safetensors", + "model.layers.42.mlp.experts.75.down_proj.weight": "model-00043-of-00047.safetensors", + "model.layers.42.mlp.experts.75.down_proj.weight_scale": "model-00043-of-00047.safetensors", + "model.layers.42.mlp.experts.75.gate_proj.weight": "model-00043-of-00047.safetensors", + "model.layers.42.mlp.experts.75.gate_proj.weight_scale": "model-00043-of-00047.safetensors", + "model.layers.42.mlp.experts.75.up_proj.weight": "model-00043-of-00047.safetensors", + "model.layers.42.mlp.experts.75.up_proj.weight_scale": "model-00043-of-00047.safetensors", + "model.layers.42.mlp.experts.76.down_proj.weight": "model-00043-of-00047.safetensors", + "model.layers.42.mlp.experts.76.down_proj.weight_scale": "model-00043-of-00047.safetensors", + "model.layers.42.mlp.experts.76.gate_proj.weight": "model-00043-of-00047.safetensors", + "model.layers.42.mlp.experts.76.gate_proj.weight_scale": "model-00043-of-00047.safetensors", + "model.layers.42.mlp.experts.76.up_proj.weight": "model-00043-of-00047.safetensors", + "model.layers.42.mlp.experts.76.up_proj.weight_scale": "model-00043-of-00047.safetensors", + "model.layers.42.mlp.experts.77.down_proj.weight": "model-00043-of-00047.safetensors", + "model.layers.42.mlp.experts.77.down_proj.weight_scale": "model-00043-of-00047.safetensors", + "model.layers.42.mlp.experts.77.gate_proj.weight": "model-00043-of-00047.safetensors", + "model.layers.42.mlp.experts.77.gate_proj.weight_scale": "model-00043-of-00047.safetensors", + "model.layers.42.mlp.experts.77.up_proj.weight": "model-00043-of-00047.safetensors", + "model.layers.42.mlp.experts.77.up_proj.weight_scale": "model-00043-of-00047.safetensors", + "model.layers.42.mlp.experts.78.down_proj.weight": "model-00043-of-00047.safetensors", + "model.layers.42.mlp.experts.78.down_proj.weight_scale": "model-00043-of-00047.safetensors", + "model.layers.42.mlp.experts.78.gate_proj.weight": "model-00043-of-00047.safetensors", + "model.layers.42.mlp.experts.78.gate_proj.weight_scale": "model-00043-of-00047.safetensors", + "model.layers.42.mlp.experts.78.up_proj.weight": "model-00043-of-00047.safetensors", + "model.layers.42.mlp.experts.78.up_proj.weight_scale": "model-00043-of-00047.safetensors", + "model.layers.42.mlp.experts.79.down_proj.weight": "model-00043-of-00047.safetensors", + "model.layers.42.mlp.experts.79.down_proj.weight_scale": "model-00043-of-00047.safetensors", + "model.layers.42.mlp.experts.79.gate_proj.weight": "model-00043-of-00047.safetensors", + "model.layers.42.mlp.experts.79.gate_proj.weight_scale": "model-00043-of-00047.safetensors", + "model.layers.42.mlp.experts.79.up_proj.weight": "model-00043-of-00047.safetensors", + "model.layers.42.mlp.experts.79.up_proj.weight_scale": "model-00043-of-00047.safetensors", + "model.layers.42.mlp.experts.8.down_proj.weight": "model-00043-of-00047.safetensors", + "model.layers.42.mlp.experts.8.down_proj.weight_scale": "model-00043-of-00047.safetensors", + "model.layers.42.mlp.experts.8.gate_proj.weight": "model-00043-of-00047.safetensors", + "model.layers.42.mlp.experts.8.gate_proj.weight_scale": "model-00043-of-00047.safetensors", + "model.layers.42.mlp.experts.8.up_proj.weight": "model-00043-of-00047.safetensors", + "model.layers.42.mlp.experts.8.up_proj.weight_scale": "model-00043-of-00047.safetensors", + "model.layers.42.mlp.experts.80.down_proj.weight": "model-00043-of-00047.safetensors", + "model.layers.42.mlp.experts.80.down_proj.weight_scale": "model-00043-of-00047.safetensors", + "model.layers.42.mlp.experts.80.gate_proj.weight": "model-00043-of-00047.safetensors", + "model.layers.42.mlp.experts.80.gate_proj.weight_scale": "model-00043-of-00047.safetensors", + "model.layers.42.mlp.experts.80.up_proj.weight": "model-00043-of-00047.safetensors", + "model.layers.42.mlp.experts.80.up_proj.weight_scale": "model-00043-of-00047.safetensors", + "model.layers.42.mlp.experts.81.down_proj.weight": "model-00043-of-00047.safetensors", + "model.layers.42.mlp.experts.81.down_proj.weight_scale": "model-00043-of-00047.safetensors", + "model.layers.42.mlp.experts.81.gate_proj.weight": "model-00043-of-00047.safetensors", + "model.layers.42.mlp.experts.81.gate_proj.weight_scale": "model-00043-of-00047.safetensors", + "model.layers.42.mlp.experts.81.up_proj.weight": "model-00043-of-00047.safetensors", + "model.layers.42.mlp.experts.81.up_proj.weight_scale": "model-00043-of-00047.safetensors", + "model.layers.42.mlp.experts.82.down_proj.weight": "model-00043-of-00047.safetensors", + "model.layers.42.mlp.experts.82.down_proj.weight_scale": "model-00043-of-00047.safetensors", + "model.layers.42.mlp.experts.82.gate_proj.weight": "model-00043-of-00047.safetensors", + "model.layers.42.mlp.experts.82.gate_proj.weight_scale": "model-00043-of-00047.safetensors", + "model.layers.42.mlp.experts.82.up_proj.weight": "model-00043-of-00047.safetensors", + "model.layers.42.mlp.experts.82.up_proj.weight_scale": "model-00043-of-00047.safetensors", + "model.layers.42.mlp.experts.83.down_proj.weight": "model-00043-of-00047.safetensors", + "model.layers.42.mlp.experts.83.down_proj.weight_scale": "model-00043-of-00047.safetensors", + "model.layers.42.mlp.experts.83.gate_proj.weight": "model-00043-of-00047.safetensors", + "model.layers.42.mlp.experts.83.gate_proj.weight_scale": "model-00043-of-00047.safetensors", + "model.layers.42.mlp.experts.83.up_proj.weight": "model-00043-of-00047.safetensors", + "model.layers.42.mlp.experts.83.up_proj.weight_scale": "model-00043-of-00047.safetensors", + "model.layers.42.mlp.experts.84.down_proj.weight": "model-00043-of-00047.safetensors", + "model.layers.42.mlp.experts.84.down_proj.weight_scale": "model-00043-of-00047.safetensors", + "model.layers.42.mlp.experts.84.gate_proj.weight": "model-00043-of-00047.safetensors", + "model.layers.42.mlp.experts.84.gate_proj.weight_scale": "model-00043-of-00047.safetensors", + "model.layers.42.mlp.experts.84.up_proj.weight": "model-00043-of-00047.safetensors", + "model.layers.42.mlp.experts.84.up_proj.weight_scale": "model-00043-of-00047.safetensors", + "model.layers.42.mlp.experts.85.down_proj.weight": "model-00043-of-00047.safetensors", + "model.layers.42.mlp.experts.85.down_proj.weight_scale": "model-00043-of-00047.safetensors", + "model.layers.42.mlp.experts.85.gate_proj.weight": "model-00043-of-00047.safetensors", + "model.layers.42.mlp.experts.85.gate_proj.weight_scale": "model-00043-of-00047.safetensors", + "model.layers.42.mlp.experts.85.up_proj.weight": "model-00043-of-00047.safetensors", + "model.layers.42.mlp.experts.85.up_proj.weight_scale": "model-00043-of-00047.safetensors", + "model.layers.42.mlp.experts.86.down_proj.weight": "model-00043-of-00047.safetensors", + "model.layers.42.mlp.experts.86.down_proj.weight_scale": "model-00043-of-00047.safetensors", + "model.layers.42.mlp.experts.86.gate_proj.weight": "model-00043-of-00047.safetensors", + "model.layers.42.mlp.experts.86.gate_proj.weight_scale": "model-00043-of-00047.safetensors", + "model.layers.42.mlp.experts.86.up_proj.weight": "model-00043-of-00047.safetensors", + "model.layers.42.mlp.experts.86.up_proj.weight_scale": "model-00043-of-00047.safetensors", + "model.layers.42.mlp.experts.87.down_proj.weight": "model-00043-of-00047.safetensors", + "model.layers.42.mlp.experts.87.down_proj.weight_scale": "model-00043-of-00047.safetensors", + "model.layers.42.mlp.experts.87.gate_proj.weight": "model-00043-of-00047.safetensors", + "model.layers.42.mlp.experts.87.gate_proj.weight_scale": "model-00043-of-00047.safetensors", + "model.layers.42.mlp.experts.87.up_proj.weight": "model-00043-of-00047.safetensors", + "model.layers.42.mlp.experts.87.up_proj.weight_scale": "model-00043-of-00047.safetensors", + "model.layers.42.mlp.experts.88.down_proj.weight": "model-00043-of-00047.safetensors", + "model.layers.42.mlp.experts.88.down_proj.weight_scale": "model-00043-of-00047.safetensors", + "model.layers.42.mlp.experts.88.gate_proj.weight": "model-00043-of-00047.safetensors", + "model.layers.42.mlp.experts.88.gate_proj.weight_scale": "model-00043-of-00047.safetensors", + "model.layers.42.mlp.experts.88.up_proj.weight": "model-00043-of-00047.safetensors", + "model.layers.42.mlp.experts.88.up_proj.weight_scale": "model-00043-of-00047.safetensors", + "model.layers.42.mlp.experts.89.down_proj.weight": "model-00043-of-00047.safetensors", + "model.layers.42.mlp.experts.89.down_proj.weight_scale": "model-00043-of-00047.safetensors", + "model.layers.42.mlp.experts.89.gate_proj.weight": "model-00043-of-00047.safetensors", + "model.layers.42.mlp.experts.89.gate_proj.weight_scale": "model-00043-of-00047.safetensors", + "model.layers.42.mlp.experts.89.up_proj.weight": "model-00043-of-00047.safetensors", + "model.layers.42.mlp.experts.89.up_proj.weight_scale": "model-00043-of-00047.safetensors", + "model.layers.42.mlp.experts.9.down_proj.weight": "model-00043-of-00047.safetensors", + "model.layers.42.mlp.experts.9.down_proj.weight_scale": "model-00043-of-00047.safetensors", + "model.layers.42.mlp.experts.9.gate_proj.weight": "model-00043-of-00047.safetensors", + "model.layers.42.mlp.experts.9.gate_proj.weight_scale": "model-00043-of-00047.safetensors", + "model.layers.42.mlp.experts.9.up_proj.weight": "model-00043-of-00047.safetensors", + "model.layers.42.mlp.experts.9.up_proj.weight_scale": "model-00043-of-00047.safetensors", + "model.layers.42.mlp.experts.90.down_proj.weight": "model-00043-of-00047.safetensors", + "model.layers.42.mlp.experts.90.down_proj.weight_scale": "model-00043-of-00047.safetensors", + "model.layers.42.mlp.experts.90.gate_proj.weight": "model-00043-of-00047.safetensors", + "model.layers.42.mlp.experts.90.gate_proj.weight_scale": "model-00043-of-00047.safetensors", + "model.layers.42.mlp.experts.90.up_proj.weight": "model-00043-of-00047.safetensors", + "model.layers.42.mlp.experts.90.up_proj.weight_scale": "model-00043-of-00047.safetensors", + "model.layers.42.mlp.experts.91.down_proj.weight": "model-00043-of-00047.safetensors", + "model.layers.42.mlp.experts.91.down_proj.weight_scale": "model-00043-of-00047.safetensors", + "model.layers.42.mlp.experts.91.gate_proj.weight": "model-00043-of-00047.safetensors", + "model.layers.42.mlp.experts.91.gate_proj.weight_scale": "model-00043-of-00047.safetensors", + "model.layers.42.mlp.experts.91.up_proj.weight": "model-00043-of-00047.safetensors", + "model.layers.42.mlp.experts.91.up_proj.weight_scale": "model-00043-of-00047.safetensors", + "model.layers.42.mlp.experts.92.down_proj.weight": "model-00043-of-00047.safetensors", + "model.layers.42.mlp.experts.92.down_proj.weight_scale": "model-00043-of-00047.safetensors", + "model.layers.42.mlp.experts.92.gate_proj.weight": "model-00043-of-00047.safetensors", + "model.layers.42.mlp.experts.92.gate_proj.weight_scale": "model-00043-of-00047.safetensors", + "model.layers.42.mlp.experts.92.up_proj.weight": "model-00043-of-00047.safetensors", + "model.layers.42.mlp.experts.92.up_proj.weight_scale": "model-00043-of-00047.safetensors", + "model.layers.42.mlp.experts.93.down_proj.weight": "model-00043-of-00047.safetensors", + "model.layers.42.mlp.experts.93.down_proj.weight_scale": "model-00043-of-00047.safetensors", + "model.layers.42.mlp.experts.93.gate_proj.weight": "model-00043-of-00047.safetensors", + "model.layers.42.mlp.experts.93.gate_proj.weight_scale": "model-00043-of-00047.safetensors", + "model.layers.42.mlp.experts.93.up_proj.weight": "model-00043-of-00047.safetensors", + "model.layers.42.mlp.experts.93.up_proj.weight_scale": "model-00043-of-00047.safetensors", + "model.layers.42.mlp.experts.94.down_proj.weight": "model-00043-of-00047.safetensors", + "model.layers.42.mlp.experts.94.down_proj.weight_scale": "model-00043-of-00047.safetensors", + "model.layers.42.mlp.experts.94.gate_proj.weight": "model-00043-of-00047.safetensors", + "model.layers.42.mlp.experts.94.gate_proj.weight_scale": "model-00043-of-00047.safetensors", + "model.layers.42.mlp.experts.94.up_proj.weight": "model-00043-of-00047.safetensors", + "model.layers.42.mlp.experts.94.up_proj.weight_scale": "model-00043-of-00047.safetensors", + "model.layers.42.mlp.experts.95.down_proj.weight": "model-00043-of-00047.safetensors", + "model.layers.42.mlp.experts.95.down_proj.weight_scale": "model-00043-of-00047.safetensors", + "model.layers.42.mlp.experts.95.gate_proj.weight": "model-00043-of-00047.safetensors", + "model.layers.42.mlp.experts.95.gate_proj.weight_scale": "model-00043-of-00047.safetensors", + "model.layers.42.mlp.experts.95.up_proj.weight": "model-00043-of-00047.safetensors", + "model.layers.42.mlp.experts.95.up_proj.weight_scale": "model-00043-of-00047.safetensors", + "model.layers.42.mlp.experts.96.down_proj.weight": "model-00043-of-00047.safetensors", + "model.layers.42.mlp.experts.96.down_proj.weight_scale": "model-00043-of-00047.safetensors", + "model.layers.42.mlp.experts.96.gate_proj.weight": "model-00043-of-00047.safetensors", + "model.layers.42.mlp.experts.96.gate_proj.weight_scale": "model-00043-of-00047.safetensors", + "model.layers.42.mlp.experts.96.up_proj.weight": "model-00043-of-00047.safetensors", + "model.layers.42.mlp.experts.96.up_proj.weight_scale": "model-00043-of-00047.safetensors", + "model.layers.42.mlp.experts.97.down_proj.weight": "model-00043-of-00047.safetensors", + "model.layers.42.mlp.experts.97.down_proj.weight_scale": "model-00043-of-00047.safetensors", + "model.layers.42.mlp.experts.97.gate_proj.weight": "model-00043-of-00047.safetensors", + "model.layers.42.mlp.experts.97.gate_proj.weight_scale": "model-00043-of-00047.safetensors", + "model.layers.42.mlp.experts.97.up_proj.weight": "model-00043-of-00047.safetensors", + "model.layers.42.mlp.experts.97.up_proj.weight_scale": "model-00043-of-00047.safetensors", + "model.layers.42.mlp.experts.98.down_proj.weight": "model-00043-of-00047.safetensors", + "model.layers.42.mlp.experts.98.down_proj.weight_scale": "model-00043-of-00047.safetensors", + "model.layers.42.mlp.experts.98.gate_proj.weight": "model-00043-of-00047.safetensors", + "model.layers.42.mlp.experts.98.gate_proj.weight_scale": "model-00043-of-00047.safetensors", + "model.layers.42.mlp.experts.98.up_proj.weight": "model-00043-of-00047.safetensors", + "model.layers.42.mlp.experts.98.up_proj.weight_scale": "model-00043-of-00047.safetensors", + "model.layers.42.mlp.experts.99.down_proj.weight": "model-00043-of-00047.safetensors", + "model.layers.42.mlp.experts.99.down_proj.weight_scale": "model-00043-of-00047.safetensors", + "model.layers.42.mlp.experts.99.gate_proj.weight": "model-00043-of-00047.safetensors", + "model.layers.42.mlp.experts.99.gate_proj.weight_scale": "model-00043-of-00047.safetensors", + "model.layers.42.mlp.experts.99.up_proj.weight": "model-00043-of-00047.safetensors", + "model.layers.42.mlp.experts.99.up_proj.weight_scale": "model-00043-of-00047.safetensors", + "model.layers.42.mlp.gate.e_score_correction_bias": "model-00043-of-00047.safetensors", + "model.layers.42.mlp.gate.weight": "model-00043-of-00047.safetensors", + "model.layers.42.mlp.shared_experts.down_proj.weight": "model-00043-of-00047.safetensors", + "model.layers.42.mlp.shared_experts.down_proj.weight_scale": "model-00043-of-00047.safetensors", + "model.layers.42.mlp.shared_experts.gate_proj.weight": "model-00043-of-00047.safetensors", + "model.layers.42.mlp.shared_experts.gate_proj.weight_scale": "model-00043-of-00047.safetensors", + "model.layers.42.mlp.shared_experts.up_proj.weight": "model-00043-of-00047.safetensors", + "model.layers.42.mlp.shared_experts.up_proj.weight_scale": "model-00043-of-00047.safetensors", + "model.layers.42.post_attention_layernorm.weight": "model-00043-of-00047.safetensors", + "model.layers.42.self_attn.k_proj.bias": "model-00043-of-00047.safetensors", + "model.layers.42.self_attn.k_proj.weight": "model-00043-of-00047.safetensors", + "model.layers.42.self_attn.k_proj.weight_scale": "model-00043-of-00047.safetensors", + "model.layers.42.self_attn.o_proj.weight": "model-00043-of-00047.safetensors", + "model.layers.42.self_attn.o_proj.weight_scale": "model-00043-of-00047.safetensors", + "model.layers.42.self_attn.q_proj.bias": "model-00043-of-00047.safetensors", + "model.layers.42.self_attn.q_proj.weight": "model-00043-of-00047.safetensors", + "model.layers.42.self_attn.q_proj.weight_scale": "model-00043-of-00047.safetensors", + "model.layers.42.self_attn.v_proj.bias": "model-00043-of-00047.safetensors", + "model.layers.42.self_attn.v_proj.weight": "model-00043-of-00047.safetensors", + "model.layers.42.self_attn.v_proj.weight_scale": "model-00043-of-00047.safetensors", + "model.layers.43.input_layernorm.weight": "model-00044-of-00047.safetensors", + "model.layers.43.mlp.experts.0.down_proj.weight": "model-00044-of-00047.safetensors", + "model.layers.43.mlp.experts.0.down_proj.weight_scale": "model-00044-of-00047.safetensors", + "model.layers.43.mlp.experts.0.gate_proj.weight": "model-00044-of-00047.safetensors", + "model.layers.43.mlp.experts.0.gate_proj.weight_scale": "model-00044-of-00047.safetensors", + "model.layers.43.mlp.experts.0.up_proj.weight": "model-00044-of-00047.safetensors", + "model.layers.43.mlp.experts.0.up_proj.weight_scale": "model-00044-of-00047.safetensors", + "model.layers.43.mlp.experts.1.down_proj.weight": "model-00044-of-00047.safetensors", + "model.layers.43.mlp.experts.1.down_proj.weight_scale": "model-00044-of-00047.safetensors", + "model.layers.43.mlp.experts.1.gate_proj.weight": "model-00044-of-00047.safetensors", + "model.layers.43.mlp.experts.1.gate_proj.weight_scale": "model-00044-of-00047.safetensors", + "model.layers.43.mlp.experts.1.up_proj.weight": "model-00044-of-00047.safetensors", + "model.layers.43.mlp.experts.1.up_proj.weight_scale": "model-00044-of-00047.safetensors", + "model.layers.43.mlp.experts.10.down_proj.weight": "model-00044-of-00047.safetensors", + "model.layers.43.mlp.experts.10.down_proj.weight_scale": "model-00044-of-00047.safetensors", + "model.layers.43.mlp.experts.10.gate_proj.weight": "model-00044-of-00047.safetensors", + "model.layers.43.mlp.experts.10.gate_proj.weight_scale": "model-00044-of-00047.safetensors", + "model.layers.43.mlp.experts.10.up_proj.weight": "model-00044-of-00047.safetensors", + "model.layers.43.mlp.experts.10.up_proj.weight_scale": "model-00044-of-00047.safetensors", + "model.layers.43.mlp.experts.100.down_proj.weight": "model-00044-of-00047.safetensors", + "model.layers.43.mlp.experts.100.down_proj.weight_scale": "model-00044-of-00047.safetensors", + "model.layers.43.mlp.experts.100.gate_proj.weight": "model-00044-of-00047.safetensors", + "model.layers.43.mlp.experts.100.gate_proj.weight_scale": "model-00044-of-00047.safetensors", + "model.layers.43.mlp.experts.100.up_proj.weight": "model-00044-of-00047.safetensors", + "model.layers.43.mlp.experts.100.up_proj.weight_scale": "model-00044-of-00047.safetensors", + "model.layers.43.mlp.experts.101.down_proj.weight": "model-00044-of-00047.safetensors", + "model.layers.43.mlp.experts.101.down_proj.weight_scale": "model-00044-of-00047.safetensors", + "model.layers.43.mlp.experts.101.gate_proj.weight": "model-00044-of-00047.safetensors", + "model.layers.43.mlp.experts.101.gate_proj.weight_scale": "model-00044-of-00047.safetensors", + "model.layers.43.mlp.experts.101.up_proj.weight": "model-00044-of-00047.safetensors", + "model.layers.43.mlp.experts.101.up_proj.weight_scale": "model-00044-of-00047.safetensors", + "model.layers.43.mlp.experts.102.down_proj.weight": "model-00044-of-00047.safetensors", + "model.layers.43.mlp.experts.102.down_proj.weight_scale": "model-00044-of-00047.safetensors", + "model.layers.43.mlp.experts.102.gate_proj.weight": "model-00044-of-00047.safetensors", + "model.layers.43.mlp.experts.102.gate_proj.weight_scale": "model-00044-of-00047.safetensors", + "model.layers.43.mlp.experts.102.up_proj.weight": "model-00044-of-00047.safetensors", + "model.layers.43.mlp.experts.102.up_proj.weight_scale": "model-00044-of-00047.safetensors", + "model.layers.43.mlp.experts.103.down_proj.weight": "model-00044-of-00047.safetensors", + "model.layers.43.mlp.experts.103.down_proj.weight_scale": "model-00044-of-00047.safetensors", + "model.layers.43.mlp.experts.103.gate_proj.weight": "model-00044-of-00047.safetensors", + "model.layers.43.mlp.experts.103.gate_proj.weight_scale": "model-00044-of-00047.safetensors", + "model.layers.43.mlp.experts.103.up_proj.weight": "model-00044-of-00047.safetensors", + "model.layers.43.mlp.experts.103.up_proj.weight_scale": "model-00044-of-00047.safetensors", + "model.layers.43.mlp.experts.104.down_proj.weight": "model-00044-of-00047.safetensors", + "model.layers.43.mlp.experts.104.down_proj.weight_scale": "model-00044-of-00047.safetensors", + "model.layers.43.mlp.experts.104.gate_proj.weight": "model-00044-of-00047.safetensors", + "model.layers.43.mlp.experts.104.gate_proj.weight_scale": "model-00044-of-00047.safetensors", + "model.layers.43.mlp.experts.104.up_proj.weight": "model-00044-of-00047.safetensors", + "model.layers.43.mlp.experts.104.up_proj.weight_scale": "model-00044-of-00047.safetensors", + "model.layers.43.mlp.experts.105.down_proj.weight": "model-00044-of-00047.safetensors", + "model.layers.43.mlp.experts.105.down_proj.weight_scale": "model-00044-of-00047.safetensors", + "model.layers.43.mlp.experts.105.gate_proj.weight": "model-00044-of-00047.safetensors", + "model.layers.43.mlp.experts.105.gate_proj.weight_scale": "model-00044-of-00047.safetensors", + "model.layers.43.mlp.experts.105.up_proj.weight": "model-00044-of-00047.safetensors", + "model.layers.43.mlp.experts.105.up_proj.weight_scale": "model-00044-of-00047.safetensors", + "model.layers.43.mlp.experts.106.down_proj.weight": "model-00044-of-00047.safetensors", + "model.layers.43.mlp.experts.106.down_proj.weight_scale": "model-00044-of-00047.safetensors", + "model.layers.43.mlp.experts.106.gate_proj.weight": "model-00044-of-00047.safetensors", + "model.layers.43.mlp.experts.106.gate_proj.weight_scale": "model-00044-of-00047.safetensors", + "model.layers.43.mlp.experts.106.up_proj.weight": "model-00044-of-00047.safetensors", + "model.layers.43.mlp.experts.106.up_proj.weight_scale": "model-00044-of-00047.safetensors", + "model.layers.43.mlp.experts.107.down_proj.weight": "model-00044-of-00047.safetensors", + "model.layers.43.mlp.experts.107.down_proj.weight_scale": "model-00044-of-00047.safetensors", + "model.layers.43.mlp.experts.107.gate_proj.weight": "model-00044-of-00047.safetensors", + "model.layers.43.mlp.experts.107.gate_proj.weight_scale": "model-00044-of-00047.safetensors", + "model.layers.43.mlp.experts.107.up_proj.weight": "model-00044-of-00047.safetensors", + "model.layers.43.mlp.experts.107.up_proj.weight_scale": "model-00044-of-00047.safetensors", + "model.layers.43.mlp.experts.108.down_proj.weight": "model-00044-of-00047.safetensors", + "model.layers.43.mlp.experts.108.down_proj.weight_scale": "model-00044-of-00047.safetensors", + "model.layers.43.mlp.experts.108.gate_proj.weight": "model-00044-of-00047.safetensors", + "model.layers.43.mlp.experts.108.gate_proj.weight_scale": "model-00044-of-00047.safetensors", + "model.layers.43.mlp.experts.108.up_proj.weight": "model-00044-of-00047.safetensors", + "model.layers.43.mlp.experts.108.up_proj.weight_scale": "model-00044-of-00047.safetensors", + "model.layers.43.mlp.experts.109.down_proj.weight": "model-00044-of-00047.safetensors", + "model.layers.43.mlp.experts.109.down_proj.weight_scale": "model-00044-of-00047.safetensors", + "model.layers.43.mlp.experts.109.gate_proj.weight": "model-00044-of-00047.safetensors", + "model.layers.43.mlp.experts.109.gate_proj.weight_scale": "model-00044-of-00047.safetensors", + "model.layers.43.mlp.experts.109.up_proj.weight": "model-00044-of-00047.safetensors", + "model.layers.43.mlp.experts.109.up_proj.weight_scale": "model-00044-of-00047.safetensors", + "model.layers.43.mlp.experts.11.down_proj.weight": "model-00044-of-00047.safetensors", + "model.layers.43.mlp.experts.11.down_proj.weight_scale": "model-00044-of-00047.safetensors", + "model.layers.43.mlp.experts.11.gate_proj.weight": "model-00044-of-00047.safetensors", + "model.layers.43.mlp.experts.11.gate_proj.weight_scale": "model-00044-of-00047.safetensors", + "model.layers.43.mlp.experts.11.up_proj.weight": "model-00044-of-00047.safetensors", + "model.layers.43.mlp.experts.11.up_proj.weight_scale": "model-00044-of-00047.safetensors", + "model.layers.43.mlp.experts.110.down_proj.weight": "model-00044-of-00047.safetensors", + "model.layers.43.mlp.experts.110.down_proj.weight_scale": "model-00044-of-00047.safetensors", + "model.layers.43.mlp.experts.110.gate_proj.weight": "model-00044-of-00047.safetensors", + "model.layers.43.mlp.experts.110.gate_proj.weight_scale": "model-00044-of-00047.safetensors", + "model.layers.43.mlp.experts.110.up_proj.weight": "model-00044-of-00047.safetensors", + "model.layers.43.mlp.experts.110.up_proj.weight_scale": "model-00044-of-00047.safetensors", + "model.layers.43.mlp.experts.111.down_proj.weight": "model-00044-of-00047.safetensors", + "model.layers.43.mlp.experts.111.down_proj.weight_scale": "model-00044-of-00047.safetensors", + "model.layers.43.mlp.experts.111.gate_proj.weight": "model-00044-of-00047.safetensors", + "model.layers.43.mlp.experts.111.gate_proj.weight_scale": "model-00044-of-00047.safetensors", + "model.layers.43.mlp.experts.111.up_proj.weight": "model-00044-of-00047.safetensors", + "model.layers.43.mlp.experts.111.up_proj.weight_scale": "model-00044-of-00047.safetensors", + "model.layers.43.mlp.experts.112.down_proj.weight": "model-00044-of-00047.safetensors", + "model.layers.43.mlp.experts.112.down_proj.weight_scale": "model-00044-of-00047.safetensors", + "model.layers.43.mlp.experts.112.gate_proj.weight": "model-00044-of-00047.safetensors", + "model.layers.43.mlp.experts.112.gate_proj.weight_scale": "model-00044-of-00047.safetensors", + "model.layers.43.mlp.experts.112.up_proj.weight": "model-00044-of-00047.safetensors", + "model.layers.43.mlp.experts.112.up_proj.weight_scale": "model-00044-of-00047.safetensors", + "model.layers.43.mlp.experts.113.down_proj.weight": "model-00044-of-00047.safetensors", + "model.layers.43.mlp.experts.113.down_proj.weight_scale": "model-00044-of-00047.safetensors", + "model.layers.43.mlp.experts.113.gate_proj.weight": "model-00044-of-00047.safetensors", + "model.layers.43.mlp.experts.113.gate_proj.weight_scale": "model-00044-of-00047.safetensors", + "model.layers.43.mlp.experts.113.up_proj.weight": "model-00044-of-00047.safetensors", + "model.layers.43.mlp.experts.113.up_proj.weight_scale": "model-00044-of-00047.safetensors", + "model.layers.43.mlp.experts.114.down_proj.weight": "model-00044-of-00047.safetensors", + "model.layers.43.mlp.experts.114.down_proj.weight_scale": "model-00044-of-00047.safetensors", + "model.layers.43.mlp.experts.114.gate_proj.weight": "model-00044-of-00047.safetensors", + "model.layers.43.mlp.experts.114.gate_proj.weight_scale": "model-00044-of-00047.safetensors", + "model.layers.43.mlp.experts.114.up_proj.weight": "model-00044-of-00047.safetensors", + "model.layers.43.mlp.experts.114.up_proj.weight_scale": "model-00044-of-00047.safetensors", + "model.layers.43.mlp.experts.115.down_proj.weight": "model-00044-of-00047.safetensors", + "model.layers.43.mlp.experts.115.down_proj.weight_scale": "model-00044-of-00047.safetensors", + "model.layers.43.mlp.experts.115.gate_proj.weight": "model-00044-of-00047.safetensors", + "model.layers.43.mlp.experts.115.gate_proj.weight_scale": "model-00044-of-00047.safetensors", + "model.layers.43.mlp.experts.115.up_proj.weight": "model-00044-of-00047.safetensors", + "model.layers.43.mlp.experts.115.up_proj.weight_scale": "model-00044-of-00047.safetensors", + "model.layers.43.mlp.experts.116.down_proj.weight": "model-00044-of-00047.safetensors", + "model.layers.43.mlp.experts.116.down_proj.weight_scale": "model-00044-of-00047.safetensors", + "model.layers.43.mlp.experts.116.gate_proj.weight": "model-00044-of-00047.safetensors", + "model.layers.43.mlp.experts.116.gate_proj.weight_scale": "model-00044-of-00047.safetensors", + "model.layers.43.mlp.experts.116.up_proj.weight": "model-00044-of-00047.safetensors", + "model.layers.43.mlp.experts.116.up_proj.weight_scale": "model-00044-of-00047.safetensors", + "model.layers.43.mlp.experts.117.down_proj.weight": "model-00044-of-00047.safetensors", + "model.layers.43.mlp.experts.117.down_proj.weight_scale": "model-00044-of-00047.safetensors", + "model.layers.43.mlp.experts.117.gate_proj.weight": "model-00044-of-00047.safetensors", + "model.layers.43.mlp.experts.117.gate_proj.weight_scale": "model-00044-of-00047.safetensors", + "model.layers.43.mlp.experts.117.up_proj.weight": "model-00044-of-00047.safetensors", + "model.layers.43.mlp.experts.117.up_proj.weight_scale": "model-00044-of-00047.safetensors", + "model.layers.43.mlp.experts.118.down_proj.weight": "model-00044-of-00047.safetensors", + "model.layers.43.mlp.experts.118.down_proj.weight_scale": "model-00044-of-00047.safetensors", + "model.layers.43.mlp.experts.118.gate_proj.weight": "model-00044-of-00047.safetensors", + "model.layers.43.mlp.experts.118.gate_proj.weight_scale": "model-00044-of-00047.safetensors", + "model.layers.43.mlp.experts.118.up_proj.weight": "model-00044-of-00047.safetensors", + "model.layers.43.mlp.experts.118.up_proj.weight_scale": "model-00044-of-00047.safetensors", + "model.layers.43.mlp.experts.119.down_proj.weight": "model-00044-of-00047.safetensors", + "model.layers.43.mlp.experts.119.down_proj.weight_scale": "model-00044-of-00047.safetensors", + "model.layers.43.mlp.experts.119.gate_proj.weight": "model-00044-of-00047.safetensors", + "model.layers.43.mlp.experts.119.gate_proj.weight_scale": "model-00044-of-00047.safetensors", + "model.layers.43.mlp.experts.119.up_proj.weight": "model-00044-of-00047.safetensors", + "model.layers.43.mlp.experts.119.up_proj.weight_scale": "model-00044-of-00047.safetensors", + "model.layers.43.mlp.experts.12.down_proj.weight": "model-00044-of-00047.safetensors", + "model.layers.43.mlp.experts.12.down_proj.weight_scale": "model-00044-of-00047.safetensors", + "model.layers.43.mlp.experts.12.gate_proj.weight": "model-00044-of-00047.safetensors", + "model.layers.43.mlp.experts.12.gate_proj.weight_scale": "model-00044-of-00047.safetensors", + "model.layers.43.mlp.experts.12.up_proj.weight": "model-00044-of-00047.safetensors", + "model.layers.43.mlp.experts.12.up_proj.weight_scale": "model-00044-of-00047.safetensors", + "model.layers.43.mlp.experts.120.down_proj.weight": "model-00044-of-00047.safetensors", + "model.layers.43.mlp.experts.120.down_proj.weight_scale": "model-00044-of-00047.safetensors", + "model.layers.43.mlp.experts.120.gate_proj.weight": "model-00044-of-00047.safetensors", + "model.layers.43.mlp.experts.120.gate_proj.weight_scale": "model-00044-of-00047.safetensors", + "model.layers.43.mlp.experts.120.up_proj.weight": "model-00044-of-00047.safetensors", + "model.layers.43.mlp.experts.120.up_proj.weight_scale": "model-00044-of-00047.safetensors", + "model.layers.43.mlp.experts.121.down_proj.weight": "model-00044-of-00047.safetensors", + "model.layers.43.mlp.experts.121.down_proj.weight_scale": "model-00044-of-00047.safetensors", + "model.layers.43.mlp.experts.121.gate_proj.weight": "model-00044-of-00047.safetensors", + "model.layers.43.mlp.experts.121.gate_proj.weight_scale": "model-00044-of-00047.safetensors", + "model.layers.43.mlp.experts.121.up_proj.weight": "model-00044-of-00047.safetensors", + "model.layers.43.mlp.experts.121.up_proj.weight_scale": "model-00044-of-00047.safetensors", + "model.layers.43.mlp.experts.122.down_proj.weight": "model-00044-of-00047.safetensors", + "model.layers.43.mlp.experts.122.down_proj.weight_scale": "model-00044-of-00047.safetensors", + "model.layers.43.mlp.experts.122.gate_proj.weight": "model-00044-of-00047.safetensors", + "model.layers.43.mlp.experts.122.gate_proj.weight_scale": "model-00044-of-00047.safetensors", + "model.layers.43.mlp.experts.122.up_proj.weight": "model-00044-of-00047.safetensors", + "model.layers.43.mlp.experts.122.up_proj.weight_scale": "model-00044-of-00047.safetensors", + "model.layers.43.mlp.experts.123.down_proj.weight": "model-00044-of-00047.safetensors", + "model.layers.43.mlp.experts.123.down_proj.weight_scale": "model-00044-of-00047.safetensors", + "model.layers.43.mlp.experts.123.gate_proj.weight": "model-00044-of-00047.safetensors", + "model.layers.43.mlp.experts.123.gate_proj.weight_scale": "model-00044-of-00047.safetensors", + "model.layers.43.mlp.experts.123.up_proj.weight": "model-00044-of-00047.safetensors", + "model.layers.43.mlp.experts.123.up_proj.weight_scale": "model-00044-of-00047.safetensors", + "model.layers.43.mlp.experts.124.down_proj.weight": "model-00044-of-00047.safetensors", + "model.layers.43.mlp.experts.124.down_proj.weight_scale": "model-00044-of-00047.safetensors", + "model.layers.43.mlp.experts.124.gate_proj.weight": "model-00044-of-00047.safetensors", + "model.layers.43.mlp.experts.124.gate_proj.weight_scale": "model-00044-of-00047.safetensors", + "model.layers.43.mlp.experts.124.up_proj.weight": "model-00044-of-00047.safetensors", + "model.layers.43.mlp.experts.124.up_proj.weight_scale": "model-00044-of-00047.safetensors", + "model.layers.43.mlp.experts.125.down_proj.weight": "model-00044-of-00047.safetensors", + "model.layers.43.mlp.experts.125.down_proj.weight_scale": "model-00044-of-00047.safetensors", + "model.layers.43.mlp.experts.125.gate_proj.weight": "model-00044-of-00047.safetensors", + "model.layers.43.mlp.experts.125.gate_proj.weight_scale": "model-00044-of-00047.safetensors", + "model.layers.43.mlp.experts.125.up_proj.weight": "model-00044-of-00047.safetensors", + "model.layers.43.mlp.experts.125.up_proj.weight_scale": "model-00044-of-00047.safetensors", + "model.layers.43.mlp.experts.126.down_proj.weight": "model-00044-of-00047.safetensors", + "model.layers.43.mlp.experts.126.down_proj.weight_scale": "model-00044-of-00047.safetensors", + "model.layers.43.mlp.experts.126.gate_proj.weight": "model-00044-of-00047.safetensors", + "model.layers.43.mlp.experts.126.gate_proj.weight_scale": "model-00044-of-00047.safetensors", + "model.layers.43.mlp.experts.126.up_proj.weight": "model-00044-of-00047.safetensors", + "model.layers.43.mlp.experts.126.up_proj.weight_scale": "model-00044-of-00047.safetensors", + "model.layers.43.mlp.experts.127.down_proj.weight": "model-00044-of-00047.safetensors", + "model.layers.43.mlp.experts.127.down_proj.weight_scale": "model-00044-of-00047.safetensors", + "model.layers.43.mlp.experts.127.gate_proj.weight": "model-00044-of-00047.safetensors", + "model.layers.43.mlp.experts.127.gate_proj.weight_scale": "model-00044-of-00047.safetensors", + "model.layers.43.mlp.experts.127.up_proj.weight": "model-00044-of-00047.safetensors", + "model.layers.43.mlp.experts.127.up_proj.weight_scale": "model-00044-of-00047.safetensors", + "model.layers.43.mlp.experts.13.down_proj.weight": "model-00044-of-00047.safetensors", + "model.layers.43.mlp.experts.13.down_proj.weight_scale": "model-00044-of-00047.safetensors", + "model.layers.43.mlp.experts.13.gate_proj.weight": "model-00044-of-00047.safetensors", + "model.layers.43.mlp.experts.13.gate_proj.weight_scale": "model-00044-of-00047.safetensors", + "model.layers.43.mlp.experts.13.up_proj.weight": "model-00044-of-00047.safetensors", + "model.layers.43.mlp.experts.13.up_proj.weight_scale": "model-00044-of-00047.safetensors", + "model.layers.43.mlp.experts.14.down_proj.weight": "model-00044-of-00047.safetensors", + "model.layers.43.mlp.experts.14.down_proj.weight_scale": "model-00044-of-00047.safetensors", + "model.layers.43.mlp.experts.14.gate_proj.weight": "model-00044-of-00047.safetensors", + "model.layers.43.mlp.experts.14.gate_proj.weight_scale": "model-00044-of-00047.safetensors", + "model.layers.43.mlp.experts.14.up_proj.weight": "model-00044-of-00047.safetensors", + "model.layers.43.mlp.experts.14.up_proj.weight_scale": "model-00044-of-00047.safetensors", + "model.layers.43.mlp.experts.15.down_proj.weight": "model-00044-of-00047.safetensors", + "model.layers.43.mlp.experts.15.down_proj.weight_scale": "model-00044-of-00047.safetensors", + "model.layers.43.mlp.experts.15.gate_proj.weight": "model-00044-of-00047.safetensors", + "model.layers.43.mlp.experts.15.gate_proj.weight_scale": "model-00044-of-00047.safetensors", + "model.layers.43.mlp.experts.15.up_proj.weight": "model-00044-of-00047.safetensors", + "model.layers.43.mlp.experts.15.up_proj.weight_scale": "model-00044-of-00047.safetensors", + "model.layers.43.mlp.experts.16.down_proj.weight": "model-00044-of-00047.safetensors", + "model.layers.43.mlp.experts.16.down_proj.weight_scale": "model-00044-of-00047.safetensors", + "model.layers.43.mlp.experts.16.gate_proj.weight": "model-00044-of-00047.safetensors", + "model.layers.43.mlp.experts.16.gate_proj.weight_scale": "model-00044-of-00047.safetensors", + "model.layers.43.mlp.experts.16.up_proj.weight": "model-00044-of-00047.safetensors", + "model.layers.43.mlp.experts.16.up_proj.weight_scale": "model-00044-of-00047.safetensors", + "model.layers.43.mlp.experts.17.down_proj.weight": "model-00044-of-00047.safetensors", + "model.layers.43.mlp.experts.17.down_proj.weight_scale": "model-00044-of-00047.safetensors", + "model.layers.43.mlp.experts.17.gate_proj.weight": "model-00044-of-00047.safetensors", + "model.layers.43.mlp.experts.17.gate_proj.weight_scale": "model-00044-of-00047.safetensors", + "model.layers.43.mlp.experts.17.up_proj.weight": "model-00044-of-00047.safetensors", + "model.layers.43.mlp.experts.17.up_proj.weight_scale": "model-00044-of-00047.safetensors", + "model.layers.43.mlp.experts.18.down_proj.weight": "model-00044-of-00047.safetensors", + "model.layers.43.mlp.experts.18.down_proj.weight_scale": "model-00044-of-00047.safetensors", + "model.layers.43.mlp.experts.18.gate_proj.weight": "model-00044-of-00047.safetensors", + "model.layers.43.mlp.experts.18.gate_proj.weight_scale": "model-00044-of-00047.safetensors", + "model.layers.43.mlp.experts.18.up_proj.weight": "model-00044-of-00047.safetensors", + "model.layers.43.mlp.experts.18.up_proj.weight_scale": "model-00044-of-00047.safetensors", + "model.layers.43.mlp.experts.19.down_proj.weight": "model-00044-of-00047.safetensors", + "model.layers.43.mlp.experts.19.down_proj.weight_scale": "model-00044-of-00047.safetensors", + "model.layers.43.mlp.experts.19.gate_proj.weight": "model-00044-of-00047.safetensors", + "model.layers.43.mlp.experts.19.gate_proj.weight_scale": "model-00044-of-00047.safetensors", + "model.layers.43.mlp.experts.19.up_proj.weight": "model-00044-of-00047.safetensors", + "model.layers.43.mlp.experts.19.up_proj.weight_scale": "model-00044-of-00047.safetensors", + "model.layers.43.mlp.experts.2.down_proj.weight": "model-00044-of-00047.safetensors", + "model.layers.43.mlp.experts.2.down_proj.weight_scale": "model-00044-of-00047.safetensors", + "model.layers.43.mlp.experts.2.gate_proj.weight": "model-00044-of-00047.safetensors", + "model.layers.43.mlp.experts.2.gate_proj.weight_scale": "model-00044-of-00047.safetensors", + "model.layers.43.mlp.experts.2.up_proj.weight": "model-00044-of-00047.safetensors", + "model.layers.43.mlp.experts.2.up_proj.weight_scale": "model-00044-of-00047.safetensors", + "model.layers.43.mlp.experts.20.down_proj.weight": "model-00044-of-00047.safetensors", + "model.layers.43.mlp.experts.20.down_proj.weight_scale": "model-00044-of-00047.safetensors", + "model.layers.43.mlp.experts.20.gate_proj.weight": "model-00044-of-00047.safetensors", + "model.layers.43.mlp.experts.20.gate_proj.weight_scale": "model-00044-of-00047.safetensors", + "model.layers.43.mlp.experts.20.up_proj.weight": "model-00044-of-00047.safetensors", + "model.layers.43.mlp.experts.20.up_proj.weight_scale": "model-00044-of-00047.safetensors", + "model.layers.43.mlp.experts.21.down_proj.weight": "model-00044-of-00047.safetensors", + "model.layers.43.mlp.experts.21.down_proj.weight_scale": "model-00044-of-00047.safetensors", + "model.layers.43.mlp.experts.21.gate_proj.weight": "model-00044-of-00047.safetensors", + "model.layers.43.mlp.experts.21.gate_proj.weight_scale": "model-00044-of-00047.safetensors", + "model.layers.43.mlp.experts.21.up_proj.weight": "model-00044-of-00047.safetensors", + "model.layers.43.mlp.experts.21.up_proj.weight_scale": "model-00044-of-00047.safetensors", + "model.layers.43.mlp.experts.22.down_proj.weight": "model-00044-of-00047.safetensors", + "model.layers.43.mlp.experts.22.down_proj.weight_scale": "model-00044-of-00047.safetensors", + "model.layers.43.mlp.experts.22.gate_proj.weight": "model-00044-of-00047.safetensors", + "model.layers.43.mlp.experts.22.gate_proj.weight_scale": "model-00044-of-00047.safetensors", + "model.layers.43.mlp.experts.22.up_proj.weight": "model-00044-of-00047.safetensors", + "model.layers.43.mlp.experts.22.up_proj.weight_scale": "model-00044-of-00047.safetensors", + "model.layers.43.mlp.experts.23.down_proj.weight": "model-00044-of-00047.safetensors", + "model.layers.43.mlp.experts.23.down_proj.weight_scale": "model-00044-of-00047.safetensors", + "model.layers.43.mlp.experts.23.gate_proj.weight": "model-00044-of-00047.safetensors", + "model.layers.43.mlp.experts.23.gate_proj.weight_scale": "model-00044-of-00047.safetensors", + "model.layers.43.mlp.experts.23.up_proj.weight": "model-00044-of-00047.safetensors", + "model.layers.43.mlp.experts.23.up_proj.weight_scale": "model-00044-of-00047.safetensors", + "model.layers.43.mlp.experts.24.down_proj.weight": "model-00044-of-00047.safetensors", + "model.layers.43.mlp.experts.24.down_proj.weight_scale": "model-00044-of-00047.safetensors", + "model.layers.43.mlp.experts.24.gate_proj.weight": "model-00044-of-00047.safetensors", + "model.layers.43.mlp.experts.24.gate_proj.weight_scale": "model-00044-of-00047.safetensors", + "model.layers.43.mlp.experts.24.up_proj.weight": "model-00044-of-00047.safetensors", + "model.layers.43.mlp.experts.24.up_proj.weight_scale": "model-00044-of-00047.safetensors", + "model.layers.43.mlp.experts.25.down_proj.weight": "model-00044-of-00047.safetensors", + "model.layers.43.mlp.experts.25.down_proj.weight_scale": "model-00044-of-00047.safetensors", + "model.layers.43.mlp.experts.25.gate_proj.weight": "model-00044-of-00047.safetensors", + "model.layers.43.mlp.experts.25.gate_proj.weight_scale": "model-00044-of-00047.safetensors", + "model.layers.43.mlp.experts.25.up_proj.weight": "model-00044-of-00047.safetensors", + "model.layers.43.mlp.experts.25.up_proj.weight_scale": "model-00044-of-00047.safetensors", + "model.layers.43.mlp.experts.26.down_proj.weight": "model-00044-of-00047.safetensors", + "model.layers.43.mlp.experts.26.down_proj.weight_scale": "model-00044-of-00047.safetensors", + "model.layers.43.mlp.experts.26.gate_proj.weight": "model-00044-of-00047.safetensors", + "model.layers.43.mlp.experts.26.gate_proj.weight_scale": "model-00044-of-00047.safetensors", + "model.layers.43.mlp.experts.26.up_proj.weight": "model-00044-of-00047.safetensors", + "model.layers.43.mlp.experts.26.up_proj.weight_scale": "model-00044-of-00047.safetensors", + "model.layers.43.mlp.experts.27.down_proj.weight": "model-00044-of-00047.safetensors", + "model.layers.43.mlp.experts.27.down_proj.weight_scale": "model-00044-of-00047.safetensors", + "model.layers.43.mlp.experts.27.gate_proj.weight": "model-00044-of-00047.safetensors", + "model.layers.43.mlp.experts.27.gate_proj.weight_scale": "model-00044-of-00047.safetensors", + "model.layers.43.mlp.experts.27.up_proj.weight": "model-00044-of-00047.safetensors", + "model.layers.43.mlp.experts.27.up_proj.weight_scale": "model-00044-of-00047.safetensors", + "model.layers.43.mlp.experts.28.down_proj.weight": "model-00044-of-00047.safetensors", + "model.layers.43.mlp.experts.28.down_proj.weight_scale": "model-00044-of-00047.safetensors", + "model.layers.43.mlp.experts.28.gate_proj.weight": "model-00044-of-00047.safetensors", + "model.layers.43.mlp.experts.28.gate_proj.weight_scale": "model-00044-of-00047.safetensors", + "model.layers.43.mlp.experts.28.up_proj.weight": "model-00044-of-00047.safetensors", + "model.layers.43.mlp.experts.28.up_proj.weight_scale": "model-00044-of-00047.safetensors", + "model.layers.43.mlp.experts.29.down_proj.weight": "model-00044-of-00047.safetensors", + "model.layers.43.mlp.experts.29.down_proj.weight_scale": "model-00044-of-00047.safetensors", + "model.layers.43.mlp.experts.29.gate_proj.weight": "model-00044-of-00047.safetensors", + "model.layers.43.mlp.experts.29.gate_proj.weight_scale": "model-00044-of-00047.safetensors", + "model.layers.43.mlp.experts.29.up_proj.weight": "model-00044-of-00047.safetensors", + "model.layers.43.mlp.experts.29.up_proj.weight_scale": "model-00044-of-00047.safetensors", + "model.layers.43.mlp.experts.3.down_proj.weight": "model-00044-of-00047.safetensors", + "model.layers.43.mlp.experts.3.down_proj.weight_scale": "model-00044-of-00047.safetensors", + "model.layers.43.mlp.experts.3.gate_proj.weight": "model-00044-of-00047.safetensors", + "model.layers.43.mlp.experts.3.gate_proj.weight_scale": "model-00044-of-00047.safetensors", + "model.layers.43.mlp.experts.3.up_proj.weight": "model-00044-of-00047.safetensors", + "model.layers.43.mlp.experts.3.up_proj.weight_scale": "model-00044-of-00047.safetensors", + "model.layers.43.mlp.experts.30.down_proj.weight": "model-00044-of-00047.safetensors", + "model.layers.43.mlp.experts.30.down_proj.weight_scale": "model-00044-of-00047.safetensors", + "model.layers.43.mlp.experts.30.gate_proj.weight": "model-00044-of-00047.safetensors", + "model.layers.43.mlp.experts.30.gate_proj.weight_scale": "model-00044-of-00047.safetensors", + "model.layers.43.mlp.experts.30.up_proj.weight": "model-00044-of-00047.safetensors", + "model.layers.43.mlp.experts.30.up_proj.weight_scale": "model-00044-of-00047.safetensors", + "model.layers.43.mlp.experts.31.down_proj.weight": "model-00044-of-00047.safetensors", + "model.layers.43.mlp.experts.31.down_proj.weight_scale": "model-00044-of-00047.safetensors", + "model.layers.43.mlp.experts.31.gate_proj.weight": "model-00044-of-00047.safetensors", + "model.layers.43.mlp.experts.31.gate_proj.weight_scale": "model-00044-of-00047.safetensors", + "model.layers.43.mlp.experts.31.up_proj.weight": "model-00044-of-00047.safetensors", + "model.layers.43.mlp.experts.31.up_proj.weight_scale": "model-00044-of-00047.safetensors", + "model.layers.43.mlp.experts.32.down_proj.weight": "model-00044-of-00047.safetensors", + "model.layers.43.mlp.experts.32.down_proj.weight_scale": "model-00044-of-00047.safetensors", + "model.layers.43.mlp.experts.32.gate_proj.weight": "model-00044-of-00047.safetensors", + "model.layers.43.mlp.experts.32.gate_proj.weight_scale": "model-00044-of-00047.safetensors", + "model.layers.43.mlp.experts.32.up_proj.weight": "model-00044-of-00047.safetensors", + "model.layers.43.mlp.experts.32.up_proj.weight_scale": "model-00044-of-00047.safetensors", + "model.layers.43.mlp.experts.33.down_proj.weight": "model-00044-of-00047.safetensors", + "model.layers.43.mlp.experts.33.down_proj.weight_scale": "model-00044-of-00047.safetensors", + "model.layers.43.mlp.experts.33.gate_proj.weight": "model-00044-of-00047.safetensors", + "model.layers.43.mlp.experts.33.gate_proj.weight_scale": "model-00044-of-00047.safetensors", + "model.layers.43.mlp.experts.33.up_proj.weight": "model-00044-of-00047.safetensors", + "model.layers.43.mlp.experts.33.up_proj.weight_scale": "model-00044-of-00047.safetensors", + "model.layers.43.mlp.experts.34.down_proj.weight": "model-00044-of-00047.safetensors", + "model.layers.43.mlp.experts.34.down_proj.weight_scale": "model-00044-of-00047.safetensors", + "model.layers.43.mlp.experts.34.gate_proj.weight": "model-00044-of-00047.safetensors", + "model.layers.43.mlp.experts.34.gate_proj.weight_scale": "model-00044-of-00047.safetensors", + "model.layers.43.mlp.experts.34.up_proj.weight": "model-00044-of-00047.safetensors", + "model.layers.43.mlp.experts.34.up_proj.weight_scale": "model-00044-of-00047.safetensors", + "model.layers.43.mlp.experts.35.down_proj.weight": "model-00044-of-00047.safetensors", + "model.layers.43.mlp.experts.35.down_proj.weight_scale": "model-00044-of-00047.safetensors", + "model.layers.43.mlp.experts.35.gate_proj.weight": "model-00044-of-00047.safetensors", + "model.layers.43.mlp.experts.35.gate_proj.weight_scale": "model-00044-of-00047.safetensors", + "model.layers.43.mlp.experts.35.up_proj.weight": "model-00044-of-00047.safetensors", + "model.layers.43.mlp.experts.35.up_proj.weight_scale": "model-00044-of-00047.safetensors", + "model.layers.43.mlp.experts.36.down_proj.weight": "model-00044-of-00047.safetensors", + "model.layers.43.mlp.experts.36.down_proj.weight_scale": "model-00044-of-00047.safetensors", + "model.layers.43.mlp.experts.36.gate_proj.weight": "model-00044-of-00047.safetensors", + "model.layers.43.mlp.experts.36.gate_proj.weight_scale": "model-00044-of-00047.safetensors", + "model.layers.43.mlp.experts.36.up_proj.weight": "model-00044-of-00047.safetensors", + "model.layers.43.mlp.experts.36.up_proj.weight_scale": "model-00044-of-00047.safetensors", + "model.layers.43.mlp.experts.37.down_proj.weight": "model-00044-of-00047.safetensors", + "model.layers.43.mlp.experts.37.down_proj.weight_scale": "model-00044-of-00047.safetensors", + "model.layers.43.mlp.experts.37.gate_proj.weight": "model-00044-of-00047.safetensors", + "model.layers.43.mlp.experts.37.gate_proj.weight_scale": "model-00044-of-00047.safetensors", + "model.layers.43.mlp.experts.37.up_proj.weight": "model-00044-of-00047.safetensors", + "model.layers.43.mlp.experts.37.up_proj.weight_scale": "model-00044-of-00047.safetensors", + "model.layers.43.mlp.experts.38.down_proj.weight": "model-00044-of-00047.safetensors", + "model.layers.43.mlp.experts.38.down_proj.weight_scale": "model-00044-of-00047.safetensors", + "model.layers.43.mlp.experts.38.gate_proj.weight": "model-00044-of-00047.safetensors", + "model.layers.43.mlp.experts.38.gate_proj.weight_scale": "model-00044-of-00047.safetensors", + "model.layers.43.mlp.experts.38.up_proj.weight": "model-00044-of-00047.safetensors", + "model.layers.43.mlp.experts.38.up_proj.weight_scale": "model-00044-of-00047.safetensors", + "model.layers.43.mlp.experts.39.down_proj.weight": "model-00044-of-00047.safetensors", + "model.layers.43.mlp.experts.39.down_proj.weight_scale": "model-00044-of-00047.safetensors", + "model.layers.43.mlp.experts.39.gate_proj.weight": "model-00044-of-00047.safetensors", + "model.layers.43.mlp.experts.39.gate_proj.weight_scale": "model-00044-of-00047.safetensors", + "model.layers.43.mlp.experts.39.up_proj.weight": "model-00044-of-00047.safetensors", + "model.layers.43.mlp.experts.39.up_proj.weight_scale": "model-00044-of-00047.safetensors", + "model.layers.43.mlp.experts.4.down_proj.weight": "model-00044-of-00047.safetensors", + "model.layers.43.mlp.experts.4.down_proj.weight_scale": "model-00044-of-00047.safetensors", + "model.layers.43.mlp.experts.4.gate_proj.weight": "model-00044-of-00047.safetensors", + "model.layers.43.mlp.experts.4.gate_proj.weight_scale": "model-00044-of-00047.safetensors", + "model.layers.43.mlp.experts.4.up_proj.weight": "model-00044-of-00047.safetensors", + "model.layers.43.mlp.experts.4.up_proj.weight_scale": "model-00044-of-00047.safetensors", + "model.layers.43.mlp.experts.40.down_proj.weight": "model-00044-of-00047.safetensors", + "model.layers.43.mlp.experts.40.down_proj.weight_scale": "model-00044-of-00047.safetensors", + "model.layers.43.mlp.experts.40.gate_proj.weight": "model-00044-of-00047.safetensors", + "model.layers.43.mlp.experts.40.gate_proj.weight_scale": "model-00044-of-00047.safetensors", + "model.layers.43.mlp.experts.40.up_proj.weight": "model-00044-of-00047.safetensors", + "model.layers.43.mlp.experts.40.up_proj.weight_scale": "model-00044-of-00047.safetensors", + "model.layers.43.mlp.experts.41.down_proj.weight": "model-00044-of-00047.safetensors", + "model.layers.43.mlp.experts.41.down_proj.weight_scale": "model-00044-of-00047.safetensors", + "model.layers.43.mlp.experts.41.gate_proj.weight": "model-00044-of-00047.safetensors", + "model.layers.43.mlp.experts.41.gate_proj.weight_scale": "model-00044-of-00047.safetensors", + "model.layers.43.mlp.experts.41.up_proj.weight": "model-00044-of-00047.safetensors", + "model.layers.43.mlp.experts.41.up_proj.weight_scale": "model-00044-of-00047.safetensors", + "model.layers.43.mlp.experts.42.down_proj.weight": "model-00044-of-00047.safetensors", + "model.layers.43.mlp.experts.42.down_proj.weight_scale": "model-00044-of-00047.safetensors", + "model.layers.43.mlp.experts.42.gate_proj.weight": "model-00044-of-00047.safetensors", + "model.layers.43.mlp.experts.42.gate_proj.weight_scale": "model-00044-of-00047.safetensors", + "model.layers.43.mlp.experts.42.up_proj.weight": "model-00044-of-00047.safetensors", + "model.layers.43.mlp.experts.42.up_proj.weight_scale": "model-00044-of-00047.safetensors", + "model.layers.43.mlp.experts.43.down_proj.weight": "model-00044-of-00047.safetensors", + "model.layers.43.mlp.experts.43.down_proj.weight_scale": "model-00044-of-00047.safetensors", + "model.layers.43.mlp.experts.43.gate_proj.weight": "model-00044-of-00047.safetensors", + "model.layers.43.mlp.experts.43.gate_proj.weight_scale": "model-00044-of-00047.safetensors", + "model.layers.43.mlp.experts.43.up_proj.weight": "model-00044-of-00047.safetensors", + "model.layers.43.mlp.experts.43.up_proj.weight_scale": "model-00044-of-00047.safetensors", + "model.layers.43.mlp.experts.44.down_proj.weight": "model-00044-of-00047.safetensors", + "model.layers.43.mlp.experts.44.down_proj.weight_scale": "model-00044-of-00047.safetensors", + "model.layers.43.mlp.experts.44.gate_proj.weight": "model-00044-of-00047.safetensors", + "model.layers.43.mlp.experts.44.gate_proj.weight_scale": "model-00044-of-00047.safetensors", + "model.layers.43.mlp.experts.44.up_proj.weight": "model-00044-of-00047.safetensors", + "model.layers.43.mlp.experts.44.up_proj.weight_scale": "model-00044-of-00047.safetensors", + "model.layers.43.mlp.experts.45.down_proj.weight": "model-00044-of-00047.safetensors", + "model.layers.43.mlp.experts.45.down_proj.weight_scale": "model-00044-of-00047.safetensors", + "model.layers.43.mlp.experts.45.gate_proj.weight": "model-00044-of-00047.safetensors", + "model.layers.43.mlp.experts.45.gate_proj.weight_scale": "model-00044-of-00047.safetensors", + "model.layers.43.mlp.experts.45.up_proj.weight": "model-00044-of-00047.safetensors", + "model.layers.43.mlp.experts.45.up_proj.weight_scale": "model-00044-of-00047.safetensors", + "model.layers.43.mlp.experts.46.down_proj.weight": "model-00044-of-00047.safetensors", + "model.layers.43.mlp.experts.46.down_proj.weight_scale": "model-00044-of-00047.safetensors", + "model.layers.43.mlp.experts.46.gate_proj.weight": "model-00044-of-00047.safetensors", + "model.layers.43.mlp.experts.46.gate_proj.weight_scale": "model-00044-of-00047.safetensors", + "model.layers.43.mlp.experts.46.up_proj.weight": "model-00044-of-00047.safetensors", + "model.layers.43.mlp.experts.46.up_proj.weight_scale": "model-00044-of-00047.safetensors", + "model.layers.43.mlp.experts.47.down_proj.weight": "model-00044-of-00047.safetensors", + "model.layers.43.mlp.experts.47.down_proj.weight_scale": "model-00044-of-00047.safetensors", + "model.layers.43.mlp.experts.47.gate_proj.weight": "model-00044-of-00047.safetensors", + "model.layers.43.mlp.experts.47.gate_proj.weight_scale": "model-00044-of-00047.safetensors", + "model.layers.43.mlp.experts.47.up_proj.weight": "model-00044-of-00047.safetensors", + "model.layers.43.mlp.experts.47.up_proj.weight_scale": "model-00044-of-00047.safetensors", + "model.layers.43.mlp.experts.48.down_proj.weight": "model-00044-of-00047.safetensors", + "model.layers.43.mlp.experts.48.down_proj.weight_scale": "model-00044-of-00047.safetensors", + "model.layers.43.mlp.experts.48.gate_proj.weight": "model-00044-of-00047.safetensors", + "model.layers.43.mlp.experts.48.gate_proj.weight_scale": "model-00044-of-00047.safetensors", + "model.layers.43.mlp.experts.48.up_proj.weight": "model-00044-of-00047.safetensors", + "model.layers.43.mlp.experts.48.up_proj.weight_scale": "model-00044-of-00047.safetensors", + "model.layers.43.mlp.experts.49.down_proj.weight": "model-00044-of-00047.safetensors", + "model.layers.43.mlp.experts.49.down_proj.weight_scale": "model-00044-of-00047.safetensors", + "model.layers.43.mlp.experts.49.gate_proj.weight": "model-00044-of-00047.safetensors", + "model.layers.43.mlp.experts.49.gate_proj.weight_scale": "model-00044-of-00047.safetensors", + "model.layers.43.mlp.experts.49.up_proj.weight": "model-00044-of-00047.safetensors", + "model.layers.43.mlp.experts.49.up_proj.weight_scale": "model-00044-of-00047.safetensors", + "model.layers.43.mlp.experts.5.down_proj.weight": "model-00044-of-00047.safetensors", + "model.layers.43.mlp.experts.5.down_proj.weight_scale": "model-00044-of-00047.safetensors", + "model.layers.43.mlp.experts.5.gate_proj.weight": "model-00044-of-00047.safetensors", + "model.layers.43.mlp.experts.5.gate_proj.weight_scale": "model-00044-of-00047.safetensors", + "model.layers.43.mlp.experts.5.up_proj.weight": "model-00044-of-00047.safetensors", + "model.layers.43.mlp.experts.5.up_proj.weight_scale": "model-00044-of-00047.safetensors", + "model.layers.43.mlp.experts.50.down_proj.weight": "model-00044-of-00047.safetensors", + "model.layers.43.mlp.experts.50.down_proj.weight_scale": "model-00044-of-00047.safetensors", + "model.layers.43.mlp.experts.50.gate_proj.weight": "model-00044-of-00047.safetensors", + "model.layers.43.mlp.experts.50.gate_proj.weight_scale": "model-00044-of-00047.safetensors", + "model.layers.43.mlp.experts.50.up_proj.weight": "model-00044-of-00047.safetensors", + "model.layers.43.mlp.experts.50.up_proj.weight_scale": "model-00044-of-00047.safetensors", + "model.layers.43.mlp.experts.51.down_proj.weight": "model-00044-of-00047.safetensors", + "model.layers.43.mlp.experts.51.down_proj.weight_scale": "model-00044-of-00047.safetensors", + "model.layers.43.mlp.experts.51.gate_proj.weight": "model-00044-of-00047.safetensors", + "model.layers.43.mlp.experts.51.gate_proj.weight_scale": "model-00044-of-00047.safetensors", + "model.layers.43.mlp.experts.51.up_proj.weight": "model-00044-of-00047.safetensors", + "model.layers.43.mlp.experts.51.up_proj.weight_scale": "model-00044-of-00047.safetensors", + "model.layers.43.mlp.experts.52.down_proj.weight": "model-00044-of-00047.safetensors", + "model.layers.43.mlp.experts.52.down_proj.weight_scale": "model-00044-of-00047.safetensors", + "model.layers.43.mlp.experts.52.gate_proj.weight": "model-00044-of-00047.safetensors", + "model.layers.43.mlp.experts.52.gate_proj.weight_scale": "model-00044-of-00047.safetensors", + "model.layers.43.mlp.experts.52.up_proj.weight": "model-00044-of-00047.safetensors", + "model.layers.43.mlp.experts.52.up_proj.weight_scale": "model-00044-of-00047.safetensors", + "model.layers.43.mlp.experts.53.down_proj.weight": "model-00044-of-00047.safetensors", + "model.layers.43.mlp.experts.53.down_proj.weight_scale": "model-00044-of-00047.safetensors", + "model.layers.43.mlp.experts.53.gate_proj.weight": "model-00044-of-00047.safetensors", + "model.layers.43.mlp.experts.53.gate_proj.weight_scale": "model-00044-of-00047.safetensors", + "model.layers.43.mlp.experts.53.up_proj.weight": "model-00044-of-00047.safetensors", + "model.layers.43.mlp.experts.53.up_proj.weight_scale": "model-00044-of-00047.safetensors", + "model.layers.43.mlp.experts.54.down_proj.weight": "model-00044-of-00047.safetensors", + "model.layers.43.mlp.experts.54.down_proj.weight_scale": "model-00044-of-00047.safetensors", + "model.layers.43.mlp.experts.54.gate_proj.weight": "model-00044-of-00047.safetensors", + "model.layers.43.mlp.experts.54.gate_proj.weight_scale": "model-00044-of-00047.safetensors", + "model.layers.43.mlp.experts.54.up_proj.weight": "model-00044-of-00047.safetensors", + "model.layers.43.mlp.experts.54.up_proj.weight_scale": "model-00044-of-00047.safetensors", + "model.layers.43.mlp.experts.55.down_proj.weight": "model-00044-of-00047.safetensors", + "model.layers.43.mlp.experts.55.down_proj.weight_scale": "model-00044-of-00047.safetensors", + "model.layers.43.mlp.experts.55.gate_proj.weight": "model-00044-of-00047.safetensors", + "model.layers.43.mlp.experts.55.gate_proj.weight_scale": "model-00044-of-00047.safetensors", + "model.layers.43.mlp.experts.55.up_proj.weight": "model-00044-of-00047.safetensors", + "model.layers.43.mlp.experts.55.up_proj.weight_scale": "model-00044-of-00047.safetensors", + "model.layers.43.mlp.experts.56.down_proj.weight": "model-00044-of-00047.safetensors", + "model.layers.43.mlp.experts.56.down_proj.weight_scale": "model-00044-of-00047.safetensors", + "model.layers.43.mlp.experts.56.gate_proj.weight": "model-00044-of-00047.safetensors", + "model.layers.43.mlp.experts.56.gate_proj.weight_scale": "model-00044-of-00047.safetensors", + "model.layers.43.mlp.experts.56.up_proj.weight": "model-00044-of-00047.safetensors", + "model.layers.43.mlp.experts.56.up_proj.weight_scale": "model-00044-of-00047.safetensors", + "model.layers.43.mlp.experts.57.down_proj.weight": "model-00044-of-00047.safetensors", + "model.layers.43.mlp.experts.57.down_proj.weight_scale": "model-00044-of-00047.safetensors", + "model.layers.43.mlp.experts.57.gate_proj.weight": "model-00044-of-00047.safetensors", + "model.layers.43.mlp.experts.57.gate_proj.weight_scale": "model-00044-of-00047.safetensors", + "model.layers.43.mlp.experts.57.up_proj.weight": "model-00044-of-00047.safetensors", + "model.layers.43.mlp.experts.57.up_proj.weight_scale": "model-00044-of-00047.safetensors", + "model.layers.43.mlp.experts.58.down_proj.weight": "model-00044-of-00047.safetensors", + "model.layers.43.mlp.experts.58.down_proj.weight_scale": "model-00044-of-00047.safetensors", + "model.layers.43.mlp.experts.58.gate_proj.weight": "model-00044-of-00047.safetensors", + "model.layers.43.mlp.experts.58.gate_proj.weight_scale": "model-00044-of-00047.safetensors", + "model.layers.43.mlp.experts.58.up_proj.weight": "model-00044-of-00047.safetensors", + "model.layers.43.mlp.experts.58.up_proj.weight_scale": "model-00044-of-00047.safetensors", + "model.layers.43.mlp.experts.59.down_proj.weight": "model-00044-of-00047.safetensors", + "model.layers.43.mlp.experts.59.down_proj.weight_scale": "model-00044-of-00047.safetensors", + "model.layers.43.mlp.experts.59.gate_proj.weight": "model-00044-of-00047.safetensors", + "model.layers.43.mlp.experts.59.gate_proj.weight_scale": "model-00044-of-00047.safetensors", + "model.layers.43.mlp.experts.59.up_proj.weight": "model-00044-of-00047.safetensors", + "model.layers.43.mlp.experts.59.up_proj.weight_scale": "model-00044-of-00047.safetensors", + "model.layers.43.mlp.experts.6.down_proj.weight": "model-00044-of-00047.safetensors", + "model.layers.43.mlp.experts.6.down_proj.weight_scale": "model-00044-of-00047.safetensors", + "model.layers.43.mlp.experts.6.gate_proj.weight": "model-00044-of-00047.safetensors", + "model.layers.43.mlp.experts.6.gate_proj.weight_scale": "model-00044-of-00047.safetensors", + "model.layers.43.mlp.experts.6.up_proj.weight": "model-00044-of-00047.safetensors", + "model.layers.43.mlp.experts.6.up_proj.weight_scale": "model-00044-of-00047.safetensors", + "model.layers.43.mlp.experts.60.down_proj.weight": "model-00044-of-00047.safetensors", + "model.layers.43.mlp.experts.60.down_proj.weight_scale": "model-00044-of-00047.safetensors", + "model.layers.43.mlp.experts.60.gate_proj.weight": "model-00044-of-00047.safetensors", + "model.layers.43.mlp.experts.60.gate_proj.weight_scale": "model-00044-of-00047.safetensors", + "model.layers.43.mlp.experts.60.up_proj.weight": "model-00044-of-00047.safetensors", + "model.layers.43.mlp.experts.60.up_proj.weight_scale": "model-00044-of-00047.safetensors", + "model.layers.43.mlp.experts.61.down_proj.weight": "model-00044-of-00047.safetensors", + "model.layers.43.mlp.experts.61.down_proj.weight_scale": "model-00044-of-00047.safetensors", + "model.layers.43.mlp.experts.61.gate_proj.weight": "model-00044-of-00047.safetensors", + "model.layers.43.mlp.experts.61.gate_proj.weight_scale": "model-00044-of-00047.safetensors", + "model.layers.43.mlp.experts.61.up_proj.weight": "model-00044-of-00047.safetensors", + "model.layers.43.mlp.experts.61.up_proj.weight_scale": "model-00044-of-00047.safetensors", + "model.layers.43.mlp.experts.62.down_proj.weight": "model-00044-of-00047.safetensors", + "model.layers.43.mlp.experts.62.down_proj.weight_scale": "model-00044-of-00047.safetensors", + "model.layers.43.mlp.experts.62.gate_proj.weight": "model-00044-of-00047.safetensors", + "model.layers.43.mlp.experts.62.gate_proj.weight_scale": "model-00044-of-00047.safetensors", + "model.layers.43.mlp.experts.62.up_proj.weight": "model-00044-of-00047.safetensors", + "model.layers.43.mlp.experts.62.up_proj.weight_scale": "model-00044-of-00047.safetensors", + "model.layers.43.mlp.experts.63.down_proj.weight": "model-00044-of-00047.safetensors", + "model.layers.43.mlp.experts.63.down_proj.weight_scale": "model-00044-of-00047.safetensors", + "model.layers.43.mlp.experts.63.gate_proj.weight": "model-00044-of-00047.safetensors", + "model.layers.43.mlp.experts.63.gate_proj.weight_scale": "model-00044-of-00047.safetensors", + "model.layers.43.mlp.experts.63.up_proj.weight": "model-00044-of-00047.safetensors", + "model.layers.43.mlp.experts.63.up_proj.weight_scale": "model-00044-of-00047.safetensors", + "model.layers.43.mlp.experts.64.down_proj.weight": "model-00044-of-00047.safetensors", + "model.layers.43.mlp.experts.64.down_proj.weight_scale": "model-00044-of-00047.safetensors", + "model.layers.43.mlp.experts.64.gate_proj.weight": "model-00044-of-00047.safetensors", + "model.layers.43.mlp.experts.64.gate_proj.weight_scale": "model-00044-of-00047.safetensors", + "model.layers.43.mlp.experts.64.up_proj.weight": "model-00044-of-00047.safetensors", + "model.layers.43.mlp.experts.64.up_proj.weight_scale": "model-00044-of-00047.safetensors", + "model.layers.43.mlp.experts.65.down_proj.weight": "model-00044-of-00047.safetensors", + "model.layers.43.mlp.experts.65.down_proj.weight_scale": "model-00044-of-00047.safetensors", + "model.layers.43.mlp.experts.65.gate_proj.weight": "model-00044-of-00047.safetensors", + "model.layers.43.mlp.experts.65.gate_proj.weight_scale": "model-00044-of-00047.safetensors", + "model.layers.43.mlp.experts.65.up_proj.weight": "model-00044-of-00047.safetensors", + "model.layers.43.mlp.experts.65.up_proj.weight_scale": "model-00044-of-00047.safetensors", + "model.layers.43.mlp.experts.66.down_proj.weight": "model-00044-of-00047.safetensors", + "model.layers.43.mlp.experts.66.down_proj.weight_scale": "model-00044-of-00047.safetensors", + "model.layers.43.mlp.experts.66.gate_proj.weight": "model-00044-of-00047.safetensors", + "model.layers.43.mlp.experts.66.gate_proj.weight_scale": "model-00044-of-00047.safetensors", + "model.layers.43.mlp.experts.66.up_proj.weight": "model-00044-of-00047.safetensors", + "model.layers.43.mlp.experts.66.up_proj.weight_scale": "model-00044-of-00047.safetensors", + "model.layers.43.mlp.experts.67.down_proj.weight": "model-00044-of-00047.safetensors", + "model.layers.43.mlp.experts.67.down_proj.weight_scale": "model-00044-of-00047.safetensors", + "model.layers.43.mlp.experts.67.gate_proj.weight": "model-00044-of-00047.safetensors", + "model.layers.43.mlp.experts.67.gate_proj.weight_scale": "model-00044-of-00047.safetensors", + "model.layers.43.mlp.experts.67.up_proj.weight": "model-00044-of-00047.safetensors", + "model.layers.43.mlp.experts.67.up_proj.weight_scale": "model-00044-of-00047.safetensors", + "model.layers.43.mlp.experts.68.down_proj.weight": "model-00044-of-00047.safetensors", + "model.layers.43.mlp.experts.68.down_proj.weight_scale": "model-00044-of-00047.safetensors", + "model.layers.43.mlp.experts.68.gate_proj.weight": "model-00044-of-00047.safetensors", + "model.layers.43.mlp.experts.68.gate_proj.weight_scale": "model-00044-of-00047.safetensors", + "model.layers.43.mlp.experts.68.up_proj.weight": "model-00044-of-00047.safetensors", + "model.layers.43.mlp.experts.68.up_proj.weight_scale": "model-00044-of-00047.safetensors", + "model.layers.43.mlp.experts.69.down_proj.weight": "model-00044-of-00047.safetensors", + "model.layers.43.mlp.experts.69.down_proj.weight_scale": "model-00044-of-00047.safetensors", + "model.layers.43.mlp.experts.69.gate_proj.weight": "model-00044-of-00047.safetensors", + "model.layers.43.mlp.experts.69.gate_proj.weight_scale": "model-00044-of-00047.safetensors", + "model.layers.43.mlp.experts.69.up_proj.weight": "model-00044-of-00047.safetensors", + "model.layers.43.mlp.experts.69.up_proj.weight_scale": "model-00044-of-00047.safetensors", + "model.layers.43.mlp.experts.7.down_proj.weight": "model-00044-of-00047.safetensors", + "model.layers.43.mlp.experts.7.down_proj.weight_scale": "model-00044-of-00047.safetensors", + "model.layers.43.mlp.experts.7.gate_proj.weight": "model-00044-of-00047.safetensors", + "model.layers.43.mlp.experts.7.gate_proj.weight_scale": "model-00044-of-00047.safetensors", + "model.layers.43.mlp.experts.7.up_proj.weight": "model-00044-of-00047.safetensors", + "model.layers.43.mlp.experts.7.up_proj.weight_scale": "model-00044-of-00047.safetensors", + "model.layers.43.mlp.experts.70.down_proj.weight": "model-00044-of-00047.safetensors", + "model.layers.43.mlp.experts.70.down_proj.weight_scale": "model-00044-of-00047.safetensors", + "model.layers.43.mlp.experts.70.gate_proj.weight": "model-00044-of-00047.safetensors", + "model.layers.43.mlp.experts.70.gate_proj.weight_scale": "model-00044-of-00047.safetensors", + "model.layers.43.mlp.experts.70.up_proj.weight": "model-00044-of-00047.safetensors", + "model.layers.43.mlp.experts.70.up_proj.weight_scale": "model-00044-of-00047.safetensors", + "model.layers.43.mlp.experts.71.down_proj.weight": "model-00044-of-00047.safetensors", + "model.layers.43.mlp.experts.71.down_proj.weight_scale": "model-00044-of-00047.safetensors", + "model.layers.43.mlp.experts.71.gate_proj.weight": "model-00044-of-00047.safetensors", + "model.layers.43.mlp.experts.71.gate_proj.weight_scale": "model-00044-of-00047.safetensors", + "model.layers.43.mlp.experts.71.up_proj.weight": "model-00044-of-00047.safetensors", + "model.layers.43.mlp.experts.71.up_proj.weight_scale": "model-00044-of-00047.safetensors", + "model.layers.43.mlp.experts.72.down_proj.weight": "model-00044-of-00047.safetensors", + "model.layers.43.mlp.experts.72.down_proj.weight_scale": "model-00044-of-00047.safetensors", + "model.layers.43.mlp.experts.72.gate_proj.weight": "model-00044-of-00047.safetensors", + "model.layers.43.mlp.experts.72.gate_proj.weight_scale": "model-00044-of-00047.safetensors", + "model.layers.43.mlp.experts.72.up_proj.weight": "model-00044-of-00047.safetensors", + "model.layers.43.mlp.experts.72.up_proj.weight_scale": "model-00044-of-00047.safetensors", + "model.layers.43.mlp.experts.73.down_proj.weight": "model-00044-of-00047.safetensors", + "model.layers.43.mlp.experts.73.down_proj.weight_scale": "model-00044-of-00047.safetensors", + "model.layers.43.mlp.experts.73.gate_proj.weight": "model-00044-of-00047.safetensors", + "model.layers.43.mlp.experts.73.gate_proj.weight_scale": "model-00044-of-00047.safetensors", + "model.layers.43.mlp.experts.73.up_proj.weight": "model-00044-of-00047.safetensors", + "model.layers.43.mlp.experts.73.up_proj.weight_scale": "model-00044-of-00047.safetensors", + "model.layers.43.mlp.experts.74.down_proj.weight": "model-00044-of-00047.safetensors", + "model.layers.43.mlp.experts.74.down_proj.weight_scale": "model-00044-of-00047.safetensors", + "model.layers.43.mlp.experts.74.gate_proj.weight": "model-00044-of-00047.safetensors", + "model.layers.43.mlp.experts.74.gate_proj.weight_scale": "model-00044-of-00047.safetensors", + "model.layers.43.mlp.experts.74.up_proj.weight": "model-00044-of-00047.safetensors", + "model.layers.43.mlp.experts.74.up_proj.weight_scale": "model-00044-of-00047.safetensors", + "model.layers.43.mlp.experts.75.down_proj.weight": "model-00044-of-00047.safetensors", + "model.layers.43.mlp.experts.75.down_proj.weight_scale": "model-00044-of-00047.safetensors", + "model.layers.43.mlp.experts.75.gate_proj.weight": "model-00044-of-00047.safetensors", + "model.layers.43.mlp.experts.75.gate_proj.weight_scale": "model-00044-of-00047.safetensors", + "model.layers.43.mlp.experts.75.up_proj.weight": "model-00044-of-00047.safetensors", + "model.layers.43.mlp.experts.75.up_proj.weight_scale": "model-00044-of-00047.safetensors", + "model.layers.43.mlp.experts.76.down_proj.weight": "model-00044-of-00047.safetensors", + "model.layers.43.mlp.experts.76.down_proj.weight_scale": "model-00044-of-00047.safetensors", + "model.layers.43.mlp.experts.76.gate_proj.weight": "model-00044-of-00047.safetensors", + "model.layers.43.mlp.experts.76.gate_proj.weight_scale": "model-00044-of-00047.safetensors", + "model.layers.43.mlp.experts.76.up_proj.weight": "model-00044-of-00047.safetensors", + "model.layers.43.mlp.experts.76.up_proj.weight_scale": "model-00044-of-00047.safetensors", + "model.layers.43.mlp.experts.77.down_proj.weight": "model-00044-of-00047.safetensors", + "model.layers.43.mlp.experts.77.down_proj.weight_scale": "model-00044-of-00047.safetensors", + "model.layers.43.mlp.experts.77.gate_proj.weight": "model-00044-of-00047.safetensors", + "model.layers.43.mlp.experts.77.gate_proj.weight_scale": "model-00044-of-00047.safetensors", + "model.layers.43.mlp.experts.77.up_proj.weight": "model-00044-of-00047.safetensors", + "model.layers.43.mlp.experts.77.up_proj.weight_scale": "model-00044-of-00047.safetensors", + "model.layers.43.mlp.experts.78.down_proj.weight": "model-00044-of-00047.safetensors", + "model.layers.43.mlp.experts.78.down_proj.weight_scale": "model-00044-of-00047.safetensors", + "model.layers.43.mlp.experts.78.gate_proj.weight": "model-00044-of-00047.safetensors", + "model.layers.43.mlp.experts.78.gate_proj.weight_scale": "model-00044-of-00047.safetensors", + "model.layers.43.mlp.experts.78.up_proj.weight": "model-00044-of-00047.safetensors", + "model.layers.43.mlp.experts.78.up_proj.weight_scale": "model-00044-of-00047.safetensors", + "model.layers.43.mlp.experts.79.down_proj.weight": "model-00044-of-00047.safetensors", + "model.layers.43.mlp.experts.79.down_proj.weight_scale": "model-00044-of-00047.safetensors", + "model.layers.43.mlp.experts.79.gate_proj.weight": "model-00044-of-00047.safetensors", + "model.layers.43.mlp.experts.79.gate_proj.weight_scale": "model-00044-of-00047.safetensors", + "model.layers.43.mlp.experts.79.up_proj.weight": "model-00044-of-00047.safetensors", + "model.layers.43.mlp.experts.79.up_proj.weight_scale": "model-00044-of-00047.safetensors", + "model.layers.43.mlp.experts.8.down_proj.weight": "model-00044-of-00047.safetensors", + "model.layers.43.mlp.experts.8.down_proj.weight_scale": "model-00044-of-00047.safetensors", + "model.layers.43.mlp.experts.8.gate_proj.weight": "model-00044-of-00047.safetensors", + "model.layers.43.mlp.experts.8.gate_proj.weight_scale": "model-00044-of-00047.safetensors", + "model.layers.43.mlp.experts.8.up_proj.weight": "model-00044-of-00047.safetensors", + "model.layers.43.mlp.experts.8.up_proj.weight_scale": "model-00044-of-00047.safetensors", + "model.layers.43.mlp.experts.80.down_proj.weight": "model-00044-of-00047.safetensors", + "model.layers.43.mlp.experts.80.down_proj.weight_scale": "model-00044-of-00047.safetensors", + "model.layers.43.mlp.experts.80.gate_proj.weight": "model-00044-of-00047.safetensors", + "model.layers.43.mlp.experts.80.gate_proj.weight_scale": "model-00044-of-00047.safetensors", + "model.layers.43.mlp.experts.80.up_proj.weight": "model-00044-of-00047.safetensors", + "model.layers.43.mlp.experts.80.up_proj.weight_scale": "model-00044-of-00047.safetensors", + "model.layers.43.mlp.experts.81.down_proj.weight": "model-00044-of-00047.safetensors", + "model.layers.43.mlp.experts.81.down_proj.weight_scale": "model-00044-of-00047.safetensors", + "model.layers.43.mlp.experts.81.gate_proj.weight": "model-00044-of-00047.safetensors", + "model.layers.43.mlp.experts.81.gate_proj.weight_scale": "model-00044-of-00047.safetensors", + "model.layers.43.mlp.experts.81.up_proj.weight": "model-00044-of-00047.safetensors", + "model.layers.43.mlp.experts.81.up_proj.weight_scale": "model-00044-of-00047.safetensors", + "model.layers.43.mlp.experts.82.down_proj.weight": "model-00044-of-00047.safetensors", + "model.layers.43.mlp.experts.82.down_proj.weight_scale": "model-00044-of-00047.safetensors", + "model.layers.43.mlp.experts.82.gate_proj.weight": "model-00044-of-00047.safetensors", + "model.layers.43.mlp.experts.82.gate_proj.weight_scale": "model-00044-of-00047.safetensors", + "model.layers.43.mlp.experts.82.up_proj.weight": "model-00044-of-00047.safetensors", + "model.layers.43.mlp.experts.82.up_proj.weight_scale": "model-00044-of-00047.safetensors", + "model.layers.43.mlp.experts.83.down_proj.weight": "model-00044-of-00047.safetensors", + "model.layers.43.mlp.experts.83.down_proj.weight_scale": "model-00044-of-00047.safetensors", + "model.layers.43.mlp.experts.83.gate_proj.weight": "model-00044-of-00047.safetensors", + "model.layers.43.mlp.experts.83.gate_proj.weight_scale": "model-00044-of-00047.safetensors", + "model.layers.43.mlp.experts.83.up_proj.weight": "model-00044-of-00047.safetensors", + "model.layers.43.mlp.experts.83.up_proj.weight_scale": "model-00044-of-00047.safetensors", + "model.layers.43.mlp.experts.84.down_proj.weight": "model-00044-of-00047.safetensors", + "model.layers.43.mlp.experts.84.down_proj.weight_scale": "model-00044-of-00047.safetensors", + "model.layers.43.mlp.experts.84.gate_proj.weight": "model-00044-of-00047.safetensors", + "model.layers.43.mlp.experts.84.gate_proj.weight_scale": "model-00044-of-00047.safetensors", + "model.layers.43.mlp.experts.84.up_proj.weight": "model-00044-of-00047.safetensors", + "model.layers.43.mlp.experts.84.up_proj.weight_scale": "model-00044-of-00047.safetensors", + "model.layers.43.mlp.experts.85.down_proj.weight": "model-00044-of-00047.safetensors", + "model.layers.43.mlp.experts.85.down_proj.weight_scale": "model-00044-of-00047.safetensors", + "model.layers.43.mlp.experts.85.gate_proj.weight": "model-00044-of-00047.safetensors", + "model.layers.43.mlp.experts.85.gate_proj.weight_scale": "model-00044-of-00047.safetensors", + "model.layers.43.mlp.experts.85.up_proj.weight": "model-00044-of-00047.safetensors", + "model.layers.43.mlp.experts.85.up_proj.weight_scale": "model-00044-of-00047.safetensors", + "model.layers.43.mlp.experts.86.down_proj.weight": "model-00044-of-00047.safetensors", + "model.layers.43.mlp.experts.86.down_proj.weight_scale": "model-00044-of-00047.safetensors", + "model.layers.43.mlp.experts.86.gate_proj.weight": "model-00044-of-00047.safetensors", + "model.layers.43.mlp.experts.86.gate_proj.weight_scale": "model-00044-of-00047.safetensors", + "model.layers.43.mlp.experts.86.up_proj.weight": "model-00044-of-00047.safetensors", + "model.layers.43.mlp.experts.86.up_proj.weight_scale": "model-00044-of-00047.safetensors", + "model.layers.43.mlp.experts.87.down_proj.weight": "model-00044-of-00047.safetensors", + "model.layers.43.mlp.experts.87.down_proj.weight_scale": "model-00044-of-00047.safetensors", + "model.layers.43.mlp.experts.87.gate_proj.weight": "model-00044-of-00047.safetensors", + "model.layers.43.mlp.experts.87.gate_proj.weight_scale": "model-00044-of-00047.safetensors", + "model.layers.43.mlp.experts.87.up_proj.weight": "model-00044-of-00047.safetensors", + "model.layers.43.mlp.experts.87.up_proj.weight_scale": "model-00044-of-00047.safetensors", + "model.layers.43.mlp.experts.88.down_proj.weight": "model-00044-of-00047.safetensors", + "model.layers.43.mlp.experts.88.down_proj.weight_scale": "model-00044-of-00047.safetensors", + "model.layers.43.mlp.experts.88.gate_proj.weight": "model-00044-of-00047.safetensors", + "model.layers.43.mlp.experts.88.gate_proj.weight_scale": "model-00044-of-00047.safetensors", + "model.layers.43.mlp.experts.88.up_proj.weight": "model-00044-of-00047.safetensors", + "model.layers.43.mlp.experts.88.up_proj.weight_scale": "model-00044-of-00047.safetensors", + "model.layers.43.mlp.experts.89.down_proj.weight": "model-00044-of-00047.safetensors", + "model.layers.43.mlp.experts.89.down_proj.weight_scale": "model-00044-of-00047.safetensors", + "model.layers.43.mlp.experts.89.gate_proj.weight": "model-00044-of-00047.safetensors", + "model.layers.43.mlp.experts.89.gate_proj.weight_scale": "model-00044-of-00047.safetensors", + "model.layers.43.mlp.experts.89.up_proj.weight": "model-00044-of-00047.safetensors", + "model.layers.43.mlp.experts.89.up_proj.weight_scale": "model-00044-of-00047.safetensors", + "model.layers.43.mlp.experts.9.down_proj.weight": "model-00044-of-00047.safetensors", + "model.layers.43.mlp.experts.9.down_proj.weight_scale": "model-00044-of-00047.safetensors", + "model.layers.43.mlp.experts.9.gate_proj.weight": "model-00044-of-00047.safetensors", + "model.layers.43.mlp.experts.9.gate_proj.weight_scale": "model-00044-of-00047.safetensors", + "model.layers.43.mlp.experts.9.up_proj.weight": "model-00044-of-00047.safetensors", + "model.layers.43.mlp.experts.9.up_proj.weight_scale": "model-00044-of-00047.safetensors", + "model.layers.43.mlp.experts.90.down_proj.weight": "model-00044-of-00047.safetensors", + "model.layers.43.mlp.experts.90.down_proj.weight_scale": "model-00044-of-00047.safetensors", + "model.layers.43.mlp.experts.90.gate_proj.weight": "model-00044-of-00047.safetensors", + "model.layers.43.mlp.experts.90.gate_proj.weight_scale": "model-00044-of-00047.safetensors", + "model.layers.43.mlp.experts.90.up_proj.weight": "model-00044-of-00047.safetensors", + "model.layers.43.mlp.experts.90.up_proj.weight_scale": "model-00044-of-00047.safetensors", + "model.layers.43.mlp.experts.91.down_proj.weight": "model-00044-of-00047.safetensors", + "model.layers.43.mlp.experts.91.down_proj.weight_scale": "model-00044-of-00047.safetensors", + "model.layers.43.mlp.experts.91.gate_proj.weight": "model-00044-of-00047.safetensors", + "model.layers.43.mlp.experts.91.gate_proj.weight_scale": "model-00044-of-00047.safetensors", + "model.layers.43.mlp.experts.91.up_proj.weight": "model-00044-of-00047.safetensors", + "model.layers.43.mlp.experts.91.up_proj.weight_scale": "model-00044-of-00047.safetensors", + "model.layers.43.mlp.experts.92.down_proj.weight": "model-00044-of-00047.safetensors", + "model.layers.43.mlp.experts.92.down_proj.weight_scale": "model-00044-of-00047.safetensors", + "model.layers.43.mlp.experts.92.gate_proj.weight": "model-00044-of-00047.safetensors", + "model.layers.43.mlp.experts.92.gate_proj.weight_scale": "model-00044-of-00047.safetensors", + "model.layers.43.mlp.experts.92.up_proj.weight": "model-00044-of-00047.safetensors", + "model.layers.43.mlp.experts.92.up_proj.weight_scale": "model-00044-of-00047.safetensors", + "model.layers.43.mlp.experts.93.down_proj.weight": "model-00044-of-00047.safetensors", + "model.layers.43.mlp.experts.93.down_proj.weight_scale": "model-00044-of-00047.safetensors", + "model.layers.43.mlp.experts.93.gate_proj.weight": "model-00044-of-00047.safetensors", + "model.layers.43.mlp.experts.93.gate_proj.weight_scale": "model-00044-of-00047.safetensors", + "model.layers.43.mlp.experts.93.up_proj.weight": "model-00044-of-00047.safetensors", + "model.layers.43.mlp.experts.93.up_proj.weight_scale": "model-00044-of-00047.safetensors", + "model.layers.43.mlp.experts.94.down_proj.weight": "model-00044-of-00047.safetensors", + "model.layers.43.mlp.experts.94.down_proj.weight_scale": "model-00044-of-00047.safetensors", + "model.layers.43.mlp.experts.94.gate_proj.weight": "model-00044-of-00047.safetensors", + "model.layers.43.mlp.experts.94.gate_proj.weight_scale": "model-00044-of-00047.safetensors", + "model.layers.43.mlp.experts.94.up_proj.weight": "model-00044-of-00047.safetensors", + "model.layers.43.mlp.experts.94.up_proj.weight_scale": "model-00044-of-00047.safetensors", + "model.layers.43.mlp.experts.95.down_proj.weight": "model-00044-of-00047.safetensors", + "model.layers.43.mlp.experts.95.down_proj.weight_scale": "model-00044-of-00047.safetensors", + "model.layers.43.mlp.experts.95.gate_proj.weight": "model-00044-of-00047.safetensors", + "model.layers.43.mlp.experts.95.gate_proj.weight_scale": "model-00044-of-00047.safetensors", + "model.layers.43.mlp.experts.95.up_proj.weight": "model-00044-of-00047.safetensors", + "model.layers.43.mlp.experts.95.up_proj.weight_scale": "model-00044-of-00047.safetensors", + "model.layers.43.mlp.experts.96.down_proj.weight": "model-00044-of-00047.safetensors", + "model.layers.43.mlp.experts.96.down_proj.weight_scale": "model-00044-of-00047.safetensors", + "model.layers.43.mlp.experts.96.gate_proj.weight": "model-00044-of-00047.safetensors", + "model.layers.43.mlp.experts.96.gate_proj.weight_scale": "model-00044-of-00047.safetensors", + "model.layers.43.mlp.experts.96.up_proj.weight": "model-00044-of-00047.safetensors", + "model.layers.43.mlp.experts.96.up_proj.weight_scale": "model-00044-of-00047.safetensors", + "model.layers.43.mlp.experts.97.down_proj.weight": "model-00044-of-00047.safetensors", + "model.layers.43.mlp.experts.97.down_proj.weight_scale": "model-00044-of-00047.safetensors", + "model.layers.43.mlp.experts.97.gate_proj.weight": "model-00044-of-00047.safetensors", + "model.layers.43.mlp.experts.97.gate_proj.weight_scale": "model-00044-of-00047.safetensors", + "model.layers.43.mlp.experts.97.up_proj.weight": "model-00044-of-00047.safetensors", + "model.layers.43.mlp.experts.97.up_proj.weight_scale": "model-00044-of-00047.safetensors", + "model.layers.43.mlp.experts.98.down_proj.weight": "model-00044-of-00047.safetensors", + "model.layers.43.mlp.experts.98.down_proj.weight_scale": "model-00044-of-00047.safetensors", + "model.layers.43.mlp.experts.98.gate_proj.weight": "model-00044-of-00047.safetensors", + "model.layers.43.mlp.experts.98.gate_proj.weight_scale": "model-00044-of-00047.safetensors", + "model.layers.43.mlp.experts.98.up_proj.weight": "model-00044-of-00047.safetensors", + "model.layers.43.mlp.experts.98.up_proj.weight_scale": "model-00044-of-00047.safetensors", + "model.layers.43.mlp.experts.99.down_proj.weight": "model-00044-of-00047.safetensors", + "model.layers.43.mlp.experts.99.down_proj.weight_scale": "model-00044-of-00047.safetensors", + "model.layers.43.mlp.experts.99.gate_proj.weight": "model-00044-of-00047.safetensors", + "model.layers.43.mlp.experts.99.gate_proj.weight_scale": "model-00044-of-00047.safetensors", + "model.layers.43.mlp.experts.99.up_proj.weight": "model-00044-of-00047.safetensors", + "model.layers.43.mlp.experts.99.up_proj.weight_scale": "model-00044-of-00047.safetensors", + "model.layers.43.mlp.gate.e_score_correction_bias": "model-00044-of-00047.safetensors", + "model.layers.43.mlp.gate.weight": "model-00044-of-00047.safetensors", + "model.layers.43.mlp.shared_experts.down_proj.weight": "model-00044-of-00047.safetensors", + "model.layers.43.mlp.shared_experts.down_proj.weight_scale": "model-00044-of-00047.safetensors", + "model.layers.43.mlp.shared_experts.gate_proj.weight": "model-00044-of-00047.safetensors", + "model.layers.43.mlp.shared_experts.gate_proj.weight_scale": "model-00044-of-00047.safetensors", + "model.layers.43.mlp.shared_experts.up_proj.weight": "model-00044-of-00047.safetensors", + "model.layers.43.mlp.shared_experts.up_proj.weight_scale": "model-00044-of-00047.safetensors", + "model.layers.43.post_attention_layernorm.weight": "model-00044-of-00047.safetensors", + "model.layers.43.self_attn.k_proj.bias": "model-00044-of-00047.safetensors", + "model.layers.43.self_attn.k_proj.weight": "model-00044-of-00047.safetensors", + "model.layers.43.self_attn.k_proj.weight_scale": "model-00044-of-00047.safetensors", + "model.layers.43.self_attn.o_proj.weight": "model-00044-of-00047.safetensors", + "model.layers.43.self_attn.o_proj.weight_scale": "model-00044-of-00047.safetensors", + "model.layers.43.self_attn.q_proj.bias": "model-00044-of-00047.safetensors", + "model.layers.43.self_attn.q_proj.weight": "model-00044-of-00047.safetensors", + "model.layers.43.self_attn.q_proj.weight_scale": "model-00044-of-00047.safetensors", + "model.layers.43.self_attn.v_proj.bias": "model-00044-of-00047.safetensors", + "model.layers.43.self_attn.v_proj.weight": "model-00044-of-00047.safetensors", + "model.layers.43.self_attn.v_proj.weight_scale": "model-00044-of-00047.safetensors", + "model.layers.44.input_layernorm.weight": "model-00045-of-00047.safetensors", + "model.layers.44.mlp.experts.0.down_proj.weight": "model-00045-of-00047.safetensors", + "model.layers.44.mlp.experts.0.down_proj.weight_scale": "model-00045-of-00047.safetensors", + "model.layers.44.mlp.experts.0.gate_proj.weight": "model-00045-of-00047.safetensors", + "model.layers.44.mlp.experts.0.gate_proj.weight_scale": "model-00045-of-00047.safetensors", + "model.layers.44.mlp.experts.0.up_proj.weight": "model-00045-of-00047.safetensors", + "model.layers.44.mlp.experts.0.up_proj.weight_scale": "model-00045-of-00047.safetensors", + "model.layers.44.mlp.experts.1.down_proj.weight": "model-00045-of-00047.safetensors", + "model.layers.44.mlp.experts.1.down_proj.weight_scale": "model-00045-of-00047.safetensors", + "model.layers.44.mlp.experts.1.gate_proj.weight": "model-00045-of-00047.safetensors", + "model.layers.44.mlp.experts.1.gate_proj.weight_scale": "model-00045-of-00047.safetensors", + "model.layers.44.mlp.experts.1.up_proj.weight": "model-00045-of-00047.safetensors", + "model.layers.44.mlp.experts.1.up_proj.weight_scale": "model-00045-of-00047.safetensors", + "model.layers.44.mlp.experts.10.down_proj.weight": "model-00045-of-00047.safetensors", + "model.layers.44.mlp.experts.10.down_proj.weight_scale": "model-00045-of-00047.safetensors", + "model.layers.44.mlp.experts.10.gate_proj.weight": "model-00045-of-00047.safetensors", + "model.layers.44.mlp.experts.10.gate_proj.weight_scale": "model-00045-of-00047.safetensors", + "model.layers.44.mlp.experts.10.up_proj.weight": "model-00045-of-00047.safetensors", + "model.layers.44.mlp.experts.10.up_proj.weight_scale": "model-00045-of-00047.safetensors", + "model.layers.44.mlp.experts.100.down_proj.weight": "model-00045-of-00047.safetensors", + "model.layers.44.mlp.experts.100.down_proj.weight_scale": "model-00045-of-00047.safetensors", + "model.layers.44.mlp.experts.100.gate_proj.weight": "model-00045-of-00047.safetensors", + "model.layers.44.mlp.experts.100.gate_proj.weight_scale": "model-00045-of-00047.safetensors", + "model.layers.44.mlp.experts.100.up_proj.weight": "model-00045-of-00047.safetensors", + "model.layers.44.mlp.experts.100.up_proj.weight_scale": "model-00045-of-00047.safetensors", + "model.layers.44.mlp.experts.101.down_proj.weight": "model-00045-of-00047.safetensors", + "model.layers.44.mlp.experts.101.down_proj.weight_scale": "model-00045-of-00047.safetensors", + "model.layers.44.mlp.experts.101.gate_proj.weight": "model-00045-of-00047.safetensors", + "model.layers.44.mlp.experts.101.gate_proj.weight_scale": "model-00045-of-00047.safetensors", + "model.layers.44.mlp.experts.101.up_proj.weight": "model-00045-of-00047.safetensors", + "model.layers.44.mlp.experts.101.up_proj.weight_scale": "model-00045-of-00047.safetensors", + "model.layers.44.mlp.experts.102.down_proj.weight": "model-00045-of-00047.safetensors", + "model.layers.44.mlp.experts.102.down_proj.weight_scale": "model-00045-of-00047.safetensors", + "model.layers.44.mlp.experts.102.gate_proj.weight": "model-00045-of-00047.safetensors", + "model.layers.44.mlp.experts.102.gate_proj.weight_scale": "model-00045-of-00047.safetensors", + "model.layers.44.mlp.experts.102.up_proj.weight": "model-00045-of-00047.safetensors", + "model.layers.44.mlp.experts.102.up_proj.weight_scale": "model-00045-of-00047.safetensors", + "model.layers.44.mlp.experts.103.down_proj.weight": "model-00045-of-00047.safetensors", + "model.layers.44.mlp.experts.103.down_proj.weight_scale": "model-00045-of-00047.safetensors", + "model.layers.44.mlp.experts.103.gate_proj.weight": "model-00045-of-00047.safetensors", + "model.layers.44.mlp.experts.103.gate_proj.weight_scale": "model-00045-of-00047.safetensors", + "model.layers.44.mlp.experts.103.up_proj.weight": "model-00045-of-00047.safetensors", + "model.layers.44.mlp.experts.103.up_proj.weight_scale": "model-00045-of-00047.safetensors", + "model.layers.44.mlp.experts.104.down_proj.weight": "model-00045-of-00047.safetensors", + "model.layers.44.mlp.experts.104.down_proj.weight_scale": "model-00045-of-00047.safetensors", + "model.layers.44.mlp.experts.104.gate_proj.weight": "model-00045-of-00047.safetensors", + "model.layers.44.mlp.experts.104.gate_proj.weight_scale": "model-00045-of-00047.safetensors", + "model.layers.44.mlp.experts.104.up_proj.weight": "model-00045-of-00047.safetensors", + "model.layers.44.mlp.experts.104.up_proj.weight_scale": "model-00045-of-00047.safetensors", + "model.layers.44.mlp.experts.105.down_proj.weight": "model-00045-of-00047.safetensors", + "model.layers.44.mlp.experts.105.down_proj.weight_scale": "model-00045-of-00047.safetensors", + "model.layers.44.mlp.experts.105.gate_proj.weight": "model-00045-of-00047.safetensors", + "model.layers.44.mlp.experts.105.gate_proj.weight_scale": "model-00045-of-00047.safetensors", + "model.layers.44.mlp.experts.105.up_proj.weight": "model-00045-of-00047.safetensors", + "model.layers.44.mlp.experts.105.up_proj.weight_scale": "model-00045-of-00047.safetensors", + "model.layers.44.mlp.experts.106.down_proj.weight": "model-00045-of-00047.safetensors", + "model.layers.44.mlp.experts.106.down_proj.weight_scale": "model-00045-of-00047.safetensors", + "model.layers.44.mlp.experts.106.gate_proj.weight": "model-00045-of-00047.safetensors", + "model.layers.44.mlp.experts.106.gate_proj.weight_scale": "model-00045-of-00047.safetensors", + "model.layers.44.mlp.experts.106.up_proj.weight": "model-00045-of-00047.safetensors", + "model.layers.44.mlp.experts.106.up_proj.weight_scale": "model-00045-of-00047.safetensors", + "model.layers.44.mlp.experts.107.down_proj.weight": "model-00045-of-00047.safetensors", + "model.layers.44.mlp.experts.107.down_proj.weight_scale": "model-00045-of-00047.safetensors", + "model.layers.44.mlp.experts.107.gate_proj.weight": "model-00045-of-00047.safetensors", + "model.layers.44.mlp.experts.107.gate_proj.weight_scale": "model-00045-of-00047.safetensors", + "model.layers.44.mlp.experts.107.up_proj.weight": "model-00045-of-00047.safetensors", + "model.layers.44.mlp.experts.107.up_proj.weight_scale": "model-00045-of-00047.safetensors", + "model.layers.44.mlp.experts.108.down_proj.weight": "model-00045-of-00047.safetensors", + "model.layers.44.mlp.experts.108.down_proj.weight_scale": "model-00045-of-00047.safetensors", + "model.layers.44.mlp.experts.108.gate_proj.weight": "model-00045-of-00047.safetensors", + "model.layers.44.mlp.experts.108.gate_proj.weight_scale": "model-00045-of-00047.safetensors", + "model.layers.44.mlp.experts.108.up_proj.weight": "model-00045-of-00047.safetensors", + "model.layers.44.mlp.experts.108.up_proj.weight_scale": "model-00045-of-00047.safetensors", + "model.layers.44.mlp.experts.109.down_proj.weight": "model-00045-of-00047.safetensors", + "model.layers.44.mlp.experts.109.down_proj.weight_scale": "model-00045-of-00047.safetensors", + "model.layers.44.mlp.experts.109.gate_proj.weight": "model-00045-of-00047.safetensors", + "model.layers.44.mlp.experts.109.gate_proj.weight_scale": "model-00045-of-00047.safetensors", + "model.layers.44.mlp.experts.109.up_proj.weight": "model-00045-of-00047.safetensors", + "model.layers.44.mlp.experts.109.up_proj.weight_scale": "model-00045-of-00047.safetensors", + "model.layers.44.mlp.experts.11.down_proj.weight": "model-00045-of-00047.safetensors", + "model.layers.44.mlp.experts.11.down_proj.weight_scale": "model-00045-of-00047.safetensors", + "model.layers.44.mlp.experts.11.gate_proj.weight": "model-00045-of-00047.safetensors", + "model.layers.44.mlp.experts.11.gate_proj.weight_scale": "model-00045-of-00047.safetensors", + "model.layers.44.mlp.experts.11.up_proj.weight": "model-00045-of-00047.safetensors", + "model.layers.44.mlp.experts.11.up_proj.weight_scale": "model-00045-of-00047.safetensors", + "model.layers.44.mlp.experts.110.down_proj.weight": "model-00045-of-00047.safetensors", + "model.layers.44.mlp.experts.110.down_proj.weight_scale": "model-00045-of-00047.safetensors", + "model.layers.44.mlp.experts.110.gate_proj.weight": "model-00045-of-00047.safetensors", + "model.layers.44.mlp.experts.110.gate_proj.weight_scale": "model-00045-of-00047.safetensors", + "model.layers.44.mlp.experts.110.up_proj.weight": "model-00045-of-00047.safetensors", + "model.layers.44.mlp.experts.110.up_proj.weight_scale": "model-00045-of-00047.safetensors", + "model.layers.44.mlp.experts.111.down_proj.weight": "model-00045-of-00047.safetensors", + "model.layers.44.mlp.experts.111.down_proj.weight_scale": "model-00045-of-00047.safetensors", + "model.layers.44.mlp.experts.111.gate_proj.weight": "model-00045-of-00047.safetensors", + "model.layers.44.mlp.experts.111.gate_proj.weight_scale": "model-00045-of-00047.safetensors", + "model.layers.44.mlp.experts.111.up_proj.weight": "model-00045-of-00047.safetensors", + "model.layers.44.mlp.experts.111.up_proj.weight_scale": "model-00045-of-00047.safetensors", + "model.layers.44.mlp.experts.112.down_proj.weight": "model-00045-of-00047.safetensors", + "model.layers.44.mlp.experts.112.down_proj.weight_scale": "model-00045-of-00047.safetensors", + "model.layers.44.mlp.experts.112.gate_proj.weight": "model-00045-of-00047.safetensors", + "model.layers.44.mlp.experts.112.gate_proj.weight_scale": "model-00045-of-00047.safetensors", + "model.layers.44.mlp.experts.112.up_proj.weight": "model-00045-of-00047.safetensors", + "model.layers.44.mlp.experts.112.up_proj.weight_scale": "model-00045-of-00047.safetensors", + "model.layers.44.mlp.experts.113.down_proj.weight": "model-00045-of-00047.safetensors", + "model.layers.44.mlp.experts.113.down_proj.weight_scale": "model-00045-of-00047.safetensors", + "model.layers.44.mlp.experts.113.gate_proj.weight": "model-00045-of-00047.safetensors", + "model.layers.44.mlp.experts.113.gate_proj.weight_scale": "model-00045-of-00047.safetensors", + "model.layers.44.mlp.experts.113.up_proj.weight": "model-00045-of-00047.safetensors", + "model.layers.44.mlp.experts.113.up_proj.weight_scale": "model-00045-of-00047.safetensors", + "model.layers.44.mlp.experts.114.down_proj.weight": "model-00045-of-00047.safetensors", + "model.layers.44.mlp.experts.114.down_proj.weight_scale": "model-00045-of-00047.safetensors", + "model.layers.44.mlp.experts.114.gate_proj.weight": "model-00045-of-00047.safetensors", + "model.layers.44.mlp.experts.114.gate_proj.weight_scale": "model-00045-of-00047.safetensors", + "model.layers.44.mlp.experts.114.up_proj.weight": "model-00045-of-00047.safetensors", + "model.layers.44.mlp.experts.114.up_proj.weight_scale": "model-00045-of-00047.safetensors", + "model.layers.44.mlp.experts.115.down_proj.weight": "model-00045-of-00047.safetensors", + "model.layers.44.mlp.experts.115.down_proj.weight_scale": "model-00045-of-00047.safetensors", + "model.layers.44.mlp.experts.115.gate_proj.weight": "model-00045-of-00047.safetensors", + "model.layers.44.mlp.experts.115.gate_proj.weight_scale": "model-00045-of-00047.safetensors", + "model.layers.44.mlp.experts.115.up_proj.weight": "model-00045-of-00047.safetensors", + "model.layers.44.mlp.experts.115.up_proj.weight_scale": "model-00045-of-00047.safetensors", + "model.layers.44.mlp.experts.116.down_proj.weight": "model-00045-of-00047.safetensors", + "model.layers.44.mlp.experts.116.down_proj.weight_scale": "model-00045-of-00047.safetensors", + "model.layers.44.mlp.experts.116.gate_proj.weight": "model-00045-of-00047.safetensors", + "model.layers.44.mlp.experts.116.gate_proj.weight_scale": "model-00045-of-00047.safetensors", + "model.layers.44.mlp.experts.116.up_proj.weight": "model-00045-of-00047.safetensors", + "model.layers.44.mlp.experts.116.up_proj.weight_scale": "model-00045-of-00047.safetensors", + "model.layers.44.mlp.experts.117.down_proj.weight": "model-00045-of-00047.safetensors", + "model.layers.44.mlp.experts.117.down_proj.weight_scale": "model-00045-of-00047.safetensors", + "model.layers.44.mlp.experts.117.gate_proj.weight": "model-00045-of-00047.safetensors", + "model.layers.44.mlp.experts.117.gate_proj.weight_scale": "model-00045-of-00047.safetensors", + "model.layers.44.mlp.experts.117.up_proj.weight": "model-00045-of-00047.safetensors", + "model.layers.44.mlp.experts.117.up_proj.weight_scale": "model-00045-of-00047.safetensors", + "model.layers.44.mlp.experts.118.down_proj.weight": "model-00045-of-00047.safetensors", + "model.layers.44.mlp.experts.118.down_proj.weight_scale": "model-00045-of-00047.safetensors", + "model.layers.44.mlp.experts.118.gate_proj.weight": "model-00045-of-00047.safetensors", + "model.layers.44.mlp.experts.118.gate_proj.weight_scale": "model-00045-of-00047.safetensors", + "model.layers.44.mlp.experts.118.up_proj.weight": "model-00045-of-00047.safetensors", + "model.layers.44.mlp.experts.118.up_proj.weight_scale": "model-00045-of-00047.safetensors", + "model.layers.44.mlp.experts.119.down_proj.weight": "model-00045-of-00047.safetensors", + "model.layers.44.mlp.experts.119.down_proj.weight_scale": "model-00045-of-00047.safetensors", + "model.layers.44.mlp.experts.119.gate_proj.weight": "model-00045-of-00047.safetensors", + "model.layers.44.mlp.experts.119.gate_proj.weight_scale": "model-00045-of-00047.safetensors", + "model.layers.44.mlp.experts.119.up_proj.weight": "model-00045-of-00047.safetensors", + "model.layers.44.mlp.experts.119.up_proj.weight_scale": "model-00045-of-00047.safetensors", + "model.layers.44.mlp.experts.12.down_proj.weight": "model-00045-of-00047.safetensors", + "model.layers.44.mlp.experts.12.down_proj.weight_scale": "model-00045-of-00047.safetensors", + "model.layers.44.mlp.experts.12.gate_proj.weight": "model-00045-of-00047.safetensors", + "model.layers.44.mlp.experts.12.gate_proj.weight_scale": "model-00045-of-00047.safetensors", + "model.layers.44.mlp.experts.12.up_proj.weight": "model-00045-of-00047.safetensors", + "model.layers.44.mlp.experts.12.up_proj.weight_scale": "model-00045-of-00047.safetensors", + "model.layers.44.mlp.experts.120.down_proj.weight": "model-00045-of-00047.safetensors", + "model.layers.44.mlp.experts.120.down_proj.weight_scale": "model-00045-of-00047.safetensors", + "model.layers.44.mlp.experts.120.gate_proj.weight": "model-00045-of-00047.safetensors", + "model.layers.44.mlp.experts.120.gate_proj.weight_scale": "model-00045-of-00047.safetensors", + "model.layers.44.mlp.experts.120.up_proj.weight": "model-00045-of-00047.safetensors", + "model.layers.44.mlp.experts.120.up_proj.weight_scale": "model-00045-of-00047.safetensors", + "model.layers.44.mlp.experts.121.down_proj.weight": "model-00045-of-00047.safetensors", + "model.layers.44.mlp.experts.121.down_proj.weight_scale": "model-00045-of-00047.safetensors", + "model.layers.44.mlp.experts.121.gate_proj.weight": "model-00045-of-00047.safetensors", + "model.layers.44.mlp.experts.121.gate_proj.weight_scale": "model-00045-of-00047.safetensors", + "model.layers.44.mlp.experts.121.up_proj.weight": "model-00045-of-00047.safetensors", + "model.layers.44.mlp.experts.121.up_proj.weight_scale": "model-00045-of-00047.safetensors", + "model.layers.44.mlp.experts.122.down_proj.weight": "model-00045-of-00047.safetensors", + "model.layers.44.mlp.experts.122.down_proj.weight_scale": "model-00045-of-00047.safetensors", + "model.layers.44.mlp.experts.122.gate_proj.weight": "model-00045-of-00047.safetensors", + "model.layers.44.mlp.experts.122.gate_proj.weight_scale": "model-00045-of-00047.safetensors", + "model.layers.44.mlp.experts.122.up_proj.weight": "model-00045-of-00047.safetensors", + "model.layers.44.mlp.experts.122.up_proj.weight_scale": "model-00045-of-00047.safetensors", + "model.layers.44.mlp.experts.123.down_proj.weight": "model-00045-of-00047.safetensors", + "model.layers.44.mlp.experts.123.down_proj.weight_scale": "model-00045-of-00047.safetensors", + "model.layers.44.mlp.experts.123.gate_proj.weight": "model-00045-of-00047.safetensors", + "model.layers.44.mlp.experts.123.gate_proj.weight_scale": "model-00045-of-00047.safetensors", + "model.layers.44.mlp.experts.123.up_proj.weight": "model-00045-of-00047.safetensors", + "model.layers.44.mlp.experts.123.up_proj.weight_scale": "model-00045-of-00047.safetensors", + "model.layers.44.mlp.experts.124.down_proj.weight": "model-00045-of-00047.safetensors", + "model.layers.44.mlp.experts.124.down_proj.weight_scale": "model-00045-of-00047.safetensors", + "model.layers.44.mlp.experts.124.gate_proj.weight": "model-00045-of-00047.safetensors", + "model.layers.44.mlp.experts.124.gate_proj.weight_scale": "model-00045-of-00047.safetensors", + "model.layers.44.mlp.experts.124.up_proj.weight": "model-00045-of-00047.safetensors", + "model.layers.44.mlp.experts.124.up_proj.weight_scale": "model-00045-of-00047.safetensors", + "model.layers.44.mlp.experts.125.down_proj.weight": "model-00045-of-00047.safetensors", + "model.layers.44.mlp.experts.125.down_proj.weight_scale": "model-00045-of-00047.safetensors", + "model.layers.44.mlp.experts.125.gate_proj.weight": "model-00045-of-00047.safetensors", + "model.layers.44.mlp.experts.125.gate_proj.weight_scale": "model-00045-of-00047.safetensors", + "model.layers.44.mlp.experts.125.up_proj.weight": "model-00045-of-00047.safetensors", + "model.layers.44.mlp.experts.125.up_proj.weight_scale": "model-00045-of-00047.safetensors", + "model.layers.44.mlp.experts.126.down_proj.weight": "model-00045-of-00047.safetensors", + "model.layers.44.mlp.experts.126.down_proj.weight_scale": "model-00045-of-00047.safetensors", + "model.layers.44.mlp.experts.126.gate_proj.weight": "model-00045-of-00047.safetensors", + "model.layers.44.mlp.experts.126.gate_proj.weight_scale": "model-00045-of-00047.safetensors", + "model.layers.44.mlp.experts.126.up_proj.weight": "model-00045-of-00047.safetensors", + "model.layers.44.mlp.experts.126.up_proj.weight_scale": "model-00045-of-00047.safetensors", + "model.layers.44.mlp.experts.127.down_proj.weight": "model-00045-of-00047.safetensors", + "model.layers.44.mlp.experts.127.down_proj.weight_scale": "model-00045-of-00047.safetensors", + "model.layers.44.mlp.experts.127.gate_proj.weight": "model-00045-of-00047.safetensors", + "model.layers.44.mlp.experts.127.gate_proj.weight_scale": "model-00045-of-00047.safetensors", + "model.layers.44.mlp.experts.127.up_proj.weight": "model-00045-of-00047.safetensors", + "model.layers.44.mlp.experts.127.up_proj.weight_scale": "model-00045-of-00047.safetensors", + "model.layers.44.mlp.experts.13.down_proj.weight": "model-00045-of-00047.safetensors", + "model.layers.44.mlp.experts.13.down_proj.weight_scale": "model-00045-of-00047.safetensors", + "model.layers.44.mlp.experts.13.gate_proj.weight": "model-00045-of-00047.safetensors", + "model.layers.44.mlp.experts.13.gate_proj.weight_scale": "model-00045-of-00047.safetensors", + "model.layers.44.mlp.experts.13.up_proj.weight": "model-00045-of-00047.safetensors", + "model.layers.44.mlp.experts.13.up_proj.weight_scale": "model-00045-of-00047.safetensors", + "model.layers.44.mlp.experts.14.down_proj.weight": "model-00045-of-00047.safetensors", + "model.layers.44.mlp.experts.14.down_proj.weight_scale": "model-00045-of-00047.safetensors", + "model.layers.44.mlp.experts.14.gate_proj.weight": "model-00045-of-00047.safetensors", + "model.layers.44.mlp.experts.14.gate_proj.weight_scale": "model-00045-of-00047.safetensors", + "model.layers.44.mlp.experts.14.up_proj.weight": "model-00045-of-00047.safetensors", + "model.layers.44.mlp.experts.14.up_proj.weight_scale": "model-00045-of-00047.safetensors", + "model.layers.44.mlp.experts.15.down_proj.weight": "model-00045-of-00047.safetensors", + "model.layers.44.mlp.experts.15.down_proj.weight_scale": "model-00045-of-00047.safetensors", + "model.layers.44.mlp.experts.15.gate_proj.weight": "model-00045-of-00047.safetensors", + "model.layers.44.mlp.experts.15.gate_proj.weight_scale": "model-00045-of-00047.safetensors", + "model.layers.44.mlp.experts.15.up_proj.weight": "model-00045-of-00047.safetensors", + "model.layers.44.mlp.experts.15.up_proj.weight_scale": "model-00045-of-00047.safetensors", + "model.layers.44.mlp.experts.16.down_proj.weight": "model-00045-of-00047.safetensors", + "model.layers.44.mlp.experts.16.down_proj.weight_scale": "model-00045-of-00047.safetensors", + "model.layers.44.mlp.experts.16.gate_proj.weight": "model-00045-of-00047.safetensors", + "model.layers.44.mlp.experts.16.gate_proj.weight_scale": "model-00045-of-00047.safetensors", + "model.layers.44.mlp.experts.16.up_proj.weight": "model-00045-of-00047.safetensors", + "model.layers.44.mlp.experts.16.up_proj.weight_scale": "model-00045-of-00047.safetensors", + "model.layers.44.mlp.experts.17.down_proj.weight": "model-00045-of-00047.safetensors", + "model.layers.44.mlp.experts.17.down_proj.weight_scale": "model-00045-of-00047.safetensors", + "model.layers.44.mlp.experts.17.gate_proj.weight": "model-00045-of-00047.safetensors", + "model.layers.44.mlp.experts.17.gate_proj.weight_scale": "model-00045-of-00047.safetensors", + "model.layers.44.mlp.experts.17.up_proj.weight": "model-00045-of-00047.safetensors", + "model.layers.44.mlp.experts.17.up_proj.weight_scale": "model-00045-of-00047.safetensors", + "model.layers.44.mlp.experts.18.down_proj.weight": "model-00045-of-00047.safetensors", + "model.layers.44.mlp.experts.18.down_proj.weight_scale": "model-00045-of-00047.safetensors", + "model.layers.44.mlp.experts.18.gate_proj.weight": "model-00045-of-00047.safetensors", + "model.layers.44.mlp.experts.18.gate_proj.weight_scale": "model-00045-of-00047.safetensors", + "model.layers.44.mlp.experts.18.up_proj.weight": "model-00045-of-00047.safetensors", + "model.layers.44.mlp.experts.18.up_proj.weight_scale": "model-00045-of-00047.safetensors", + "model.layers.44.mlp.experts.19.down_proj.weight": "model-00045-of-00047.safetensors", + "model.layers.44.mlp.experts.19.down_proj.weight_scale": "model-00045-of-00047.safetensors", + "model.layers.44.mlp.experts.19.gate_proj.weight": "model-00045-of-00047.safetensors", + "model.layers.44.mlp.experts.19.gate_proj.weight_scale": "model-00045-of-00047.safetensors", + "model.layers.44.mlp.experts.19.up_proj.weight": "model-00045-of-00047.safetensors", + "model.layers.44.mlp.experts.19.up_proj.weight_scale": "model-00045-of-00047.safetensors", + "model.layers.44.mlp.experts.2.down_proj.weight": "model-00045-of-00047.safetensors", + "model.layers.44.mlp.experts.2.down_proj.weight_scale": "model-00045-of-00047.safetensors", + "model.layers.44.mlp.experts.2.gate_proj.weight": "model-00045-of-00047.safetensors", + "model.layers.44.mlp.experts.2.gate_proj.weight_scale": "model-00045-of-00047.safetensors", + "model.layers.44.mlp.experts.2.up_proj.weight": "model-00045-of-00047.safetensors", + "model.layers.44.mlp.experts.2.up_proj.weight_scale": "model-00045-of-00047.safetensors", + "model.layers.44.mlp.experts.20.down_proj.weight": "model-00045-of-00047.safetensors", + "model.layers.44.mlp.experts.20.down_proj.weight_scale": "model-00045-of-00047.safetensors", + "model.layers.44.mlp.experts.20.gate_proj.weight": "model-00045-of-00047.safetensors", + "model.layers.44.mlp.experts.20.gate_proj.weight_scale": "model-00045-of-00047.safetensors", + "model.layers.44.mlp.experts.20.up_proj.weight": "model-00045-of-00047.safetensors", + "model.layers.44.mlp.experts.20.up_proj.weight_scale": "model-00045-of-00047.safetensors", + "model.layers.44.mlp.experts.21.down_proj.weight": "model-00045-of-00047.safetensors", + "model.layers.44.mlp.experts.21.down_proj.weight_scale": "model-00045-of-00047.safetensors", + "model.layers.44.mlp.experts.21.gate_proj.weight": "model-00045-of-00047.safetensors", + "model.layers.44.mlp.experts.21.gate_proj.weight_scale": "model-00045-of-00047.safetensors", + "model.layers.44.mlp.experts.21.up_proj.weight": "model-00045-of-00047.safetensors", + "model.layers.44.mlp.experts.21.up_proj.weight_scale": "model-00045-of-00047.safetensors", + "model.layers.44.mlp.experts.22.down_proj.weight": "model-00045-of-00047.safetensors", + "model.layers.44.mlp.experts.22.down_proj.weight_scale": "model-00045-of-00047.safetensors", + "model.layers.44.mlp.experts.22.gate_proj.weight": "model-00045-of-00047.safetensors", + "model.layers.44.mlp.experts.22.gate_proj.weight_scale": "model-00045-of-00047.safetensors", + "model.layers.44.mlp.experts.22.up_proj.weight": "model-00045-of-00047.safetensors", + "model.layers.44.mlp.experts.22.up_proj.weight_scale": "model-00045-of-00047.safetensors", + "model.layers.44.mlp.experts.23.down_proj.weight": "model-00045-of-00047.safetensors", + "model.layers.44.mlp.experts.23.down_proj.weight_scale": "model-00045-of-00047.safetensors", + "model.layers.44.mlp.experts.23.gate_proj.weight": "model-00045-of-00047.safetensors", + "model.layers.44.mlp.experts.23.gate_proj.weight_scale": "model-00045-of-00047.safetensors", + "model.layers.44.mlp.experts.23.up_proj.weight": "model-00045-of-00047.safetensors", + "model.layers.44.mlp.experts.23.up_proj.weight_scale": "model-00045-of-00047.safetensors", + "model.layers.44.mlp.experts.24.down_proj.weight": "model-00045-of-00047.safetensors", + "model.layers.44.mlp.experts.24.down_proj.weight_scale": "model-00045-of-00047.safetensors", + "model.layers.44.mlp.experts.24.gate_proj.weight": "model-00045-of-00047.safetensors", + "model.layers.44.mlp.experts.24.gate_proj.weight_scale": "model-00045-of-00047.safetensors", + "model.layers.44.mlp.experts.24.up_proj.weight": "model-00045-of-00047.safetensors", + "model.layers.44.mlp.experts.24.up_proj.weight_scale": "model-00045-of-00047.safetensors", + "model.layers.44.mlp.experts.25.down_proj.weight": "model-00045-of-00047.safetensors", + "model.layers.44.mlp.experts.25.down_proj.weight_scale": "model-00045-of-00047.safetensors", + "model.layers.44.mlp.experts.25.gate_proj.weight": "model-00045-of-00047.safetensors", + "model.layers.44.mlp.experts.25.gate_proj.weight_scale": "model-00045-of-00047.safetensors", + "model.layers.44.mlp.experts.25.up_proj.weight": "model-00045-of-00047.safetensors", + "model.layers.44.mlp.experts.25.up_proj.weight_scale": "model-00045-of-00047.safetensors", + "model.layers.44.mlp.experts.26.down_proj.weight": "model-00045-of-00047.safetensors", + "model.layers.44.mlp.experts.26.down_proj.weight_scale": "model-00045-of-00047.safetensors", + "model.layers.44.mlp.experts.26.gate_proj.weight": "model-00045-of-00047.safetensors", + "model.layers.44.mlp.experts.26.gate_proj.weight_scale": "model-00045-of-00047.safetensors", + "model.layers.44.mlp.experts.26.up_proj.weight": "model-00045-of-00047.safetensors", + "model.layers.44.mlp.experts.26.up_proj.weight_scale": "model-00045-of-00047.safetensors", + "model.layers.44.mlp.experts.27.down_proj.weight": "model-00045-of-00047.safetensors", + "model.layers.44.mlp.experts.27.down_proj.weight_scale": "model-00045-of-00047.safetensors", + "model.layers.44.mlp.experts.27.gate_proj.weight": "model-00045-of-00047.safetensors", + "model.layers.44.mlp.experts.27.gate_proj.weight_scale": "model-00045-of-00047.safetensors", + "model.layers.44.mlp.experts.27.up_proj.weight": "model-00045-of-00047.safetensors", + "model.layers.44.mlp.experts.27.up_proj.weight_scale": "model-00045-of-00047.safetensors", + "model.layers.44.mlp.experts.28.down_proj.weight": "model-00045-of-00047.safetensors", + "model.layers.44.mlp.experts.28.down_proj.weight_scale": "model-00045-of-00047.safetensors", + "model.layers.44.mlp.experts.28.gate_proj.weight": "model-00045-of-00047.safetensors", + "model.layers.44.mlp.experts.28.gate_proj.weight_scale": "model-00045-of-00047.safetensors", + "model.layers.44.mlp.experts.28.up_proj.weight": "model-00045-of-00047.safetensors", + "model.layers.44.mlp.experts.28.up_proj.weight_scale": "model-00045-of-00047.safetensors", + "model.layers.44.mlp.experts.29.down_proj.weight": "model-00045-of-00047.safetensors", + "model.layers.44.mlp.experts.29.down_proj.weight_scale": "model-00045-of-00047.safetensors", + "model.layers.44.mlp.experts.29.gate_proj.weight": "model-00045-of-00047.safetensors", + "model.layers.44.mlp.experts.29.gate_proj.weight_scale": "model-00045-of-00047.safetensors", + "model.layers.44.mlp.experts.29.up_proj.weight": "model-00045-of-00047.safetensors", + "model.layers.44.mlp.experts.29.up_proj.weight_scale": "model-00045-of-00047.safetensors", + "model.layers.44.mlp.experts.3.down_proj.weight": "model-00045-of-00047.safetensors", + "model.layers.44.mlp.experts.3.down_proj.weight_scale": "model-00045-of-00047.safetensors", + "model.layers.44.mlp.experts.3.gate_proj.weight": "model-00045-of-00047.safetensors", + "model.layers.44.mlp.experts.3.gate_proj.weight_scale": "model-00045-of-00047.safetensors", + "model.layers.44.mlp.experts.3.up_proj.weight": "model-00045-of-00047.safetensors", + "model.layers.44.mlp.experts.3.up_proj.weight_scale": "model-00045-of-00047.safetensors", + "model.layers.44.mlp.experts.30.down_proj.weight": "model-00045-of-00047.safetensors", + "model.layers.44.mlp.experts.30.down_proj.weight_scale": "model-00045-of-00047.safetensors", + "model.layers.44.mlp.experts.30.gate_proj.weight": "model-00045-of-00047.safetensors", + "model.layers.44.mlp.experts.30.gate_proj.weight_scale": "model-00045-of-00047.safetensors", + "model.layers.44.mlp.experts.30.up_proj.weight": "model-00045-of-00047.safetensors", + "model.layers.44.mlp.experts.30.up_proj.weight_scale": "model-00045-of-00047.safetensors", + "model.layers.44.mlp.experts.31.down_proj.weight": "model-00045-of-00047.safetensors", + "model.layers.44.mlp.experts.31.down_proj.weight_scale": "model-00045-of-00047.safetensors", + "model.layers.44.mlp.experts.31.gate_proj.weight": "model-00045-of-00047.safetensors", + "model.layers.44.mlp.experts.31.gate_proj.weight_scale": "model-00045-of-00047.safetensors", + "model.layers.44.mlp.experts.31.up_proj.weight": "model-00045-of-00047.safetensors", + "model.layers.44.mlp.experts.31.up_proj.weight_scale": "model-00045-of-00047.safetensors", + "model.layers.44.mlp.experts.32.down_proj.weight": "model-00045-of-00047.safetensors", + "model.layers.44.mlp.experts.32.down_proj.weight_scale": "model-00045-of-00047.safetensors", + "model.layers.44.mlp.experts.32.gate_proj.weight": "model-00045-of-00047.safetensors", + "model.layers.44.mlp.experts.32.gate_proj.weight_scale": "model-00045-of-00047.safetensors", + "model.layers.44.mlp.experts.32.up_proj.weight": "model-00045-of-00047.safetensors", + "model.layers.44.mlp.experts.32.up_proj.weight_scale": "model-00045-of-00047.safetensors", + "model.layers.44.mlp.experts.33.down_proj.weight": "model-00045-of-00047.safetensors", + "model.layers.44.mlp.experts.33.down_proj.weight_scale": "model-00045-of-00047.safetensors", + "model.layers.44.mlp.experts.33.gate_proj.weight": "model-00045-of-00047.safetensors", + "model.layers.44.mlp.experts.33.gate_proj.weight_scale": "model-00045-of-00047.safetensors", + "model.layers.44.mlp.experts.33.up_proj.weight": "model-00045-of-00047.safetensors", + "model.layers.44.mlp.experts.33.up_proj.weight_scale": "model-00045-of-00047.safetensors", + "model.layers.44.mlp.experts.34.down_proj.weight": "model-00045-of-00047.safetensors", + "model.layers.44.mlp.experts.34.down_proj.weight_scale": "model-00045-of-00047.safetensors", + "model.layers.44.mlp.experts.34.gate_proj.weight": "model-00045-of-00047.safetensors", + "model.layers.44.mlp.experts.34.gate_proj.weight_scale": "model-00045-of-00047.safetensors", + "model.layers.44.mlp.experts.34.up_proj.weight": "model-00045-of-00047.safetensors", + "model.layers.44.mlp.experts.34.up_proj.weight_scale": "model-00045-of-00047.safetensors", + "model.layers.44.mlp.experts.35.down_proj.weight": "model-00045-of-00047.safetensors", + "model.layers.44.mlp.experts.35.down_proj.weight_scale": "model-00045-of-00047.safetensors", + "model.layers.44.mlp.experts.35.gate_proj.weight": "model-00045-of-00047.safetensors", + "model.layers.44.mlp.experts.35.gate_proj.weight_scale": "model-00045-of-00047.safetensors", + "model.layers.44.mlp.experts.35.up_proj.weight": "model-00045-of-00047.safetensors", + "model.layers.44.mlp.experts.35.up_proj.weight_scale": "model-00045-of-00047.safetensors", + "model.layers.44.mlp.experts.36.down_proj.weight": "model-00045-of-00047.safetensors", + "model.layers.44.mlp.experts.36.down_proj.weight_scale": "model-00045-of-00047.safetensors", + "model.layers.44.mlp.experts.36.gate_proj.weight": "model-00045-of-00047.safetensors", + "model.layers.44.mlp.experts.36.gate_proj.weight_scale": "model-00045-of-00047.safetensors", + "model.layers.44.mlp.experts.36.up_proj.weight": "model-00045-of-00047.safetensors", + "model.layers.44.mlp.experts.36.up_proj.weight_scale": "model-00045-of-00047.safetensors", + "model.layers.44.mlp.experts.37.down_proj.weight": "model-00045-of-00047.safetensors", + "model.layers.44.mlp.experts.37.down_proj.weight_scale": "model-00045-of-00047.safetensors", + "model.layers.44.mlp.experts.37.gate_proj.weight": "model-00045-of-00047.safetensors", + "model.layers.44.mlp.experts.37.gate_proj.weight_scale": "model-00045-of-00047.safetensors", + "model.layers.44.mlp.experts.37.up_proj.weight": "model-00045-of-00047.safetensors", + "model.layers.44.mlp.experts.37.up_proj.weight_scale": "model-00045-of-00047.safetensors", + "model.layers.44.mlp.experts.38.down_proj.weight": "model-00045-of-00047.safetensors", + "model.layers.44.mlp.experts.38.down_proj.weight_scale": "model-00045-of-00047.safetensors", + "model.layers.44.mlp.experts.38.gate_proj.weight": "model-00045-of-00047.safetensors", + "model.layers.44.mlp.experts.38.gate_proj.weight_scale": "model-00045-of-00047.safetensors", + "model.layers.44.mlp.experts.38.up_proj.weight": "model-00045-of-00047.safetensors", + "model.layers.44.mlp.experts.38.up_proj.weight_scale": "model-00045-of-00047.safetensors", + "model.layers.44.mlp.experts.39.down_proj.weight": "model-00045-of-00047.safetensors", + "model.layers.44.mlp.experts.39.down_proj.weight_scale": "model-00045-of-00047.safetensors", + "model.layers.44.mlp.experts.39.gate_proj.weight": "model-00045-of-00047.safetensors", + "model.layers.44.mlp.experts.39.gate_proj.weight_scale": "model-00045-of-00047.safetensors", + "model.layers.44.mlp.experts.39.up_proj.weight": "model-00045-of-00047.safetensors", + "model.layers.44.mlp.experts.39.up_proj.weight_scale": "model-00045-of-00047.safetensors", + "model.layers.44.mlp.experts.4.down_proj.weight": "model-00045-of-00047.safetensors", + "model.layers.44.mlp.experts.4.down_proj.weight_scale": "model-00045-of-00047.safetensors", + "model.layers.44.mlp.experts.4.gate_proj.weight": "model-00045-of-00047.safetensors", + "model.layers.44.mlp.experts.4.gate_proj.weight_scale": "model-00045-of-00047.safetensors", + "model.layers.44.mlp.experts.4.up_proj.weight": "model-00045-of-00047.safetensors", + "model.layers.44.mlp.experts.4.up_proj.weight_scale": "model-00045-of-00047.safetensors", + "model.layers.44.mlp.experts.40.down_proj.weight": "model-00045-of-00047.safetensors", + "model.layers.44.mlp.experts.40.down_proj.weight_scale": "model-00045-of-00047.safetensors", + "model.layers.44.mlp.experts.40.gate_proj.weight": "model-00045-of-00047.safetensors", + "model.layers.44.mlp.experts.40.gate_proj.weight_scale": "model-00045-of-00047.safetensors", + "model.layers.44.mlp.experts.40.up_proj.weight": "model-00045-of-00047.safetensors", + "model.layers.44.mlp.experts.40.up_proj.weight_scale": "model-00045-of-00047.safetensors", + "model.layers.44.mlp.experts.41.down_proj.weight": "model-00045-of-00047.safetensors", + "model.layers.44.mlp.experts.41.down_proj.weight_scale": "model-00045-of-00047.safetensors", + "model.layers.44.mlp.experts.41.gate_proj.weight": "model-00045-of-00047.safetensors", + "model.layers.44.mlp.experts.41.gate_proj.weight_scale": "model-00045-of-00047.safetensors", + "model.layers.44.mlp.experts.41.up_proj.weight": "model-00045-of-00047.safetensors", + "model.layers.44.mlp.experts.41.up_proj.weight_scale": "model-00045-of-00047.safetensors", + "model.layers.44.mlp.experts.42.down_proj.weight": "model-00045-of-00047.safetensors", + "model.layers.44.mlp.experts.42.down_proj.weight_scale": "model-00045-of-00047.safetensors", + "model.layers.44.mlp.experts.42.gate_proj.weight": "model-00045-of-00047.safetensors", + "model.layers.44.mlp.experts.42.gate_proj.weight_scale": "model-00045-of-00047.safetensors", + "model.layers.44.mlp.experts.42.up_proj.weight": "model-00045-of-00047.safetensors", + "model.layers.44.mlp.experts.42.up_proj.weight_scale": "model-00045-of-00047.safetensors", + "model.layers.44.mlp.experts.43.down_proj.weight": "model-00045-of-00047.safetensors", + "model.layers.44.mlp.experts.43.down_proj.weight_scale": "model-00045-of-00047.safetensors", + "model.layers.44.mlp.experts.43.gate_proj.weight": "model-00045-of-00047.safetensors", + "model.layers.44.mlp.experts.43.gate_proj.weight_scale": "model-00045-of-00047.safetensors", + "model.layers.44.mlp.experts.43.up_proj.weight": "model-00045-of-00047.safetensors", + "model.layers.44.mlp.experts.43.up_proj.weight_scale": "model-00045-of-00047.safetensors", + "model.layers.44.mlp.experts.44.down_proj.weight": "model-00045-of-00047.safetensors", + "model.layers.44.mlp.experts.44.down_proj.weight_scale": "model-00045-of-00047.safetensors", + "model.layers.44.mlp.experts.44.gate_proj.weight": "model-00045-of-00047.safetensors", + "model.layers.44.mlp.experts.44.gate_proj.weight_scale": "model-00045-of-00047.safetensors", + "model.layers.44.mlp.experts.44.up_proj.weight": "model-00045-of-00047.safetensors", + "model.layers.44.mlp.experts.44.up_proj.weight_scale": "model-00045-of-00047.safetensors", + "model.layers.44.mlp.experts.45.down_proj.weight": "model-00045-of-00047.safetensors", + "model.layers.44.mlp.experts.45.down_proj.weight_scale": "model-00045-of-00047.safetensors", + "model.layers.44.mlp.experts.45.gate_proj.weight": "model-00045-of-00047.safetensors", + "model.layers.44.mlp.experts.45.gate_proj.weight_scale": "model-00045-of-00047.safetensors", + "model.layers.44.mlp.experts.45.up_proj.weight": "model-00045-of-00047.safetensors", + "model.layers.44.mlp.experts.45.up_proj.weight_scale": "model-00045-of-00047.safetensors", + "model.layers.44.mlp.experts.46.down_proj.weight": "model-00045-of-00047.safetensors", + "model.layers.44.mlp.experts.46.down_proj.weight_scale": "model-00045-of-00047.safetensors", + "model.layers.44.mlp.experts.46.gate_proj.weight": "model-00045-of-00047.safetensors", + "model.layers.44.mlp.experts.46.gate_proj.weight_scale": "model-00045-of-00047.safetensors", + "model.layers.44.mlp.experts.46.up_proj.weight": "model-00045-of-00047.safetensors", + "model.layers.44.mlp.experts.46.up_proj.weight_scale": "model-00045-of-00047.safetensors", + "model.layers.44.mlp.experts.47.down_proj.weight": "model-00045-of-00047.safetensors", + "model.layers.44.mlp.experts.47.down_proj.weight_scale": "model-00045-of-00047.safetensors", + "model.layers.44.mlp.experts.47.gate_proj.weight": "model-00045-of-00047.safetensors", + "model.layers.44.mlp.experts.47.gate_proj.weight_scale": "model-00045-of-00047.safetensors", + "model.layers.44.mlp.experts.47.up_proj.weight": "model-00045-of-00047.safetensors", + "model.layers.44.mlp.experts.47.up_proj.weight_scale": "model-00045-of-00047.safetensors", + "model.layers.44.mlp.experts.48.down_proj.weight": "model-00045-of-00047.safetensors", + "model.layers.44.mlp.experts.48.down_proj.weight_scale": "model-00045-of-00047.safetensors", + "model.layers.44.mlp.experts.48.gate_proj.weight": "model-00045-of-00047.safetensors", + "model.layers.44.mlp.experts.48.gate_proj.weight_scale": "model-00045-of-00047.safetensors", + "model.layers.44.mlp.experts.48.up_proj.weight": "model-00045-of-00047.safetensors", + "model.layers.44.mlp.experts.48.up_proj.weight_scale": "model-00045-of-00047.safetensors", + "model.layers.44.mlp.experts.49.down_proj.weight": "model-00045-of-00047.safetensors", + "model.layers.44.mlp.experts.49.down_proj.weight_scale": "model-00045-of-00047.safetensors", + "model.layers.44.mlp.experts.49.gate_proj.weight": "model-00045-of-00047.safetensors", + "model.layers.44.mlp.experts.49.gate_proj.weight_scale": "model-00045-of-00047.safetensors", + "model.layers.44.mlp.experts.49.up_proj.weight": "model-00045-of-00047.safetensors", + "model.layers.44.mlp.experts.49.up_proj.weight_scale": "model-00045-of-00047.safetensors", + "model.layers.44.mlp.experts.5.down_proj.weight": "model-00045-of-00047.safetensors", + "model.layers.44.mlp.experts.5.down_proj.weight_scale": "model-00045-of-00047.safetensors", + "model.layers.44.mlp.experts.5.gate_proj.weight": "model-00045-of-00047.safetensors", + "model.layers.44.mlp.experts.5.gate_proj.weight_scale": "model-00045-of-00047.safetensors", + "model.layers.44.mlp.experts.5.up_proj.weight": "model-00045-of-00047.safetensors", + "model.layers.44.mlp.experts.5.up_proj.weight_scale": "model-00045-of-00047.safetensors", + "model.layers.44.mlp.experts.50.down_proj.weight": "model-00045-of-00047.safetensors", + "model.layers.44.mlp.experts.50.down_proj.weight_scale": "model-00045-of-00047.safetensors", + "model.layers.44.mlp.experts.50.gate_proj.weight": "model-00045-of-00047.safetensors", + "model.layers.44.mlp.experts.50.gate_proj.weight_scale": "model-00045-of-00047.safetensors", + "model.layers.44.mlp.experts.50.up_proj.weight": "model-00045-of-00047.safetensors", + "model.layers.44.mlp.experts.50.up_proj.weight_scale": "model-00045-of-00047.safetensors", + "model.layers.44.mlp.experts.51.down_proj.weight": "model-00045-of-00047.safetensors", + "model.layers.44.mlp.experts.51.down_proj.weight_scale": "model-00045-of-00047.safetensors", + "model.layers.44.mlp.experts.51.gate_proj.weight": "model-00045-of-00047.safetensors", + "model.layers.44.mlp.experts.51.gate_proj.weight_scale": "model-00045-of-00047.safetensors", + "model.layers.44.mlp.experts.51.up_proj.weight": "model-00045-of-00047.safetensors", + "model.layers.44.mlp.experts.51.up_proj.weight_scale": "model-00045-of-00047.safetensors", + "model.layers.44.mlp.experts.52.down_proj.weight": "model-00045-of-00047.safetensors", + "model.layers.44.mlp.experts.52.down_proj.weight_scale": "model-00045-of-00047.safetensors", + "model.layers.44.mlp.experts.52.gate_proj.weight": "model-00045-of-00047.safetensors", + "model.layers.44.mlp.experts.52.gate_proj.weight_scale": "model-00045-of-00047.safetensors", + "model.layers.44.mlp.experts.52.up_proj.weight": "model-00045-of-00047.safetensors", + "model.layers.44.mlp.experts.52.up_proj.weight_scale": "model-00045-of-00047.safetensors", + "model.layers.44.mlp.experts.53.down_proj.weight": "model-00045-of-00047.safetensors", + "model.layers.44.mlp.experts.53.down_proj.weight_scale": "model-00045-of-00047.safetensors", + "model.layers.44.mlp.experts.53.gate_proj.weight": "model-00045-of-00047.safetensors", + "model.layers.44.mlp.experts.53.gate_proj.weight_scale": "model-00045-of-00047.safetensors", + "model.layers.44.mlp.experts.53.up_proj.weight": "model-00045-of-00047.safetensors", + "model.layers.44.mlp.experts.53.up_proj.weight_scale": "model-00045-of-00047.safetensors", + "model.layers.44.mlp.experts.54.down_proj.weight": "model-00045-of-00047.safetensors", + "model.layers.44.mlp.experts.54.down_proj.weight_scale": "model-00045-of-00047.safetensors", + "model.layers.44.mlp.experts.54.gate_proj.weight": "model-00045-of-00047.safetensors", + "model.layers.44.mlp.experts.54.gate_proj.weight_scale": "model-00045-of-00047.safetensors", + "model.layers.44.mlp.experts.54.up_proj.weight": "model-00045-of-00047.safetensors", + "model.layers.44.mlp.experts.54.up_proj.weight_scale": "model-00045-of-00047.safetensors", + "model.layers.44.mlp.experts.55.down_proj.weight": "model-00045-of-00047.safetensors", + "model.layers.44.mlp.experts.55.down_proj.weight_scale": "model-00045-of-00047.safetensors", + "model.layers.44.mlp.experts.55.gate_proj.weight": "model-00045-of-00047.safetensors", + "model.layers.44.mlp.experts.55.gate_proj.weight_scale": "model-00045-of-00047.safetensors", + "model.layers.44.mlp.experts.55.up_proj.weight": "model-00045-of-00047.safetensors", + "model.layers.44.mlp.experts.55.up_proj.weight_scale": "model-00045-of-00047.safetensors", + "model.layers.44.mlp.experts.56.down_proj.weight": "model-00045-of-00047.safetensors", + "model.layers.44.mlp.experts.56.down_proj.weight_scale": "model-00045-of-00047.safetensors", + "model.layers.44.mlp.experts.56.gate_proj.weight": "model-00045-of-00047.safetensors", + "model.layers.44.mlp.experts.56.gate_proj.weight_scale": "model-00045-of-00047.safetensors", + "model.layers.44.mlp.experts.56.up_proj.weight": "model-00045-of-00047.safetensors", + "model.layers.44.mlp.experts.56.up_proj.weight_scale": "model-00045-of-00047.safetensors", + "model.layers.44.mlp.experts.57.down_proj.weight": "model-00045-of-00047.safetensors", + "model.layers.44.mlp.experts.57.down_proj.weight_scale": "model-00045-of-00047.safetensors", + "model.layers.44.mlp.experts.57.gate_proj.weight": "model-00045-of-00047.safetensors", + "model.layers.44.mlp.experts.57.gate_proj.weight_scale": "model-00045-of-00047.safetensors", + "model.layers.44.mlp.experts.57.up_proj.weight": "model-00045-of-00047.safetensors", + "model.layers.44.mlp.experts.57.up_proj.weight_scale": "model-00045-of-00047.safetensors", + "model.layers.44.mlp.experts.58.down_proj.weight": "model-00045-of-00047.safetensors", + "model.layers.44.mlp.experts.58.down_proj.weight_scale": "model-00045-of-00047.safetensors", + "model.layers.44.mlp.experts.58.gate_proj.weight": "model-00045-of-00047.safetensors", + "model.layers.44.mlp.experts.58.gate_proj.weight_scale": "model-00045-of-00047.safetensors", + "model.layers.44.mlp.experts.58.up_proj.weight": "model-00045-of-00047.safetensors", + "model.layers.44.mlp.experts.58.up_proj.weight_scale": "model-00045-of-00047.safetensors", + "model.layers.44.mlp.experts.59.down_proj.weight": "model-00045-of-00047.safetensors", + "model.layers.44.mlp.experts.59.down_proj.weight_scale": "model-00045-of-00047.safetensors", + "model.layers.44.mlp.experts.59.gate_proj.weight": "model-00045-of-00047.safetensors", + "model.layers.44.mlp.experts.59.gate_proj.weight_scale": "model-00045-of-00047.safetensors", + "model.layers.44.mlp.experts.59.up_proj.weight": "model-00045-of-00047.safetensors", + "model.layers.44.mlp.experts.59.up_proj.weight_scale": "model-00045-of-00047.safetensors", + "model.layers.44.mlp.experts.6.down_proj.weight": "model-00045-of-00047.safetensors", + "model.layers.44.mlp.experts.6.down_proj.weight_scale": "model-00045-of-00047.safetensors", + "model.layers.44.mlp.experts.6.gate_proj.weight": "model-00045-of-00047.safetensors", + "model.layers.44.mlp.experts.6.gate_proj.weight_scale": "model-00045-of-00047.safetensors", + "model.layers.44.mlp.experts.6.up_proj.weight": "model-00045-of-00047.safetensors", + "model.layers.44.mlp.experts.6.up_proj.weight_scale": "model-00045-of-00047.safetensors", + "model.layers.44.mlp.experts.60.down_proj.weight": "model-00045-of-00047.safetensors", + "model.layers.44.mlp.experts.60.down_proj.weight_scale": "model-00045-of-00047.safetensors", + "model.layers.44.mlp.experts.60.gate_proj.weight": "model-00045-of-00047.safetensors", + "model.layers.44.mlp.experts.60.gate_proj.weight_scale": "model-00045-of-00047.safetensors", + "model.layers.44.mlp.experts.60.up_proj.weight": "model-00045-of-00047.safetensors", + "model.layers.44.mlp.experts.60.up_proj.weight_scale": "model-00045-of-00047.safetensors", + "model.layers.44.mlp.experts.61.down_proj.weight": "model-00045-of-00047.safetensors", + "model.layers.44.mlp.experts.61.down_proj.weight_scale": "model-00045-of-00047.safetensors", + "model.layers.44.mlp.experts.61.gate_proj.weight": "model-00045-of-00047.safetensors", + "model.layers.44.mlp.experts.61.gate_proj.weight_scale": "model-00045-of-00047.safetensors", + "model.layers.44.mlp.experts.61.up_proj.weight": "model-00045-of-00047.safetensors", + "model.layers.44.mlp.experts.61.up_proj.weight_scale": "model-00045-of-00047.safetensors", + "model.layers.44.mlp.experts.62.down_proj.weight": "model-00045-of-00047.safetensors", + "model.layers.44.mlp.experts.62.down_proj.weight_scale": "model-00045-of-00047.safetensors", + "model.layers.44.mlp.experts.62.gate_proj.weight": "model-00045-of-00047.safetensors", + "model.layers.44.mlp.experts.62.gate_proj.weight_scale": "model-00045-of-00047.safetensors", + "model.layers.44.mlp.experts.62.up_proj.weight": "model-00045-of-00047.safetensors", + "model.layers.44.mlp.experts.62.up_proj.weight_scale": "model-00045-of-00047.safetensors", + "model.layers.44.mlp.experts.63.down_proj.weight": "model-00045-of-00047.safetensors", + "model.layers.44.mlp.experts.63.down_proj.weight_scale": "model-00045-of-00047.safetensors", + "model.layers.44.mlp.experts.63.gate_proj.weight": "model-00045-of-00047.safetensors", + "model.layers.44.mlp.experts.63.gate_proj.weight_scale": "model-00045-of-00047.safetensors", + "model.layers.44.mlp.experts.63.up_proj.weight": "model-00045-of-00047.safetensors", + "model.layers.44.mlp.experts.63.up_proj.weight_scale": "model-00045-of-00047.safetensors", + "model.layers.44.mlp.experts.64.down_proj.weight": "model-00045-of-00047.safetensors", + "model.layers.44.mlp.experts.64.down_proj.weight_scale": "model-00045-of-00047.safetensors", + "model.layers.44.mlp.experts.64.gate_proj.weight": "model-00045-of-00047.safetensors", + "model.layers.44.mlp.experts.64.gate_proj.weight_scale": "model-00045-of-00047.safetensors", + "model.layers.44.mlp.experts.64.up_proj.weight": "model-00045-of-00047.safetensors", + "model.layers.44.mlp.experts.64.up_proj.weight_scale": "model-00045-of-00047.safetensors", + "model.layers.44.mlp.experts.65.down_proj.weight": "model-00045-of-00047.safetensors", + "model.layers.44.mlp.experts.65.down_proj.weight_scale": "model-00045-of-00047.safetensors", + "model.layers.44.mlp.experts.65.gate_proj.weight": "model-00045-of-00047.safetensors", + "model.layers.44.mlp.experts.65.gate_proj.weight_scale": "model-00045-of-00047.safetensors", + "model.layers.44.mlp.experts.65.up_proj.weight": "model-00045-of-00047.safetensors", + "model.layers.44.mlp.experts.65.up_proj.weight_scale": "model-00045-of-00047.safetensors", + "model.layers.44.mlp.experts.66.down_proj.weight": "model-00045-of-00047.safetensors", + "model.layers.44.mlp.experts.66.down_proj.weight_scale": "model-00045-of-00047.safetensors", + "model.layers.44.mlp.experts.66.gate_proj.weight": "model-00045-of-00047.safetensors", + "model.layers.44.mlp.experts.66.gate_proj.weight_scale": "model-00045-of-00047.safetensors", + "model.layers.44.mlp.experts.66.up_proj.weight": "model-00045-of-00047.safetensors", + "model.layers.44.mlp.experts.66.up_proj.weight_scale": "model-00045-of-00047.safetensors", + "model.layers.44.mlp.experts.67.down_proj.weight": "model-00045-of-00047.safetensors", + "model.layers.44.mlp.experts.67.down_proj.weight_scale": "model-00045-of-00047.safetensors", + "model.layers.44.mlp.experts.67.gate_proj.weight": "model-00045-of-00047.safetensors", + "model.layers.44.mlp.experts.67.gate_proj.weight_scale": "model-00045-of-00047.safetensors", + "model.layers.44.mlp.experts.67.up_proj.weight": "model-00045-of-00047.safetensors", + "model.layers.44.mlp.experts.67.up_proj.weight_scale": "model-00045-of-00047.safetensors", + "model.layers.44.mlp.experts.68.down_proj.weight": "model-00045-of-00047.safetensors", + "model.layers.44.mlp.experts.68.down_proj.weight_scale": "model-00045-of-00047.safetensors", + "model.layers.44.mlp.experts.68.gate_proj.weight": "model-00045-of-00047.safetensors", + "model.layers.44.mlp.experts.68.gate_proj.weight_scale": "model-00045-of-00047.safetensors", + "model.layers.44.mlp.experts.68.up_proj.weight": "model-00045-of-00047.safetensors", + "model.layers.44.mlp.experts.68.up_proj.weight_scale": "model-00045-of-00047.safetensors", + "model.layers.44.mlp.experts.69.down_proj.weight": "model-00045-of-00047.safetensors", + "model.layers.44.mlp.experts.69.down_proj.weight_scale": "model-00045-of-00047.safetensors", + "model.layers.44.mlp.experts.69.gate_proj.weight": "model-00045-of-00047.safetensors", + "model.layers.44.mlp.experts.69.gate_proj.weight_scale": "model-00045-of-00047.safetensors", + "model.layers.44.mlp.experts.69.up_proj.weight": "model-00045-of-00047.safetensors", + "model.layers.44.mlp.experts.69.up_proj.weight_scale": "model-00045-of-00047.safetensors", + "model.layers.44.mlp.experts.7.down_proj.weight": "model-00045-of-00047.safetensors", + "model.layers.44.mlp.experts.7.down_proj.weight_scale": "model-00045-of-00047.safetensors", + "model.layers.44.mlp.experts.7.gate_proj.weight": "model-00045-of-00047.safetensors", + "model.layers.44.mlp.experts.7.gate_proj.weight_scale": "model-00045-of-00047.safetensors", + "model.layers.44.mlp.experts.7.up_proj.weight": "model-00045-of-00047.safetensors", + "model.layers.44.mlp.experts.7.up_proj.weight_scale": "model-00045-of-00047.safetensors", + "model.layers.44.mlp.experts.70.down_proj.weight": "model-00045-of-00047.safetensors", + "model.layers.44.mlp.experts.70.down_proj.weight_scale": "model-00045-of-00047.safetensors", + "model.layers.44.mlp.experts.70.gate_proj.weight": "model-00045-of-00047.safetensors", + "model.layers.44.mlp.experts.70.gate_proj.weight_scale": "model-00045-of-00047.safetensors", + "model.layers.44.mlp.experts.70.up_proj.weight": "model-00045-of-00047.safetensors", + "model.layers.44.mlp.experts.70.up_proj.weight_scale": "model-00045-of-00047.safetensors", + "model.layers.44.mlp.experts.71.down_proj.weight": "model-00045-of-00047.safetensors", + "model.layers.44.mlp.experts.71.down_proj.weight_scale": "model-00045-of-00047.safetensors", + "model.layers.44.mlp.experts.71.gate_proj.weight": "model-00045-of-00047.safetensors", + "model.layers.44.mlp.experts.71.gate_proj.weight_scale": "model-00045-of-00047.safetensors", + "model.layers.44.mlp.experts.71.up_proj.weight": "model-00045-of-00047.safetensors", + "model.layers.44.mlp.experts.71.up_proj.weight_scale": "model-00045-of-00047.safetensors", + "model.layers.44.mlp.experts.72.down_proj.weight": "model-00045-of-00047.safetensors", + "model.layers.44.mlp.experts.72.down_proj.weight_scale": "model-00045-of-00047.safetensors", + "model.layers.44.mlp.experts.72.gate_proj.weight": "model-00045-of-00047.safetensors", + "model.layers.44.mlp.experts.72.gate_proj.weight_scale": "model-00045-of-00047.safetensors", + "model.layers.44.mlp.experts.72.up_proj.weight": "model-00045-of-00047.safetensors", + "model.layers.44.mlp.experts.72.up_proj.weight_scale": "model-00045-of-00047.safetensors", + "model.layers.44.mlp.experts.73.down_proj.weight": "model-00045-of-00047.safetensors", + "model.layers.44.mlp.experts.73.down_proj.weight_scale": "model-00045-of-00047.safetensors", + "model.layers.44.mlp.experts.73.gate_proj.weight": "model-00045-of-00047.safetensors", + "model.layers.44.mlp.experts.73.gate_proj.weight_scale": "model-00045-of-00047.safetensors", + "model.layers.44.mlp.experts.73.up_proj.weight": "model-00045-of-00047.safetensors", + "model.layers.44.mlp.experts.73.up_proj.weight_scale": "model-00045-of-00047.safetensors", + "model.layers.44.mlp.experts.74.down_proj.weight": "model-00045-of-00047.safetensors", + "model.layers.44.mlp.experts.74.down_proj.weight_scale": "model-00045-of-00047.safetensors", + "model.layers.44.mlp.experts.74.gate_proj.weight": "model-00045-of-00047.safetensors", + "model.layers.44.mlp.experts.74.gate_proj.weight_scale": "model-00045-of-00047.safetensors", + "model.layers.44.mlp.experts.74.up_proj.weight": "model-00045-of-00047.safetensors", + "model.layers.44.mlp.experts.74.up_proj.weight_scale": "model-00045-of-00047.safetensors", + "model.layers.44.mlp.experts.75.down_proj.weight": "model-00045-of-00047.safetensors", + "model.layers.44.mlp.experts.75.down_proj.weight_scale": "model-00045-of-00047.safetensors", + "model.layers.44.mlp.experts.75.gate_proj.weight": "model-00045-of-00047.safetensors", + "model.layers.44.mlp.experts.75.gate_proj.weight_scale": "model-00045-of-00047.safetensors", + "model.layers.44.mlp.experts.75.up_proj.weight": "model-00045-of-00047.safetensors", + "model.layers.44.mlp.experts.75.up_proj.weight_scale": "model-00045-of-00047.safetensors", + "model.layers.44.mlp.experts.76.down_proj.weight": "model-00045-of-00047.safetensors", + "model.layers.44.mlp.experts.76.down_proj.weight_scale": "model-00045-of-00047.safetensors", + "model.layers.44.mlp.experts.76.gate_proj.weight": "model-00045-of-00047.safetensors", + "model.layers.44.mlp.experts.76.gate_proj.weight_scale": "model-00045-of-00047.safetensors", + "model.layers.44.mlp.experts.76.up_proj.weight": "model-00045-of-00047.safetensors", + "model.layers.44.mlp.experts.76.up_proj.weight_scale": "model-00045-of-00047.safetensors", + "model.layers.44.mlp.experts.77.down_proj.weight": "model-00045-of-00047.safetensors", + "model.layers.44.mlp.experts.77.down_proj.weight_scale": "model-00045-of-00047.safetensors", + "model.layers.44.mlp.experts.77.gate_proj.weight": "model-00045-of-00047.safetensors", + "model.layers.44.mlp.experts.77.gate_proj.weight_scale": "model-00045-of-00047.safetensors", + "model.layers.44.mlp.experts.77.up_proj.weight": "model-00045-of-00047.safetensors", + "model.layers.44.mlp.experts.77.up_proj.weight_scale": "model-00045-of-00047.safetensors", + "model.layers.44.mlp.experts.78.down_proj.weight": "model-00045-of-00047.safetensors", + "model.layers.44.mlp.experts.78.down_proj.weight_scale": "model-00045-of-00047.safetensors", + "model.layers.44.mlp.experts.78.gate_proj.weight": "model-00045-of-00047.safetensors", + "model.layers.44.mlp.experts.78.gate_proj.weight_scale": "model-00045-of-00047.safetensors", + "model.layers.44.mlp.experts.78.up_proj.weight": "model-00045-of-00047.safetensors", + "model.layers.44.mlp.experts.78.up_proj.weight_scale": "model-00045-of-00047.safetensors", + "model.layers.44.mlp.experts.79.down_proj.weight": "model-00045-of-00047.safetensors", + "model.layers.44.mlp.experts.79.down_proj.weight_scale": "model-00045-of-00047.safetensors", + "model.layers.44.mlp.experts.79.gate_proj.weight": "model-00045-of-00047.safetensors", + "model.layers.44.mlp.experts.79.gate_proj.weight_scale": "model-00045-of-00047.safetensors", + "model.layers.44.mlp.experts.79.up_proj.weight": "model-00045-of-00047.safetensors", + "model.layers.44.mlp.experts.79.up_proj.weight_scale": "model-00045-of-00047.safetensors", + "model.layers.44.mlp.experts.8.down_proj.weight": "model-00045-of-00047.safetensors", + "model.layers.44.mlp.experts.8.down_proj.weight_scale": "model-00045-of-00047.safetensors", + "model.layers.44.mlp.experts.8.gate_proj.weight": "model-00045-of-00047.safetensors", + "model.layers.44.mlp.experts.8.gate_proj.weight_scale": "model-00045-of-00047.safetensors", + "model.layers.44.mlp.experts.8.up_proj.weight": "model-00045-of-00047.safetensors", + "model.layers.44.mlp.experts.8.up_proj.weight_scale": "model-00045-of-00047.safetensors", + "model.layers.44.mlp.experts.80.down_proj.weight": "model-00045-of-00047.safetensors", + "model.layers.44.mlp.experts.80.down_proj.weight_scale": "model-00045-of-00047.safetensors", + "model.layers.44.mlp.experts.80.gate_proj.weight": "model-00045-of-00047.safetensors", + "model.layers.44.mlp.experts.80.gate_proj.weight_scale": "model-00045-of-00047.safetensors", + "model.layers.44.mlp.experts.80.up_proj.weight": "model-00045-of-00047.safetensors", + "model.layers.44.mlp.experts.80.up_proj.weight_scale": "model-00045-of-00047.safetensors", + "model.layers.44.mlp.experts.81.down_proj.weight": "model-00045-of-00047.safetensors", + "model.layers.44.mlp.experts.81.down_proj.weight_scale": "model-00045-of-00047.safetensors", + "model.layers.44.mlp.experts.81.gate_proj.weight": "model-00045-of-00047.safetensors", + "model.layers.44.mlp.experts.81.gate_proj.weight_scale": "model-00045-of-00047.safetensors", + "model.layers.44.mlp.experts.81.up_proj.weight": "model-00045-of-00047.safetensors", + "model.layers.44.mlp.experts.81.up_proj.weight_scale": "model-00045-of-00047.safetensors", + "model.layers.44.mlp.experts.82.down_proj.weight": "model-00045-of-00047.safetensors", + "model.layers.44.mlp.experts.82.down_proj.weight_scale": "model-00045-of-00047.safetensors", + "model.layers.44.mlp.experts.82.gate_proj.weight": "model-00045-of-00047.safetensors", + "model.layers.44.mlp.experts.82.gate_proj.weight_scale": "model-00045-of-00047.safetensors", + "model.layers.44.mlp.experts.82.up_proj.weight": "model-00045-of-00047.safetensors", + "model.layers.44.mlp.experts.82.up_proj.weight_scale": "model-00045-of-00047.safetensors", + "model.layers.44.mlp.experts.83.down_proj.weight": "model-00045-of-00047.safetensors", + "model.layers.44.mlp.experts.83.down_proj.weight_scale": "model-00045-of-00047.safetensors", + "model.layers.44.mlp.experts.83.gate_proj.weight": "model-00045-of-00047.safetensors", + "model.layers.44.mlp.experts.83.gate_proj.weight_scale": "model-00045-of-00047.safetensors", + "model.layers.44.mlp.experts.83.up_proj.weight": "model-00045-of-00047.safetensors", + "model.layers.44.mlp.experts.83.up_proj.weight_scale": "model-00045-of-00047.safetensors", + "model.layers.44.mlp.experts.84.down_proj.weight": "model-00045-of-00047.safetensors", + "model.layers.44.mlp.experts.84.down_proj.weight_scale": "model-00045-of-00047.safetensors", + "model.layers.44.mlp.experts.84.gate_proj.weight": "model-00045-of-00047.safetensors", + "model.layers.44.mlp.experts.84.gate_proj.weight_scale": "model-00045-of-00047.safetensors", + "model.layers.44.mlp.experts.84.up_proj.weight": "model-00045-of-00047.safetensors", + "model.layers.44.mlp.experts.84.up_proj.weight_scale": "model-00045-of-00047.safetensors", + "model.layers.44.mlp.experts.85.down_proj.weight": "model-00045-of-00047.safetensors", + "model.layers.44.mlp.experts.85.down_proj.weight_scale": "model-00045-of-00047.safetensors", + "model.layers.44.mlp.experts.85.gate_proj.weight": "model-00045-of-00047.safetensors", + "model.layers.44.mlp.experts.85.gate_proj.weight_scale": "model-00045-of-00047.safetensors", + "model.layers.44.mlp.experts.85.up_proj.weight": "model-00045-of-00047.safetensors", + "model.layers.44.mlp.experts.85.up_proj.weight_scale": "model-00045-of-00047.safetensors", + "model.layers.44.mlp.experts.86.down_proj.weight": "model-00045-of-00047.safetensors", + "model.layers.44.mlp.experts.86.down_proj.weight_scale": "model-00045-of-00047.safetensors", + "model.layers.44.mlp.experts.86.gate_proj.weight": "model-00045-of-00047.safetensors", + "model.layers.44.mlp.experts.86.gate_proj.weight_scale": "model-00045-of-00047.safetensors", + "model.layers.44.mlp.experts.86.up_proj.weight": "model-00045-of-00047.safetensors", + "model.layers.44.mlp.experts.86.up_proj.weight_scale": "model-00045-of-00047.safetensors", + "model.layers.44.mlp.experts.87.down_proj.weight": "model-00045-of-00047.safetensors", + "model.layers.44.mlp.experts.87.down_proj.weight_scale": "model-00045-of-00047.safetensors", + "model.layers.44.mlp.experts.87.gate_proj.weight": "model-00045-of-00047.safetensors", + "model.layers.44.mlp.experts.87.gate_proj.weight_scale": "model-00045-of-00047.safetensors", + "model.layers.44.mlp.experts.87.up_proj.weight": "model-00045-of-00047.safetensors", + "model.layers.44.mlp.experts.87.up_proj.weight_scale": "model-00045-of-00047.safetensors", + "model.layers.44.mlp.experts.88.down_proj.weight": "model-00045-of-00047.safetensors", + "model.layers.44.mlp.experts.88.down_proj.weight_scale": "model-00045-of-00047.safetensors", + "model.layers.44.mlp.experts.88.gate_proj.weight": "model-00045-of-00047.safetensors", + "model.layers.44.mlp.experts.88.gate_proj.weight_scale": "model-00045-of-00047.safetensors", + "model.layers.44.mlp.experts.88.up_proj.weight": "model-00045-of-00047.safetensors", + "model.layers.44.mlp.experts.88.up_proj.weight_scale": "model-00045-of-00047.safetensors", + "model.layers.44.mlp.experts.89.down_proj.weight": "model-00045-of-00047.safetensors", + "model.layers.44.mlp.experts.89.down_proj.weight_scale": "model-00045-of-00047.safetensors", + "model.layers.44.mlp.experts.89.gate_proj.weight": "model-00045-of-00047.safetensors", + "model.layers.44.mlp.experts.89.gate_proj.weight_scale": "model-00045-of-00047.safetensors", + "model.layers.44.mlp.experts.89.up_proj.weight": "model-00045-of-00047.safetensors", + "model.layers.44.mlp.experts.89.up_proj.weight_scale": "model-00045-of-00047.safetensors", + "model.layers.44.mlp.experts.9.down_proj.weight": "model-00045-of-00047.safetensors", + "model.layers.44.mlp.experts.9.down_proj.weight_scale": "model-00045-of-00047.safetensors", + "model.layers.44.mlp.experts.9.gate_proj.weight": "model-00045-of-00047.safetensors", + "model.layers.44.mlp.experts.9.gate_proj.weight_scale": "model-00045-of-00047.safetensors", + "model.layers.44.mlp.experts.9.up_proj.weight": "model-00045-of-00047.safetensors", + "model.layers.44.mlp.experts.9.up_proj.weight_scale": "model-00045-of-00047.safetensors", + "model.layers.44.mlp.experts.90.down_proj.weight": "model-00045-of-00047.safetensors", + "model.layers.44.mlp.experts.90.down_proj.weight_scale": "model-00045-of-00047.safetensors", + "model.layers.44.mlp.experts.90.gate_proj.weight": "model-00045-of-00047.safetensors", + "model.layers.44.mlp.experts.90.gate_proj.weight_scale": "model-00045-of-00047.safetensors", + "model.layers.44.mlp.experts.90.up_proj.weight": "model-00045-of-00047.safetensors", + "model.layers.44.mlp.experts.90.up_proj.weight_scale": "model-00045-of-00047.safetensors", + "model.layers.44.mlp.experts.91.down_proj.weight": "model-00045-of-00047.safetensors", + "model.layers.44.mlp.experts.91.down_proj.weight_scale": "model-00045-of-00047.safetensors", + "model.layers.44.mlp.experts.91.gate_proj.weight": "model-00045-of-00047.safetensors", + "model.layers.44.mlp.experts.91.gate_proj.weight_scale": "model-00045-of-00047.safetensors", + "model.layers.44.mlp.experts.91.up_proj.weight": "model-00045-of-00047.safetensors", + "model.layers.44.mlp.experts.91.up_proj.weight_scale": "model-00045-of-00047.safetensors", + "model.layers.44.mlp.experts.92.down_proj.weight": "model-00045-of-00047.safetensors", + "model.layers.44.mlp.experts.92.down_proj.weight_scale": "model-00045-of-00047.safetensors", + "model.layers.44.mlp.experts.92.gate_proj.weight": "model-00045-of-00047.safetensors", + "model.layers.44.mlp.experts.92.gate_proj.weight_scale": "model-00045-of-00047.safetensors", + "model.layers.44.mlp.experts.92.up_proj.weight": "model-00045-of-00047.safetensors", + "model.layers.44.mlp.experts.92.up_proj.weight_scale": "model-00045-of-00047.safetensors", + "model.layers.44.mlp.experts.93.down_proj.weight": "model-00045-of-00047.safetensors", + "model.layers.44.mlp.experts.93.down_proj.weight_scale": "model-00045-of-00047.safetensors", + "model.layers.44.mlp.experts.93.gate_proj.weight": "model-00045-of-00047.safetensors", + "model.layers.44.mlp.experts.93.gate_proj.weight_scale": "model-00045-of-00047.safetensors", + "model.layers.44.mlp.experts.93.up_proj.weight": "model-00045-of-00047.safetensors", + "model.layers.44.mlp.experts.93.up_proj.weight_scale": "model-00045-of-00047.safetensors", + "model.layers.44.mlp.experts.94.down_proj.weight": "model-00045-of-00047.safetensors", + "model.layers.44.mlp.experts.94.down_proj.weight_scale": "model-00045-of-00047.safetensors", + "model.layers.44.mlp.experts.94.gate_proj.weight": "model-00045-of-00047.safetensors", + "model.layers.44.mlp.experts.94.gate_proj.weight_scale": "model-00045-of-00047.safetensors", + "model.layers.44.mlp.experts.94.up_proj.weight": "model-00045-of-00047.safetensors", + "model.layers.44.mlp.experts.94.up_proj.weight_scale": "model-00045-of-00047.safetensors", + "model.layers.44.mlp.experts.95.down_proj.weight": "model-00045-of-00047.safetensors", + "model.layers.44.mlp.experts.95.down_proj.weight_scale": "model-00045-of-00047.safetensors", + "model.layers.44.mlp.experts.95.gate_proj.weight": "model-00045-of-00047.safetensors", + "model.layers.44.mlp.experts.95.gate_proj.weight_scale": "model-00045-of-00047.safetensors", + "model.layers.44.mlp.experts.95.up_proj.weight": "model-00045-of-00047.safetensors", + "model.layers.44.mlp.experts.95.up_proj.weight_scale": "model-00045-of-00047.safetensors", + "model.layers.44.mlp.experts.96.down_proj.weight": "model-00045-of-00047.safetensors", + "model.layers.44.mlp.experts.96.down_proj.weight_scale": "model-00045-of-00047.safetensors", + "model.layers.44.mlp.experts.96.gate_proj.weight": "model-00045-of-00047.safetensors", + "model.layers.44.mlp.experts.96.gate_proj.weight_scale": "model-00045-of-00047.safetensors", + "model.layers.44.mlp.experts.96.up_proj.weight": "model-00045-of-00047.safetensors", + "model.layers.44.mlp.experts.96.up_proj.weight_scale": "model-00045-of-00047.safetensors", + "model.layers.44.mlp.experts.97.down_proj.weight": "model-00045-of-00047.safetensors", + "model.layers.44.mlp.experts.97.down_proj.weight_scale": "model-00045-of-00047.safetensors", + "model.layers.44.mlp.experts.97.gate_proj.weight": "model-00045-of-00047.safetensors", + "model.layers.44.mlp.experts.97.gate_proj.weight_scale": "model-00045-of-00047.safetensors", + "model.layers.44.mlp.experts.97.up_proj.weight": "model-00045-of-00047.safetensors", + "model.layers.44.mlp.experts.97.up_proj.weight_scale": "model-00045-of-00047.safetensors", + "model.layers.44.mlp.experts.98.down_proj.weight": "model-00045-of-00047.safetensors", + "model.layers.44.mlp.experts.98.down_proj.weight_scale": "model-00045-of-00047.safetensors", + "model.layers.44.mlp.experts.98.gate_proj.weight": "model-00045-of-00047.safetensors", + "model.layers.44.mlp.experts.98.gate_proj.weight_scale": "model-00045-of-00047.safetensors", + "model.layers.44.mlp.experts.98.up_proj.weight": "model-00045-of-00047.safetensors", + "model.layers.44.mlp.experts.98.up_proj.weight_scale": "model-00045-of-00047.safetensors", + "model.layers.44.mlp.experts.99.down_proj.weight": "model-00045-of-00047.safetensors", + "model.layers.44.mlp.experts.99.down_proj.weight_scale": "model-00045-of-00047.safetensors", + "model.layers.44.mlp.experts.99.gate_proj.weight": "model-00045-of-00047.safetensors", + "model.layers.44.mlp.experts.99.gate_proj.weight_scale": "model-00045-of-00047.safetensors", + "model.layers.44.mlp.experts.99.up_proj.weight": "model-00045-of-00047.safetensors", + "model.layers.44.mlp.experts.99.up_proj.weight_scale": "model-00045-of-00047.safetensors", + "model.layers.44.mlp.gate.e_score_correction_bias": "model-00045-of-00047.safetensors", + "model.layers.44.mlp.gate.weight": "model-00045-of-00047.safetensors", + "model.layers.44.mlp.shared_experts.down_proj.weight": "model-00045-of-00047.safetensors", + "model.layers.44.mlp.shared_experts.down_proj.weight_scale": "model-00045-of-00047.safetensors", + "model.layers.44.mlp.shared_experts.gate_proj.weight": "model-00045-of-00047.safetensors", + "model.layers.44.mlp.shared_experts.gate_proj.weight_scale": "model-00045-of-00047.safetensors", + "model.layers.44.mlp.shared_experts.up_proj.weight": "model-00045-of-00047.safetensors", + "model.layers.44.mlp.shared_experts.up_proj.weight_scale": "model-00045-of-00047.safetensors", + "model.layers.44.post_attention_layernorm.weight": "model-00045-of-00047.safetensors", + "model.layers.44.self_attn.k_proj.bias": "model-00045-of-00047.safetensors", + "model.layers.44.self_attn.k_proj.weight": "model-00045-of-00047.safetensors", + "model.layers.44.self_attn.k_proj.weight_scale": "model-00045-of-00047.safetensors", + "model.layers.44.self_attn.o_proj.weight": "model-00045-of-00047.safetensors", + "model.layers.44.self_attn.o_proj.weight_scale": "model-00045-of-00047.safetensors", + "model.layers.44.self_attn.q_proj.bias": "model-00045-of-00047.safetensors", + "model.layers.44.self_attn.q_proj.weight": "model-00045-of-00047.safetensors", + "model.layers.44.self_attn.q_proj.weight_scale": "model-00045-of-00047.safetensors", + "model.layers.44.self_attn.v_proj.bias": "model-00045-of-00047.safetensors", + "model.layers.44.self_attn.v_proj.weight": "model-00045-of-00047.safetensors", + "model.layers.44.self_attn.v_proj.weight_scale": "model-00045-of-00047.safetensors", + "lm_head.weight": "model-00046-of-00047.safetensors", + "model.layers.45.input_layernorm.weight": "model-00046-of-00047.safetensors", + "model.layers.45.mlp.experts.0.down_proj.weight": "model-00046-of-00047.safetensors", + "model.layers.45.mlp.experts.0.down_proj.weight_scale": "model-00046-of-00047.safetensors", + "model.layers.45.mlp.experts.0.gate_proj.weight": "model-00046-of-00047.safetensors", + "model.layers.45.mlp.experts.0.gate_proj.weight_scale": "model-00046-of-00047.safetensors", + "model.layers.45.mlp.experts.0.up_proj.weight": "model-00046-of-00047.safetensors", + "model.layers.45.mlp.experts.0.up_proj.weight_scale": "model-00046-of-00047.safetensors", + "model.layers.45.mlp.experts.1.down_proj.weight": "model-00046-of-00047.safetensors", + "model.layers.45.mlp.experts.1.down_proj.weight_scale": "model-00046-of-00047.safetensors", + "model.layers.45.mlp.experts.1.gate_proj.weight": "model-00046-of-00047.safetensors", + "model.layers.45.mlp.experts.1.gate_proj.weight_scale": "model-00046-of-00047.safetensors", + "model.layers.45.mlp.experts.1.up_proj.weight": "model-00046-of-00047.safetensors", + "model.layers.45.mlp.experts.1.up_proj.weight_scale": "model-00046-of-00047.safetensors", + "model.layers.45.mlp.experts.10.down_proj.weight": "model-00046-of-00047.safetensors", + "model.layers.45.mlp.experts.10.down_proj.weight_scale": "model-00046-of-00047.safetensors", + "model.layers.45.mlp.experts.10.gate_proj.weight": "model-00046-of-00047.safetensors", + "model.layers.45.mlp.experts.10.gate_proj.weight_scale": "model-00046-of-00047.safetensors", + "model.layers.45.mlp.experts.10.up_proj.weight": "model-00046-of-00047.safetensors", + "model.layers.45.mlp.experts.10.up_proj.weight_scale": "model-00046-of-00047.safetensors", + "model.layers.45.mlp.experts.100.down_proj.weight": "model-00046-of-00047.safetensors", + "model.layers.45.mlp.experts.100.down_proj.weight_scale": "model-00046-of-00047.safetensors", + "model.layers.45.mlp.experts.100.gate_proj.weight": "model-00046-of-00047.safetensors", + "model.layers.45.mlp.experts.100.gate_proj.weight_scale": "model-00046-of-00047.safetensors", + "model.layers.45.mlp.experts.100.up_proj.weight": "model-00046-of-00047.safetensors", + "model.layers.45.mlp.experts.100.up_proj.weight_scale": "model-00046-of-00047.safetensors", + "model.layers.45.mlp.experts.101.down_proj.weight": "model-00046-of-00047.safetensors", + "model.layers.45.mlp.experts.101.down_proj.weight_scale": "model-00046-of-00047.safetensors", + "model.layers.45.mlp.experts.101.gate_proj.weight": "model-00046-of-00047.safetensors", + "model.layers.45.mlp.experts.101.gate_proj.weight_scale": "model-00046-of-00047.safetensors", + "model.layers.45.mlp.experts.101.up_proj.weight": "model-00046-of-00047.safetensors", + "model.layers.45.mlp.experts.101.up_proj.weight_scale": "model-00046-of-00047.safetensors", + "model.layers.45.mlp.experts.102.down_proj.weight": "model-00046-of-00047.safetensors", + "model.layers.45.mlp.experts.102.down_proj.weight_scale": "model-00046-of-00047.safetensors", + "model.layers.45.mlp.experts.102.gate_proj.weight": "model-00046-of-00047.safetensors", + "model.layers.45.mlp.experts.102.gate_proj.weight_scale": "model-00046-of-00047.safetensors", + "model.layers.45.mlp.experts.102.up_proj.weight": "model-00046-of-00047.safetensors", + "model.layers.45.mlp.experts.102.up_proj.weight_scale": "model-00046-of-00047.safetensors", + "model.layers.45.mlp.experts.103.down_proj.weight": "model-00046-of-00047.safetensors", + "model.layers.45.mlp.experts.103.down_proj.weight_scale": "model-00046-of-00047.safetensors", + "model.layers.45.mlp.experts.103.gate_proj.weight": "model-00046-of-00047.safetensors", + "model.layers.45.mlp.experts.103.gate_proj.weight_scale": "model-00046-of-00047.safetensors", + "model.layers.45.mlp.experts.103.up_proj.weight": "model-00046-of-00047.safetensors", + "model.layers.45.mlp.experts.103.up_proj.weight_scale": "model-00046-of-00047.safetensors", + "model.layers.45.mlp.experts.104.down_proj.weight": "model-00046-of-00047.safetensors", + "model.layers.45.mlp.experts.104.down_proj.weight_scale": "model-00046-of-00047.safetensors", + "model.layers.45.mlp.experts.104.gate_proj.weight": "model-00046-of-00047.safetensors", + "model.layers.45.mlp.experts.104.gate_proj.weight_scale": "model-00046-of-00047.safetensors", + "model.layers.45.mlp.experts.104.up_proj.weight": "model-00046-of-00047.safetensors", + "model.layers.45.mlp.experts.104.up_proj.weight_scale": "model-00046-of-00047.safetensors", + "model.layers.45.mlp.experts.105.down_proj.weight": "model-00046-of-00047.safetensors", + "model.layers.45.mlp.experts.105.down_proj.weight_scale": "model-00046-of-00047.safetensors", + "model.layers.45.mlp.experts.105.gate_proj.weight": "model-00046-of-00047.safetensors", + "model.layers.45.mlp.experts.105.gate_proj.weight_scale": "model-00046-of-00047.safetensors", + "model.layers.45.mlp.experts.105.up_proj.weight": "model-00046-of-00047.safetensors", + "model.layers.45.mlp.experts.105.up_proj.weight_scale": "model-00046-of-00047.safetensors", + "model.layers.45.mlp.experts.106.down_proj.weight": "model-00046-of-00047.safetensors", + "model.layers.45.mlp.experts.106.down_proj.weight_scale": "model-00046-of-00047.safetensors", + "model.layers.45.mlp.experts.106.gate_proj.weight": "model-00046-of-00047.safetensors", + "model.layers.45.mlp.experts.106.gate_proj.weight_scale": "model-00046-of-00047.safetensors", + "model.layers.45.mlp.experts.106.up_proj.weight": "model-00046-of-00047.safetensors", + "model.layers.45.mlp.experts.106.up_proj.weight_scale": "model-00046-of-00047.safetensors", + "model.layers.45.mlp.experts.107.down_proj.weight": "model-00046-of-00047.safetensors", + "model.layers.45.mlp.experts.107.down_proj.weight_scale": "model-00046-of-00047.safetensors", + "model.layers.45.mlp.experts.107.gate_proj.weight": "model-00046-of-00047.safetensors", + "model.layers.45.mlp.experts.107.gate_proj.weight_scale": "model-00046-of-00047.safetensors", + "model.layers.45.mlp.experts.107.up_proj.weight": "model-00046-of-00047.safetensors", + "model.layers.45.mlp.experts.107.up_proj.weight_scale": "model-00046-of-00047.safetensors", + "model.layers.45.mlp.experts.108.down_proj.weight": "model-00046-of-00047.safetensors", + "model.layers.45.mlp.experts.108.down_proj.weight_scale": "model-00046-of-00047.safetensors", + "model.layers.45.mlp.experts.108.gate_proj.weight": "model-00046-of-00047.safetensors", + "model.layers.45.mlp.experts.108.gate_proj.weight_scale": "model-00046-of-00047.safetensors", + "model.layers.45.mlp.experts.108.up_proj.weight": "model-00046-of-00047.safetensors", + "model.layers.45.mlp.experts.108.up_proj.weight_scale": "model-00046-of-00047.safetensors", + "model.layers.45.mlp.experts.109.down_proj.weight": "model-00046-of-00047.safetensors", + "model.layers.45.mlp.experts.109.down_proj.weight_scale": "model-00046-of-00047.safetensors", + "model.layers.45.mlp.experts.109.gate_proj.weight": "model-00046-of-00047.safetensors", + "model.layers.45.mlp.experts.109.gate_proj.weight_scale": "model-00046-of-00047.safetensors", + "model.layers.45.mlp.experts.109.up_proj.weight": "model-00046-of-00047.safetensors", + "model.layers.45.mlp.experts.109.up_proj.weight_scale": "model-00046-of-00047.safetensors", + "model.layers.45.mlp.experts.11.down_proj.weight": "model-00046-of-00047.safetensors", + "model.layers.45.mlp.experts.11.down_proj.weight_scale": "model-00046-of-00047.safetensors", + "model.layers.45.mlp.experts.11.gate_proj.weight": "model-00046-of-00047.safetensors", + "model.layers.45.mlp.experts.11.gate_proj.weight_scale": "model-00046-of-00047.safetensors", + "model.layers.45.mlp.experts.11.up_proj.weight": "model-00046-of-00047.safetensors", + "model.layers.45.mlp.experts.11.up_proj.weight_scale": "model-00046-of-00047.safetensors", + "model.layers.45.mlp.experts.110.down_proj.weight": "model-00046-of-00047.safetensors", + "model.layers.45.mlp.experts.110.down_proj.weight_scale": "model-00046-of-00047.safetensors", + "model.layers.45.mlp.experts.110.gate_proj.weight": "model-00046-of-00047.safetensors", + "model.layers.45.mlp.experts.110.gate_proj.weight_scale": "model-00046-of-00047.safetensors", + "model.layers.45.mlp.experts.110.up_proj.weight": "model-00046-of-00047.safetensors", + "model.layers.45.mlp.experts.110.up_proj.weight_scale": "model-00046-of-00047.safetensors", + "model.layers.45.mlp.experts.111.down_proj.weight": "model-00046-of-00047.safetensors", + "model.layers.45.mlp.experts.111.down_proj.weight_scale": "model-00046-of-00047.safetensors", + "model.layers.45.mlp.experts.111.gate_proj.weight": "model-00046-of-00047.safetensors", + "model.layers.45.mlp.experts.111.gate_proj.weight_scale": "model-00046-of-00047.safetensors", + "model.layers.45.mlp.experts.111.up_proj.weight": "model-00046-of-00047.safetensors", + "model.layers.45.mlp.experts.111.up_proj.weight_scale": "model-00046-of-00047.safetensors", + "model.layers.45.mlp.experts.112.down_proj.weight": "model-00046-of-00047.safetensors", + "model.layers.45.mlp.experts.112.down_proj.weight_scale": "model-00046-of-00047.safetensors", + "model.layers.45.mlp.experts.112.gate_proj.weight": "model-00046-of-00047.safetensors", + "model.layers.45.mlp.experts.112.gate_proj.weight_scale": "model-00046-of-00047.safetensors", + "model.layers.45.mlp.experts.112.up_proj.weight": "model-00046-of-00047.safetensors", + "model.layers.45.mlp.experts.112.up_proj.weight_scale": "model-00046-of-00047.safetensors", + "model.layers.45.mlp.experts.113.down_proj.weight": "model-00046-of-00047.safetensors", + "model.layers.45.mlp.experts.113.down_proj.weight_scale": "model-00046-of-00047.safetensors", + "model.layers.45.mlp.experts.113.gate_proj.weight": "model-00046-of-00047.safetensors", + "model.layers.45.mlp.experts.113.gate_proj.weight_scale": "model-00046-of-00047.safetensors", + "model.layers.45.mlp.experts.113.up_proj.weight": "model-00046-of-00047.safetensors", + "model.layers.45.mlp.experts.113.up_proj.weight_scale": "model-00046-of-00047.safetensors", + "model.layers.45.mlp.experts.114.down_proj.weight": "model-00046-of-00047.safetensors", + "model.layers.45.mlp.experts.114.down_proj.weight_scale": "model-00046-of-00047.safetensors", + "model.layers.45.mlp.experts.114.gate_proj.weight": "model-00046-of-00047.safetensors", + "model.layers.45.mlp.experts.114.gate_proj.weight_scale": "model-00046-of-00047.safetensors", + "model.layers.45.mlp.experts.114.up_proj.weight": "model-00046-of-00047.safetensors", + "model.layers.45.mlp.experts.114.up_proj.weight_scale": "model-00046-of-00047.safetensors", + "model.layers.45.mlp.experts.115.down_proj.weight": "model-00046-of-00047.safetensors", + "model.layers.45.mlp.experts.115.down_proj.weight_scale": "model-00046-of-00047.safetensors", + "model.layers.45.mlp.experts.115.gate_proj.weight": "model-00046-of-00047.safetensors", + "model.layers.45.mlp.experts.115.gate_proj.weight_scale": "model-00046-of-00047.safetensors", + "model.layers.45.mlp.experts.115.up_proj.weight": "model-00046-of-00047.safetensors", + "model.layers.45.mlp.experts.115.up_proj.weight_scale": "model-00046-of-00047.safetensors", + "model.layers.45.mlp.experts.116.down_proj.weight": "model-00046-of-00047.safetensors", + "model.layers.45.mlp.experts.116.down_proj.weight_scale": "model-00046-of-00047.safetensors", + "model.layers.45.mlp.experts.116.gate_proj.weight": "model-00046-of-00047.safetensors", + "model.layers.45.mlp.experts.116.gate_proj.weight_scale": "model-00046-of-00047.safetensors", + "model.layers.45.mlp.experts.116.up_proj.weight": "model-00046-of-00047.safetensors", + "model.layers.45.mlp.experts.116.up_proj.weight_scale": "model-00046-of-00047.safetensors", + "model.layers.45.mlp.experts.117.down_proj.weight": "model-00046-of-00047.safetensors", + "model.layers.45.mlp.experts.117.down_proj.weight_scale": "model-00046-of-00047.safetensors", + "model.layers.45.mlp.experts.117.gate_proj.weight": "model-00046-of-00047.safetensors", + "model.layers.45.mlp.experts.117.gate_proj.weight_scale": "model-00046-of-00047.safetensors", + "model.layers.45.mlp.experts.117.up_proj.weight": "model-00046-of-00047.safetensors", + "model.layers.45.mlp.experts.117.up_proj.weight_scale": "model-00046-of-00047.safetensors", + "model.layers.45.mlp.experts.118.down_proj.weight": "model-00046-of-00047.safetensors", + "model.layers.45.mlp.experts.118.down_proj.weight_scale": "model-00046-of-00047.safetensors", + "model.layers.45.mlp.experts.118.gate_proj.weight": "model-00046-of-00047.safetensors", + "model.layers.45.mlp.experts.118.gate_proj.weight_scale": "model-00046-of-00047.safetensors", + "model.layers.45.mlp.experts.118.up_proj.weight": "model-00046-of-00047.safetensors", + "model.layers.45.mlp.experts.118.up_proj.weight_scale": "model-00046-of-00047.safetensors", + "model.layers.45.mlp.experts.119.down_proj.weight": "model-00046-of-00047.safetensors", + "model.layers.45.mlp.experts.119.down_proj.weight_scale": "model-00046-of-00047.safetensors", + "model.layers.45.mlp.experts.119.gate_proj.weight": "model-00046-of-00047.safetensors", + "model.layers.45.mlp.experts.119.gate_proj.weight_scale": "model-00046-of-00047.safetensors", + "model.layers.45.mlp.experts.119.up_proj.weight": "model-00046-of-00047.safetensors", + "model.layers.45.mlp.experts.119.up_proj.weight_scale": "model-00046-of-00047.safetensors", + "model.layers.45.mlp.experts.12.down_proj.weight": "model-00046-of-00047.safetensors", + "model.layers.45.mlp.experts.12.down_proj.weight_scale": "model-00046-of-00047.safetensors", + "model.layers.45.mlp.experts.12.gate_proj.weight": "model-00046-of-00047.safetensors", + "model.layers.45.mlp.experts.12.gate_proj.weight_scale": "model-00046-of-00047.safetensors", + "model.layers.45.mlp.experts.12.up_proj.weight": "model-00046-of-00047.safetensors", + "model.layers.45.mlp.experts.12.up_proj.weight_scale": "model-00046-of-00047.safetensors", + "model.layers.45.mlp.experts.120.down_proj.weight": "model-00046-of-00047.safetensors", + "model.layers.45.mlp.experts.120.down_proj.weight_scale": "model-00046-of-00047.safetensors", + "model.layers.45.mlp.experts.120.gate_proj.weight": "model-00046-of-00047.safetensors", + "model.layers.45.mlp.experts.120.gate_proj.weight_scale": "model-00046-of-00047.safetensors", + "model.layers.45.mlp.experts.120.up_proj.weight": "model-00046-of-00047.safetensors", + "model.layers.45.mlp.experts.120.up_proj.weight_scale": "model-00046-of-00047.safetensors", + "model.layers.45.mlp.experts.121.down_proj.weight": "model-00046-of-00047.safetensors", + "model.layers.45.mlp.experts.121.down_proj.weight_scale": "model-00046-of-00047.safetensors", + "model.layers.45.mlp.experts.121.gate_proj.weight": "model-00046-of-00047.safetensors", + "model.layers.45.mlp.experts.121.gate_proj.weight_scale": "model-00046-of-00047.safetensors", + "model.layers.45.mlp.experts.121.up_proj.weight": "model-00046-of-00047.safetensors", + "model.layers.45.mlp.experts.121.up_proj.weight_scale": "model-00046-of-00047.safetensors", + "model.layers.45.mlp.experts.122.down_proj.weight": "model-00046-of-00047.safetensors", + "model.layers.45.mlp.experts.122.down_proj.weight_scale": "model-00046-of-00047.safetensors", + "model.layers.45.mlp.experts.122.gate_proj.weight": "model-00046-of-00047.safetensors", + "model.layers.45.mlp.experts.122.gate_proj.weight_scale": "model-00046-of-00047.safetensors", + "model.layers.45.mlp.experts.122.up_proj.weight": "model-00046-of-00047.safetensors", + "model.layers.45.mlp.experts.122.up_proj.weight_scale": "model-00046-of-00047.safetensors", + "model.layers.45.mlp.experts.123.down_proj.weight": "model-00046-of-00047.safetensors", + "model.layers.45.mlp.experts.123.down_proj.weight_scale": "model-00046-of-00047.safetensors", + "model.layers.45.mlp.experts.123.gate_proj.weight": "model-00046-of-00047.safetensors", + "model.layers.45.mlp.experts.123.gate_proj.weight_scale": "model-00046-of-00047.safetensors", + "model.layers.45.mlp.experts.123.up_proj.weight": "model-00046-of-00047.safetensors", + "model.layers.45.mlp.experts.123.up_proj.weight_scale": "model-00046-of-00047.safetensors", + "model.layers.45.mlp.experts.124.down_proj.weight": "model-00046-of-00047.safetensors", + "model.layers.45.mlp.experts.124.down_proj.weight_scale": "model-00046-of-00047.safetensors", + "model.layers.45.mlp.experts.124.gate_proj.weight": "model-00046-of-00047.safetensors", + "model.layers.45.mlp.experts.124.gate_proj.weight_scale": "model-00046-of-00047.safetensors", + "model.layers.45.mlp.experts.124.up_proj.weight": "model-00046-of-00047.safetensors", + "model.layers.45.mlp.experts.124.up_proj.weight_scale": "model-00046-of-00047.safetensors", + "model.layers.45.mlp.experts.125.down_proj.weight": "model-00046-of-00047.safetensors", + "model.layers.45.mlp.experts.125.down_proj.weight_scale": "model-00046-of-00047.safetensors", + "model.layers.45.mlp.experts.125.gate_proj.weight": "model-00046-of-00047.safetensors", + "model.layers.45.mlp.experts.125.gate_proj.weight_scale": "model-00046-of-00047.safetensors", + "model.layers.45.mlp.experts.125.up_proj.weight": "model-00046-of-00047.safetensors", + "model.layers.45.mlp.experts.125.up_proj.weight_scale": "model-00046-of-00047.safetensors", + "model.layers.45.mlp.experts.126.down_proj.weight": "model-00046-of-00047.safetensors", + "model.layers.45.mlp.experts.126.down_proj.weight_scale": "model-00046-of-00047.safetensors", + "model.layers.45.mlp.experts.126.gate_proj.weight": "model-00046-of-00047.safetensors", + "model.layers.45.mlp.experts.126.gate_proj.weight_scale": "model-00046-of-00047.safetensors", + "model.layers.45.mlp.experts.126.up_proj.weight": "model-00046-of-00047.safetensors", + "model.layers.45.mlp.experts.126.up_proj.weight_scale": "model-00046-of-00047.safetensors", + "model.layers.45.mlp.experts.127.down_proj.weight": "model-00046-of-00047.safetensors", + "model.layers.45.mlp.experts.127.down_proj.weight_scale": "model-00046-of-00047.safetensors", + "model.layers.45.mlp.experts.127.gate_proj.weight": "model-00046-of-00047.safetensors", + "model.layers.45.mlp.experts.127.gate_proj.weight_scale": "model-00046-of-00047.safetensors", + "model.layers.45.mlp.experts.127.up_proj.weight": "model-00046-of-00047.safetensors", + "model.layers.45.mlp.experts.127.up_proj.weight_scale": "model-00046-of-00047.safetensors", + "model.layers.45.mlp.experts.13.down_proj.weight": "model-00046-of-00047.safetensors", + "model.layers.45.mlp.experts.13.down_proj.weight_scale": "model-00046-of-00047.safetensors", + "model.layers.45.mlp.experts.13.gate_proj.weight": "model-00046-of-00047.safetensors", + "model.layers.45.mlp.experts.13.gate_proj.weight_scale": "model-00046-of-00047.safetensors", + "model.layers.45.mlp.experts.13.up_proj.weight": "model-00046-of-00047.safetensors", + "model.layers.45.mlp.experts.13.up_proj.weight_scale": "model-00046-of-00047.safetensors", + "model.layers.45.mlp.experts.14.down_proj.weight": "model-00046-of-00047.safetensors", + "model.layers.45.mlp.experts.14.down_proj.weight_scale": "model-00046-of-00047.safetensors", + "model.layers.45.mlp.experts.14.gate_proj.weight": "model-00046-of-00047.safetensors", + "model.layers.45.mlp.experts.14.gate_proj.weight_scale": "model-00046-of-00047.safetensors", + "model.layers.45.mlp.experts.14.up_proj.weight": "model-00046-of-00047.safetensors", + "model.layers.45.mlp.experts.14.up_proj.weight_scale": "model-00046-of-00047.safetensors", + "model.layers.45.mlp.experts.15.down_proj.weight": "model-00046-of-00047.safetensors", + "model.layers.45.mlp.experts.15.down_proj.weight_scale": "model-00046-of-00047.safetensors", + "model.layers.45.mlp.experts.15.gate_proj.weight": "model-00046-of-00047.safetensors", + "model.layers.45.mlp.experts.15.gate_proj.weight_scale": "model-00046-of-00047.safetensors", + "model.layers.45.mlp.experts.15.up_proj.weight": "model-00046-of-00047.safetensors", + "model.layers.45.mlp.experts.15.up_proj.weight_scale": "model-00046-of-00047.safetensors", + "model.layers.45.mlp.experts.16.down_proj.weight": "model-00046-of-00047.safetensors", + "model.layers.45.mlp.experts.16.down_proj.weight_scale": "model-00046-of-00047.safetensors", + "model.layers.45.mlp.experts.16.gate_proj.weight": "model-00046-of-00047.safetensors", + "model.layers.45.mlp.experts.16.gate_proj.weight_scale": "model-00046-of-00047.safetensors", + "model.layers.45.mlp.experts.16.up_proj.weight": "model-00046-of-00047.safetensors", + "model.layers.45.mlp.experts.16.up_proj.weight_scale": "model-00046-of-00047.safetensors", + "model.layers.45.mlp.experts.17.down_proj.weight": "model-00046-of-00047.safetensors", + "model.layers.45.mlp.experts.17.down_proj.weight_scale": "model-00046-of-00047.safetensors", + "model.layers.45.mlp.experts.17.gate_proj.weight": "model-00046-of-00047.safetensors", + "model.layers.45.mlp.experts.17.gate_proj.weight_scale": "model-00046-of-00047.safetensors", + "model.layers.45.mlp.experts.17.up_proj.weight": "model-00046-of-00047.safetensors", + "model.layers.45.mlp.experts.17.up_proj.weight_scale": "model-00046-of-00047.safetensors", + "model.layers.45.mlp.experts.18.down_proj.weight": "model-00046-of-00047.safetensors", + "model.layers.45.mlp.experts.18.down_proj.weight_scale": "model-00046-of-00047.safetensors", + "model.layers.45.mlp.experts.18.gate_proj.weight": "model-00046-of-00047.safetensors", + "model.layers.45.mlp.experts.18.gate_proj.weight_scale": "model-00046-of-00047.safetensors", + "model.layers.45.mlp.experts.18.up_proj.weight": "model-00046-of-00047.safetensors", + "model.layers.45.mlp.experts.18.up_proj.weight_scale": "model-00046-of-00047.safetensors", + "model.layers.45.mlp.experts.19.down_proj.weight": "model-00046-of-00047.safetensors", + "model.layers.45.mlp.experts.19.down_proj.weight_scale": "model-00046-of-00047.safetensors", + "model.layers.45.mlp.experts.19.gate_proj.weight": "model-00046-of-00047.safetensors", + "model.layers.45.mlp.experts.19.gate_proj.weight_scale": "model-00046-of-00047.safetensors", + "model.layers.45.mlp.experts.19.up_proj.weight": "model-00046-of-00047.safetensors", + "model.layers.45.mlp.experts.19.up_proj.weight_scale": "model-00046-of-00047.safetensors", + "model.layers.45.mlp.experts.2.down_proj.weight": "model-00046-of-00047.safetensors", + "model.layers.45.mlp.experts.2.down_proj.weight_scale": "model-00046-of-00047.safetensors", + "model.layers.45.mlp.experts.2.gate_proj.weight": "model-00046-of-00047.safetensors", + "model.layers.45.mlp.experts.2.gate_proj.weight_scale": "model-00046-of-00047.safetensors", + "model.layers.45.mlp.experts.2.up_proj.weight": "model-00046-of-00047.safetensors", + "model.layers.45.mlp.experts.2.up_proj.weight_scale": "model-00046-of-00047.safetensors", + "model.layers.45.mlp.experts.20.down_proj.weight": "model-00046-of-00047.safetensors", + "model.layers.45.mlp.experts.20.down_proj.weight_scale": "model-00046-of-00047.safetensors", + "model.layers.45.mlp.experts.20.gate_proj.weight": "model-00046-of-00047.safetensors", + "model.layers.45.mlp.experts.20.gate_proj.weight_scale": "model-00046-of-00047.safetensors", + "model.layers.45.mlp.experts.20.up_proj.weight": "model-00046-of-00047.safetensors", + "model.layers.45.mlp.experts.20.up_proj.weight_scale": "model-00046-of-00047.safetensors", + "model.layers.45.mlp.experts.21.down_proj.weight": "model-00046-of-00047.safetensors", + "model.layers.45.mlp.experts.21.down_proj.weight_scale": "model-00046-of-00047.safetensors", + "model.layers.45.mlp.experts.21.gate_proj.weight": "model-00046-of-00047.safetensors", + "model.layers.45.mlp.experts.21.gate_proj.weight_scale": "model-00046-of-00047.safetensors", + "model.layers.45.mlp.experts.21.up_proj.weight": "model-00046-of-00047.safetensors", + "model.layers.45.mlp.experts.21.up_proj.weight_scale": "model-00046-of-00047.safetensors", + "model.layers.45.mlp.experts.22.down_proj.weight": "model-00046-of-00047.safetensors", + "model.layers.45.mlp.experts.22.down_proj.weight_scale": "model-00046-of-00047.safetensors", + "model.layers.45.mlp.experts.22.gate_proj.weight": "model-00046-of-00047.safetensors", + "model.layers.45.mlp.experts.22.gate_proj.weight_scale": "model-00046-of-00047.safetensors", + "model.layers.45.mlp.experts.22.up_proj.weight": "model-00046-of-00047.safetensors", + "model.layers.45.mlp.experts.22.up_proj.weight_scale": "model-00046-of-00047.safetensors", + "model.layers.45.mlp.experts.23.down_proj.weight": "model-00046-of-00047.safetensors", + "model.layers.45.mlp.experts.23.down_proj.weight_scale": "model-00046-of-00047.safetensors", + "model.layers.45.mlp.experts.23.gate_proj.weight": "model-00046-of-00047.safetensors", + "model.layers.45.mlp.experts.23.gate_proj.weight_scale": "model-00046-of-00047.safetensors", + "model.layers.45.mlp.experts.23.up_proj.weight": "model-00046-of-00047.safetensors", + "model.layers.45.mlp.experts.23.up_proj.weight_scale": "model-00046-of-00047.safetensors", + "model.layers.45.mlp.experts.24.down_proj.weight": "model-00046-of-00047.safetensors", + "model.layers.45.mlp.experts.24.down_proj.weight_scale": "model-00046-of-00047.safetensors", + "model.layers.45.mlp.experts.24.gate_proj.weight": "model-00046-of-00047.safetensors", + "model.layers.45.mlp.experts.24.gate_proj.weight_scale": "model-00046-of-00047.safetensors", + "model.layers.45.mlp.experts.24.up_proj.weight": "model-00046-of-00047.safetensors", + "model.layers.45.mlp.experts.24.up_proj.weight_scale": "model-00046-of-00047.safetensors", + "model.layers.45.mlp.experts.25.down_proj.weight": "model-00046-of-00047.safetensors", + "model.layers.45.mlp.experts.25.down_proj.weight_scale": "model-00046-of-00047.safetensors", + "model.layers.45.mlp.experts.25.gate_proj.weight": "model-00046-of-00047.safetensors", + "model.layers.45.mlp.experts.25.gate_proj.weight_scale": "model-00046-of-00047.safetensors", + "model.layers.45.mlp.experts.25.up_proj.weight": "model-00046-of-00047.safetensors", + "model.layers.45.mlp.experts.25.up_proj.weight_scale": "model-00046-of-00047.safetensors", + "model.layers.45.mlp.experts.26.down_proj.weight": "model-00046-of-00047.safetensors", + "model.layers.45.mlp.experts.26.down_proj.weight_scale": "model-00046-of-00047.safetensors", + "model.layers.45.mlp.experts.26.gate_proj.weight": "model-00046-of-00047.safetensors", + "model.layers.45.mlp.experts.26.gate_proj.weight_scale": "model-00046-of-00047.safetensors", + "model.layers.45.mlp.experts.26.up_proj.weight": "model-00046-of-00047.safetensors", + "model.layers.45.mlp.experts.26.up_proj.weight_scale": "model-00046-of-00047.safetensors", + "model.layers.45.mlp.experts.27.down_proj.weight": "model-00046-of-00047.safetensors", + "model.layers.45.mlp.experts.27.down_proj.weight_scale": "model-00046-of-00047.safetensors", + "model.layers.45.mlp.experts.27.gate_proj.weight": "model-00046-of-00047.safetensors", + "model.layers.45.mlp.experts.27.gate_proj.weight_scale": "model-00046-of-00047.safetensors", + "model.layers.45.mlp.experts.27.up_proj.weight": "model-00046-of-00047.safetensors", + "model.layers.45.mlp.experts.27.up_proj.weight_scale": "model-00046-of-00047.safetensors", + "model.layers.45.mlp.experts.28.down_proj.weight": "model-00046-of-00047.safetensors", + "model.layers.45.mlp.experts.28.down_proj.weight_scale": "model-00046-of-00047.safetensors", + "model.layers.45.mlp.experts.28.gate_proj.weight": "model-00046-of-00047.safetensors", + "model.layers.45.mlp.experts.28.gate_proj.weight_scale": "model-00046-of-00047.safetensors", + "model.layers.45.mlp.experts.28.up_proj.weight": "model-00046-of-00047.safetensors", + "model.layers.45.mlp.experts.28.up_proj.weight_scale": "model-00046-of-00047.safetensors", + "model.layers.45.mlp.experts.29.down_proj.weight": "model-00046-of-00047.safetensors", + "model.layers.45.mlp.experts.29.down_proj.weight_scale": "model-00046-of-00047.safetensors", + "model.layers.45.mlp.experts.29.gate_proj.weight": "model-00046-of-00047.safetensors", + "model.layers.45.mlp.experts.29.gate_proj.weight_scale": "model-00046-of-00047.safetensors", + "model.layers.45.mlp.experts.29.up_proj.weight": "model-00046-of-00047.safetensors", + "model.layers.45.mlp.experts.29.up_proj.weight_scale": "model-00046-of-00047.safetensors", + "model.layers.45.mlp.experts.3.down_proj.weight": "model-00046-of-00047.safetensors", + "model.layers.45.mlp.experts.3.down_proj.weight_scale": "model-00046-of-00047.safetensors", + "model.layers.45.mlp.experts.3.gate_proj.weight": "model-00046-of-00047.safetensors", + "model.layers.45.mlp.experts.3.gate_proj.weight_scale": "model-00046-of-00047.safetensors", + "model.layers.45.mlp.experts.3.up_proj.weight": "model-00046-of-00047.safetensors", + "model.layers.45.mlp.experts.3.up_proj.weight_scale": "model-00046-of-00047.safetensors", + "model.layers.45.mlp.experts.30.down_proj.weight": "model-00046-of-00047.safetensors", + "model.layers.45.mlp.experts.30.down_proj.weight_scale": "model-00046-of-00047.safetensors", + "model.layers.45.mlp.experts.30.gate_proj.weight": "model-00046-of-00047.safetensors", + "model.layers.45.mlp.experts.30.gate_proj.weight_scale": "model-00046-of-00047.safetensors", + "model.layers.45.mlp.experts.30.up_proj.weight": "model-00046-of-00047.safetensors", + "model.layers.45.mlp.experts.30.up_proj.weight_scale": "model-00046-of-00047.safetensors", + "model.layers.45.mlp.experts.31.down_proj.weight": "model-00046-of-00047.safetensors", + "model.layers.45.mlp.experts.31.down_proj.weight_scale": "model-00046-of-00047.safetensors", + "model.layers.45.mlp.experts.31.gate_proj.weight": "model-00046-of-00047.safetensors", + "model.layers.45.mlp.experts.31.gate_proj.weight_scale": "model-00046-of-00047.safetensors", + "model.layers.45.mlp.experts.31.up_proj.weight": "model-00046-of-00047.safetensors", + "model.layers.45.mlp.experts.31.up_proj.weight_scale": "model-00046-of-00047.safetensors", + "model.layers.45.mlp.experts.32.down_proj.weight": "model-00046-of-00047.safetensors", + "model.layers.45.mlp.experts.32.down_proj.weight_scale": "model-00046-of-00047.safetensors", + "model.layers.45.mlp.experts.32.gate_proj.weight": "model-00046-of-00047.safetensors", + "model.layers.45.mlp.experts.32.gate_proj.weight_scale": "model-00046-of-00047.safetensors", + "model.layers.45.mlp.experts.32.up_proj.weight": "model-00046-of-00047.safetensors", + "model.layers.45.mlp.experts.32.up_proj.weight_scale": "model-00046-of-00047.safetensors", + "model.layers.45.mlp.experts.33.down_proj.weight": "model-00046-of-00047.safetensors", + "model.layers.45.mlp.experts.33.down_proj.weight_scale": "model-00046-of-00047.safetensors", + "model.layers.45.mlp.experts.33.gate_proj.weight": "model-00046-of-00047.safetensors", + "model.layers.45.mlp.experts.33.gate_proj.weight_scale": "model-00046-of-00047.safetensors", + "model.layers.45.mlp.experts.33.up_proj.weight": "model-00046-of-00047.safetensors", + "model.layers.45.mlp.experts.33.up_proj.weight_scale": "model-00046-of-00047.safetensors", + "model.layers.45.mlp.experts.34.down_proj.weight": "model-00046-of-00047.safetensors", + "model.layers.45.mlp.experts.34.down_proj.weight_scale": "model-00046-of-00047.safetensors", + "model.layers.45.mlp.experts.34.gate_proj.weight": "model-00046-of-00047.safetensors", + "model.layers.45.mlp.experts.34.gate_proj.weight_scale": "model-00046-of-00047.safetensors", + "model.layers.45.mlp.experts.34.up_proj.weight": "model-00046-of-00047.safetensors", + "model.layers.45.mlp.experts.34.up_proj.weight_scale": "model-00046-of-00047.safetensors", + "model.layers.45.mlp.experts.35.down_proj.weight": "model-00046-of-00047.safetensors", + "model.layers.45.mlp.experts.35.down_proj.weight_scale": "model-00046-of-00047.safetensors", + "model.layers.45.mlp.experts.35.gate_proj.weight": "model-00046-of-00047.safetensors", + "model.layers.45.mlp.experts.35.gate_proj.weight_scale": "model-00046-of-00047.safetensors", + "model.layers.45.mlp.experts.35.up_proj.weight": "model-00046-of-00047.safetensors", + "model.layers.45.mlp.experts.35.up_proj.weight_scale": "model-00046-of-00047.safetensors", + "model.layers.45.mlp.experts.36.down_proj.weight": "model-00046-of-00047.safetensors", + "model.layers.45.mlp.experts.36.down_proj.weight_scale": "model-00046-of-00047.safetensors", + "model.layers.45.mlp.experts.36.gate_proj.weight": "model-00046-of-00047.safetensors", + "model.layers.45.mlp.experts.36.gate_proj.weight_scale": "model-00046-of-00047.safetensors", + "model.layers.45.mlp.experts.36.up_proj.weight": "model-00046-of-00047.safetensors", + "model.layers.45.mlp.experts.36.up_proj.weight_scale": "model-00046-of-00047.safetensors", + "model.layers.45.mlp.experts.37.down_proj.weight": "model-00046-of-00047.safetensors", + "model.layers.45.mlp.experts.37.down_proj.weight_scale": "model-00046-of-00047.safetensors", + "model.layers.45.mlp.experts.37.gate_proj.weight": "model-00046-of-00047.safetensors", + "model.layers.45.mlp.experts.37.gate_proj.weight_scale": "model-00046-of-00047.safetensors", + "model.layers.45.mlp.experts.37.up_proj.weight": "model-00046-of-00047.safetensors", + "model.layers.45.mlp.experts.37.up_proj.weight_scale": "model-00046-of-00047.safetensors", + "model.layers.45.mlp.experts.38.down_proj.weight": "model-00046-of-00047.safetensors", + "model.layers.45.mlp.experts.38.down_proj.weight_scale": "model-00046-of-00047.safetensors", + "model.layers.45.mlp.experts.38.gate_proj.weight": "model-00046-of-00047.safetensors", + "model.layers.45.mlp.experts.38.gate_proj.weight_scale": "model-00046-of-00047.safetensors", + "model.layers.45.mlp.experts.38.up_proj.weight": "model-00046-of-00047.safetensors", + "model.layers.45.mlp.experts.38.up_proj.weight_scale": "model-00046-of-00047.safetensors", + "model.layers.45.mlp.experts.39.down_proj.weight": "model-00046-of-00047.safetensors", + "model.layers.45.mlp.experts.39.down_proj.weight_scale": "model-00046-of-00047.safetensors", + "model.layers.45.mlp.experts.39.gate_proj.weight": "model-00046-of-00047.safetensors", + "model.layers.45.mlp.experts.39.gate_proj.weight_scale": "model-00046-of-00047.safetensors", + "model.layers.45.mlp.experts.39.up_proj.weight": "model-00046-of-00047.safetensors", + "model.layers.45.mlp.experts.39.up_proj.weight_scale": "model-00046-of-00047.safetensors", + "model.layers.45.mlp.experts.4.down_proj.weight": "model-00046-of-00047.safetensors", + "model.layers.45.mlp.experts.4.down_proj.weight_scale": "model-00046-of-00047.safetensors", + "model.layers.45.mlp.experts.4.gate_proj.weight": "model-00046-of-00047.safetensors", + "model.layers.45.mlp.experts.4.gate_proj.weight_scale": "model-00046-of-00047.safetensors", + "model.layers.45.mlp.experts.4.up_proj.weight": "model-00046-of-00047.safetensors", + "model.layers.45.mlp.experts.4.up_proj.weight_scale": "model-00046-of-00047.safetensors", + "model.layers.45.mlp.experts.40.down_proj.weight": "model-00046-of-00047.safetensors", + "model.layers.45.mlp.experts.40.down_proj.weight_scale": "model-00046-of-00047.safetensors", + "model.layers.45.mlp.experts.40.gate_proj.weight": "model-00046-of-00047.safetensors", + "model.layers.45.mlp.experts.40.gate_proj.weight_scale": "model-00046-of-00047.safetensors", + "model.layers.45.mlp.experts.40.up_proj.weight": "model-00046-of-00047.safetensors", + "model.layers.45.mlp.experts.40.up_proj.weight_scale": "model-00046-of-00047.safetensors", + "model.layers.45.mlp.experts.41.down_proj.weight": "model-00046-of-00047.safetensors", + "model.layers.45.mlp.experts.41.down_proj.weight_scale": "model-00046-of-00047.safetensors", + "model.layers.45.mlp.experts.41.gate_proj.weight": "model-00046-of-00047.safetensors", + "model.layers.45.mlp.experts.41.gate_proj.weight_scale": "model-00046-of-00047.safetensors", + "model.layers.45.mlp.experts.41.up_proj.weight": "model-00046-of-00047.safetensors", + "model.layers.45.mlp.experts.41.up_proj.weight_scale": "model-00046-of-00047.safetensors", + "model.layers.45.mlp.experts.42.down_proj.weight": "model-00046-of-00047.safetensors", + "model.layers.45.mlp.experts.42.down_proj.weight_scale": "model-00046-of-00047.safetensors", + "model.layers.45.mlp.experts.42.gate_proj.weight": "model-00046-of-00047.safetensors", + "model.layers.45.mlp.experts.42.gate_proj.weight_scale": "model-00046-of-00047.safetensors", + "model.layers.45.mlp.experts.42.up_proj.weight": "model-00046-of-00047.safetensors", + "model.layers.45.mlp.experts.42.up_proj.weight_scale": "model-00046-of-00047.safetensors", + "model.layers.45.mlp.experts.43.down_proj.weight": "model-00046-of-00047.safetensors", + "model.layers.45.mlp.experts.43.down_proj.weight_scale": "model-00046-of-00047.safetensors", + "model.layers.45.mlp.experts.43.gate_proj.weight": "model-00046-of-00047.safetensors", + "model.layers.45.mlp.experts.43.gate_proj.weight_scale": "model-00046-of-00047.safetensors", + "model.layers.45.mlp.experts.43.up_proj.weight": "model-00046-of-00047.safetensors", + "model.layers.45.mlp.experts.43.up_proj.weight_scale": "model-00046-of-00047.safetensors", + "model.layers.45.mlp.experts.44.down_proj.weight": "model-00046-of-00047.safetensors", + "model.layers.45.mlp.experts.44.down_proj.weight_scale": "model-00046-of-00047.safetensors", + "model.layers.45.mlp.experts.44.gate_proj.weight": "model-00046-of-00047.safetensors", + "model.layers.45.mlp.experts.44.gate_proj.weight_scale": "model-00046-of-00047.safetensors", + "model.layers.45.mlp.experts.44.up_proj.weight": "model-00046-of-00047.safetensors", + "model.layers.45.mlp.experts.44.up_proj.weight_scale": "model-00046-of-00047.safetensors", + "model.layers.45.mlp.experts.45.down_proj.weight": "model-00046-of-00047.safetensors", + "model.layers.45.mlp.experts.45.down_proj.weight_scale": "model-00046-of-00047.safetensors", + "model.layers.45.mlp.experts.45.gate_proj.weight": "model-00046-of-00047.safetensors", + "model.layers.45.mlp.experts.45.gate_proj.weight_scale": "model-00046-of-00047.safetensors", + "model.layers.45.mlp.experts.45.up_proj.weight": "model-00046-of-00047.safetensors", + "model.layers.45.mlp.experts.45.up_proj.weight_scale": "model-00046-of-00047.safetensors", + "model.layers.45.mlp.experts.46.down_proj.weight": "model-00046-of-00047.safetensors", + "model.layers.45.mlp.experts.46.down_proj.weight_scale": "model-00046-of-00047.safetensors", + "model.layers.45.mlp.experts.46.gate_proj.weight": "model-00046-of-00047.safetensors", + "model.layers.45.mlp.experts.46.gate_proj.weight_scale": "model-00046-of-00047.safetensors", + "model.layers.45.mlp.experts.46.up_proj.weight": "model-00046-of-00047.safetensors", + "model.layers.45.mlp.experts.46.up_proj.weight_scale": "model-00046-of-00047.safetensors", + "model.layers.45.mlp.experts.47.down_proj.weight": "model-00046-of-00047.safetensors", + "model.layers.45.mlp.experts.47.down_proj.weight_scale": "model-00046-of-00047.safetensors", + "model.layers.45.mlp.experts.47.gate_proj.weight": "model-00046-of-00047.safetensors", + "model.layers.45.mlp.experts.47.gate_proj.weight_scale": "model-00046-of-00047.safetensors", + "model.layers.45.mlp.experts.47.up_proj.weight": "model-00046-of-00047.safetensors", + "model.layers.45.mlp.experts.47.up_proj.weight_scale": "model-00046-of-00047.safetensors", + "model.layers.45.mlp.experts.48.down_proj.weight": "model-00046-of-00047.safetensors", + "model.layers.45.mlp.experts.48.down_proj.weight_scale": "model-00046-of-00047.safetensors", + "model.layers.45.mlp.experts.48.gate_proj.weight": "model-00046-of-00047.safetensors", + "model.layers.45.mlp.experts.48.gate_proj.weight_scale": "model-00046-of-00047.safetensors", + "model.layers.45.mlp.experts.48.up_proj.weight": "model-00046-of-00047.safetensors", + "model.layers.45.mlp.experts.48.up_proj.weight_scale": "model-00046-of-00047.safetensors", + "model.layers.45.mlp.experts.49.down_proj.weight": "model-00046-of-00047.safetensors", + "model.layers.45.mlp.experts.49.down_proj.weight_scale": "model-00046-of-00047.safetensors", + "model.layers.45.mlp.experts.49.gate_proj.weight": "model-00046-of-00047.safetensors", + "model.layers.45.mlp.experts.49.gate_proj.weight_scale": "model-00046-of-00047.safetensors", + "model.layers.45.mlp.experts.49.up_proj.weight": "model-00046-of-00047.safetensors", + "model.layers.45.mlp.experts.49.up_proj.weight_scale": "model-00046-of-00047.safetensors", + "model.layers.45.mlp.experts.5.down_proj.weight": "model-00046-of-00047.safetensors", + "model.layers.45.mlp.experts.5.down_proj.weight_scale": "model-00046-of-00047.safetensors", + "model.layers.45.mlp.experts.5.gate_proj.weight": "model-00046-of-00047.safetensors", + "model.layers.45.mlp.experts.5.gate_proj.weight_scale": "model-00046-of-00047.safetensors", + "model.layers.45.mlp.experts.5.up_proj.weight": "model-00046-of-00047.safetensors", + "model.layers.45.mlp.experts.5.up_proj.weight_scale": "model-00046-of-00047.safetensors", + "model.layers.45.mlp.experts.50.down_proj.weight": "model-00046-of-00047.safetensors", + "model.layers.45.mlp.experts.50.down_proj.weight_scale": "model-00046-of-00047.safetensors", + "model.layers.45.mlp.experts.50.gate_proj.weight": "model-00046-of-00047.safetensors", + "model.layers.45.mlp.experts.50.gate_proj.weight_scale": "model-00046-of-00047.safetensors", + "model.layers.45.mlp.experts.50.up_proj.weight": "model-00046-of-00047.safetensors", + "model.layers.45.mlp.experts.50.up_proj.weight_scale": "model-00046-of-00047.safetensors", + "model.layers.45.mlp.experts.51.down_proj.weight": "model-00046-of-00047.safetensors", + "model.layers.45.mlp.experts.51.down_proj.weight_scale": "model-00046-of-00047.safetensors", + "model.layers.45.mlp.experts.51.gate_proj.weight": "model-00046-of-00047.safetensors", + "model.layers.45.mlp.experts.51.gate_proj.weight_scale": "model-00046-of-00047.safetensors", + "model.layers.45.mlp.experts.51.up_proj.weight": "model-00046-of-00047.safetensors", + "model.layers.45.mlp.experts.51.up_proj.weight_scale": "model-00046-of-00047.safetensors", + "model.layers.45.mlp.experts.52.down_proj.weight": "model-00046-of-00047.safetensors", + "model.layers.45.mlp.experts.52.down_proj.weight_scale": "model-00046-of-00047.safetensors", + "model.layers.45.mlp.experts.52.gate_proj.weight": "model-00046-of-00047.safetensors", + "model.layers.45.mlp.experts.52.gate_proj.weight_scale": "model-00046-of-00047.safetensors", + "model.layers.45.mlp.experts.52.up_proj.weight": "model-00046-of-00047.safetensors", + "model.layers.45.mlp.experts.52.up_proj.weight_scale": "model-00046-of-00047.safetensors", + "model.layers.45.mlp.experts.53.down_proj.weight": "model-00046-of-00047.safetensors", + "model.layers.45.mlp.experts.53.down_proj.weight_scale": "model-00046-of-00047.safetensors", + "model.layers.45.mlp.experts.53.gate_proj.weight": "model-00046-of-00047.safetensors", + "model.layers.45.mlp.experts.53.gate_proj.weight_scale": "model-00046-of-00047.safetensors", + "model.layers.45.mlp.experts.53.up_proj.weight": "model-00046-of-00047.safetensors", + "model.layers.45.mlp.experts.53.up_proj.weight_scale": "model-00046-of-00047.safetensors", + "model.layers.45.mlp.experts.54.down_proj.weight": "model-00046-of-00047.safetensors", + "model.layers.45.mlp.experts.54.down_proj.weight_scale": "model-00046-of-00047.safetensors", + "model.layers.45.mlp.experts.54.gate_proj.weight": "model-00046-of-00047.safetensors", + "model.layers.45.mlp.experts.54.gate_proj.weight_scale": "model-00046-of-00047.safetensors", + "model.layers.45.mlp.experts.54.up_proj.weight": "model-00046-of-00047.safetensors", + "model.layers.45.mlp.experts.54.up_proj.weight_scale": "model-00046-of-00047.safetensors", + "model.layers.45.mlp.experts.55.down_proj.weight": "model-00046-of-00047.safetensors", + "model.layers.45.mlp.experts.55.down_proj.weight_scale": "model-00046-of-00047.safetensors", + "model.layers.45.mlp.experts.55.gate_proj.weight": "model-00046-of-00047.safetensors", + "model.layers.45.mlp.experts.55.gate_proj.weight_scale": "model-00046-of-00047.safetensors", + "model.layers.45.mlp.experts.55.up_proj.weight": "model-00046-of-00047.safetensors", + "model.layers.45.mlp.experts.55.up_proj.weight_scale": "model-00046-of-00047.safetensors", + "model.layers.45.mlp.experts.56.down_proj.weight": "model-00046-of-00047.safetensors", + "model.layers.45.mlp.experts.56.down_proj.weight_scale": "model-00046-of-00047.safetensors", + "model.layers.45.mlp.experts.56.gate_proj.weight": "model-00046-of-00047.safetensors", + "model.layers.45.mlp.experts.56.gate_proj.weight_scale": "model-00046-of-00047.safetensors", + "model.layers.45.mlp.experts.56.up_proj.weight": "model-00046-of-00047.safetensors", + "model.layers.45.mlp.experts.56.up_proj.weight_scale": "model-00046-of-00047.safetensors", + "model.layers.45.mlp.experts.57.down_proj.weight": "model-00046-of-00047.safetensors", + "model.layers.45.mlp.experts.57.down_proj.weight_scale": "model-00046-of-00047.safetensors", + "model.layers.45.mlp.experts.57.gate_proj.weight": "model-00046-of-00047.safetensors", + "model.layers.45.mlp.experts.57.gate_proj.weight_scale": "model-00046-of-00047.safetensors", + "model.layers.45.mlp.experts.57.up_proj.weight": "model-00046-of-00047.safetensors", + "model.layers.45.mlp.experts.57.up_proj.weight_scale": "model-00046-of-00047.safetensors", + "model.layers.45.mlp.experts.58.down_proj.weight": "model-00046-of-00047.safetensors", + "model.layers.45.mlp.experts.58.down_proj.weight_scale": "model-00046-of-00047.safetensors", + "model.layers.45.mlp.experts.58.gate_proj.weight": "model-00046-of-00047.safetensors", + "model.layers.45.mlp.experts.58.gate_proj.weight_scale": "model-00046-of-00047.safetensors", + "model.layers.45.mlp.experts.58.up_proj.weight": "model-00046-of-00047.safetensors", + "model.layers.45.mlp.experts.58.up_proj.weight_scale": "model-00046-of-00047.safetensors", + "model.layers.45.mlp.experts.59.down_proj.weight": "model-00046-of-00047.safetensors", + "model.layers.45.mlp.experts.59.down_proj.weight_scale": "model-00046-of-00047.safetensors", + "model.layers.45.mlp.experts.59.gate_proj.weight": "model-00046-of-00047.safetensors", + "model.layers.45.mlp.experts.59.gate_proj.weight_scale": "model-00046-of-00047.safetensors", + "model.layers.45.mlp.experts.59.up_proj.weight": "model-00046-of-00047.safetensors", + "model.layers.45.mlp.experts.59.up_proj.weight_scale": "model-00046-of-00047.safetensors", + "model.layers.45.mlp.experts.6.down_proj.weight": "model-00046-of-00047.safetensors", + "model.layers.45.mlp.experts.6.down_proj.weight_scale": "model-00046-of-00047.safetensors", + "model.layers.45.mlp.experts.6.gate_proj.weight": "model-00046-of-00047.safetensors", + "model.layers.45.mlp.experts.6.gate_proj.weight_scale": "model-00046-of-00047.safetensors", + "model.layers.45.mlp.experts.6.up_proj.weight": "model-00046-of-00047.safetensors", + "model.layers.45.mlp.experts.6.up_proj.weight_scale": "model-00046-of-00047.safetensors", + "model.layers.45.mlp.experts.60.down_proj.weight": "model-00046-of-00047.safetensors", + "model.layers.45.mlp.experts.60.down_proj.weight_scale": "model-00046-of-00047.safetensors", + "model.layers.45.mlp.experts.60.gate_proj.weight": "model-00046-of-00047.safetensors", + "model.layers.45.mlp.experts.60.gate_proj.weight_scale": "model-00046-of-00047.safetensors", + "model.layers.45.mlp.experts.60.up_proj.weight": "model-00046-of-00047.safetensors", + "model.layers.45.mlp.experts.60.up_proj.weight_scale": "model-00046-of-00047.safetensors", + "model.layers.45.mlp.experts.61.down_proj.weight": "model-00046-of-00047.safetensors", + "model.layers.45.mlp.experts.61.down_proj.weight_scale": "model-00046-of-00047.safetensors", + "model.layers.45.mlp.experts.61.gate_proj.weight": "model-00046-of-00047.safetensors", + "model.layers.45.mlp.experts.61.gate_proj.weight_scale": "model-00046-of-00047.safetensors", + "model.layers.45.mlp.experts.61.up_proj.weight": "model-00046-of-00047.safetensors", + "model.layers.45.mlp.experts.61.up_proj.weight_scale": "model-00046-of-00047.safetensors", + "model.layers.45.mlp.experts.62.down_proj.weight": "model-00046-of-00047.safetensors", + "model.layers.45.mlp.experts.62.down_proj.weight_scale": "model-00046-of-00047.safetensors", + "model.layers.45.mlp.experts.62.gate_proj.weight": "model-00046-of-00047.safetensors", + "model.layers.45.mlp.experts.62.gate_proj.weight_scale": "model-00046-of-00047.safetensors", + "model.layers.45.mlp.experts.62.up_proj.weight": "model-00046-of-00047.safetensors", + "model.layers.45.mlp.experts.62.up_proj.weight_scale": "model-00046-of-00047.safetensors", + "model.layers.45.mlp.experts.63.down_proj.weight": "model-00046-of-00047.safetensors", + "model.layers.45.mlp.experts.63.down_proj.weight_scale": "model-00046-of-00047.safetensors", + "model.layers.45.mlp.experts.63.gate_proj.weight": "model-00046-of-00047.safetensors", + "model.layers.45.mlp.experts.63.gate_proj.weight_scale": "model-00046-of-00047.safetensors", + "model.layers.45.mlp.experts.63.up_proj.weight": "model-00046-of-00047.safetensors", + "model.layers.45.mlp.experts.63.up_proj.weight_scale": "model-00046-of-00047.safetensors", + "model.layers.45.mlp.experts.64.down_proj.weight": "model-00046-of-00047.safetensors", + "model.layers.45.mlp.experts.64.down_proj.weight_scale": "model-00046-of-00047.safetensors", + "model.layers.45.mlp.experts.64.gate_proj.weight": "model-00046-of-00047.safetensors", + "model.layers.45.mlp.experts.64.gate_proj.weight_scale": "model-00046-of-00047.safetensors", + "model.layers.45.mlp.experts.64.up_proj.weight": "model-00046-of-00047.safetensors", + "model.layers.45.mlp.experts.64.up_proj.weight_scale": "model-00046-of-00047.safetensors", + "model.layers.45.mlp.experts.65.down_proj.weight": "model-00046-of-00047.safetensors", + "model.layers.45.mlp.experts.65.down_proj.weight_scale": "model-00046-of-00047.safetensors", + "model.layers.45.mlp.experts.65.gate_proj.weight": "model-00046-of-00047.safetensors", + "model.layers.45.mlp.experts.65.gate_proj.weight_scale": "model-00046-of-00047.safetensors", + "model.layers.45.mlp.experts.65.up_proj.weight": "model-00046-of-00047.safetensors", + "model.layers.45.mlp.experts.65.up_proj.weight_scale": "model-00046-of-00047.safetensors", + "model.layers.45.mlp.experts.66.down_proj.weight": "model-00046-of-00047.safetensors", + "model.layers.45.mlp.experts.66.down_proj.weight_scale": "model-00046-of-00047.safetensors", + "model.layers.45.mlp.experts.66.gate_proj.weight": "model-00046-of-00047.safetensors", + "model.layers.45.mlp.experts.66.gate_proj.weight_scale": "model-00046-of-00047.safetensors", + "model.layers.45.mlp.experts.66.up_proj.weight": "model-00046-of-00047.safetensors", + "model.layers.45.mlp.experts.66.up_proj.weight_scale": "model-00046-of-00047.safetensors", + "model.layers.45.mlp.experts.67.down_proj.weight": "model-00046-of-00047.safetensors", + "model.layers.45.mlp.experts.67.down_proj.weight_scale": "model-00046-of-00047.safetensors", + "model.layers.45.mlp.experts.67.gate_proj.weight": "model-00046-of-00047.safetensors", + "model.layers.45.mlp.experts.67.gate_proj.weight_scale": "model-00046-of-00047.safetensors", + "model.layers.45.mlp.experts.67.up_proj.weight": "model-00046-of-00047.safetensors", + "model.layers.45.mlp.experts.67.up_proj.weight_scale": "model-00046-of-00047.safetensors", + "model.layers.45.mlp.experts.68.down_proj.weight": "model-00046-of-00047.safetensors", + "model.layers.45.mlp.experts.68.down_proj.weight_scale": "model-00046-of-00047.safetensors", + "model.layers.45.mlp.experts.68.gate_proj.weight": "model-00046-of-00047.safetensors", + "model.layers.45.mlp.experts.68.gate_proj.weight_scale": "model-00046-of-00047.safetensors", + "model.layers.45.mlp.experts.68.up_proj.weight": "model-00046-of-00047.safetensors", + "model.layers.45.mlp.experts.68.up_proj.weight_scale": "model-00046-of-00047.safetensors", + "model.layers.45.mlp.experts.69.down_proj.weight": "model-00046-of-00047.safetensors", + "model.layers.45.mlp.experts.69.down_proj.weight_scale": "model-00046-of-00047.safetensors", + "model.layers.45.mlp.experts.69.gate_proj.weight": "model-00046-of-00047.safetensors", + "model.layers.45.mlp.experts.69.gate_proj.weight_scale": "model-00046-of-00047.safetensors", + "model.layers.45.mlp.experts.69.up_proj.weight": "model-00046-of-00047.safetensors", + "model.layers.45.mlp.experts.69.up_proj.weight_scale": "model-00046-of-00047.safetensors", + "model.layers.45.mlp.experts.7.down_proj.weight": "model-00046-of-00047.safetensors", + "model.layers.45.mlp.experts.7.down_proj.weight_scale": "model-00046-of-00047.safetensors", + "model.layers.45.mlp.experts.7.gate_proj.weight": "model-00046-of-00047.safetensors", + "model.layers.45.mlp.experts.7.gate_proj.weight_scale": "model-00046-of-00047.safetensors", + "model.layers.45.mlp.experts.7.up_proj.weight": "model-00046-of-00047.safetensors", + "model.layers.45.mlp.experts.7.up_proj.weight_scale": "model-00046-of-00047.safetensors", + "model.layers.45.mlp.experts.70.down_proj.weight": "model-00046-of-00047.safetensors", + "model.layers.45.mlp.experts.70.down_proj.weight_scale": "model-00046-of-00047.safetensors", + "model.layers.45.mlp.experts.70.gate_proj.weight": "model-00046-of-00047.safetensors", + "model.layers.45.mlp.experts.70.gate_proj.weight_scale": "model-00046-of-00047.safetensors", + "model.layers.45.mlp.experts.70.up_proj.weight": "model-00046-of-00047.safetensors", + "model.layers.45.mlp.experts.70.up_proj.weight_scale": "model-00046-of-00047.safetensors", + "model.layers.45.mlp.experts.71.down_proj.weight": "model-00046-of-00047.safetensors", + "model.layers.45.mlp.experts.71.down_proj.weight_scale": "model-00046-of-00047.safetensors", + "model.layers.45.mlp.experts.71.gate_proj.weight": "model-00046-of-00047.safetensors", + "model.layers.45.mlp.experts.71.gate_proj.weight_scale": "model-00046-of-00047.safetensors", + "model.layers.45.mlp.experts.71.up_proj.weight": "model-00046-of-00047.safetensors", + "model.layers.45.mlp.experts.71.up_proj.weight_scale": "model-00046-of-00047.safetensors", + "model.layers.45.mlp.experts.72.down_proj.weight": "model-00046-of-00047.safetensors", + "model.layers.45.mlp.experts.72.down_proj.weight_scale": "model-00046-of-00047.safetensors", + "model.layers.45.mlp.experts.72.gate_proj.weight": "model-00046-of-00047.safetensors", + "model.layers.45.mlp.experts.72.gate_proj.weight_scale": "model-00046-of-00047.safetensors", + "model.layers.45.mlp.experts.72.up_proj.weight": "model-00046-of-00047.safetensors", + "model.layers.45.mlp.experts.72.up_proj.weight_scale": "model-00046-of-00047.safetensors", + "model.layers.45.mlp.experts.73.down_proj.weight": "model-00046-of-00047.safetensors", + "model.layers.45.mlp.experts.73.down_proj.weight_scale": "model-00046-of-00047.safetensors", + "model.layers.45.mlp.experts.73.gate_proj.weight": "model-00046-of-00047.safetensors", + "model.layers.45.mlp.experts.73.gate_proj.weight_scale": "model-00046-of-00047.safetensors", + "model.layers.45.mlp.experts.73.up_proj.weight": "model-00046-of-00047.safetensors", + "model.layers.45.mlp.experts.73.up_proj.weight_scale": "model-00046-of-00047.safetensors", + "model.layers.45.mlp.experts.74.down_proj.weight": "model-00046-of-00047.safetensors", + "model.layers.45.mlp.experts.74.down_proj.weight_scale": "model-00046-of-00047.safetensors", + "model.layers.45.mlp.experts.74.gate_proj.weight": "model-00046-of-00047.safetensors", + "model.layers.45.mlp.experts.74.gate_proj.weight_scale": "model-00046-of-00047.safetensors", + "model.layers.45.mlp.experts.74.up_proj.weight": "model-00046-of-00047.safetensors", + "model.layers.45.mlp.experts.74.up_proj.weight_scale": "model-00046-of-00047.safetensors", + "model.layers.45.mlp.experts.75.down_proj.weight": "model-00046-of-00047.safetensors", + "model.layers.45.mlp.experts.75.down_proj.weight_scale": "model-00046-of-00047.safetensors", + "model.layers.45.mlp.experts.75.gate_proj.weight": "model-00046-of-00047.safetensors", + "model.layers.45.mlp.experts.75.gate_proj.weight_scale": "model-00046-of-00047.safetensors", + "model.layers.45.mlp.experts.75.up_proj.weight": "model-00046-of-00047.safetensors", + "model.layers.45.mlp.experts.75.up_proj.weight_scale": "model-00046-of-00047.safetensors", + "model.layers.45.mlp.experts.76.down_proj.weight": "model-00046-of-00047.safetensors", + "model.layers.45.mlp.experts.76.down_proj.weight_scale": "model-00046-of-00047.safetensors", + "model.layers.45.mlp.experts.76.gate_proj.weight": "model-00046-of-00047.safetensors", + "model.layers.45.mlp.experts.76.gate_proj.weight_scale": "model-00046-of-00047.safetensors", + "model.layers.45.mlp.experts.76.up_proj.weight": "model-00046-of-00047.safetensors", + "model.layers.45.mlp.experts.76.up_proj.weight_scale": "model-00046-of-00047.safetensors", + "model.layers.45.mlp.experts.77.down_proj.weight": "model-00046-of-00047.safetensors", + "model.layers.45.mlp.experts.77.down_proj.weight_scale": "model-00046-of-00047.safetensors", + "model.layers.45.mlp.experts.77.gate_proj.weight": "model-00046-of-00047.safetensors", + "model.layers.45.mlp.experts.77.gate_proj.weight_scale": "model-00046-of-00047.safetensors", + "model.layers.45.mlp.experts.77.up_proj.weight": "model-00046-of-00047.safetensors", + "model.layers.45.mlp.experts.77.up_proj.weight_scale": "model-00046-of-00047.safetensors", + "model.layers.45.mlp.experts.78.down_proj.weight": "model-00046-of-00047.safetensors", + "model.layers.45.mlp.experts.78.down_proj.weight_scale": "model-00046-of-00047.safetensors", + "model.layers.45.mlp.experts.78.gate_proj.weight": "model-00046-of-00047.safetensors", + "model.layers.45.mlp.experts.78.gate_proj.weight_scale": "model-00046-of-00047.safetensors", + "model.layers.45.mlp.experts.78.up_proj.weight": "model-00046-of-00047.safetensors", + "model.layers.45.mlp.experts.78.up_proj.weight_scale": "model-00046-of-00047.safetensors", + "model.layers.45.mlp.experts.79.down_proj.weight": "model-00046-of-00047.safetensors", + "model.layers.45.mlp.experts.79.down_proj.weight_scale": "model-00046-of-00047.safetensors", + "model.layers.45.mlp.experts.79.gate_proj.weight": "model-00046-of-00047.safetensors", + "model.layers.45.mlp.experts.79.gate_proj.weight_scale": "model-00046-of-00047.safetensors", + "model.layers.45.mlp.experts.79.up_proj.weight": "model-00046-of-00047.safetensors", + "model.layers.45.mlp.experts.79.up_proj.weight_scale": "model-00046-of-00047.safetensors", + "model.layers.45.mlp.experts.8.down_proj.weight": "model-00046-of-00047.safetensors", + "model.layers.45.mlp.experts.8.down_proj.weight_scale": "model-00046-of-00047.safetensors", + "model.layers.45.mlp.experts.8.gate_proj.weight": "model-00046-of-00047.safetensors", + "model.layers.45.mlp.experts.8.gate_proj.weight_scale": "model-00046-of-00047.safetensors", + "model.layers.45.mlp.experts.8.up_proj.weight": "model-00046-of-00047.safetensors", + "model.layers.45.mlp.experts.8.up_proj.weight_scale": "model-00046-of-00047.safetensors", + "model.layers.45.mlp.experts.80.down_proj.weight": "model-00046-of-00047.safetensors", + "model.layers.45.mlp.experts.80.down_proj.weight_scale": "model-00046-of-00047.safetensors", + "model.layers.45.mlp.experts.80.gate_proj.weight": "model-00046-of-00047.safetensors", + "model.layers.45.mlp.experts.80.gate_proj.weight_scale": "model-00046-of-00047.safetensors", + "model.layers.45.mlp.experts.80.up_proj.weight": "model-00046-of-00047.safetensors", + "model.layers.45.mlp.experts.80.up_proj.weight_scale": "model-00046-of-00047.safetensors", + "model.layers.45.mlp.experts.81.down_proj.weight": "model-00046-of-00047.safetensors", + "model.layers.45.mlp.experts.81.down_proj.weight_scale": "model-00046-of-00047.safetensors", + "model.layers.45.mlp.experts.81.gate_proj.weight": "model-00046-of-00047.safetensors", + "model.layers.45.mlp.experts.81.gate_proj.weight_scale": "model-00046-of-00047.safetensors", + "model.layers.45.mlp.experts.81.up_proj.weight": "model-00046-of-00047.safetensors", + "model.layers.45.mlp.experts.81.up_proj.weight_scale": "model-00046-of-00047.safetensors", + "model.layers.45.mlp.experts.82.down_proj.weight": "model-00046-of-00047.safetensors", + "model.layers.45.mlp.experts.82.down_proj.weight_scale": "model-00046-of-00047.safetensors", + "model.layers.45.mlp.experts.82.gate_proj.weight": "model-00046-of-00047.safetensors", + "model.layers.45.mlp.experts.82.gate_proj.weight_scale": "model-00046-of-00047.safetensors", + "model.layers.45.mlp.experts.82.up_proj.weight": "model-00046-of-00047.safetensors", + "model.layers.45.mlp.experts.82.up_proj.weight_scale": "model-00046-of-00047.safetensors", + "model.layers.45.mlp.experts.83.down_proj.weight": "model-00046-of-00047.safetensors", + "model.layers.45.mlp.experts.83.down_proj.weight_scale": "model-00046-of-00047.safetensors", + "model.layers.45.mlp.experts.83.gate_proj.weight": "model-00046-of-00047.safetensors", + "model.layers.45.mlp.experts.83.gate_proj.weight_scale": "model-00046-of-00047.safetensors", + "model.layers.45.mlp.experts.83.up_proj.weight": "model-00046-of-00047.safetensors", + "model.layers.45.mlp.experts.83.up_proj.weight_scale": "model-00046-of-00047.safetensors", + "model.layers.45.mlp.experts.84.down_proj.weight": "model-00046-of-00047.safetensors", + "model.layers.45.mlp.experts.84.down_proj.weight_scale": "model-00046-of-00047.safetensors", + "model.layers.45.mlp.experts.84.gate_proj.weight": "model-00046-of-00047.safetensors", + "model.layers.45.mlp.experts.84.gate_proj.weight_scale": "model-00046-of-00047.safetensors", + "model.layers.45.mlp.experts.84.up_proj.weight": "model-00046-of-00047.safetensors", + "model.layers.45.mlp.experts.84.up_proj.weight_scale": "model-00046-of-00047.safetensors", + "model.layers.45.mlp.experts.85.down_proj.weight": "model-00046-of-00047.safetensors", + "model.layers.45.mlp.experts.85.down_proj.weight_scale": "model-00046-of-00047.safetensors", + "model.layers.45.mlp.experts.85.gate_proj.weight": "model-00046-of-00047.safetensors", + "model.layers.45.mlp.experts.85.gate_proj.weight_scale": "model-00046-of-00047.safetensors", + "model.layers.45.mlp.experts.85.up_proj.weight": "model-00046-of-00047.safetensors", + "model.layers.45.mlp.experts.85.up_proj.weight_scale": "model-00046-of-00047.safetensors", + "model.layers.45.mlp.experts.86.down_proj.weight": "model-00046-of-00047.safetensors", + "model.layers.45.mlp.experts.86.down_proj.weight_scale": "model-00046-of-00047.safetensors", + "model.layers.45.mlp.experts.86.gate_proj.weight": "model-00046-of-00047.safetensors", + "model.layers.45.mlp.experts.86.gate_proj.weight_scale": "model-00046-of-00047.safetensors", + "model.layers.45.mlp.experts.86.up_proj.weight": "model-00046-of-00047.safetensors", + "model.layers.45.mlp.experts.86.up_proj.weight_scale": "model-00046-of-00047.safetensors", + "model.layers.45.mlp.experts.87.down_proj.weight": "model-00046-of-00047.safetensors", + "model.layers.45.mlp.experts.87.down_proj.weight_scale": "model-00046-of-00047.safetensors", + "model.layers.45.mlp.experts.87.gate_proj.weight": "model-00046-of-00047.safetensors", + "model.layers.45.mlp.experts.87.gate_proj.weight_scale": "model-00046-of-00047.safetensors", + "model.layers.45.mlp.experts.87.up_proj.weight": "model-00046-of-00047.safetensors", + "model.layers.45.mlp.experts.87.up_proj.weight_scale": "model-00046-of-00047.safetensors", + "model.layers.45.mlp.experts.88.down_proj.weight": "model-00046-of-00047.safetensors", + "model.layers.45.mlp.experts.88.down_proj.weight_scale": "model-00046-of-00047.safetensors", + "model.layers.45.mlp.experts.88.gate_proj.weight": "model-00046-of-00047.safetensors", + "model.layers.45.mlp.experts.88.gate_proj.weight_scale": "model-00046-of-00047.safetensors", + "model.layers.45.mlp.experts.88.up_proj.weight": "model-00046-of-00047.safetensors", + "model.layers.45.mlp.experts.88.up_proj.weight_scale": "model-00046-of-00047.safetensors", + "model.layers.45.mlp.experts.89.down_proj.weight": "model-00046-of-00047.safetensors", + "model.layers.45.mlp.experts.89.down_proj.weight_scale": "model-00046-of-00047.safetensors", + "model.layers.45.mlp.experts.89.gate_proj.weight": "model-00046-of-00047.safetensors", + "model.layers.45.mlp.experts.89.gate_proj.weight_scale": "model-00046-of-00047.safetensors", + "model.layers.45.mlp.experts.89.up_proj.weight": "model-00046-of-00047.safetensors", + "model.layers.45.mlp.experts.89.up_proj.weight_scale": "model-00046-of-00047.safetensors", + "model.layers.45.mlp.experts.9.down_proj.weight": "model-00046-of-00047.safetensors", + "model.layers.45.mlp.experts.9.down_proj.weight_scale": "model-00046-of-00047.safetensors", + "model.layers.45.mlp.experts.9.gate_proj.weight": "model-00046-of-00047.safetensors", + "model.layers.45.mlp.experts.9.gate_proj.weight_scale": "model-00046-of-00047.safetensors", + "model.layers.45.mlp.experts.9.up_proj.weight": "model-00046-of-00047.safetensors", + "model.layers.45.mlp.experts.9.up_proj.weight_scale": "model-00046-of-00047.safetensors", + "model.layers.45.mlp.experts.90.down_proj.weight": "model-00046-of-00047.safetensors", + "model.layers.45.mlp.experts.90.down_proj.weight_scale": "model-00046-of-00047.safetensors", + "model.layers.45.mlp.experts.90.gate_proj.weight": "model-00046-of-00047.safetensors", + "model.layers.45.mlp.experts.90.gate_proj.weight_scale": "model-00046-of-00047.safetensors", + "model.layers.45.mlp.experts.90.up_proj.weight": "model-00046-of-00047.safetensors", + "model.layers.45.mlp.experts.90.up_proj.weight_scale": "model-00046-of-00047.safetensors", + "model.layers.45.mlp.experts.91.down_proj.weight": "model-00046-of-00047.safetensors", + "model.layers.45.mlp.experts.91.down_proj.weight_scale": "model-00046-of-00047.safetensors", + "model.layers.45.mlp.experts.91.gate_proj.weight": "model-00046-of-00047.safetensors", + "model.layers.45.mlp.experts.91.gate_proj.weight_scale": "model-00046-of-00047.safetensors", + "model.layers.45.mlp.experts.91.up_proj.weight": "model-00046-of-00047.safetensors", + "model.layers.45.mlp.experts.91.up_proj.weight_scale": "model-00046-of-00047.safetensors", + "model.layers.45.mlp.experts.92.down_proj.weight": "model-00046-of-00047.safetensors", + "model.layers.45.mlp.experts.92.down_proj.weight_scale": "model-00046-of-00047.safetensors", + "model.layers.45.mlp.experts.92.gate_proj.weight": "model-00046-of-00047.safetensors", + "model.layers.45.mlp.experts.92.gate_proj.weight_scale": "model-00046-of-00047.safetensors", + "model.layers.45.mlp.experts.92.up_proj.weight": "model-00046-of-00047.safetensors", + "model.layers.45.mlp.experts.92.up_proj.weight_scale": "model-00046-of-00047.safetensors", + "model.layers.45.mlp.experts.93.down_proj.weight": "model-00046-of-00047.safetensors", + "model.layers.45.mlp.experts.93.down_proj.weight_scale": "model-00046-of-00047.safetensors", + "model.layers.45.mlp.experts.93.gate_proj.weight": "model-00046-of-00047.safetensors", + "model.layers.45.mlp.experts.93.gate_proj.weight_scale": "model-00046-of-00047.safetensors", + "model.layers.45.mlp.experts.93.up_proj.weight": "model-00046-of-00047.safetensors", + "model.layers.45.mlp.experts.93.up_proj.weight_scale": "model-00046-of-00047.safetensors", + "model.layers.45.mlp.experts.94.down_proj.weight": "model-00046-of-00047.safetensors", + "model.layers.45.mlp.experts.94.down_proj.weight_scale": "model-00046-of-00047.safetensors", + "model.layers.45.mlp.experts.94.gate_proj.weight": "model-00046-of-00047.safetensors", + "model.layers.45.mlp.experts.94.gate_proj.weight_scale": "model-00046-of-00047.safetensors", + "model.layers.45.mlp.experts.94.up_proj.weight": "model-00046-of-00047.safetensors", + "model.layers.45.mlp.experts.94.up_proj.weight_scale": "model-00046-of-00047.safetensors", + "model.layers.45.mlp.experts.95.down_proj.weight": "model-00046-of-00047.safetensors", + "model.layers.45.mlp.experts.95.down_proj.weight_scale": "model-00046-of-00047.safetensors", + "model.layers.45.mlp.experts.95.gate_proj.weight": "model-00046-of-00047.safetensors", + "model.layers.45.mlp.experts.95.gate_proj.weight_scale": "model-00046-of-00047.safetensors", + "model.layers.45.mlp.experts.95.up_proj.weight": "model-00046-of-00047.safetensors", + "model.layers.45.mlp.experts.95.up_proj.weight_scale": "model-00046-of-00047.safetensors", + "model.layers.45.mlp.experts.96.down_proj.weight": "model-00046-of-00047.safetensors", + "model.layers.45.mlp.experts.96.down_proj.weight_scale": "model-00046-of-00047.safetensors", + "model.layers.45.mlp.experts.96.gate_proj.weight": "model-00046-of-00047.safetensors", + "model.layers.45.mlp.experts.96.gate_proj.weight_scale": "model-00046-of-00047.safetensors", + "model.layers.45.mlp.experts.96.up_proj.weight": "model-00046-of-00047.safetensors", + "model.layers.45.mlp.experts.96.up_proj.weight_scale": "model-00046-of-00047.safetensors", + "model.layers.45.mlp.experts.97.down_proj.weight": "model-00046-of-00047.safetensors", + "model.layers.45.mlp.experts.97.down_proj.weight_scale": "model-00046-of-00047.safetensors", + "model.layers.45.mlp.experts.97.gate_proj.weight": "model-00046-of-00047.safetensors", + "model.layers.45.mlp.experts.97.gate_proj.weight_scale": "model-00046-of-00047.safetensors", + "model.layers.45.mlp.experts.97.up_proj.weight": "model-00046-of-00047.safetensors", + "model.layers.45.mlp.experts.97.up_proj.weight_scale": "model-00046-of-00047.safetensors", + "model.layers.45.mlp.experts.98.down_proj.weight": "model-00046-of-00047.safetensors", + "model.layers.45.mlp.experts.98.down_proj.weight_scale": "model-00046-of-00047.safetensors", + "model.layers.45.mlp.experts.98.gate_proj.weight": "model-00046-of-00047.safetensors", + "model.layers.45.mlp.experts.98.gate_proj.weight_scale": "model-00046-of-00047.safetensors", + "model.layers.45.mlp.experts.98.up_proj.weight": "model-00046-of-00047.safetensors", + "model.layers.45.mlp.experts.98.up_proj.weight_scale": "model-00046-of-00047.safetensors", + "model.layers.45.mlp.experts.99.down_proj.weight": "model-00046-of-00047.safetensors", + "model.layers.45.mlp.experts.99.down_proj.weight_scale": "model-00046-of-00047.safetensors", + "model.layers.45.mlp.experts.99.gate_proj.weight": "model-00046-of-00047.safetensors", + "model.layers.45.mlp.experts.99.gate_proj.weight_scale": "model-00046-of-00047.safetensors", + "model.layers.45.mlp.experts.99.up_proj.weight": "model-00046-of-00047.safetensors", + "model.layers.45.mlp.experts.99.up_proj.weight_scale": "model-00046-of-00047.safetensors", + "model.layers.45.mlp.gate.e_score_correction_bias": "model-00046-of-00047.safetensors", + "model.layers.45.mlp.gate.weight": "model-00046-of-00047.safetensors", + "model.layers.45.mlp.shared_experts.down_proj.weight": "model-00046-of-00047.safetensors", + "model.layers.45.mlp.shared_experts.down_proj.weight_scale": "model-00046-of-00047.safetensors", + "model.layers.45.mlp.shared_experts.gate_proj.weight": "model-00046-of-00047.safetensors", + "model.layers.45.mlp.shared_experts.gate_proj.weight_scale": "model-00046-of-00047.safetensors", + "model.layers.45.mlp.shared_experts.up_proj.weight": "model-00046-of-00047.safetensors", + "model.layers.45.mlp.shared_experts.up_proj.weight_scale": "model-00046-of-00047.safetensors", + "model.layers.45.post_attention_layernorm.weight": "model-00046-of-00047.safetensors", + "model.layers.45.self_attn.k_proj.bias": "model-00046-of-00047.safetensors", + "model.layers.45.self_attn.k_proj.weight": "model-00046-of-00047.safetensors", + "model.layers.45.self_attn.k_proj.weight_scale": "model-00046-of-00047.safetensors", + "model.layers.45.self_attn.o_proj.weight": "model-00046-of-00047.safetensors", + "model.layers.45.self_attn.o_proj.weight_scale": "model-00046-of-00047.safetensors", + "model.layers.45.self_attn.q_proj.bias": "model-00046-of-00047.safetensors", + "model.layers.45.self_attn.q_proj.weight": "model-00046-of-00047.safetensors", + "model.layers.45.self_attn.q_proj.weight_scale": "model-00046-of-00047.safetensors", + "model.layers.45.self_attn.v_proj.bias": "model-00046-of-00047.safetensors", + "model.layers.45.self_attn.v_proj.weight": "model-00046-of-00047.safetensors", + "model.layers.45.self_attn.v_proj.weight_scale": "model-00046-of-00047.safetensors", + "model.layers.46.shared_head.head.weight": "model-00046-of-00047.safetensors", + "model.layers.46.shared_head.head.weight_scale": "model-00046-of-00047.safetensors", + "model.norm.weight": "model-00046-of-00047.safetensors", + "model.layers.46.eh_proj.weight": "model-00047-of-00047.safetensors", + "model.layers.46.enorm.weight": "model-00047-of-00047.safetensors", + "model.layers.46.hnorm.weight": "model-00047-of-00047.safetensors", + "model.layers.46.input_layernorm.weight": "model-00047-of-00047.safetensors", + "model.layers.46.mlp.experts.0.down_proj.weight": "model-00047-of-00047.safetensors", + "model.layers.46.mlp.experts.0.down_proj.weight_scale": "model-00047-of-00047.safetensors", + "model.layers.46.mlp.experts.0.gate_proj.weight": "model-00047-of-00047.safetensors", + "model.layers.46.mlp.experts.0.gate_proj.weight_scale": "model-00047-of-00047.safetensors", + "model.layers.46.mlp.experts.0.up_proj.weight": "model-00047-of-00047.safetensors", + "model.layers.46.mlp.experts.0.up_proj.weight_scale": "model-00047-of-00047.safetensors", + "model.layers.46.mlp.experts.1.down_proj.weight": "model-00047-of-00047.safetensors", + "model.layers.46.mlp.experts.1.down_proj.weight_scale": "model-00047-of-00047.safetensors", + "model.layers.46.mlp.experts.1.gate_proj.weight": "model-00047-of-00047.safetensors", + "model.layers.46.mlp.experts.1.gate_proj.weight_scale": "model-00047-of-00047.safetensors", + "model.layers.46.mlp.experts.1.up_proj.weight": "model-00047-of-00047.safetensors", + "model.layers.46.mlp.experts.1.up_proj.weight_scale": "model-00047-of-00047.safetensors", + "model.layers.46.mlp.experts.10.down_proj.weight": "model-00047-of-00047.safetensors", + "model.layers.46.mlp.experts.10.down_proj.weight_scale": "model-00047-of-00047.safetensors", + "model.layers.46.mlp.experts.10.gate_proj.weight": "model-00047-of-00047.safetensors", + "model.layers.46.mlp.experts.10.gate_proj.weight_scale": "model-00047-of-00047.safetensors", + "model.layers.46.mlp.experts.10.up_proj.weight": "model-00047-of-00047.safetensors", + "model.layers.46.mlp.experts.10.up_proj.weight_scale": "model-00047-of-00047.safetensors", + "model.layers.46.mlp.experts.100.down_proj.weight": "model-00047-of-00047.safetensors", + "model.layers.46.mlp.experts.100.down_proj.weight_scale": "model-00047-of-00047.safetensors", + "model.layers.46.mlp.experts.100.gate_proj.weight": "model-00047-of-00047.safetensors", + "model.layers.46.mlp.experts.100.gate_proj.weight_scale": "model-00047-of-00047.safetensors", + "model.layers.46.mlp.experts.100.up_proj.weight": "model-00047-of-00047.safetensors", + "model.layers.46.mlp.experts.100.up_proj.weight_scale": "model-00047-of-00047.safetensors", + "model.layers.46.mlp.experts.101.down_proj.weight": "model-00047-of-00047.safetensors", + "model.layers.46.mlp.experts.101.down_proj.weight_scale": "model-00047-of-00047.safetensors", + "model.layers.46.mlp.experts.101.gate_proj.weight": "model-00047-of-00047.safetensors", + "model.layers.46.mlp.experts.101.gate_proj.weight_scale": "model-00047-of-00047.safetensors", + "model.layers.46.mlp.experts.101.up_proj.weight": "model-00047-of-00047.safetensors", + "model.layers.46.mlp.experts.101.up_proj.weight_scale": "model-00047-of-00047.safetensors", + "model.layers.46.mlp.experts.102.down_proj.weight": "model-00047-of-00047.safetensors", + "model.layers.46.mlp.experts.102.down_proj.weight_scale": "model-00047-of-00047.safetensors", + "model.layers.46.mlp.experts.102.gate_proj.weight": "model-00047-of-00047.safetensors", + "model.layers.46.mlp.experts.102.gate_proj.weight_scale": "model-00047-of-00047.safetensors", + "model.layers.46.mlp.experts.102.up_proj.weight": "model-00047-of-00047.safetensors", + "model.layers.46.mlp.experts.102.up_proj.weight_scale": "model-00047-of-00047.safetensors", + "model.layers.46.mlp.experts.103.down_proj.weight": "model-00047-of-00047.safetensors", + "model.layers.46.mlp.experts.103.down_proj.weight_scale": "model-00047-of-00047.safetensors", + "model.layers.46.mlp.experts.103.gate_proj.weight": "model-00047-of-00047.safetensors", + "model.layers.46.mlp.experts.103.gate_proj.weight_scale": "model-00047-of-00047.safetensors", + "model.layers.46.mlp.experts.103.up_proj.weight": "model-00047-of-00047.safetensors", + "model.layers.46.mlp.experts.103.up_proj.weight_scale": "model-00047-of-00047.safetensors", + "model.layers.46.mlp.experts.104.down_proj.weight": "model-00047-of-00047.safetensors", + "model.layers.46.mlp.experts.104.down_proj.weight_scale": "model-00047-of-00047.safetensors", + "model.layers.46.mlp.experts.104.gate_proj.weight": "model-00047-of-00047.safetensors", + "model.layers.46.mlp.experts.104.gate_proj.weight_scale": "model-00047-of-00047.safetensors", + "model.layers.46.mlp.experts.104.up_proj.weight": "model-00047-of-00047.safetensors", + "model.layers.46.mlp.experts.104.up_proj.weight_scale": "model-00047-of-00047.safetensors", + "model.layers.46.mlp.experts.105.down_proj.weight": "model-00047-of-00047.safetensors", + "model.layers.46.mlp.experts.105.down_proj.weight_scale": "model-00047-of-00047.safetensors", + "model.layers.46.mlp.experts.105.gate_proj.weight": "model-00047-of-00047.safetensors", + "model.layers.46.mlp.experts.105.gate_proj.weight_scale": "model-00047-of-00047.safetensors", + "model.layers.46.mlp.experts.105.up_proj.weight": "model-00047-of-00047.safetensors", + "model.layers.46.mlp.experts.105.up_proj.weight_scale": "model-00047-of-00047.safetensors", + "model.layers.46.mlp.experts.106.down_proj.weight": "model-00047-of-00047.safetensors", + "model.layers.46.mlp.experts.106.down_proj.weight_scale": "model-00047-of-00047.safetensors", + "model.layers.46.mlp.experts.106.gate_proj.weight": "model-00047-of-00047.safetensors", + "model.layers.46.mlp.experts.106.gate_proj.weight_scale": "model-00047-of-00047.safetensors", + "model.layers.46.mlp.experts.106.up_proj.weight": "model-00047-of-00047.safetensors", + "model.layers.46.mlp.experts.106.up_proj.weight_scale": "model-00047-of-00047.safetensors", + "model.layers.46.mlp.experts.107.down_proj.weight": "model-00047-of-00047.safetensors", + "model.layers.46.mlp.experts.107.down_proj.weight_scale": "model-00047-of-00047.safetensors", + "model.layers.46.mlp.experts.107.gate_proj.weight": "model-00047-of-00047.safetensors", + "model.layers.46.mlp.experts.107.gate_proj.weight_scale": "model-00047-of-00047.safetensors", + "model.layers.46.mlp.experts.107.up_proj.weight": "model-00047-of-00047.safetensors", + "model.layers.46.mlp.experts.107.up_proj.weight_scale": "model-00047-of-00047.safetensors", + "model.layers.46.mlp.experts.108.down_proj.weight": "model-00047-of-00047.safetensors", + "model.layers.46.mlp.experts.108.down_proj.weight_scale": "model-00047-of-00047.safetensors", + "model.layers.46.mlp.experts.108.gate_proj.weight": "model-00047-of-00047.safetensors", + "model.layers.46.mlp.experts.108.gate_proj.weight_scale": "model-00047-of-00047.safetensors", + "model.layers.46.mlp.experts.108.up_proj.weight": "model-00047-of-00047.safetensors", + "model.layers.46.mlp.experts.108.up_proj.weight_scale": "model-00047-of-00047.safetensors", + "model.layers.46.mlp.experts.109.down_proj.weight": "model-00047-of-00047.safetensors", + "model.layers.46.mlp.experts.109.down_proj.weight_scale": "model-00047-of-00047.safetensors", + "model.layers.46.mlp.experts.109.gate_proj.weight": "model-00047-of-00047.safetensors", + "model.layers.46.mlp.experts.109.gate_proj.weight_scale": "model-00047-of-00047.safetensors", + "model.layers.46.mlp.experts.109.up_proj.weight": "model-00047-of-00047.safetensors", + "model.layers.46.mlp.experts.109.up_proj.weight_scale": "model-00047-of-00047.safetensors", + "model.layers.46.mlp.experts.11.down_proj.weight": "model-00047-of-00047.safetensors", + "model.layers.46.mlp.experts.11.down_proj.weight_scale": "model-00047-of-00047.safetensors", + "model.layers.46.mlp.experts.11.gate_proj.weight": "model-00047-of-00047.safetensors", + "model.layers.46.mlp.experts.11.gate_proj.weight_scale": "model-00047-of-00047.safetensors", + "model.layers.46.mlp.experts.11.up_proj.weight": "model-00047-of-00047.safetensors", + "model.layers.46.mlp.experts.11.up_proj.weight_scale": "model-00047-of-00047.safetensors", + "model.layers.46.mlp.experts.110.down_proj.weight": "model-00047-of-00047.safetensors", + "model.layers.46.mlp.experts.110.down_proj.weight_scale": "model-00047-of-00047.safetensors", + "model.layers.46.mlp.experts.110.gate_proj.weight": "model-00047-of-00047.safetensors", + "model.layers.46.mlp.experts.110.gate_proj.weight_scale": "model-00047-of-00047.safetensors", + "model.layers.46.mlp.experts.110.up_proj.weight": "model-00047-of-00047.safetensors", + "model.layers.46.mlp.experts.110.up_proj.weight_scale": "model-00047-of-00047.safetensors", + "model.layers.46.mlp.experts.111.down_proj.weight": "model-00047-of-00047.safetensors", + "model.layers.46.mlp.experts.111.down_proj.weight_scale": "model-00047-of-00047.safetensors", + "model.layers.46.mlp.experts.111.gate_proj.weight": "model-00047-of-00047.safetensors", + "model.layers.46.mlp.experts.111.gate_proj.weight_scale": "model-00047-of-00047.safetensors", + "model.layers.46.mlp.experts.111.up_proj.weight": "model-00047-of-00047.safetensors", + "model.layers.46.mlp.experts.111.up_proj.weight_scale": "model-00047-of-00047.safetensors", + "model.layers.46.mlp.experts.112.down_proj.weight": "model-00047-of-00047.safetensors", + "model.layers.46.mlp.experts.112.down_proj.weight_scale": "model-00047-of-00047.safetensors", + "model.layers.46.mlp.experts.112.gate_proj.weight": "model-00047-of-00047.safetensors", + "model.layers.46.mlp.experts.112.gate_proj.weight_scale": "model-00047-of-00047.safetensors", + "model.layers.46.mlp.experts.112.up_proj.weight": "model-00047-of-00047.safetensors", + "model.layers.46.mlp.experts.112.up_proj.weight_scale": "model-00047-of-00047.safetensors", + "model.layers.46.mlp.experts.113.down_proj.weight": "model-00047-of-00047.safetensors", + "model.layers.46.mlp.experts.113.down_proj.weight_scale": "model-00047-of-00047.safetensors", + "model.layers.46.mlp.experts.113.gate_proj.weight": "model-00047-of-00047.safetensors", + "model.layers.46.mlp.experts.113.gate_proj.weight_scale": "model-00047-of-00047.safetensors", + "model.layers.46.mlp.experts.113.up_proj.weight": "model-00047-of-00047.safetensors", + "model.layers.46.mlp.experts.113.up_proj.weight_scale": "model-00047-of-00047.safetensors", + "model.layers.46.mlp.experts.114.down_proj.weight": "model-00047-of-00047.safetensors", + "model.layers.46.mlp.experts.114.down_proj.weight_scale": "model-00047-of-00047.safetensors", + "model.layers.46.mlp.experts.114.gate_proj.weight": "model-00047-of-00047.safetensors", + "model.layers.46.mlp.experts.114.gate_proj.weight_scale": "model-00047-of-00047.safetensors", + "model.layers.46.mlp.experts.114.up_proj.weight": "model-00047-of-00047.safetensors", + "model.layers.46.mlp.experts.114.up_proj.weight_scale": "model-00047-of-00047.safetensors", + "model.layers.46.mlp.experts.115.down_proj.weight": "model-00047-of-00047.safetensors", + "model.layers.46.mlp.experts.115.down_proj.weight_scale": "model-00047-of-00047.safetensors", + "model.layers.46.mlp.experts.115.gate_proj.weight": "model-00047-of-00047.safetensors", + "model.layers.46.mlp.experts.115.gate_proj.weight_scale": "model-00047-of-00047.safetensors", + "model.layers.46.mlp.experts.115.up_proj.weight": "model-00047-of-00047.safetensors", + "model.layers.46.mlp.experts.115.up_proj.weight_scale": "model-00047-of-00047.safetensors", + "model.layers.46.mlp.experts.116.down_proj.weight": "model-00047-of-00047.safetensors", + "model.layers.46.mlp.experts.116.down_proj.weight_scale": "model-00047-of-00047.safetensors", + "model.layers.46.mlp.experts.116.gate_proj.weight": "model-00047-of-00047.safetensors", + "model.layers.46.mlp.experts.116.gate_proj.weight_scale": "model-00047-of-00047.safetensors", + "model.layers.46.mlp.experts.116.up_proj.weight": "model-00047-of-00047.safetensors", + "model.layers.46.mlp.experts.116.up_proj.weight_scale": "model-00047-of-00047.safetensors", + "model.layers.46.mlp.experts.117.down_proj.weight": "model-00047-of-00047.safetensors", + "model.layers.46.mlp.experts.117.down_proj.weight_scale": "model-00047-of-00047.safetensors", + "model.layers.46.mlp.experts.117.gate_proj.weight": "model-00047-of-00047.safetensors", + "model.layers.46.mlp.experts.117.gate_proj.weight_scale": "model-00047-of-00047.safetensors", + "model.layers.46.mlp.experts.117.up_proj.weight": "model-00047-of-00047.safetensors", + "model.layers.46.mlp.experts.117.up_proj.weight_scale": "model-00047-of-00047.safetensors", + "model.layers.46.mlp.experts.118.down_proj.weight": "model-00047-of-00047.safetensors", + "model.layers.46.mlp.experts.118.down_proj.weight_scale": "model-00047-of-00047.safetensors", + "model.layers.46.mlp.experts.118.gate_proj.weight": "model-00047-of-00047.safetensors", + "model.layers.46.mlp.experts.118.gate_proj.weight_scale": "model-00047-of-00047.safetensors", + "model.layers.46.mlp.experts.118.up_proj.weight": "model-00047-of-00047.safetensors", + "model.layers.46.mlp.experts.118.up_proj.weight_scale": "model-00047-of-00047.safetensors", + "model.layers.46.mlp.experts.119.down_proj.weight": "model-00047-of-00047.safetensors", + "model.layers.46.mlp.experts.119.down_proj.weight_scale": "model-00047-of-00047.safetensors", + "model.layers.46.mlp.experts.119.gate_proj.weight": "model-00047-of-00047.safetensors", + "model.layers.46.mlp.experts.119.gate_proj.weight_scale": "model-00047-of-00047.safetensors", + "model.layers.46.mlp.experts.119.up_proj.weight": "model-00047-of-00047.safetensors", + "model.layers.46.mlp.experts.119.up_proj.weight_scale": "model-00047-of-00047.safetensors", + "model.layers.46.mlp.experts.12.down_proj.weight": "model-00047-of-00047.safetensors", + "model.layers.46.mlp.experts.12.down_proj.weight_scale": "model-00047-of-00047.safetensors", + "model.layers.46.mlp.experts.12.gate_proj.weight": "model-00047-of-00047.safetensors", + "model.layers.46.mlp.experts.12.gate_proj.weight_scale": "model-00047-of-00047.safetensors", + "model.layers.46.mlp.experts.12.up_proj.weight": "model-00047-of-00047.safetensors", + "model.layers.46.mlp.experts.12.up_proj.weight_scale": "model-00047-of-00047.safetensors", + "model.layers.46.mlp.experts.120.down_proj.weight": "model-00047-of-00047.safetensors", + "model.layers.46.mlp.experts.120.down_proj.weight_scale": "model-00047-of-00047.safetensors", + "model.layers.46.mlp.experts.120.gate_proj.weight": "model-00047-of-00047.safetensors", + "model.layers.46.mlp.experts.120.gate_proj.weight_scale": "model-00047-of-00047.safetensors", + "model.layers.46.mlp.experts.120.up_proj.weight": "model-00047-of-00047.safetensors", + "model.layers.46.mlp.experts.120.up_proj.weight_scale": "model-00047-of-00047.safetensors", + "model.layers.46.mlp.experts.121.down_proj.weight": "model-00047-of-00047.safetensors", + "model.layers.46.mlp.experts.121.down_proj.weight_scale": "model-00047-of-00047.safetensors", + "model.layers.46.mlp.experts.121.gate_proj.weight": "model-00047-of-00047.safetensors", + "model.layers.46.mlp.experts.121.gate_proj.weight_scale": "model-00047-of-00047.safetensors", + "model.layers.46.mlp.experts.121.up_proj.weight": "model-00047-of-00047.safetensors", + "model.layers.46.mlp.experts.121.up_proj.weight_scale": "model-00047-of-00047.safetensors", + "model.layers.46.mlp.experts.122.down_proj.weight": "model-00047-of-00047.safetensors", + "model.layers.46.mlp.experts.122.down_proj.weight_scale": "model-00047-of-00047.safetensors", + "model.layers.46.mlp.experts.122.gate_proj.weight": "model-00047-of-00047.safetensors", + "model.layers.46.mlp.experts.122.gate_proj.weight_scale": "model-00047-of-00047.safetensors", + "model.layers.46.mlp.experts.122.up_proj.weight": "model-00047-of-00047.safetensors", + "model.layers.46.mlp.experts.122.up_proj.weight_scale": "model-00047-of-00047.safetensors", + "model.layers.46.mlp.experts.123.down_proj.weight": "model-00047-of-00047.safetensors", + "model.layers.46.mlp.experts.123.down_proj.weight_scale": "model-00047-of-00047.safetensors", + "model.layers.46.mlp.experts.123.gate_proj.weight": "model-00047-of-00047.safetensors", + "model.layers.46.mlp.experts.123.gate_proj.weight_scale": "model-00047-of-00047.safetensors", + "model.layers.46.mlp.experts.123.up_proj.weight": "model-00047-of-00047.safetensors", + "model.layers.46.mlp.experts.123.up_proj.weight_scale": "model-00047-of-00047.safetensors", + "model.layers.46.mlp.experts.124.down_proj.weight": "model-00047-of-00047.safetensors", + "model.layers.46.mlp.experts.124.down_proj.weight_scale": "model-00047-of-00047.safetensors", + "model.layers.46.mlp.experts.124.gate_proj.weight": "model-00047-of-00047.safetensors", + "model.layers.46.mlp.experts.124.gate_proj.weight_scale": "model-00047-of-00047.safetensors", + "model.layers.46.mlp.experts.124.up_proj.weight": "model-00047-of-00047.safetensors", + "model.layers.46.mlp.experts.124.up_proj.weight_scale": "model-00047-of-00047.safetensors", + "model.layers.46.mlp.experts.125.down_proj.weight": "model-00047-of-00047.safetensors", + "model.layers.46.mlp.experts.125.down_proj.weight_scale": "model-00047-of-00047.safetensors", + "model.layers.46.mlp.experts.125.gate_proj.weight": "model-00047-of-00047.safetensors", + "model.layers.46.mlp.experts.125.gate_proj.weight_scale": "model-00047-of-00047.safetensors", + "model.layers.46.mlp.experts.125.up_proj.weight": "model-00047-of-00047.safetensors", + "model.layers.46.mlp.experts.125.up_proj.weight_scale": "model-00047-of-00047.safetensors", + "model.layers.46.mlp.experts.126.down_proj.weight": "model-00047-of-00047.safetensors", + "model.layers.46.mlp.experts.126.down_proj.weight_scale": "model-00047-of-00047.safetensors", + "model.layers.46.mlp.experts.126.gate_proj.weight": "model-00047-of-00047.safetensors", + "model.layers.46.mlp.experts.126.gate_proj.weight_scale": "model-00047-of-00047.safetensors", + "model.layers.46.mlp.experts.126.up_proj.weight": "model-00047-of-00047.safetensors", + "model.layers.46.mlp.experts.126.up_proj.weight_scale": "model-00047-of-00047.safetensors", + "model.layers.46.mlp.experts.127.down_proj.weight": "model-00047-of-00047.safetensors", + "model.layers.46.mlp.experts.127.down_proj.weight_scale": "model-00047-of-00047.safetensors", + "model.layers.46.mlp.experts.127.gate_proj.weight": "model-00047-of-00047.safetensors", + "model.layers.46.mlp.experts.127.gate_proj.weight_scale": "model-00047-of-00047.safetensors", + "model.layers.46.mlp.experts.127.up_proj.weight": "model-00047-of-00047.safetensors", + "model.layers.46.mlp.experts.127.up_proj.weight_scale": "model-00047-of-00047.safetensors", + "model.layers.46.mlp.experts.13.down_proj.weight": "model-00047-of-00047.safetensors", + "model.layers.46.mlp.experts.13.down_proj.weight_scale": "model-00047-of-00047.safetensors", + "model.layers.46.mlp.experts.13.gate_proj.weight": "model-00047-of-00047.safetensors", + "model.layers.46.mlp.experts.13.gate_proj.weight_scale": "model-00047-of-00047.safetensors", + "model.layers.46.mlp.experts.13.up_proj.weight": "model-00047-of-00047.safetensors", + "model.layers.46.mlp.experts.13.up_proj.weight_scale": "model-00047-of-00047.safetensors", + "model.layers.46.mlp.experts.14.down_proj.weight": "model-00047-of-00047.safetensors", + "model.layers.46.mlp.experts.14.down_proj.weight_scale": "model-00047-of-00047.safetensors", + "model.layers.46.mlp.experts.14.gate_proj.weight": "model-00047-of-00047.safetensors", + "model.layers.46.mlp.experts.14.gate_proj.weight_scale": "model-00047-of-00047.safetensors", + "model.layers.46.mlp.experts.14.up_proj.weight": "model-00047-of-00047.safetensors", + "model.layers.46.mlp.experts.14.up_proj.weight_scale": "model-00047-of-00047.safetensors", + "model.layers.46.mlp.experts.15.down_proj.weight": "model-00047-of-00047.safetensors", + "model.layers.46.mlp.experts.15.down_proj.weight_scale": "model-00047-of-00047.safetensors", + "model.layers.46.mlp.experts.15.gate_proj.weight": "model-00047-of-00047.safetensors", + "model.layers.46.mlp.experts.15.gate_proj.weight_scale": "model-00047-of-00047.safetensors", + "model.layers.46.mlp.experts.15.up_proj.weight": "model-00047-of-00047.safetensors", + "model.layers.46.mlp.experts.15.up_proj.weight_scale": "model-00047-of-00047.safetensors", + "model.layers.46.mlp.experts.16.down_proj.weight": "model-00047-of-00047.safetensors", + "model.layers.46.mlp.experts.16.down_proj.weight_scale": "model-00047-of-00047.safetensors", + "model.layers.46.mlp.experts.16.gate_proj.weight": "model-00047-of-00047.safetensors", + "model.layers.46.mlp.experts.16.gate_proj.weight_scale": "model-00047-of-00047.safetensors", + "model.layers.46.mlp.experts.16.up_proj.weight": "model-00047-of-00047.safetensors", + "model.layers.46.mlp.experts.16.up_proj.weight_scale": "model-00047-of-00047.safetensors", + "model.layers.46.mlp.experts.17.down_proj.weight": "model-00047-of-00047.safetensors", + "model.layers.46.mlp.experts.17.down_proj.weight_scale": "model-00047-of-00047.safetensors", + "model.layers.46.mlp.experts.17.gate_proj.weight": "model-00047-of-00047.safetensors", + "model.layers.46.mlp.experts.17.gate_proj.weight_scale": "model-00047-of-00047.safetensors", + "model.layers.46.mlp.experts.17.up_proj.weight": "model-00047-of-00047.safetensors", + "model.layers.46.mlp.experts.17.up_proj.weight_scale": "model-00047-of-00047.safetensors", + "model.layers.46.mlp.experts.18.down_proj.weight": "model-00047-of-00047.safetensors", + "model.layers.46.mlp.experts.18.down_proj.weight_scale": "model-00047-of-00047.safetensors", + "model.layers.46.mlp.experts.18.gate_proj.weight": "model-00047-of-00047.safetensors", + "model.layers.46.mlp.experts.18.gate_proj.weight_scale": "model-00047-of-00047.safetensors", + "model.layers.46.mlp.experts.18.up_proj.weight": "model-00047-of-00047.safetensors", + "model.layers.46.mlp.experts.18.up_proj.weight_scale": "model-00047-of-00047.safetensors", + "model.layers.46.mlp.experts.19.down_proj.weight": "model-00047-of-00047.safetensors", + "model.layers.46.mlp.experts.19.down_proj.weight_scale": "model-00047-of-00047.safetensors", + "model.layers.46.mlp.experts.19.gate_proj.weight": "model-00047-of-00047.safetensors", + "model.layers.46.mlp.experts.19.gate_proj.weight_scale": "model-00047-of-00047.safetensors", + "model.layers.46.mlp.experts.19.up_proj.weight": "model-00047-of-00047.safetensors", + "model.layers.46.mlp.experts.19.up_proj.weight_scale": "model-00047-of-00047.safetensors", + "model.layers.46.mlp.experts.2.down_proj.weight": "model-00047-of-00047.safetensors", + "model.layers.46.mlp.experts.2.down_proj.weight_scale": "model-00047-of-00047.safetensors", + "model.layers.46.mlp.experts.2.gate_proj.weight": "model-00047-of-00047.safetensors", + "model.layers.46.mlp.experts.2.gate_proj.weight_scale": "model-00047-of-00047.safetensors", + "model.layers.46.mlp.experts.2.up_proj.weight": "model-00047-of-00047.safetensors", + "model.layers.46.mlp.experts.2.up_proj.weight_scale": "model-00047-of-00047.safetensors", + "model.layers.46.mlp.experts.20.down_proj.weight": "model-00047-of-00047.safetensors", + "model.layers.46.mlp.experts.20.down_proj.weight_scale": "model-00047-of-00047.safetensors", + "model.layers.46.mlp.experts.20.gate_proj.weight": "model-00047-of-00047.safetensors", + "model.layers.46.mlp.experts.20.gate_proj.weight_scale": "model-00047-of-00047.safetensors", + "model.layers.46.mlp.experts.20.up_proj.weight": "model-00047-of-00047.safetensors", + "model.layers.46.mlp.experts.20.up_proj.weight_scale": "model-00047-of-00047.safetensors", + "model.layers.46.mlp.experts.21.down_proj.weight": "model-00047-of-00047.safetensors", + "model.layers.46.mlp.experts.21.down_proj.weight_scale": "model-00047-of-00047.safetensors", + "model.layers.46.mlp.experts.21.gate_proj.weight": "model-00047-of-00047.safetensors", + "model.layers.46.mlp.experts.21.gate_proj.weight_scale": "model-00047-of-00047.safetensors", + "model.layers.46.mlp.experts.21.up_proj.weight": "model-00047-of-00047.safetensors", + "model.layers.46.mlp.experts.21.up_proj.weight_scale": "model-00047-of-00047.safetensors", + "model.layers.46.mlp.experts.22.down_proj.weight": "model-00047-of-00047.safetensors", + "model.layers.46.mlp.experts.22.down_proj.weight_scale": "model-00047-of-00047.safetensors", + "model.layers.46.mlp.experts.22.gate_proj.weight": "model-00047-of-00047.safetensors", + "model.layers.46.mlp.experts.22.gate_proj.weight_scale": "model-00047-of-00047.safetensors", + "model.layers.46.mlp.experts.22.up_proj.weight": "model-00047-of-00047.safetensors", + "model.layers.46.mlp.experts.22.up_proj.weight_scale": "model-00047-of-00047.safetensors", + "model.layers.46.mlp.experts.23.down_proj.weight": "model-00047-of-00047.safetensors", + "model.layers.46.mlp.experts.23.down_proj.weight_scale": "model-00047-of-00047.safetensors", + "model.layers.46.mlp.experts.23.gate_proj.weight": "model-00047-of-00047.safetensors", + "model.layers.46.mlp.experts.23.gate_proj.weight_scale": "model-00047-of-00047.safetensors", + "model.layers.46.mlp.experts.23.up_proj.weight": "model-00047-of-00047.safetensors", + "model.layers.46.mlp.experts.23.up_proj.weight_scale": "model-00047-of-00047.safetensors", + "model.layers.46.mlp.experts.24.down_proj.weight": "model-00047-of-00047.safetensors", + "model.layers.46.mlp.experts.24.down_proj.weight_scale": "model-00047-of-00047.safetensors", + "model.layers.46.mlp.experts.24.gate_proj.weight": "model-00047-of-00047.safetensors", + "model.layers.46.mlp.experts.24.gate_proj.weight_scale": "model-00047-of-00047.safetensors", + "model.layers.46.mlp.experts.24.up_proj.weight": "model-00047-of-00047.safetensors", + "model.layers.46.mlp.experts.24.up_proj.weight_scale": "model-00047-of-00047.safetensors", + "model.layers.46.mlp.experts.25.down_proj.weight": "model-00047-of-00047.safetensors", + "model.layers.46.mlp.experts.25.down_proj.weight_scale": "model-00047-of-00047.safetensors", + "model.layers.46.mlp.experts.25.gate_proj.weight": "model-00047-of-00047.safetensors", + "model.layers.46.mlp.experts.25.gate_proj.weight_scale": "model-00047-of-00047.safetensors", + "model.layers.46.mlp.experts.25.up_proj.weight": "model-00047-of-00047.safetensors", + "model.layers.46.mlp.experts.25.up_proj.weight_scale": "model-00047-of-00047.safetensors", + "model.layers.46.mlp.experts.26.down_proj.weight": "model-00047-of-00047.safetensors", + "model.layers.46.mlp.experts.26.down_proj.weight_scale": "model-00047-of-00047.safetensors", + "model.layers.46.mlp.experts.26.gate_proj.weight": "model-00047-of-00047.safetensors", + "model.layers.46.mlp.experts.26.gate_proj.weight_scale": "model-00047-of-00047.safetensors", + "model.layers.46.mlp.experts.26.up_proj.weight": "model-00047-of-00047.safetensors", + "model.layers.46.mlp.experts.26.up_proj.weight_scale": "model-00047-of-00047.safetensors", + "model.layers.46.mlp.experts.27.down_proj.weight": "model-00047-of-00047.safetensors", + "model.layers.46.mlp.experts.27.down_proj.weight_scale": "model-00047-of-00047.safetensors", + "model.layers.46.mlp.experts.27.gate_proj.weight": "model-00047-of-00047.safetensors", + "model.layers.46.mlp.experts.27.gate_proj.weight_scale": "model-00047-of-00047.safetensors", + "model.layers.46.mlp.experts.27.up_proj.weight": "model-00047-of-00047.safetensors", + "model.layers.46.mlp.experts.27.up_proj.weight_scale": "model-00047-of-00047.safetensors", + "model.layers.46.mlp.experts.28.down_proj.weight": "model-00047-of-00047.safetensors", + "model.layers.46.mlp.experts.28.down_proj.weight_scale": "model-00047-of-00047.safetensors", + "model.layers.46.mlp.experts.28.gate_proj.weight": "model-00047-of-00047.safetensors", + "model.layers.46.mlp.experts.28.gate_proj.weight_scale": "model-00047-of-00047.safetensors", + "model.layers.46.mlp.experts.28.up_proj.weight": "model-00047-of-00047.safetensors", + "model.layers.46.mlp.experts.28.up_proj.weight_scale": "model-00047-of-00047.safetensors", + "model.layers.46.mlp.experts.29.down_proj.weight": "model-00047-of-00047.safetensors", + "model.layers.46.mlp.experts.29.down_proj.weight_scale": "model-00047-of-00047.safetensors", + "model.layers.46.mlp.experts.29.gate_proj.weight": "model-00047-of-00047.safetensors", + "model.layers.46.mlp.experts.29.gate_proj.weight_scale": "model-00047-of-00047.safetensors", + "model.layers.46.mlp.experts.29.up_proj.weight": "model-00047-of-00047.safetensors", + "model.layers.46.mlp.experts.29.up_proj.weight_scale": "model-00047-of-00047.safetensors", + "model.layers.46.mlp.experts.3.down_proj.weight": "model-00047-of-00047.safetensors", + "model.layers.46.mlp.experts.3.down_proj.weight_scale": "model-00047-of-00047.safetensors", + "model.layers.46.mlp.experts.3.gate_proj.weight": "model-00047-of-00047.safetensors", + "model.layers.46.mlp.experts.3.gate_proj.weight_scale": "model-00047-of-00047.safetensors", + "model.layers.46.mlp.experts.3.up_proj.weight": "model-00047-of-00047.safetensors", + "model.layers.46.mlp.experts.3.up_proj.weight_scale": "model-00047-of-00047.safetensors", + "model.layers.46.mlp.experts.30.down_proj.weight": "model-00047-of-00047.safetensors", + "model.layers.46.mlp.experts.30.down_proj.weight_scale": "model-00047-of-00047.safetensors", + "model.layers.46.mlp.experts.30.gate_proj.weight": "model-00047-of-00047.safetensors", + "model.layers.46.mlp.experts.30.gate_proj.weight_scale": "model-00047-of-00047.safetensors", + "model.layers.46.mlp.experts.30.up_proj.weight": "model-00047-of-00047.safetensors", + "model.layers.46.mlp.experts.30.up_proj.weight_scale": "model-00047-of-00047.safetensors", + "model.layers.46.mlp.experts.31.down_proj.weight": "model-00047-of-00047.safetensors", + "model.layers.46.mlp.experts.31.down_proj.weight_scale": "model-00047-of-00047.safetensors", + "model.layers.46.mlp.experts.31.gate_proj.weight": "model-00047-of-00047.safetensors", + "model.layers.46.mlp.experts.31.gate_proj.weight_scale": "model-00047-of-00047.safetensors", + "model.layers.46.mlp.experts.31.up_proj.weight": "model-00047-of-00047.safetensors", + "model.layers.46.mlp.experts.31.up_proj.weight_scale": "model-00047-of-00047.safetensors", + "model.layers.46.mlp.experts.32.down_proj.weight": "model-00047-of-00047.safetensors", + "model.layers.46.mlp.experts.32.down_proj.weight_scale": "model-00047-of-00047.safetensors", + "model.layers.46.mlp.experts.32.gate_proj.weight": "model-00047-of-00047.safetensors", + "model.layers.46.mlp.experts.32.gate_proj.weight_scale": "model-00047-of-00047.safetensors", + "model.layers.46.mlp.experts.32.up_proj.weight": "model-00047-of-00047.safetensors", + "model.layers.46.mlp.experts.32.up_proj.weight_scale": "model-00047-of-00047.safetensors", + "model.layers.46.mlp.experts.33.down_proj.weight": "model-00047-of-00047.safetensors", + "model.layers.46.mlp.experts.33.down_proj.weight_scale": "model-00047-of-00047.safetensors", + "model.layers.46.mlp.experts.33.gate_proj.weight": "model-00047-of-00047.safetensors", + "model.layers.46.mlp.experts.33.gate_proj.weight_scale": "model-00047-of-00047.safetensors", + "model.layers.46.mlp.experts.33.up_proj.weight": "model-00047-of-00047.safetensors", + "model.layers.46.mlp.experts.33.up_proj.weight_scale": "model-00047-of-00047.safetensors", + "model.layers.46.mlp.experts.34.down_proj.weight": "model-00047-of-00047.safetensors", + "model.layers.46.mlp.experts.34.down_proj.weight_scale": "model-00047-of-00047.safetensors", + "model.layers.46.mlp.experts.34.gate_proj.weight": "model-00047-of-00047.safetensors", + "model.layers.46.mlp.experts.34.gate_proj.weight_scale": "model-00047-of-00047.safetensors", + "model.layers.46.mlp.experts.34.up_proj.weight": "model-00047-of-00047.safetensors", + "model.layers.46.mlp.experts.34.up_proj.weight_scale": "model-00047-of-00047.safetensors", + "model.layers.46.mlp.experts.35.down_proj.weight": "model-00047-of-00047.safetensors", + "model.layers.46.mlp.experts.35.down_proj.weight_scale": "model-00047-of-00047.safetensors", + "model.layers.46.mlp.experts.35.gate_proj.weight": "model-00047-of-00047.safetensors", + "model.layers.46.mlp.experts.35.gate_proj.weight_scale": "model-00047-of-00047.safetensors", + "model.layers.46.mlp.experts.35.up_proj.weight": "model-00047-of-00047.safetensors", + "model.layers.46.mlp.experts.35.up_proj.weight_scale": "model-00047-of-00047.safetensors", + "model.layers.46.mlp.experts.36.down_proj.weight": "model-00047-of-00047.safetensors", + "model.layers.46.mlp.experts.36.down_proj.weight_scale": "model-00047-of-00047.safetensors", + "model.layers.46.mlp.experts.36.gate_proj.weight": "model-00047-of-00047.safetensors", + "model.layers.46.mlp.experts.36.gate_proj.weight_scale": "model-00047-of-00047.safetensors", + "model.layers.46.mlp.experts.36.up_proj.weight": "model-00047-of-00047.safetensors", + "model.layers.46.mlp.experts.36.up_proj.weight_scale": "model-00047-of-00047.safetensors", + "model.layers.46.mlp.experts.37.down_proj.weight": "model-00047-of-00047.safetensors", + "model.layers.46.mlp.experts.37.down_proj.weight_scale": "model-00047-of-00047.safetensors", + "model.layers.46.mlp.experts.37.gate_proj.weight": "model-00047-of-00047.safetensors", + "model.layers.46.mlp.experts.37.gate_proj.weight_scale": "model-00047-of-00047.safetensors", + "model.layers.46.mlp.experts.37.up_proj.weight": "model-00047-of-00047.safetensors", + "model.layers.46.mlp.experts.37.up_proj.weight_scale": "model-00047-of-00047.safetensors", + "model.layers.46.mlp.experts.38.down_proj.weight": "model-00047-of-00047.safetensors", + "model.layers.46.mlp.experts.38.down_proj.weight_scale": "model-00047-of-00047.safetensors", + "model.layers.46.mlp.experts.38.gate_proj.weight": "model-00047-of-00047.safetensors", + "model.layers.46.mlp.experts.38.gate_proj.weight_scale": "model-00047-of-00047.safetensors", + "model.layers.46.mlp.experts.38.up_proj.weight": "model-00047-of-00047.safetensors", + "model.layers.46.mlp.experts.38.up_proj.weight_scale": "model-00047-of-00047.safetensors", + "model.layers.46.mlp.experts.39.down_proj.weight": "model-00047-of-00047.safetensors", + "model.layers.46.mlp.experts.39.down_proj.weight_scale": "model-00047-of-00047.safetensors", + "model.layers.46.mlp.experts.39.gate_proj.weight": "model-00047-of-00047.safetensors", + "model.layers.46.mlp.experts.39.gate_proj.weight_scale": "model-00047-of-00047.safetensors", + "model.layers.46.mlp.experts.39.up_proj.weight": "model-00047-of-00047.safetensors", + "model.layers.46.mlp.experts.39.up_proj.weight_scale": "model-00047-of-00047.safetensors", + "model.layers.46.mlp.experts.4.down_proj.weight": "model-00047-of-00047.safetensors", + "model.layers.46.mlp.experts.4.down_proj.weight_scale": "model-00047-of-00047.safetensors", + "model.layers.46.mlp.experts.4.gate_proj.weight": "model-00047-of-00047.safetensors", + "model.layers.46.mlp.experts.4.gate_proj.weight_scale": "model-00047-of-00047.safetensors", + "model.layers.46.mlp.experts.4.up_proj.weight": "model-00047-of-00047.safetensors", + "model.layers.46.mlp.experts.4.up_proj.weight_scale": "model-00047-of-00047.safetensors", + "model.layers.46.mlp.experts.40.down_proj.weight": "model-00047-of-00047.safetensors", + "model.layers.46.mlp.experts.40.down_proj.weight_scale": "model-00047-of-00047.safetensors", + "model.layers.46.mlp.experts.40.gate_proj.weight": "model-00047-of-00047.safetensors", + "model.layers.46.mlp.experts.40.gate_proj.weight_scale": "model-00047-of-00047.safetensors", + "model.layers.46.mlp.experts.40.up_proj.weight": "model-00047-of-00047.safetensors", + "model.layers.46.mlp.experts.40.up_proj.weight_scale": "model-00047-of-00047.safetensors", + "model.layers.46.mlp.experts.41.down_proj.weight": "model-00047-of-00047.safetensors", + "model.layers.46.mlp.experts.41.down_proj.weight_scale": "model-00047-of-00047.safetensors", + "model.layers.46.mlp.experts.41.gate_proj.weight": "model-00047-of-00047.safetensors", + "model.layers.46.mlp.experts.41.gate_proj.weight_scale": "model-00047-of-00047.safetensors", + "model.layers.46.mlp.experts.41.up_proj.weight": "model-00047-of-00047.safetensors", + "model.layers.46.mlp.experts.41.up_proj.weight_scale": "model-00047-of-00047.safetensors", + "model.layers.46.mlp.experts.42.down_proj.weight": "model-00047-of-00047.safetensors", + "model.layers.46.mlp.experts.42.down_proj.weight_scale": "model-00047-of-00047.safetensors", + "model.layers.46.mlp.experts.42.gate_proj.weight": "model-00047-of-00047.safetensors", + "model.layers.46.mlp.experts.42.gate_proj.weight_scale": "model-00047-of-00047.safetensors", + "model.layers.46.mlp.experts.42.up_proj.weight": "model-00047-of-00047.safetensors", + "model.layers.46.mlp.experts.42.up_proj.weight_scale": "model-00047-of-00047.safetensors", + "model.layers.46.mlp.experts.43.down_proj.weight": "model-00047-of-00047.safetensors", + "model.layers.46.mlp.experts.43.down_proj.weight_scale": "model-00047-of-00047.safetensors", + "model.layers.46.mlp.experts.43.gate_proj.weight": "model-00047-of-00047.safetensors", + "model.layers.46.mlp.experts.43.gate_proj.weight_scale": "model-00047-of-00047.safetensors", + "model.layers.46.mlp.experts.43.up_proj.weight": "model-00047-of-00047.safetensors", + "model.layers.46.mlp.experts.43.up_proj.weight_scale": "model-00047-of-00047.safetensors", + "model.layers.46.mlp.experts.44.down_proj.weight": "model-00047-of-00047.safetensors", + "model.layers.46.mlp.experts.44.down_proj.weight_scale": "model-00047-of-00047.safetensors", + "model.layers.46.mlp.experts.44.gate_proj.weight": "model-00047-of-00047.safetensors", + "model.layers.46.mlp.experts.44.gate_proj.weight_scale": "model-00047-of-00047.safetensors", + "model.layers.46.mlp.experts.44.up_proj.weight": "model-00047-of-00047.safetensors", + "model.layers.46.mlp.experts.44.up_proj.weight_scale": "model-00047-of-00047.safetensors", + "model.layers.46.mlp.experts.45.down_proj.weight": "model-00047-of-00047.safetensors", + "model.layers.46.mlp.experts.45.down_proj.weight_scale": "model-00047-of-00047.safetensors", + "model.layers.46.mlp.experts.45.gate_proj.weight": "model-00047-of-00047.safetensors", + "model.layers.46.mlp.experts.45.gate_proj.weight_scale": "model-00047-of-00047.safetensors", + "model.layers.46.mlp.experts.45.up_proj.weight": "model-00047-of-00047.safetensors", + "model.layers.46.mlp.experts.45.up_proj.weight_scale": "model-00047-of-00047.safetensors", + "model.layers.46.mlp.experts.46.down_proj.weight": "model-00047-of-00047.safetensors", + "model.layers.46.mlp.experts.46.down_proj.weight_scale": "model-00047-of-00047.safetensors", + "model.layers.46.mlp.experts.46.gate_proj.weight": "model-00047-of-00047.safetensors", + "model.layers.46.mlp.experts.46.gate_proj.weight_scale": "model-00047-of-00047.safetensors", + "model.layers.46.mlp.experts.46.up_proj.weight": "model-00047-of-00047.safetensors", + "model.layers.46.mlp.experts.46.up_proj.weight_scale": "model-00047-of-00047.safetensors", + "model.layers.46.mlp.experts.47.down_proj.weight": "model-00047-of-00047.safetensors", + "model.layers.46.mlp.experts.47.down_proj.weight_scale": "model-00047-of-00047.safetensors", + "model.layers.46.mlp.experts.47.gate_proj.weight": "model-00047-of-00047.safetensors", + "model.layers.46.mlp.experts.47.gate_proj.weight_scale": "model-00047-of-00047.safetensors", + "model.layers.46.mlp.experts.47.up_proj.weight": "model-00047-of-00047.safetensors", + "model.layers.46.mlp.experts.47.up_proj.weight_scale": "model-00047-of-00047.safetensors", + "model.layers.46.mlp.experts.48.down_proj.weight": "model-00047-of-00047.safetensors", + "model.layers.46.mlp.experts.48.down_proj.weight_scale": "model-00047-of-00047.safetensors", + "model.layers.46.mlp.experts.48.gate_proj.weight": "model-00047-of-00047.safetensors", + "model.layers.46.mlp.experts.48.gate_proj.weight_scale": "model-00047-of-00047.safetensors", + "model.layers.46.mlp.experts.48.up_proj.weight": "model-00047-of-00047.safetensors", + "model.layers.46.mlp.experts.48.up_proj.weight_scale": "model-00047-of-00047.safetensors", + "model.layers.46.mlp.experts.49.down_proj.weight": "model-00047-of-00047.safetensors", + "model.layers.46.mlp.experts.49.down_proj.weight_scale": "model-00047-of-00047.safetensors", + "model.layers.46.mlp.experts.49.gate_proj.weight": "model-00047-of-00047.safetensors", + "model.layers.46.mlp.experts.49.gate_proj.weight_scale": "model-00047-of-00047.safetensors", + "model.layers.46.mlp.experts.49.up_proj.weight": "model-00047-of-00047.safetensors", + "model.layers.46.mlp.experts.49.up_proj.weight_scale": "model-00047-of-00047.safetensors", + "model.layers.46.mlp.experts.5.down_proj.weight": "model-00047-of-00047.safetensors", + "model.layers.46.mlp.experts.5.down_proj.weight_scale": "model-00047-of-00047.safetensors", + "model.layers.46.mlp.experts.5.gate_proj.weight": "model-00047-of-00047.safetensors", + "model.layers.46.mlp.experts.5.gate_proj.weight_scale": "model-00047-of-00047.safetensors", + "model.layers.46.mlp.experts.5.up_proj.weight": "model-00047-of-00047.safetensors", + "model.layers.46.mlp.experts.5.up_proj.weight_scale": "model-00047-of-00047.safetensors", + "model.layers.46.mlp.experts.50.down_proj.weight": "model-00047-of-00047.safetensors", + "model.layers.46.mlp.experts.50.down_proj.weight_scale": "model-00047-of-00047.safetensors", + "model.layers.46.mlp.experts.50.gate_proj.weight": "model-00047-of-00047.safetensors", + "model.layers.46.mlp.experts.50.gate_proj.weight_scale": "model-00047-of-00047.safetensors", + "model.layers.46.mlp.experts.50.up_proj.weight": "model-00047-of-00047.safetensors", + "model.layers.46.mlp.experts.50.up_proj.weight_scale": "model-00047-of-00047.safetensors", + "model.layers.46.mlp.experts.51.down_proj.weight": "model-00047-of-00047.safetensors", + "model.layers.46.mlp.experts.51.down_proj.weight_scale": "model-00047-of-00047.safetensors", + "model.layers.46.mlp.experts.51.gate_proj.weight": "model-00047-of-00047.safetensors", + "model.layers.46.mlp.experts.51.gate_proj.weight_scale": "model-00047-of-00047.safetensors", + "model.layers.46.mlp.experts.51.up_proj.weight": "model-00047-of-00047.safetensors", + "model.layers.46.mlp.experts.51.up_proj.weight_scale": "model-00047-of-00047.safetensors", + "model.layers.46.mlp.experts.52.down_proj.weight": "model-00047-of-00047.safetensors", + "model.layers.46.mlp.experts.52.down_proj.weight_scale": "model-00047-of-00047.safetensors", + "model.layers.46.mlp.experts.52.gate_proj.weight": "model-00047-of-00047.safetensors", + "model.layers.46.mlp.experts.52.gate_proj.weight_scale": "model-00047-of-00047.safetensors", + "model.layers.46.mlp.experts.52.up_proj.weight": "model-00047-of-00047.safetensors", + "model.layers.46.mlp.experts.52.up_proj.weight_scale": "model-00047-of-00047.safetensors", + "model.layers.46.mlp.experts.53.down_proj.weight": "model-00047-of-00047.safetensors", + "model.layers.46.mlp.experts.53.down_proj.weight_scale": "model-00047-of-00047.safetensors", + "model.layers.46.mlp.experts.53.gate_proj.weight": "model-00047-of-00047.safetensors", + "model.layers.46.mlp.experts.53.gate_proj.weight_scale": "model-00047-of-00047.safetensors", + "model.layers.46.mlp.experts.53.up_proj.weight": "model-00047-of-00047.safetensors", + "model.layers.46.mlp.experts.53.up_proj.weight_scale": "model-00047-of-00047.safetensors", + "model.layers.46.mlp.experts.54.down_proj.weight": "model-00047-of-00047.safetensors", + "model.layers.46.mlp.experts.54.down_proj.weight_scale": "model-00047-of-00047.safetensors", + "model.layers.46.mlp.experts.54.gate_proj.weight": "model-00047-of-00047.safetensors", + "model.layers.46.mlp.experts.54.gate_proj.weight_scale": "model-00047-of-00047.safetensors", + "model.layers.46.mlp.experts.54.up_proj.weight": "model-00047-of-00047.safetensors", + "model.layers.46.mlp.experts.54.up_proj.weight_scale": "model-00047-of-00047.safetensors", + "model.layers.46.mlp.experts.55.down_proj.weight": "model-00047-of-00047.safetensors", + "model.layers.46.mlp.experts.55.down_proj.weight_scale": "model-00047-of-00047.safetensors", + "model.layers.46.mlp.experts.55.gate_proj.weight": "model-00047-of-00047.safetensors", + "model.layers.46.mlp.experts.55.gate_proj.weight_scale": "model-00047-of-00047.safetensors", + "model.layers.46.mlp.experts.55.up_proj.weight": "model-00047-of-00047.safetensors", + "model.layers.46.mlp.experts.55.up_proj.weight_scale": "model-00047-of-00047.safetensors", + "model.layers.46.mlp.experts.56.down_proj.weight": "model-00047-of-00047.safetensors", + "model.layers.46.mlp.experts.56.down_proj.weight_scale": "model-00047-of-00047.safetensors", + "model.layers.46.mlp.experts.56.gate_proj.weight": "model-00047-of-00047.safetensors", + "model.layers.46.mlp.experts.56.gate_proj.weight_scale": "model-00047-of-00047.safetensors", + "model.layers.46.mlp.experts.56.up_proj.weight": "model-00047-of-00047.safetensors", + "model.layers.46.mlp.experts.56.up_proj.weight_scale": "model-00047-of-00047.safetensors", + "model.layers.46.mlp.experts.57.down_proj.weight": "model-00047-of-00047.safetensors", + "model.layers.46.mlp.experts.57.down_proj.weight_scale": "model-00047-of-00047.safetensors", + "model.layers.46.mlp.experts.57.gate_proj.weight": "model-00047-of-00047.safetensors", + "model.layers.46.mlp.experts.57.gate_proj.weight_scale": "model-00047-of-00047.safetensors", + "model.layers.46.mlp.experts.57.up_proj.weight": "model-00047-of-00047.safetensors", + "model.layers.46.mlp.experts.57.up_proj.weight_scale": "model-00047-of-00047.safetensors", + "model.layers.46.mlp.experts.58.down_proj.weight": "model-00047-of-00047.safetensors", + "model.layers.46.mlp.experts.58.down_proj.weight_scale": "model-00047-of-00047.safetensors", + "model.layers.46.mlp.experts.58.gate_proj.weight": "model-00047-of-00047.safetensors", + "model.layers.46.mlp.experts.58.gate_proj.weight_scale": "model-00047-of-00047.safetensors", + "model.layers.46.mlp.experts.58.up_proj.weight": "model-00047-of-00047.safetensors", + "model.layers.46.mlp.experts.58.up_proj.weight_scale": "model-00047-of-00047.safetensors", + "model.layers.46.mlp.experts.59.down_proj.weight": "model-00047-of-00047.safetensors", + "model.layers.46.mlp.experts.59.down_proj.weight_scale": "model-00047-of-00047.safetensors", + "model.layers.46.mlp.experts.59.gate_proj.weight": "model-00047-of-00047.safetensors", + "model.layers.46.mlp.experts.59.gate_proj.weight_scale": "model-00047-of-00047.safetensors", + "model.layers.46.mlp.experts.59.up_proj.weight": "model-00047-of-00047.safetensors", + "model.layers.46.mlp.experts.59.up_proj.weight_scale": "model-00047-of-00047.safetensors", + "model.layers.46.mlp.experts.6.down_proj.weight": "model-00047-of-00047.safetensors", + "model.layers.46.mlp.experts.6.down_proj.weight_scale": "model-00047-of-00047.safetensors", + "model.layers.46.mlp.experts.6.gate_proj.weight": "model-00047-of-00047.safetensors", + "model.layers.46.mlp.experts.6.gate_proj.weight_scale": "model-00047-of-00047.safetensors", + "model.layers.46.mlp.experts.6.up_proj.weight": "model-00047-of-00047.safetensors", + "model.layers.46.mlp.experts.6.up_proj.weight_scale": "model-00047-of-00047.safetensors", + "model.layers.46.mlp.experts.60.down_proj.weight": "model-00047-of-00047.safetensors", + "model.layers.46.mlp.experts.60.down_proj.weight_scale": "model-00047-of-00047.safetensors", + "model.layers.46.mlp.experts.60.gate_proj.weight": "model-00047-of-00047.safetensors", + "model.layers.46.mlp.experts.60.gate_proj.weight_scale": "model-00047-of-00047.safetensors", + "model.layers.46.mlp.experts.60.up_proj.weight": "model-00047-of-00047.safetensors", + "model.layers.46.mlp.experts.60.up_proj.weight_scale": "model-00047-of-00047.safetensors", + "model.layers.46.mlp.experts.61.down_proj.weight": "model-00047-of-00047.safetensors", + "model.layers.46.mlp.experts.61.down_proj.weight_scale": "model-00047-of-00047.safetensors", + "model.layers.46.mlp.experts.61.gate_proj.weight": "model-00047-of-00047.safetensors", + "model.layers.46.mlp.experts.61.gate_proj.weight_scale": "model-00047-of-00047.safetensors", + "model.layers.46.mlp.experts.61.up_proj.weight": "model-00047-of-00047.safetensors", + "model.layers.46.mlp.experts.61.up_proj.weight_scale": "model-00047-of-00047.safetensors", + "model.layers.46.mlp.experts.62.down_proj.weight": "model-00047-of-00047.safetensors", + "model.layers.46.mlp.experts.62.down_proj.weight_scale": "model-00047-of-00047.safetensors", + "model.layers.46.mlp.experts.62.gate_proj.weight": "model-00047-of-00047.safetensors", + "model.layers.46.mlp.experts.62.gate_proj.weight_scale": "model-00047-of-00047.safetensors", + "model.layers.46.mlp.experts.62.up_proj.weight": "model-00047-of-00047.safetensors", + "model.layers.46.mlp.experts.62.up_proj.weight_scale": "model-00047-of-00047.safetensors", + "model.layers.46.mlp.experts.63.down_proj.weight": "model-00047-of-00047.safetensors", + "model.layers.46.mlp.experts.63.down_proj.weight_scale": "model-00047-of-00047.safetensors", + "model.layers.46.mlp.experts.63.gate_proj.weight": "model-00047-of-00047.safetensors", + "model.layers.46.mlp.experts.63.gate_proj.weight_scale": "model-00047-of-00047.safetensors", + "model.layers.46.mlp.experts.63.up_proj.weight": "model-00047-of-00047.safetensors", + "model.layers.46.mlp.experts.63.up_proj.weight_scale": "model-00047-of-00047.safetensors", + "model.layers.46.mlp.experts.64.down_proj.weight": "model-00047-of-00047.safetensors", + "model.layers.46.mlp.experts.64.down_proj.weight_scale": "model-00047-of-00047.safetensors", + "model.layers.46.mlp.experts.64.gate_proj.weight": "model-00047-of-00047.safetensors", + "model.layers.46.mlp.experts.64.gate_proj.weight_scale": "model-00047-of-00047.safetensors", + "model.layers.46.mlp.experts.64.up_proj.weight": "model-00047-of-00047.safetensors", + "model.layers.46.mlp.experts.64.up_proj.weight_scale": "model-00047-of-00047.safetensors", + "model.layers.46.mlp.experts.65.down_proj.weight": "model-00047-of-00047.safetensors", + "model.layers.46.mlp.experts.65.down_proj.weight_scale": "model-00047-of-00047.safetensors", + "model.layers.46.mlp.experts.65.gate_proj.weight": "model-00047-of-00047.safetensors", + "model.layers.46.mlp.experts.65.gate_proj.weight_scale": "model-00047-of-00047.safetensors", + "model.layers.46.mlp.experts.65.up_proj.weight": "model-00047-of-00047.safetensors", + "model.layers.46.mlp.experts.65.up_proj.weight_scale": "model-00047-of-00047.safetensors", + "model.layers.46.mlp.experts.66.down_proj.weight": "model-00047-of-00047.safetensors", + "model.layers.46.mlp.experts.66.down_proj.weight_scale": "model-00047-of-00047.safetensors", + "model.layers.46.mlp.experts.66.gate_proj.weight": "model-00047-of-00047.safetensors", + "model.layers.46.mlp.experts.66.gate_proj.weight_scale": "model-00047-of-00047.safetensors", + "model.layers.46.mlp.experts.66.up_proj.weight": "model-00047-of-00047.safetensors", + "model.layers.46.mlp.experts.66.up_proj.weight_scale": "model-00047-of-00047.safetensors", + "model.layers.46.mlp.experts.67.down_proj.weight": "model-00047-of-00047.safetensors", + "model.layers.46.mlp.experts.67.down_proj.weight_scale": "model-00047-of-00047.safetensors", + "model.layers.46.mlp.experts.67.gate_proj.weight": "model-00047-of-00047.safetensors", + "model.layers.46.mlp.experts.67.gate_proj.weight_scale": "model-00047-of-00047.safetensors", + "model.layers.46.mlp.experts.67.up_proj.weight": "model-00047-of-00047.safetensors", + "model.layers.46.mlp.experts.67.up_proj.weight_scale": "model-00047-of-00047.safetensors", + "model.layers.46.mlp.experts.68.down_proj.weight": "model-00047-of-00047.safetensors", + "model.layers.46.mlp.experts.68.down_proj.weight_scale": "model-00047-of-00047.safetensors", + "model.layers.46.mlp.experts.68.gate_proj.weight": "model-00047-of-00047.safetensors", + "model.layers.46.mlp.experts.68.gate_proj.weight_scale": "model-00047-of-00047.safetensors", + "model.layers.46.mlp.experts.68.up_proj.weight": "model-00047-of-00047.safetensors", + "model.layers.46.mlp.experts.68.up_proj.weight_scale": "model-00047-of-00047.safetensors", + "model.layers.46.mlp.experts.69.down_proj.weight": "model-00047-of-00047.safetensors", + "model.layers.46.mlp.experts.69.down_proj.weight_scale": "model-00047-of-00047.safetensors", + "model.layers.46.mlp.experts.69.gate_proj.weight": "model-00047-of-00047.safetensors", + "model.layers.46.mlp.experts.69.gate_proj.weight_scale": "model-00047-of-00047.safetensors", + "model.layers.46.mlp.experts.69.up_proj.weight": "model-00047-of-00047.safetensors", + "model.layers.46.mlp.experts.69.up_proj.weight_scale": "model-00047-of-00047.safetensors", + "model.layers.46.mlp.experts.7.down_proj.weight": "model-00047-of-00047.safetensors", + "model.layers.46.mlp.experts.7.down_proj.weight_scale": "model-00047-of-00047.safetensors", + "model.layers.46.mlp.experts.7.gate_proj.weight": "model-00047-of-00047.safetensors", + "model.layers.46.mlp.experts.7.gate_proj.weight_scale": "model-00047-of-00047.safetensors", + "model.layers.46.mlp.experts.7.up_proj.weight": "model-00047-of-00047.safetensors", + "model.layers.46.mlp.experts.7.up_proj.weight_scale": "model-00047-of-00047.safetensors", + "model.layers.46.mlp.experts.70.down_proj.weight": "model-00047-of-00047.safetensors", + "model.layers.46.mlp.experts.70.down_proj.weight_scale": "model-00047-of-00047.safetensors", + "model.layers.46.mlp.experts.70.gate_proj.weight": "model-00047-of-00047.safetensors", + "model.layers.46.mlp.experts.70.gate_proj.weight_scale": "model-00047-of-00047.safetensors", + "model.layers.46.mlp.experts.70.up_proj.weight": "model-00047-of-00047.safetensors", + "model.layers.46.mlp.experts.70.up_proj.weight_scale": "model-00047-of-00047.safetensors", + "model.layers.46.mlp.experts.71.down_proj.weight": "model-00047-of-00047.safetensors", + "model.layers.46.mlp.experts.71.down_proj.weight_scale": "model-00047-of-00047.safetensors", + "model.layers.46.mlp.experts.71.gate_proj.weight": "model-00047-of-00047.safetensors", + "model.layers.46.mlp.experts.71.gate_proj.weight_scale": "model-00047-of-00047.safetensors", + "model.layers.46.mlp.experts.71.up_proj.weight": "model-00047-of-00047.safetensors", + "model.layers.46.mlp.experts.71.up_proj.weight_scale": "model-00047-of-00047.safetensors", + "model.layers.46.mlp.experts.72.down_proj.weight": "model-00047-of-00047.safetensors", + "model.layers.46.mlp.experts.72.down_proj.weight_scale": "model-00047-of-00047.safetensors", + "model.layers.46.mlp.experts.72.gate_proj.weight": "model-00047-of-00047.safetensors", + "model.layers.46.mlp.experts.72.gate_proj.weight_scale": "model-00047-of-00047.safetensors", + "model.layers.46.mlp.experts.72.up_proj.weight": "model-00047-of-00047.safetensors", + "model.layers.46.mlp.experts.72.up_proj.weight_scale": "model-00047-of-00047.safetensors", + "model.layers.46.mlp.experts.73.down_proj.weight": "model-00047-of-00047.safetensors", + "model.layers.46.mlp.experts.73.down_proj.weight_scale": "model-00047-of-00047.safetensors", + "model.layers.46.mlp.experts.73.gate_proj.weight": "model-00047-of-00047.safetensors", + "model.layers.46.mlp.experts.73.gate_proj.weight_scale": "model-00047-of-00047.safetensors", + "model.layers.46.mlp.experts.73.up_proj.weight": "model-00047-of-00047.safetensors", + "model.layers.46.mlp.experts.73.up_proj.weight_scale": "model-00047-of-00047.safetensors", + "model.layers.46.mlp.experts.74.down_proj.weight": "model-00047-of-00047.safetensors", + "model.layers.46.mlp.experts.74.down_proj.weight_scale": "model-00047-of-00047.safetensors", + "model.layers.46.mlp.experts.74.gate_proj.weight": "model-00047-of-00047.safetensors", + "model.layers.46.mlp.experts.74.gate_proj.weight_scale": "model-00047-of-00047.safetensors", + "model.layers.46.mlp.experts.74.up_proj.weight": "model-00047-of-00047.safetensors", + "model.layers.46.mlp.experts.74.up_proj.weight_scale": "model-00047-of-00047.safetensors", + "model.layers.46.mlp.experts.75.down_proj.weight": "model-00047-of-00047.safetensors", + "model.layers.46.mlp.experts.75.down_proj.weight_scale": "model-00047-of-00047.safetensors", + "model.layers.46.mlp.experts.75.gate_proj.weight": "model-00047-of-00047.safetensors", + "model.layers.46.mlp.experts.75.gate_proj.weight_scale": "model-00047-of-00047.safetensors", + "model.layers.46.mlp.experts.75.up_proj.weight": "model-00047-of-00047.safetensors", + "model.layers.46.mlp.experts.75.up_proj.weight_scale": "model-00047-of-00047.safetensors", + "model.layers.46.mlp.experts.76.down_proj.weight": "model-00047-of-00047.safetensors", + "model.layers.46.mlp.experts.76.down_proj.weight_scale": "model-00047-of-00047.safetensors", + "model.layers.46.mlp.experts.76.gate_proj.weight": "model-00047-of-00047.safetensors", + "model.layers.46.mlp.experts.76.gate_proj.weight_scale": "model-00047-of-00047.safetensors", + "model.layers.46.mlp.experts.76.up_proj.weight": "model-00047-of-00047.safetensors", + "model.layers.46.mlp.experts.76.up_proj.weight_scale": "model-00047-of-00047.safetensors", + "model.layers.46.mlp.experts.77.down_proj.weight": "model-00047-of-00047.safetensors", + "model.layers.46.mlp.experts.77.down_proj.weight_scale": "model-00047-of-00047.safetensors", + "model.layers.46.mlp.experts.77.gate_proj.weight": "model-00047-of-00047.safetensors", + "model.layers.46.mlp.experts.77.gate_proj.weight_scale": "model-00047-of-00047.safetensors", + "model.layers.46.mlp.experts.77.up_proj.weight": "model-00047-of-00047.safetensors", + "model.layers.46.mlp.experts.77.up_proj.weight_scale": "model-00047-of-00047.safetensors", + "model.layers.46.mlp.experts.78.down_proj.weight": "model-00047-of-00047.safetensors", + "model.layers.46.mlp.experts.78.down_proj.weight_scale": "model-00047-of-00047.safetensors", + "model.layers.46.mlp.experts.78.gate_proj.weight": "model-00047-of-00047.safetensors", + "model.layers.46.mlp.experts.78.gate_proj.weight_scale": "model-00047-of-00047.safetensors", + "model.layers.46.mlp.experts.78.up_proj.weight": "model-00047-of-00047.safetensors", + "model.layers.46.mlp.experts.78.up_proj.weight_scale": "model-00047-of-00047.safetensors", + "model.layers.46.mlp.experts.79.down_proj.weight": "model-00047-of-00047.safetensors", + "model.layers.46.mlp.experts.79.down_proj.weight_scale": "model-00047-of-00047.safetensors", + "model.layers.46.mlp.experts.79.gate_proj.weight": "model-00047-of-00047.safetensors", + "model.layers.46.mlp.experts.79.gate_proj.weight_scale": "model-00047-of-00047.safetensors", + "model.layers.46.mlp.experts.79.up_proj.weight": "model-00047-of-00047.safetensors", + "model.layers.46.mlp.experts.79.up_proj.weight_scale": "model-00047-of-00047.safetensors", + "model.layers.46.mlp.experts.8.down_proj.weight": "model-00047-of-00047.safetensors", + "model.layers.46.mlp.experts.8.down_proj.weight_scale": "model-00047-of-00047.safetensors", + "model.layers.46.mlp.experts.8.gate_proj.weight": "model-00047-of-00047.safetensors", + "model.layers.46.mlp.experts.8.gate_proj.weight_scale": "model-00047-of-00047.safetensors", + "model.layers.46.mlp.experts.8.up_proj.weight": "model-00047-of-00047.safetensors", + "model.layers.46.mlp.experts.8.up_proj.weight_scale": "model-00047-of-00047.safetensors", + "model.layers.46.mlp.experts.80.down_proj.weight": "model-00047-of-00047.safetensors", + "model.layers.46.mlp.experts.80.down_proj.weight_scale": "model-00047-of-00047.safetensors", + "model.layers.46.mlp.experts.80.gate_proj.weight": "model-00047-of-00047.safetensors", + "model.layers.46.mlp.experts.80.gate_proj.weight_scale": "model-00047-of-00047.safetensors", + "model.layers.46.mlp.experts.80.up_proj.weight": "model-00047-of-00047.safetensors", + "model.layers.46.mlp.experts.80.up_proj.weight_scale": "model-00047-of-00047.safetensors", + "model.layers.46.mlp.experts.81.down_proj.weight": "model-00047-of-00047.safetensors", + "model.layers.46.mlp.experts.81.down_proj.weight_scale": "model-00047-of-00047.safetensors", + "model.layers.46.mlp.experts.81.gate_proj.weight": "model-00047-of-00047.safetensors", + "model.layers.46.mlp.experts.81.gate_proj.weight_scale": "model-00047-of-00047.safetensors", + "model.layers.46.mlp.experts.81.up_proj.weight": "model-00047-of-00047.safetensors", + "model.layers.46.mlp.experts.81.up_proj.weight_scale": "model-00047-of-00047.safetensors", + "model.layers.46.mlp.experts.82.down_proj.weight": "model-00047-of-00047.safetensors", + "model.layers.46.mlp.experts.82.down_proj.weight_scale": "model-00047-of-00047.safetensors", + "model.layers.46.mlp.experts.82.gate_proj.weight": "model-00047-of-00047.safetensors", + "model.layers.46.mlp.experts.82.gate_proj.weight_scale": "model-00047-of-00047.safetensors", + "model.layers.46.mlp.experts.82.up_proj.weight": "model-00047-of-00047.safetensors", + "model.layers.46.mlp.experts.82.up_proj.weight_scale": "model-00047-of-00047.safetensors", + "model.layers.46.mlp.experts.83.down_proj.weight": "model-00047-of-00047.safetensors", + "model.layers.46.mlp.experts.83.down_proj.weight_scale": "model-00047-of-00047.safetensors", + "model.layers.46.mlp.experts.83.gate_proj.weight": "model-00047-of-00047.safetensors", + "model.layers.46.mlp.experts.83.gate_proj.weight_scale": "model-00047-of-00047.safetensors", + "model.layers.46.mlp.experts.83.up_proj.weight": "model-00047-of-00047.safetensors", + "model.layers.46.mlp.experts.83.up_proj.weight_scale": "model-00047-of-00047.safetensors", + "model.layers.46.mlp.experts.84.down_proj.weight": "model-00047-of-00047.safetensors", + "model.layers.46.mlp.experts.84.down_proj.weight_scale": "model-00047-of-00047.safetensors", + "model.layers.46.mlp.experts.84.gate_proj.weight": "model-00047-of-00047.safetensors", + "model.layers.46.mlp.experts.84.gate_proj.weight_scale": "model-00047-of-00047.safetensors", + "model.layers.46.mlp.experts.84.up_proj.weight": "model-00047-of-00047.safetensors", + "model.layers.46.mlp.experts.84.up_proj.weight_scale": "model-00047-of-00047.safetensors", + "model.layers.46.mlp.experts.85.down_proj.weight": "model-00047-of-00047.safetensors", + "model.layers.46.mlp.experts.85.down_proj.weight_scale": "model-00047-of-00047.safetensors", + "model.layers.46.mlp.experts.85.gate_proj.weight": "model-00047-of-00047.safetensors", + "model.layers.46.mlp.experts.85.gate_proj.weight_scale": "model-00047-of-00047.safetensors", + "model.layers.46.mlp.experts.85.up_proj.weight": "model-00047-of-00047.safetensors", + "model.layers.46.mlp.experts.85.up_proj.weight_scale": "model-00047-of-00047.safetensors", + "model.layers.46.mlp.experts.86.down_proj.weight": "model-00047-of-00047.safetensors", + "model.layers.46.mlp.experts.86.down_proj.weight_scale": "model-00047-of-00047.safetensors", + "model.layers.46.mlp.experts.86.gate_proj.weight": "model-00047-of-00047.safetensors", + "model.layers.46.mlp.experts.86.gate_proj.weight_scale": "model-00047-of-00047.safetensors", + "model.layers.46.mlp.experts.86.up_proj.weight": "model-00047-of-00047.safetensors", + "model.layers.46.mlp.experts.86.up_proj.weight_scale": "model-00047-of-00047.safetensors", + "model.layers.46.mlp.experts.87.down_proj.weight": "model-00047-of-00047.safetensors", + "model.layers.46.mlp.experts.87.down_proj.weight_scale": "model-00047-of-00047.safetensors", + "model.layers.46.mlp.experts.87.gate_proj.weight": "model-00047-of-00047.safetensors", + "model.layers.46.mlp.experts.87.gate_proj.weight_scale": "model-00047-of-00047.safetensors", + "model.layers.46.mlp.experts.87.up_proj.weight": "model-00047-of-00047.safetensors", + "model.layers.46.mlp.experts.87.up_proj.weight_scale": "model-00047-of-00047.safetensors", + "model.layers.46.mlp.experts.88.down_proj.weight": "model-00047-of-00047.safetensors", + "model.layers.46.mlp.experts.88.down_proj.weight_scale": "model-00047-of-00047.safetensors", + "model.layers.46.mlp.experts.88.gate_proj.weight": "model-00047-of-00047.safetensors", + "model.layers.46.mlp.experts.88.gate_proj.weight_scale": "model-00047-of-00047.safetensors", + "model.layers.46.mlp.experts.88.up_proj.weight": "model-00047-of-00047.safetensors", + "model.layers.46.mlp.experts.88.up_proj.weight_scale": "model-00047-of-00047.safetensors", + "model.layers.46.mlp.experts.89.down_proj.weight": "model-00047-of-00047.safetensors", + "model.layers.46.mlp.experts.89.down_proj.weight_scale": "model-00047-of-00047.safetensors", + "model.layers.46.mlp.experts.89.gate_proj.weight": "model-00047-of-00047.safetensors", + "model.layers.46.mlp.experts.89.gate_proj.weight_scale": "model-00047-of-00047.safetensors", + "model.layers.46.mlp.experts.89.up_proj.weight": "model-00047-of-00047.safetensors", + "model.layers.46.mlp.experts.89.up_proj.weight_scale": "model-00047-of-00047.safetensors", + "model.layers.46.mlp.experts.9.down_proj.weight": "model-00047-of-00047.safetensors", + "model.layers.46.mlp.experts.9.down_proj.weight_scale": "model-00047-of-00047.safetensors", + "model.layers.46.mlp.experts.9.gate_proj.weight": "model-00047-of-00047.safetensors", + "model.layers.46.mlp.experts.9.gate_proj.weight_scale": "model-00047-of-00047.safetensors", + "model.layers.46.mlp.experts.9.up_proj.weight": "model-00047-of-00047.safetensors", + "model.layers.46.mlp.experts.9.up_proj.weight_scale": "model-00047-of-00047.safetensors", + "model.layers.46.mlp.experts.90.down_proj.weight": "model-00047-of-00047.safetensors", + "model.layers.46.mlp.experts.90.down_proj.weight_scale": "model-00047-of-00047.safetensors", + "model.layers.46.mlp.experts.90.gate_proj.weight": "model-00047-of-00047.safetensors", + "model.layers.46.mlp.experts.90.gate_proj.weight_scale": "model-00047-of-00047.safetensors", + "model.layers.46.mlp.experts.90.up_proj.weight": "model-00047-of-00047.safetensors", + "model.layers.46.mlp.experts.90.up_proj.weight_scale": "model-00047-of-00047.safetensors", + "model.layers.46.mlp.experts.91.down_proj.weight": "model-00047-of-00047.safetensors", + "model.layers.46.mlp.experts.91.down_proj.weight_scale": "model-00047-of-00047.safetensors", + "model.layers.46.mlp.experts.91.gate_proj.weight": "model-00047-of-00047.safetensors", + "model.layers.46.mlp.experts.91.gate_proj.weight_scale": "model-00047-of-00047.safetensors", + "model.layers.46.mlp.experts.91.up_proj.weight": "model-00047-of-00047.safetensors", + "model.layers.46.mlp.experts.91.up_proj.weight_scale": "model-00047-of-00047.safetensors", + "model.layers.46.mlp.experts.92.down_proj.weight": "model-00047-of-00047.safetensors", + "model.layers.46.mlp.experts.92.down_proj.weight_scale": "model-00047-of-00047.safetensors", + "model.layers.46.mlp.experts.92.gate_proj.weight": "model-00047-of-00047.safetensors", + "model.layers.46.mlp.experts.92.gate_proj.weight_scale": "model-00047-of-00047.safetensors", + "model.layers.46.mlp.experts.92.up_proj.weight": "model-00047-of-00047.safetensors", + "model.layers.46.mlp.experts.92.up_proj.weight_scale": "model-00047-of-00047.safetensors", + "model.layers.46.mlp.experts.93.down_proj.weight": "model-00047-of-00047.safetensors", + "model.layers.46.mlp.experts.93.down_proj.weight_scale": "model-00047-of-00047.safetensors", + "model.layers.46.mlp.experts.93.gate_proj.weight": "model-00047-of-00047.safetensors", + "model.layers.46.mlp.experts.93.gate_proj.weight_scale": "model-00047-of-00047.safetensors", + "model.layers.46.mlp.experts.93.up_proj.weight": "model-00047-of-00047.safetensors", + "model.layers.46.mlp.experts.93.up_proj.weight_scale": "model-00047-of-00047.safetensors", + "model.layers.46.mlp.experts.94.down_proj.weight": "model-00047-of-00047.safetensors", + "model.layers.46.mlp.experts.94.down_proj.weight_scale": "model-00047-of-00047.safetensors", + "model.layers.46.mlp.experts.94.gate_proj.weight": "model-00047-of-00047.safetensors", + "model.layers.46.mlp.experts.94.gate_proj.weight_scale": "model-00047-of-00047.safetensors", + "model.layers.46.mlp.experts.94.up_proj.weight": "model-00047-of-00047.safetensors", + "model.layers.46.mlp.experts.94.up_proj.weight_scale": "model-00047-of-00047.safetensors", + "model.layers.46.mlp.experts.95.down_proj.weight": "model-00047-of-00047.safetensors", + "model.layers.46.mlp.experts.95.down_proj.weight_scale": "model-00047-of-00047.safetensors", + "model.layers.46.mlp.experts.95.gate_proj.weight": "model-00047-of-00047.safetensors", + "model.layers.46.mlp.experts.95.gate_proj.weight_scale": "model-00047-of-00047.safetensors", + "model.layers.46.mlp.experts.95.up_proj.weight": "model-00047-of-00047.safetensors", + "model.layers.46.mlp.experts.95.up_proj.weight_scale": "model-00047-of-00047.safetensors", + "model.layers.46.mlp.experts.96.down_proj.weight": "model-00047-of-00047.safetensors", + "model.layers.46.mlp.experts.96.down_proj.weight_scale": "model-00047-of-00047.safetensors", + "model.layers.46.mlp.experts.96.gate_proj.weight": "model-00047-of-00047.safetensors", + "model.layers.46.mlp.experts.96.gate_proj.weight_scale": "model-00047-of-00047.safetensors", + "model.layers.46.mlp.experts.96.up_proj.weight": "model-00047-of-00047.safetensors", + "model.layers.46.mlp.experts.96.up_proj.weight_scale": "model-00047-of-00047.safetensors", + "model.layers.46.mlp.experts.97.down_proj.weight": "model-00047-of-00047.safetensors", + "model.layers.46.mlp.experts.97.down_proj.weight_scale": "model-00047-of-00047.safetensors", + "model.layers.46.mlp.experts.97.gate_proj.weight": "model-00047-of-00047.safetensors", + "model.layers.46.mlp.experts.97.gate_proj.weight_scale": "model-00047-of-00047.safetensors", + "model.layers.46.mlp.experts.97.up_proj.weight": "model-00047-of-00047.safetensors", + "model.layers.46.mlp.experts.97.up_proj.weight_scale": "model-00047-of-00047.safetensors", + "model.layers.46.mlp.experts.98.down_proj.weight": "model-00047-of-00047.safetensors", + "model.layers.46.mlp.experts.98.down_proj.weight_scale": "model-00047-of-00047.safetensors", + "model.layers.46.mlp.experts.98.gate_proj.weight": "model-00047-of-00047.safetensors", + "model.layers.46.mlp.experts.98.gate_proj.weight_scale": "model-00047-of-00047.safetensors", + "model.layers.46.mlp.experts.98.up_proj.weight": "model-00047-of-00047.safetensors", + "model.layers.46.mlp.experts.98.up_proj.weight_scale": "model-00047-of-00047.safetensors", + "model.layers.46.mlp.experts.99.down_proj.weight": "model-00047-of-00047.safetensors", + "model.layers.46.mlp.experts.99.down_proj.weight_scale": "model-00047-of-00047.safetensors", + "model.layers.46.mlp.experts.99.gate_proj.weight": "model-00047-of-00047.safetensors", + "model.layers.46.mlp.experts.99.gate_proj.weight_scale": "model-00047-of-00047.safetensors", + "model.layers.46.mlp.experts.99.up_proj.weight": "model-00047-of-00047.safetensors", + "model.layers.46.mlp.experts.99.up_proj.weight_scale": "model-00047-of-00047.safetensors", + "model.layers.46.mlp.gate.e_score_correction_bias": "model-00047-of-00047.safetensors", + "model.layers.46.mlp.gate.weight": "model-00047-of-00047.safetensors", + "model.layers.46.mlp.shared_experts.down_proj.weight": "model-00047-of-00047.safetensors", + "model.layers.46.mlp.shared_experts.down_proj.weight_scale": "model-00047-of-00047.safetensors", + "model.layers.46.mlp.shared_experts.gate_proj.weight": "model-00047-of-00047.safetensors", + "model.layers.46.mlp.shared_experts.gate_proj.weight_scale": "model-00047-of-00047.safetensors", + "model.layers.46.mlp.shared_experts.up_proj.weight": "model-00047-of-00047.safetensors", + "model.layers.46.mlp.shared_experts.up_proj.weight_scale": "model-00047-of-00047.safetensors", + "model.layers.46.post_attention_layernorm.weight": "model-00047-of-00047.safetensors", + "model.layers.46.self_attn.k_proj.bias": "model-00047-of-00047.safetensors", + "model.layers.46.self_attn.k_proj.weight": "model-00047-of-00047.safetensors", + "model.layers.46.self_attn.k_proj.weight_scale": "model-00047-of-00047.safetensors", + "model.layers.46.self_attn.o_proj.weight": "model-00047-of-00047.safetensors", + "model.layers.46.self_attn.o_proj.weight_scale": "model-00047-of-00047.safetensors", + "model.layers.46.self_attn.q_proj.bias": "model-00047-of-00047.safetensors", + "model.layers.46.self_attn.q_proj.weight": "model-00047-of-00047.safetensors", + "model.layers.46.self_attn.q_proj.weight_scale": "model-00047-of-00047.safetensors", + "model.layers.46.self_attn.v_proj.bias": "model-00047-of-00047.safetensors", + "model.layers.46.self_attn.v_proj.weight": "model-00047-of-00047.safetensors", + "model.layers.46.self_attn.v_proj.weight_scale": "model-00047-of-00047.safetensors", + "model.layers.46.shared_head.norm.weight": "model-00047-of-00047.safetensors" + }, + "metadata": { + "total_size": 85665024 + } +} \ No newline at end of file diff --git a/tokenizer.json b/tokenizer.json new file mode 100644 index 0000000000000000000000000000000000000000..43a71efad1ab3f7e4d66d1e48e7cc44f68f21f3a --- /dev/null +++ b/tokenizer.json @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9340665016419c825c4bdabbcc9acc43b7ca2c68ce142724afa829abb1be5efd +size 19970699 diff --git a/tokenizer_config.json b/tokenizer_config.json new file mode 100644 index 0000000000000000000000000000000000000000..053f12c9b03d5acbcc921042ea0c87a6baa5d3f7 --- /dev/null +++ b/tokenizer_config.json @@ -0,0 +1,325 @@ +{ + "added_tokens_decoder": { + "151329": { + "content": "<|endoftext|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "151330": { + "content": "[MASK]", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "151331": { + "content": "[gMASK]", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "151332": { + "content": "[sMASK]", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "151333": { + "content": "", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "151334": { + "content": "", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "151335": { + "content": "<|system|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "151336": { + "content": "<|user|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "151337": { + "content": "<|assistant|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "151338": { + "content": "<|observation|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "151339": { + "content": "<|begin_of_image|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "151340": { + "content": "<|end_of_image|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "151341": { + "content": "<|begin_of_video|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "151342": { + "content": "<|end_of_video|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "151343": { + "content": "<|begin_of_audio|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "151344": { + "content": "<|end_of_audio|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "151345": { + "content": "<|begin_of_transcription|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "151346": { + "content": "<|end_of_transcription|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "151347": { + "content": "<|code_prefix|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "151348": { + "content": "<|code_middle|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "151349": { + "content": "<|code_suffix|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "151350": { + "content": "", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": false + }, + "151351": { + "content": "", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": false + }, + "151352": { + "content": "", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": false + }, + "151353": { + "content": "", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": false + }, + "151354": { + "content": "", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": false + }, + "151355": { + "content": "", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": false + }, + "151356": { + "content": "", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": false + }, + "151357": { + "content": "", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": false + }, + "151358": { + "content": "", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": false + }, + "151359": { + "content": "", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": false + }, + "151360": { + "content": "/nothink", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "151361": { + "content": "<|begin_of_box|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": false + }, + "151362": { + "content": "<|end_of_box|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": false + }, + "151363": { + "content": "<|image|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": false + }, + "151364": { + "content": "<|video|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": false + } + }, + "additional_special_tokens": [ + "<|endoftext|>", + "[MASK]", + "[gMASK]", + "[sMASK]", + "", + "", + "<|system|>", + "<|user|>", + "<|assistant|>", + "<|observation|>", + "<|begin_of_image|>", + "<|end_of_image|>", + "<|begin_of_video|>", + "<|end_of_video|>", + "<|begin_of_audio|>", + "<|end_of_audio|>", + "<|begin_of_transcription|>", + "<|end_of_transcription|>", + "<|code_prefix|>", + "<|code_middle|>", + "<|code_suffix|>", + "/nothink" + ], + "clean_up_tokenization_spaces": false, + "do_lower_case": false, + "eos_token": "<|endoftext|>", + "extra_special_tokens": {}, + "model_max_length": 128000, + "pad_token": "<|endoftext|>", + "padding_side": "left", + "remove_space": false, + "tokenizer_class": "PreTrainedTokenizer" +}