diff --git a/-split/config.json b/-split/config.json deleted file mode 100644 index ce8dd0c6ee4ffc4dbec717046c76d806db919220..0000000000000000000000000000000000000000 --- a/-split/config.json +++ /dev/null @@ -1,27 +0,0 @@ -{ - "_name_or_path": "mistralai/Mistral-7B-Instruct-v0.3", - "architectures": [ - "MistralForCausalLM" - ], - "attention_dropout": 0.0, - "bos_token_id": 1, - "eos_token_id": 2, - "head_dim": 128, - "hidden_act": "silu", - "hidden_size": 4096, - "initializer_range": 0.02, - "intermediate_size": 14336, - "max_position_embeddings": 32768, - "model_type": "mistral", - "num_attention_heads": 32, - "num_hidden_layers": 32, - "num_key_value_heads": 8, - "rms_norm_eps": 1e-05, - "rope_theta": 1000000.0, - "sliding_window": null, - "tie_word_embeddings": false, - "torch_dtype": "float32", - "transformers_version": "4.44.0", - "use_cache": true, - "vocab_size": 32768 -} diff --git a/-split/generation_config.json b/-split/generation_config.json deleted file mode 100644 index 619b6765140cdfaa9b9d20619cae17643a28265f..0000000000000000000000000000000000000000 --- a/-split/generation_config.json +++ /dev/null @@ -1,6 +0,0 @@ -{ - "_from_model_config": true, - "bos_token_id": 1, - "eos_token_id": 2, - "transformers_version": "4.44.0" -} diff --git a/config.json b/config.json index 9f913dc05d66cfb23c16e3c93b3cc4899813dfa6..ce8dd0c6ee4ffc4dbec717046c76d806db919220 100644 --- a/config.json +++ b/config.json @@ -1,10 +1,12 @@ { + "_name_or_path": "mistralai/Mistral-7B-Instruct-v0.3", "architectures": [ "MistralForCausalLM" ], "attention_dropout": 0.0, "bos_token_id": 1, "eos_token_id": 2, + "head_dim": 128, "hidden_act": "silu", "hidden_size": 4096, "initializer_range": 0.02, @@ -18,8 +20,8 @@ "rope_theta": 1000000.0, "sliding_window": null, "tie_word_embeddings": false, - "torch_dtype": "bfloat16", - "transformers_version": "4.42.0.dev0", + "torch_dtype": "float32", + "transformers_version": "4.44.0", "use_cache": true, "vocab_size": 32768 } diff --git a/generation_config.json b/generation_config.json index b6bea2642bc3fe80f392111d52af91d1563a8de2..619b6765140cdfaa9b9d20619cae17643a28265f 100644 --- a/generation_config.json +++ b/generation_config.json @@ -2,5 +2,5 @@ "_from_model_config": true, "bos_token_id": 1, "eos_token_id": 2, - "transformers_version": "4.42.0.dev0" + "transformers_version": "4.44.0" } diff --git a/-split/pytorch_model.bin/key_to_filename.json b/pytorch_model.bin/key_to_filename.json similarity index 100% rename from -split/pytorch_model.bin/key_to_filename.json rename to pytorch_model.bin/key_to_filename.json diff --git a/-split/pytorch_model.bin/p0.model.embed_tokens.weight b/pytorch_model.bin/p0.model.embed_tokens.weight similarity index 100% rename from -split/pytorch_model.bin/p0.model.embed_tokens.weight rename to pytorch_model.bin/p0.model.embed_tokens.weight diff --git a/-split/pytorch_model.bin/p1.model.layers.0.self_attn.q_proj.weight b/pytorch_model.bin/p1.model.layers.0.self_attn.q_proj.weight similarity index 100% rename from -split/pytorch_model.bin/p1.model.layers.0.self_attn.q_proj.weight rename to pytorch_model.bin/p1.model.layers.0.self_attn.q_proj.weight diff --git a/-split/pytorch_model.bin/p10.model.layers.1.self_attn.q_proj.weight b/pytorch_model.bin/p10.model.layers.1.self_attn.q_proj.weight similarity index 100% rename from -split/pytorch_model.bin/p10.model.layers.1.self_attn.q_proj.weight rename to pytorch_model.bin/p10.model.layers.1.self_attn.q_proj.weight diff --git a/-split/pytorch_model.bin/p100.model.layers.11.self_attn.q_proj.weight b/pytorch_model.bin/p100.model.layers.11.self_attn.q_proj.weight similarity index 100% rename from -split/pytorch_model.bin/p100.model.layers.11.self_attn.q_proj.weight rename to pytorch_model.bin/p100.model.layers.11.self_attn.q_proj.weight diff --git a/-split/pytorch_model.bin/p101.model.layers.11.self_attn.k_proj.weight b/pytorch_model.bin/p101.model.layers.11.self_attn.k_proj.weight similarity index 100% rename from -split/pytorch_model.bin/p101.model.layers.11.self_attn.k_proj.weight rename to pytorch_model.bin/p101.model.layers.11.self_attn.k_proj.weight diff --git a/-split/pytorch_model.bin/p102.model.layers.11.self_attn.v_proj.weight b/pytorch_model.bin/p102.model.layers.11.self_attn.v_proj.weight similarity index 100% rename from -split/pytorch_model.bin/p102.model.layers.11.self_attn.v_proj.weight rename to pytorch_model.bin/p102.model.layers.11.self_attn.v_proj.weight diff --git a/-split/pytorch_model.bin/p103.model.layers.11.self_attn.o_proj.weight b/pytorch_model.bin/p103.model.layers.11.self_attn.o_proj.weight similarity index 100% rename from -split/pytorch_model.bin/p103.model.layers.11.self_attn.o_proj.weight rename to pytorch_model.bin/p103.model.layers.11.self_attn.o_proj.weight diff --git a/-split/pytorch_model.bin/p104.model.layers.11.mlp.gate_proj.weight b/pytorch_model.bin/p104.model.layers.11.mlp.gate_proj.weight similarity index 100% rename from -split/pytorch_model.bin/p104.model.layers.11.mlp.gate_proj.weight rename to pytorch_model.bin/p104.model.layers.11.mlp.gate_proj.weight diff --git a/-split/pytorch_model.bin/p105.model.layers.11.mlp.up_proj.weight b/pytorch_model.bin/p105.model.layers.11.mlp.up_proj.weight similarity index 100% rename from -split/pytorch_model.bin/p105.model.layers.11.mlp.up_proj.weight rename to pytorch_model.bin/p105.model.layers.11.mlp.up_proj.weight diff --git a/-split/pytorch_model.bin/p106.model.layers.11.mlp.down_proj.weight b/pytorch_model.bin/p106.model.layers.11.mlp.down_proj.weight similarity index 100% rename from -split/pytorch_model.bin/p106.model.layers.11.mlp.down_proj.weight rename to pytorch_model.bin/p106.model.layers.11.mlp.down_proj.weight diff --git a/-split/pytorch_model.bin/p107.model.layers.11.input_layernorm.weight b/pytorch_model.bin/p107.model.layers.11.input_layernorm.weight similarity index 100% rename from -split/pytorch_model.bin/p107.model.layers.11.input_layernorm.weight rename to pytorch_model.bin/p107.model.layers.11.input_layernorm.weight diff --git a/-split/pytorch_model.bin/p108.model.layers.11.post_attention_layernorm.weight b/pytorch_model.bin/p108.model.layers.11.post_attention_layernorm.weight similarity index 100% rename from -split/pytorch_model.bin/p108.model.layers.11.post_attention_layernorm.weight rename to pytorch_model.bin/p108.model.layers.11.post_attention_layernorm.weight diff --git a/-split/pytorch_model.bin/p109.model.layers.12.self_attn.q_proj.weight b/pytorch_model.bin/p109.model.layers.12.self_attn.q_proj.weight similarity index 100% rename from -split/pytorch_model.bin/p109.model.layers.12.self_attn.q_proj.weight rename to pytorch_model.bin/p109.model.layers.12.self_attn.q_proj.weight diff --git a/-split/pytorch_model.bin/p11.model.layers.1.self_attn.k_proj.weight b/pytorch_model.bin/p11.model.layers.1.self_attn.k_proj.weight similarity index 100% rename from -split/pytorch_model.bin/p11.model.layers.1.self_attn.k_proj.weight rename to pytorch_model.bin/p11.model.layers.1.self_attn.k_proj.weight diff --git a/-split/pytorch_model.bin/p110.model.layers.12.self_attn.k_proj.weight b/pytorch_model.bin/p110.model.layers.12.self_attn.k_proj.weight similarity index 100% rename from -split/pytorch_model.bin/p110.model.layers.12.self_attn.k_proj.weight rename to pytorch_model.bin/p110.model.layers.12.self_attn.k_proj.weight diff --git a/-split/pytorch_model.bin/p111.model.layers.12.self_attn.v_proj.weight b/pytorch_model.bin/p111.model.layers.12.self_attn.v_proj.weight similarity index 100% rename from -split/pytorch_model.bin/p111.model.layers.12.self_attn.v_proj.weight rename to pytorch_model.bin/p111.model.layers.12.self_attn.v_proj.weight diff --git a/-split/pytorch_model.bin/p112.model.layers.12.self_attn.o_proj.weight b/pytorch_model.bin/p112.model.layers.12.self_attn.o_proj.weight similarity index 100% rename from -split/pytorch_model.bin/p112.model.layers.12.self_attn.o_proj.weight rename to pytorch_model.bin/p112.model.layers.12.self_attn.o_proj.weight diff --git a/-split/pytorch_model.bin/p113.model.layers.12.mlp.gate_proj.weight b/pytorch_model.bin/p113.model.layers.12.mlp.gate_proj.weight similarity index 100% rename from -split/pytorch_model.bin/p113.model.layers.12.mlp.gate_proj.weight rename to pytorch_model.bin/p113.model.layers.12.mlp.gate_proj.weight diff --git a/-split/pytorch_model.bin/p114.model.layers.12.mlp.up_proj.weight b/pytorch_model.bin/p114.model.layers.12.mlp.up_proj.weight similarity index 100% rename from -split/pytorch_model.bin/p114.model.layers.12.mlp.up_proj.weight rename to pytorch_model.bin/p114.model.layers.12.mlp.up_proj.weight diff --git a/-split/pytorch_model.bin/p115.model.layers.12.mlp.down_proj.weight b/pytorch_model.bin/p115.model.layers.12.mlp.down_proj.weight similarity index 100% rename from -split/pytorch_model.bin/p115.model.layers.12.mlp.down_proj.weight rename to pytorch_model.bin/p115.model.layers.12.mlp.down_proj.weight diff --git a/-split/pytorch_model.bin/p116.model.layers.12.input_layernorm.weight b/pytorch_model.bin/p116.model.layers.12.input_layernorm.weight similarity index 100% rename from -split/pytorch_model.bin/p116.model.layers.12.input_layernorm.weight rename to pytorch_model.bin/p116.model.layers.12.input_layernorm.weight diff --git a/-split/pytorch_model.bin/p117.model.layers.12.post_attention_layernorm.weight b/pytorch_model.bin/p117.model.layers.12.post_attention_layernorm.weight similarity index 100% rename from -split/pytorch_model.bin/p117.model.layers.12.post_attention_layernorm.weight rename to pytorch_model.bin/p117.model.layers.12.post_attention_layernorm.weight diff --git a/-split/pytorch_model.bin/p118.model.layers.13.self_attn.q_proj.weight b/pytorch_model.bin/p118.model.layers.13.self_attn.q_proj.weight similarity index 100% rename from -split/pytorch_model.bin/p118.model.layers.13.self_attn.q_proj.weight rename to pytorch_model.bin/p118.model.layers.13.self_attn.q_proj.weight diff --git a/-split/pytorch_model.bin/p119.model.layers.13.self_attn.k_proj.weight b/pytorch_model.bin/p119.model.layers.13.self_attn.k_proj.weight similarity index 100% rename from -split/pytorch_model.bin/p119.model.layers.13.self_attn.k_proj.weight rename to pytorch_model.bin/p119.model.layers.13.self_attn.k_proj.weight diff --git a/-split/pytorch_model.bin/p12.model.layers.1.self_attn.v_proj.weight b/pytorch_model.bin/p12.model.layers.1.self_attn.v_proj.weight similarity index 100% rename from -split/pytorch_model.bin/p12.model.layers.1.self_attn.v_proj.weight rename to pytorch_model.bin/p12.model.layers.1.self_attn.v_proj.weight diff --git a/-split/pytorch_model.bin/p120.model.layers.13.self_attn.v_proj.weight b/pytorch_model.bin/p120.model.layers.13.self_attn.v_proj.weight similarity index 100% rename from -split/pytorch_model.bin/p120.model.layers.13.self_attn.v_proj.weight rename to pytorch_model.bin/p120.model.layers.13.self_attn.v_proj.weight diff --git a/-split/pytorch_model.bin/p121.model.layers.13.self_attn.o_proj.weight b/pytorch_model.bin/p121.model.layers.13.self_attn.o_proj.weight similarity index 100% rename from -split/pytorch_model.bin/p121.model.layers.13.self_attn.o_proj.weight rename to pytorch_model.bin/p121.model.layers.13.self_attn.o_proj.weight diff --git a/-split/pytorch_model.bin/p122.model.layers.13.mlp.gate_proj.weight b/pytorch_model.bin/p122.model.layers.13.mlp.gate_proj.weight similarity index 100% rename from -split/pytorch_model.bin/p122.model.layers.13.mlp.gate_proj.weight rename to pytorch_model.bin/p122.model.layers.13.mlp.gate_proj.weight diff --git a/-split/pytorch_model.bin/p123.model.layers.13.mlp.up_proj.weight b/pytorch_model.bin/p123.model.layers.13.mlp.up_proj.weight similarity index 100% rename from -split/pytorch_model.bin/p123.model.layers.13.mlp.up_proj.weight rename to pytorch_model.bin/p123.model.layers.13.mlp.up_proj.weight diff --git a/-split/pytorch_model.bin/p124.model.layers.13.mlp.down_proj.weight b/pytorch_model.bin/p124.model.layers.13.mlp.down_proj.weight similarity index 100% rename from -split/pytorch_model.bin/p124.model.layers.13.mlp.down_proj.weight rename to pytorch_model.bin/p124.model.layers.13.mlp.down_proj.weight diff --git a/-split/pytorch_model.bin/p125.model.layers.13.input_layernorm.weight b/pytorch_model.bin/p125.model.layers.13.input_layernorm.weight similarity index 100% rename from -split/pytorch_model.bin/p125.model.layers.13.input_layernorm.weight rename to pytorch_model.bin/p125.model.layers.13.input_layernorm.weight diff --git a/-split/pytorch_model.bin/p126.model.layers.13.post_attention_layernorm.weight b/pytorch_model.bin/p126.model.layers.13.post_attention_layernorm.weight similarity index 100% rename from -split/pytorch_model.bin/p126.model.layers.13.post_attention_layernorm.weight rename to pytorch_model.bin/p126.model.layers.13.post_attention_layernorm.weight diff --git a/-split/pytorch_model.bin/p127.model.layers.14.self_attn.q_proj.weight b/pytorch_model.bin/p127.model.layers.14.self_attn.q_proj.weight similarity index 100% rename from -split/pytorch_model.bin/p127.model.layers.14.self_attn.q_proj.weight rename to pytorch_model.bin/p127.model.layers.14.self_attn.q_proj.weight diff --git a/-split/pytorch_model.bin/p128.model.layers.14.self_attn.k_proj.weight b/pytorch_model.bin/p128.model.layers.14.self_attn.k_proj.weight similarity index 100% rename from -split/pytorch_model.bin/p128.model.layers.14.self_attn.k_proj.weight rename to pytorch_model.bin/p128.model.layers.14.self_attn.k_proj.weight diff --git a/-split/pytorch_model.bin/p129.model.layers.14.self_attn.v_proj.weight b/pytorch_model.bin/p129.model.layers.14.self_attn.v_proj.weight similarity index 100% rename from -split/pytorch_model.bin/p129.model.layers.14.self_attn.v_proj.weight rename to pytorch_model.bin/p129.model.layers.14.self_attn.v_proj.weight diff --git a/-split/pytorch_model.bin/p13.model.layers.1.self_attn.o_proj.weight b/pytorch_model.bin/p13.model.layers.1.self_attn.o_proj.weight similarity index 100% rename from -split/pytorch_model.bin/p13.model.layers.1.self_attn.o_proj.weight rename to pytorch_model.bin/p13.model.layers.1.self_attn.o_proj.weight diff --git a/-split/pytorch_model.bin/p130.model.layers.14.self_attn.o_proj.weight b/pytorch_model.bin/p130.model.layers.14.self_attn.o_proj.weight similarity index 100% rename from -split/pytorch_model.bin/p130.model.layers.14.self_attn.o_proj.weight rename to pytorch_model.bin/p130.model.layers.14.self_attn.o_proj.weight diff --git a/-split/pytorch_model.bin/p131.model.layers.14.mlp.gate_proj.weight b/pytorch_model.bin/p131.model.layers.14.mlp.gate_proj.weight similarity index 100% rename from -split/pytorch_model.bin/p131.model.layers.14.mlp.gate_proj.weight rename to pytorch_model.bin/p131.model.layers.14.mlp.gate_proj.weight diff --git a/-split/pytorch_model.bin/p132.model.layers.14.mlp.up_proj.weight b/pytorch_model.bin/p132.model.layers.14.mlp.up_proj.weight similarity index 100% rename from -split/pytorch_model.bin/p132.model.layers.14.mlp.up_proj.weight rename to pytorch_model.bin/p132.model.layers.14.mlp.up_proj.weight diff --git a/-split/pytorch_model.bin/p133.model.layers.14.mlp.down_proj.weight b/pytorch_model.bin/p133.model.layers.14.mlp.down_proj.weight similarity index 100% rename from -split/pytorch_model.bin/p133.model.layers.14.mlp.down_proj.weight rename to pytorch_model.bin/p133.model.layers.14.mlp.down_proj.weight diff --git a/-split/pytorch_model.bin/p134.model.layers.14.input_layernorm.weight b/pytorch_model.bin/p134.model.layers.14.input_layernorm.weight similarity index 100% rename from -split/pytorch_model.bin/p134.model.layers.14.input_layernorm.weight rename to pytorch_model.bin/p134.model.layers.14.input_layernorm.weight diff --git a/-split/pytorch_model.bin/p135.model.layers.14.post_attention_layernorm.weight b/pytorch_model.bin/p135.model.layers.14.post_attention_layernorm.weight similarity index 100% rename from -split/pytorch_model.bin/p135.model.layers.14.post_attention_layernorm.weight rename to pytorch_model.bin/p135.model.layers.14.post_attention_layernorm.weight diff --git a/-split/pytorch_model.bin/p136.model.layers.15.self_attn.q_proj.weight b/pytorch_model.bin/p136.model.layers.15.self_attn.q_proj.weight similarity index 100% rename from -split/pytorch_model.bin/p136.model.layers.15.self_attn.q_proj.weight rename to pytorch_model.bin/p136.model.layers.15.self_attn.q_proj.weight diff --git a/-split/pytorch_model.bin/p137.model.layers.15.self_attn.k_proj.weight b/pytorch_model.bin/p137.model.layers.15.self_attn.k_proj.weight similarity index 100% rename from -split/pytorch_model.bin/p137.model.layers.15.self_attn.k_proj.weight rename to pytorch_model.bin/p137.model.layers.15.self_attn.k_proj.weight diff --git a/-split/pytorch_model.bin/p138.model.layers.15.self_attn.v_proj.weight b/pytorch_model.bin/p138.model.layers.15.self_attn.v_proj.weight similarity index 100% rename from -split/pytorch_model.bin/p138.model.layers.15.self_attn.v_proj.weight rename to pytorch_model.bin/p138.model.layers.15.self_attn.v_proj.weight diff --git a/-split/pytorch_model.bin/p139.model.layers.15.self_attn.o_proj.weight b/pytorch_model.bin/p139.model.layers.15.self_attn.o_proj.weight similarity index 100% rename from -split/pytorch_model.bin/p139.model.layers.15.self_attn.o_proj.weight rename to pytorch_model.bin/p139.model.layers.15.self_attn.o_proj.weight diff --git a/-split/pytorch_model.bin/p14.model.layers.1.mlp.gate_proj.weight b/pytorch_model.bin/p14.model.layers.1.mlp.gate_proj.weight similarity index 100% rename from -split/pytorch_model.bin/p14.model.layers.1.mlp.gate_proj.weight rename to pytorch_model.bin/p14.model.layers.1.mlp.gate_proj.weight diff --git a/-split/pytorch_model.bin/p140.model.layers.15.mlp.gate_proj.weight b/pytorch_model.bin/p140.model.layers.15.mlp.gate_proj.weight similarity index 100% rename from -split/pytorch_model.bin/p140.model.layers.15.mlp.gate_proj.weight rename to pytorch_model.bin/p140.model.layers.15.mlp.gate_proj.weight diff --git a/-split/pytorch_model.bin/p141.model.layers.15.mlp.up_proj.weight b/pytorch_model.bin/p141.model.layers.15.mlp.up_proj.weight similarity index 100% rename from -split/pytorch_model.bin/p141.model.layers.15.mlp.up_proj.weight rename to pytorch_model.bin/p141.model.layers.15.mlp.up_proj.weight diff --git a/-split/pytorch_model.bin/p142.model.layers.15.mlp.down_proj.weight b/pytorch_model.bin/p142.model.layers.15.mlp.down_proj.weight similarity index 100% rename from -split/pytorch_model.bin/p142.model.layers.15.mlp.down_proj.weight rename to pytorch_model.bin/p142.model.layers.15.mlp.down_proj.weight diff --git a/-split/pytorch_model.bin/p143.model.layers.15.input_layernorm.weight b/pytorch_model.bin/p143.model.layers.15.input_layernorm.weight similarity index 100% rename from -split/pytorch_model.bin/p143.model.layers.15.input_layernorm.weight rename to pytorch_model.bin/p143.model.layers.15.input_layernorm.weight diff --git a/-split/pytorch_model.bin/p144.model.layers.15.post_attention_layernorm.weight b/pytorch_model.bin/p144.model.layers.15.post_attention_layernorm.weight similarity index 100% rename from -split/pytorch_model.bin/p144.model.layers.15.post_attention_layernorm.weight rename to pytorch_model.bin/p144.model.layers.15.post_attention_layernorm.weight diff --git a/-split/pytorch_model.bin/p145.model.layers.16.self_attn.q_proj.weight b/pytorch_model.bin/p145.model.layers.16.self_attn.q_proj.weight similarity index 100% rename from -split/pytorch_model.bin/p145.model.layers.16.self_attn.q_proj.weight rename to pytorch_model.bin/p145.model.layers.16.self_attn.q_proj.weight diff --git a/-split/pytorch_model.bin/p146.model.layers.16.self_attn.k_proj.weight b/pytorch_model.bin/p146.model.layers.16.self_attn.k_proj.weight similarity index 100% rename from -split/pytorch_model.bin/p146.model.layers.16.self_attn.k_proj.weight rename to pytorch_model.bin/p146.model.layers.16.self_attn.k_proj.weight diff --git a/-split/pytorch_model.bin/p147.model.layers.16.self_attn.v_proj.weight b/pytorch_model.bin/p147.model.layers.16.self_attn.v_proj.weight similarity index 100% rename from -split/pytorch_model.bin/p147.model.layers.16.self_attn.v_proj.weight rename to pytorch_model.bin/p147.model.layers.16.self_attn.v_proj.weight diff --git a/-split/pytorch_model.bin/p148.model.layers.16.self_attn.o_proj.weight b/pytorch_model.bin/p148.model.layers.16.self_attn.o_proj.weight similarity index 100% rename from -split/pytorch_model.bin/p148.model.layers.16.self_attn.o_proj.weight rename to pytorch_model.bin/p148.model.layers.16.self_attn.o_proj.weight diff --git a/-split/pytorch_model.bin/p149.model.layers.16.mlp.gate_proj.weight b/pytorch_model.bin/p149.model.layers.16.mlp.gate_proj.weight similarity index 100% rename from -split/pytorch_model.bin/p149.model.layers.16.mlp.gate_proj.weight rename to pytorch_model.bin/p149.model.layers.16.mlp.gate_proj.weight diff --git a/-split/pytorch_model.bin/p15.model.layers.1.mlp.up_proj.weight b/pytorch_model.bin/p15.model.layers.1.mlp.up_proj.weight similarity index 100% rename from -split/pytorch_model.bin/p15.model.layers.1.mlp.up_proj.weight rename to pytorch_model.bin/p15.model.layers.1.mlp.up_proj.weight diff --git a/-split/pytorch_model.bin/p150.model.layers.16.mlp.up_proj.weight b/pytorch_model.bin/p150.model.layers.16.mlp.up_proj.weight similarity index 100% rename from -split/pytorch_model.bin/p150.model.layers.16.mlp.up_proj.weight rename to pytorch_model.bin/p150.model.layers.16.mlp.up_proj.weight diff --git a/-split/pytorch_model.bin/p151.model.layers.16.mlp.down_proj.weight b/pytorch_model.bin/p151.model.layers.16.mlp.down_proj.weight similarity index 100% rename from -split/pytorch_model.bin/p151.model.layers.16.mlp.down_proj.weight rename to pytorch_model.bin/p151.model.layers.16.mlp.down_proj.weight diff --git a/-split/pytorch_model.bin/p152.model.layers.16.input_layernorm.weight b/pytorch_model.bin/p152.model.layers.16.input_layernorm.weight similarity index 100% rename from -split/pytorch_model.bin/p152.model.layers.16.input_layernorm.weight rename to pytorch_model.bin/p152.model.layers.16.input_layernorm.weight diff --git a/-split/pytorch_model.bin/p153.model.layers.16.post_attention_layernorm.weight b/pytorch_model.bin/p153.model.layers.16.post_attention_layernorm.weight similarity index 100% rename from -split/pytorch_model.bin/p153.model.layers.16.post_attention_layernorm.weight rename to pytorch_model.bin/p153.model.layers.16.post_attention_layernorm.weight diff --git a/-split/pytorch_model.bin/p154.model.layers.17.self_attn.q_proj.weight b/pytorch_model.bin/p154.model.layers.17.self_attn.q_proj.weight similarity index 100% rename from -split/pytorch_model.bin/p154.model.layers.17.self_attn.q_proj.weight rename to pytorch_model.bin/p154.model.layers.17.self_attn.q_proj.weight diff --git a/-split/pytorch_model.bin/p155.model.layers.17.self_attn.k_proj.weight b/pytorch_model.bin/p155.model.layers.17.self_attn.k_proj.weight similarity index 100% rename from -split/pytorch_model.bin/p155.model.layers.17.self_attn.k_proj.weight rename to pytorch_model.bin/p155.model.layers.17.self_attn.k_proj.weight diff --git a/-split/pytorch_model.bin/p156.model.layers.17.self_attn.v_proj.weight b/pytorch_model.bin/p156.model.layers.17.self_attn.v_proj.weight similarity index 100% rename from -split/pytorch_model.bin/p156.model.layers.17.self_attn.v_proj.weight rename to pytorch_model.bin/p156.model.layers.17.self_attn.v_proj.weight diff --git a/-split/pytorch_model.bin/p157.model.layers.17.self_attn.o_proj.weight b/pytorch_model.bin/p157.model.layers.17.self_attn.o_proj.weight similarity index 100% rename from -split/pytorch_model.bin/p157.model.layers.17.self_attn.o_proj.weight rename to pytorch_model.bin/p157.model.layers.17.self_attn.o_proj.weight diff --git a/-split/pytorch_model.bin/p158.model.layers.17.mlp.gate_proj.weight b/pytorch_model.bin/p158.model.layers.17.mlp.gate_proj.weight similarity index 100% rename from -split/pytorch_model.bin/p158.model.layers.17.mlp.gate_proj.weight rename to pytorch_model.bin/p158.model.layers.17.mlp.gate_proj.weight diff --git a/-split/pytorch_model.bin/p159.model.layers.17.mlp.up_proj.weight b/pytorch_model.bin/p159.model.layers.17.mlp.up_proj.weight similarity index 100% rename from -split/pytorch_model.bin/p159.model.layers.17.mlp.up_proj.weight rename to pytorch_model.bin/p159.model.layers.17.mlp.up_proj.weight diff --git a/-split/pytorch_model.bin/p16.model.layers.1.mlp.down_proj.weight b/pytorch_model.bin/p16.model.layers.1.mlp.down_proj.weight similarity index 100% rename from -split/pytorch_model.bin/p16.model.layers.1.mlp.down_proj.weight rename to pytorch_model.bin/p16.model.layers.1.mlp.down_proj.weight diff --git a/-split/pytorch_model.bin/p160.model.layers.17.mlp.down_proj.weight b/pytorch_model.bin/p160.model.layers.17.mlp.down_proj.weight similarity index 100% rename from -split/pytorch_model.bin/p160.model.layers.17.mlp.down_proj.weight rename to pytorch_model.bin/p160.model.layers.17.mlp.down_proj.weight diff --git a/-split/pytorch_model.bin/p161.model.layers.17.input_layernorm.weight b/pytorch_model.bin/p161.model.layers.17.input_layernorm.weight similarity index 100% rename from -split/pytorch_model.bin/p161.model.layers.17.input_layernorm.weight rename to pytorch_model.bin/p161.model.layers.17.input_layernorm.weight diff --git a/-split/pytorch_model.bin/p162.model.layers.17.post_attention_layernorm.weight b/pytorch_model.bin/p162.model.layers.17.post_attention_layernorm.weight similarity index 100% rename from -split/pytorch_model.bin/p162.model.layers.17.post_attention_layernorm.weight rename to pytorch_model.bin/p162.model.layers.17.post_attention_layernorm.weight diff --git a/-split/pytorch_model.bin/p163.model.layers.18.self_attn.q_proj.weight b/pytorch_model.bin/p163.model.layers.18.self_attn.q_proj.weight similarity index 100% rename from -split/pytorch_model.bin/p163.model.layers.18.self_attn.q_proj.weight rename to pytorch_model.bin/p163.model.layers.18.self_attn.q_proj.weight diff --git a/-split/pytorch_model.bin/p164.model.layers.18.self_attn.k_proj.weight b/pytorch_model.bin/p164.model.layers.18.self_attn.k_proj.weight similarity index 100% rename from -split/pytorch_model.bin/p164.model.layers.18.self_attn.k_proj.weight rename to pytorch_model.bin/p164.model.layers.18.self_attn.k_proj.weight diff --git a/-split/pytorch_model.bin/p165.model.layers.18.self_attn.v_proj.weight b/pytorch_model.bin/p165.model.layers.18.self_attn.v_proj.weight similarity index 100% rename from -split/pytorch_model.bin/p165.model.layers.18.self_attn.v_proj.weight rename to pytorch_model.bin/p165.model.layers.18.self_attn.v_proj.weight diff --git a/-split/pytorch_model.bin/p166.model.layers.18.self_attn.o_proj.weight b/pytorch_model.bin/p166.model.layers.18.self_attn.o_proj.weight similarity index 100% rename from -split/pytorch_model.bin/p166.model.layers.18.self_attn.o_proj.weight rename to pytorch_model.bin/p166.model.layers.18.self_attn.o_proj.weight diff --git a/-split/pytorch_model.bin/p167.model.layers.18.mlp.gate_proj.weight b/pytorch_model.bin/p167.model.layers.18.mlp.gate_proj.weight similarity index 100% rename from -split/pytorch_model.bin/p167.model.layers.18.mlp.gate_proj.weight rename to pytorch_model.bin/p167.model.layers.18.mlp.gate_proj.weight diff --git a/-split/pytorch_model.bin/p168.model.layers.18.mlp.up_proj.weight b/pytorch_model.bin/p168.model.layers.18.mlp.up_proj.weight similarity index 100% rename from -split/pytorch_model.bin/p168.model.layers.18.mlp.up_proj.weight rename to pytorch_model.bin/p168.model.layers.18.mlp.up_proj.weight diff --git a/-split/pytorch_model.bin/p169.model.layers.18.mlp.down_proj.weight b/pytorch_model.bin/p169.model.layers.18.mlp.down_proj.weight similarity index 100% rename from -split/pytorch_model.bin/p169.model.layers.18.mlp.down_proj.weight rename to pytorch_model.bin/p169.model.layers.18.mlp.down_proj.weight diff --git a/-split/pytorch_model.bin/p17.model.layers.1.input_layernorm.weight b/pytorch_model.bin/p17.model.layers.1.input_layernorm.weight similarity index 100% rename from -split/pytorch_model.bin/p17.model.layers.1.input_layernorm.weight rename to pytorch_model.bin/p17.model.layers.1.input_layernorm.weight diff --git a/-split/pytorch_model.bin/p170.model.layers.18.input_layernorm.weight b/pytorch_model.bin/p170.model.layers.18.input_layernorm.weight similarity index 100% rename from -split/pytorch_model.bin/p170.model.layers.18.input_layernorm.weight rename to pytorch_model.bin/p170.model.layers.18.input_layernorm.weight diff --git a/-split/pytorch_model.bin/p171.model.layers.18.post_attention_layernorm.weight b/pytorch_model.bin/p171.model.layers.18.post_attention_layernorm.weight similarity index 100% rename from -split/pytorch_model.bin/p171.model.layers.18.post_attention_layernorm.weight rename to pytorch_model.bin/p171.model.layers.18.post_attention_layernorm.weight diff --git a/-split/pytorch_model.bin/p172.model.layers.19.self_attn.q_proj.weight b/pytorch_model.bin/p172.model.layers.19.self_attn.q_proj.weight similarity index 100% rename from -split/pytorch_model.bin/p172.model.layers.19.self_attn.q_proj.weight rename to pytorch_model.bin/p172.model.layers.19.self_attn.q_proj.weight diff --git a/-split/pytorch_model.bin/p173.model.layers.19.self_attn.k_proj.weight b/pytorch_model.bin/p173.model.layers.19.self_attn.k_proj.weight similarity index 100% rename from -split/pytorch_model.bin/p173.model.layers.19.self_attn.k_proj.weight rename to pytorch_model.bin/p173.model.layers.19.self_attn.k_proj.weight diff --git a/-split/pytorch_model.bin/p174.model.layers.19.self_attn.v_proj.weight b/pytorch_model.bin/p174.model.layers.19.self_attn.v_proj.weight similarity index 100% rename from -split/pytorch_model.bin/p174.model.layers.19.self_attn.v_proj.weight rename to pytorch_model.bin/p174.model.layers.19.self_attn.v_proj.weight diff --git a/-split/pytorch_model.bin/p175.model.layers.19.self_attn.o_proj.weight b/pytorch_model.bin/p175.model.layers.19.self_attn.o_proj.weight similarity index 100% rename from -split/pytorch_model.bin/p175.model.layers.19.self_attn.o_proj.weight rename to pytorch_model.bin/p175.model.layers.19.self_attn.o_proj.weight diff --git a/-split/pytorch_model.bin/p176.model.layers.19.mlp.gate_proj.weight b/pytorch_model.bin/p176.model.layers.19.mlp.gate_proj.weight similarity index 100% rename from -split/pytorch_model.bin/p176.model.layers.19.mlp.gate_proj.weight rename to pytorch_model.bin/p176.model.layers.19.mlp.gate_proj.weight diff --git a/-split/pytorch_model.bin/p177.model.layers.19.mlp.up_proj.weight b/pytorch_model.bin/p177.model.layers.19.mlp.up_proj.weight similarity index 100% rename from -split/pytorch_model.bin/p177.model.layers.19.mlp.up_proj.weight rename to pytorch_model.bin/p177.model.layers.19.mlp.up_proj.weight diff --git a/-split/pytorch_model.bin/p178.model.layers.19.mlp.down_proj.weight b/pytorch_model.bin/p178.model.layers.19.mlp.down_proj.weight similarity index 100% rename from -split/pytorch_model.bin/p178.model.layers.19.mlp.down_proj.weight rename to pytorch_model.bin/p178.model.layers.19.mlp.down_proj.weight diff --git a/-split/pytorch_model.bin/p179.model.layers.19.input_layernorm.weight b/pytorch_model.bin/p179.model.layers.19.input_layernorm.weight similarity index 100% rename from -split/pytorch_model.bin/p179.model.layers.19.input_layernorm.weight rename to pytorch_model.bin/p179.model.layers.19.input_layernorm.weight diff --git a/-split/pytorch_model.bin/p18.model.layers.1.post_attention_layernorm.weight b/pytorch_model.bin/p18.model.layers.1.post_attention_layernorm.weight similarity index 100% rename from -split/pytorch_model.bin/p18.model.layers.1.post_attention_layernorm.weight rename to pytorch_model.bin/p18.model.layers.1.post_attention_layernorm.weight diff --git a/-split/pytorch_model.bin/p180.model.layers.19.post_attention_layernorm.weight b/pytorch_model.bin/p180.model.layers.19.post_attention_layernorm.weight similarity index 100% rename from -split/pytorch_model.bin/p180.model.layers.19.post_attention_layernorm.weight rename to pytorch_model.bin/p180.model.layers.19.post_attention_layernorm.weight diff --git a/-split/pytorch_model.bin/p181.model.layers.20.self_attn.q_proj.weight b/pytorch_model.bin/p181.model.layers.20.self_attn.q_proj.weight similarity index 100% rename from -split/pytorch_model.bin/p181.model.layers.20.self_attn.q_proj.weight rename to pytorch_model.bin/p181.model.layers.20.self_attn.q_proj.weight diff --git a/-split/pytorch_model.bin/p182.model.layers.20.self_attn.k_proj.weight b/pytorch_model.bin/p182.model.layers.20.self_attn.k_proj.weight similarity index 100% rename from -split/pytorch_model.bin/p182.model.layers.20.self_attn.k_proj.weight rename to pytorch_model.bin/p182.model.layers.20.self_attn.k_proj.weight diff --git a/-split/pytorch_model.bin/p183.model.layers.20.self_attn.v_proj.weight b/pytorch_model.bin/p183.model.layers.20.self_attn.v_proj.weight similarity index 100% rename from -split/pytorch_model.bin/p183.model.layers.20.self_attn.v_proj.weight rename to pytorch_model.bin/p183.model.layers.20.self_attn.v_proj.weight diff --git a/-split/pytorch_model.bin/p184.model.layers.20.self_attn.o_proj.weight b/pytorch_model.bin/p184.model.layers.20.self_attn.o_proj.weight similarity index 100% rename from -split/pytorch_model.bin/p184.model.layers.20.self_attn.o_proj.weight rename to pytorch_model.bin/p184.model.layers.20.self_attn.o_proj.weight diff --git a/-split/pytorch_model.bin/p185.model.layers.20.mlp.gate_proj.weight b/pytorch_model.bin/p185.model.layers.20.mlp.gate_proj.weight similarity index 100% rename from -split/pytorch_model.bin/p185.model.layers.20.mlp.gate_proj.weight rename to pytorch_model.bin/p185.model.layers.20.mlp.gate_proj.weight diff --git a/-split/pytorch_model.bin/p186.model.layers.20.mlp.up_proj.weight b/pytorch_model.bin/p186.model.layers.20.mlp.up_proj.weight similarity index 100% rename from -split/pytorch_model.bin/p186.model.layers.20.mlp.up_proj.weight rename to pytorch_model.bin/p186.model.layers.20.mlp.up_proj.weight diff --git a/-split/pytorch_model.bin/p187.model.layers.20.mlp.down_proj.weight b/pytorch_model.bin/p187.model.layers.20.mlp.down_proj.weight similarity index 100% rename from -split/pytorch_model.bin/p187.model.layers.20.mlp.down_proj.weight rename to pytorch_model.bin/p187.model.layers.20.mlp.down_proj.weight diff --git a/-split/pytorch_model.bin/p188.model.layers.20.input_layernorm.weight b/pytorch_model.bin/p188.model.layers.20.input_layernorm.weight similarity index 100% rename from -split/pytorch_model.bin/p188.model.layers.20.input_layernorm.weight rename to pytorch_model.bin/p188.model.layers.20.input_layernorm.weight diff --git a/-split/pytorch_model.bin/p189.model.layers.20.post_attention_layernorm.weight b/pytorch_model.bin/p189.model.layers.20.post_attention_layernorm.weight similarity index 100% rename from -split/pytorch_model.bin/p189.model.layers.20.post_attention_layernorm.weight rename to pytorch_model.bin/p189.model.layers.20.post_attention_layernorm.weight diff --git a/-split/pytorch_model.bin/p19.model.layers.2.self_attn.q_proj.weight b/pytorch_model.bin/p19.model.layers.2.self_attn.q_proj.weight similarity index 100% rename from -split/pytorch_model.bin/p19.model.layers.2.self_attn.q_proj.weight rename to pytorch_model.bin/p19.model.layers.2.self_attn.q_proj.weight diff --git a/-split/pytorch_model.bin/p190.model.layers.21.self_attn.q_proj.weight b/pytorch_model.bin/p190.model.layers.21.self_attn.q_proj.weight similarity index 100% rename from -split/pytorch_model.bin/p190.model.layers.21.self_attn.q_proj.weight rename to pytorch_model.bin/p190.model.layers.21.self_attn.q_proj.weight diff --git a/-split/pytorch_model.bin/p191.model.layers.21.self_attn.k_proj.weight b/pytorch_model.bin/p191.model.layers.21.self_attn.k_proj.weight similarity index 100% rename from -split/pytorch_model.bin/p191.model.layers.21.self_attn.k_proj.weight rename to pytorch_model.bin/p191.model.layers.21.self_attn.k_proj.weight diff --git a/-split/pytorch_model.bin/p192.model.layers.21.self_attn.v_proj.weight b/pytorch_model.bin/p192.model.layers.21.self_attn.v_proj.weight similarity index 100% rename from -split/pytorch_model.bin/p192.model.layers.21.self_attn.v_proj.weight rename to pytorch_model.bin/p192.model.layers.21.self_attn.v_proj.weight diff --git a/-split/pytorch_model.bin/p193.model.layers.21.self_attn.o_proj.weight b/pytorch_model.bin/p193.model.layers.21.self_attn.o_proj.weight similarity index 100% rename from -split/pytorch_model.bin/p193.model.layers.21.self_attn.o_proj.weight rename to pytorch_model.bin/p193.model.layers.21.self_attn.o_proj.weight diff --git a/-split/pytorch_model.bin/p194.model.layers.21.mlp.gate_proj.weight b/pytorch_model.bin/p194.model.layers.21.mlp.gate_proj.weight similarity index 100% rename from -split/pytorch_model.bin/p194.model.layers.21.mlp.gate_proj.weight rename to pytorch_model.bin/p194.model.layers.21.mlp.gate_proj.weight diff --git a/-split/pytorch_model.bin/p195.model.layers.21.mlp.up_proj.weight b/pytorch_model.bin/p195.model.layers.21.mlp.up_proj.weight similarity index 100% rename from -split/pytorch_model.bin/p195.model.layers.21.mlp.up_proj.weight rename to pytorch_model.bin/p195.model.layers.21.mlp.up_proj.weight diff --git a/-split/pytorch_model.bin/p196.model.layers.21.mlp.down_proj.weight b/pytorch_model.bin/p196.model.layers.21.mlp.down_proj.weight similarity index 100% rename from -split/pytorch_model.bin/p196.model.layers.21.mlp.down_proj.weight rename to pytorch_model.bin/p196.model.layers.21.mlp.down_proj.weight diff --git a/-split/pytorch_model.bin/p197.model.layers.21.input_layernorm.weight b/pytorch_model.bin/p197.model.layers.21.input_layernorm.weight similarity index 100% rename from -split/pytorch_model.bin/p197.model.layers.21.input_layernorm.weight rename to pytorch_model.bin/p197.model.layers.21.input_layernorm.weight diff --git a/-split/pytorch_model.bin/p198.model.layers.21.post_attention_layernorm.weight b/pytorch_model.bin/p198.model.layers.21.post_attention_layernorm.weight similarity index 100% rename from -split/pytorch_model.bin/p198.model.layers.21.post_attention_layernorm.weight rename to pytorch_model.bin/p198.model.layers.21.post_attention_layernorm.weight diff --git a/-split/pytorch_model.bin/p199.model.layers.22.self_attn.q_proj.weight b/pytorch_model.bin/p199.model.layers.22.self_attn.q_proj.weight similarity index 100% rename from -split/pytorch_model.bin/p199.model.layers.22.self_attn.q_proj.weight rename to pytorch_model.bin/p199.model.layers.22.self_attn.q_proj.weight diff --git a/-split/pytorch_model.bin/p2.model.layers.0.self_attn.k_proj.weight b/pytorch_model.bin/p2.model.layers.0.self_attn.k_proj.weight similarity index 100% rename from -split/pytorch_model.bin/p2.model.layers.0.self_attn.k_proj.weight rename to pytorch_model.bin/p2.model.layers.0.self_attn.k_proj.weight diff --git a/-split/pytorch_model.bin/p20.model.layers.2.self_attn.k_proj.weight b/pytorch_model.bin/p20.model.layers.2.self_attn.k_proj.weight similarity index 100% rename from -split/pytorch_model.bin/p20.model.layers.2.self_attn.k_proj.weight rename to pytorch_model.bin/p20.model.layers.2.self_attn.k_proj.weight diff --git a/-split/pytorch_model.bin/p200.model.layers.22.self_attn.k_proj.weight b/pytorch_model.bin/p200.model.layers.22.self_attn.k_proj.weight similarity index 100% rename from -split/pytorch_model.bin/p200.model.layers.22.self_attn.k_proj.weight rename to pytorch_model.bin/p200.model.layers.22.self_attn.k_proj.weight diff --git a/-split/pytorch_model.bin/p201.model.layers.22.self_attn.v_proj.weight b/pytorch_model.bin/p201.model.layers.22.self_attn.v_proj.weight similarity index 100% rename from -split/pytorch_model.bin/p201.model.layers.22.self_attn.v_proj.weight rename to pytorch_model.bin/p201.model.layers.22.self_attn.v_proj.weight diff --git a/-split/pytorch_model.bin/p202.model.layers.22.self_attn.o_proj.weight b/pytorch_model.bin/p202.model.layers.22.self_attn.o_proj.weight similarity index 100% rename from -split/pytorch_model.bin/p202.model.layers.22.self_attn.o_proj.weight rename to pytorch_model.bin/p202.model.layers.22.self_attn.o_proj.weight diff --git a/-split/pytorch_model.bin/p203.model.layers.22.mlp.gate_proj.weight b/pytorch_model.bin/p203.model.layers.22.mlp.gate_proj.weight similarity index 100% rename from -split/pytorch_model.bin/p203.model.layers.22.mlp.gate_proj.weight rename to pytorch_model.bin/p203.model.layers.22.mlp.gate_proj.weight diff --git a/-split/pytorch_model.bin/p204.model.layers.22.mlp.up_proj.weight b/pytorch_model.bin/p204.model.layers.22.mlp.up_proj.weight similarity index 100% rename from -split/pytorch_model.bin/p204.model.layers.22.mlp.up_proj.weight rename to pytorch_model.bin/p204.model.layers.22.mlp.up_proj.weight diff --git a/-split/pytorch_model.bin/p205.model.layers.22.mlp.down_proj.weight b/pytorch_model.bin/p205.model.layers.22.mlp.down_proj.weight similarity index 100% rename from -split/pytorch_model.bin/p205.model.layers.22.mlp.down_proj.weight rename to pytorch_model.bin/p205.model.layers.22.mlp.down_proj.weight diff --git a/-split/pytorch_model.bin/p206.model.layers.22.input_layernorm.weight b/pytorch_model.bin/p206.model.layers.22.input_layernorm.weight similarity index 100% rename from -split/pytorch_model.bin/p206.model.layers.22.input_layernorm.weight rename to pytorch_model.bin/p206.model.layers.22.input_layernorm.weight diff --git a/-split/pytorch_model.bin/p207.model.layers.22.post_attention_layernorm.weight b/pytorch_model.bin/p207.model.layers.22.post_attention_layernorm.weight similarity index 100% rename from -split/pytorch_model.bin/p207.model.layers.22.post_attention_layernorm.weight rename to pytorch_model.bin/p207.model.layers.22.post_attention_layernorm.weight diff --git a/-split/pytorch_model.bin/p208.model.layers.23.self_attn.q_proj.weight b/pytorch_model.bin/p208.model.layers.23.self_attn.q_proj.weight similarity index 100% rename from -split/pytorch_model.bin/p208.model.layers.23.self_attn.q_proj.weight rename to pytorch_model.bin/p208.model.layers.23.self_attn.q_proj.weight diff --git a/-split/pytorch_model.bin/p209.model.layers.23.self_attn.k_proj.weight b/pytorch_model.bin/p209.model.layers.23.self_attn.k_proj.weight similarity index 100% rename from -split/pytorch_model.bin/p209.model.layers.23.self_attn.k_proj.weight rename to pytorch_model.bin/p209.model.layers.23.self_attn.k_proj.weight diff --git a/-split/pytorch_model.bin/p21.model.layers.2.self_attn.v_proj.weight b/pytorch_model.bin/p21.model.layers.2.self_attn.v_proj.weight similarity index 100% rename from -split/pytorch_model.bin/p21.model.layers.2.self_attn.v_proj.weight rename to pytorch_model.bin/p21.model.layers.2.self_attn.v_proj.weight diff --git a/-split/pytorch_model.bin/p210.model.layers.23.self_attn.v_proj.weight b/pytorch_model.bin/p210.model.layers.23.self_attn.v_proj.weight similarity index 100% rename from -split/pytorch_model.bin/p210.model.layers.23.self_attn.v_proj.weight rename to pytorch_model.bin/p210.model.layers.23.self_attn.v_proj.weight diff --git a/-split/pytorch_model.bin/p211.model.layers.23.self_attn.o_proj.weight b/pytorch_model.bin/p211.model.layers.23.self_attn.o_proj.weight similarity index 100% rename from -split/pytorch_model.bin/p211.model.layers.23.self_attn.o_proj.weight rename to pytorch_model.bin/p211.model.layers.23.self_attn.o_proj.weight diff --git a/-split/pytorch_model.bin/p212.model.layers.23.mlp.gate_proj.weight b/pytorch_model.bin/p212.model.layers.23.mlp.gate_proj.weight similarity index 100% rename from -split/pytorch_model.bin/p212.model.layers.23.mlp.gate_proj.weight rename to pytorch_model.bin/p212.model.layers.23.mlp.gate_proj.weight diff --git a/-split/pytorch_model.bin/p213.model.layers.23.mlp.up_proj.weight b/pytorch_model.bin/p213.model.layers.23.mlp.up_proj.weight similarity index 100% rename from -split/pytorch_model.bin/p213.model.layers.23.mlp.up_proj.weight rename to pytorch_model.bin/p213.model.layers.23.mlp.up_proj.weight diff --git a/-split/pytorch_model.bin/p214.model.layers.23.mlp.down_proj.weight b/pytorch_model.bin/p214.model.layers.23.mlp.down_proj.weight similarity index 100% rename from -split/pytorch_model.bin/p214.model.layers.23.mlp.down_proj.weight rename to pytorch_model.bin/p214.model.layers.23.mlp.down_proj.weight diff --git a/-split/pytorch_model.bin/p215.model.layers.23.input_layernorm.weight b/pytorch_model.bin/p215.model.layers.23.input_layernorm.weight similarity index 100% rename from -split/pytorch_model.bin/p215.model.layers.23.input_layernorm.weight rename to pytorch_model.bin/p215.model.layers.23.input_layernorm.weight diff --git a/-split/pytorch_model.bin/p216.model.layers.23.post_attention_layernorm.weight b/pytorch_model.bin/p216.model.layers.23.post_attention_layernorm.weight similarity index 100% rename from -split/pytorch_model.bin/p216.model.layers.23.post_attention_layernorm.weight rename to pytorch_model.bin/p216.model.layers.23.post_attention_layernorm.weight diff --git a/-split/pytorch_model.bin/p217.model.layers.24.self_attn.q_proj.weight b/pytorch_model.bin/p217.model.layers.24.self_attn.q_proj.weight similarity index 100% rename from -split/pytorch_model.bin/p217.model.layers.24.self_attn.q_proj.weight rename to pytorch_model.bin/p217.model.layers.24.self_attn.q_proj.weight diff --git a/-split/pytorch_model.bin/p218.model.layers.24.self_attn.k_proj.weight b/pytorch_model.bin/p218.model.layers.24.self_attn.k_proj.weight similarity index 100% rename from -split/pytorch_model.bin/p218.model.layers.24.self_attn.k_proj.weight rename to pytorch_model.bin/p218.model.layers.24.self_attn.k_proj.weight diff --git a/-split/pytorch_model.bin/p219.model.layers.24.self_attn.v_proj.weight b/pytorch_model.bin/p219.model.layers.24.self_attn.v_proj.weight similarity index 100% rename from -split/pytorch_model.bin/p219.model.layers.24.self_attn.v_proj.weight rename to pytorch_model.bin/p219.model.layers.24.self_attn.v_proj.weight diff --git a/-split/pytorch_model.bin/p22.model.layers.2.self_attn.o_proj.weight b/pytorch_model.bin/p22.model.layers.2.self_attn.o_proj.weight similarity index 100% rename from -split/pytorch_model.bin/p22.model.layers.2.self_attn.o_proj.weight rename to pytorch_model.bin/p22.model.layers.2.self_attn.o_proj.weight diff --git a/-split/pytorch_model.bin/p220.model.layers.24.self_attn.o_proj.weight b/pytorch_model.bin/p220.model.layers.24.self_attn.o_proj.weight similarity index 100% rename from -split/pytorch_model.bin/p220.model.layers.24.self_attn.o_proj.weight rename to pytorch_model.bin/p220.model.layers.24.self_attn.o_proj.weight diff --git a/-split/pytorch_model.bin/p221.model.layers.24.mlp.gate_proj.weight b/pytorch_model.bin/p221.model.layers.24.mlp.gate_proj.weight similarity index 100% rename from -split/pytorch_model.bin/p221.model.layers.24.mlp.gate_proj.weight rename to pytorch_model.bin/p221.model.layers.24.mlp.gate_proj.weight diff --git a/-split/pytorch_model.bin/p222.model.layers.24.mlp.up_proj.weight b/pytorch_model.bin/p222.model.layers.24.mlp.up_proj.weight similarity index 100% rename from -split/pytorch_model.bin/p222.model.layers.24.mlp.up_proj.weight rename to pytorch_model.bin/p222.model.layers.24.mlp.up_proj.weight diff --git a/-split/pytorch_model.bin/p223.model.layers.24.mlp.down_proj.weight b/pytorch_model.bin/p223.model.layers.24.mlp.down_proj.weight similarity index 100% rename from -split/pytorch_model.bin/p223.model.layers.24.mlp.down_proj.weight rename to pytorch_model.bin/p223.model.layers.24.mlp.down_proj.weight diff --git a/-split/pytorch_model.bin/p224.model.layers.24.input_layernorm.weight b/pytorch_model.bin/p224.model.layers.24.input_layernorm.weight similarity index 100% rename from -split/pytorch_model.bin/p224.model.layers.24.input_layernorm.weight rename to pytorch_model.bin/p224.model.layers.24.input_layernorm.weight diff --git a/-split/pytorch_model.bin/p225.model.layers.24.post_attention_layernorm.weight b/pytorch_model.bin/p225.model.layers.24.post_attention_layernorm.weight similarity index 100% rename from -split/pytorch_model.bin/p225.model.layers.24.post_attention_layernorm.weight rename to pytorch_model.bin/p225.model.layers.24.post_attention_layernorm.weight diff --git a/-split/pytorch_model.bin/p226.model.layers.25.self_attn.q_proj.weight b/pytorch_model.bin/p226.model.layers.25.self_attn.q_proj.weight similarity index 100% rename from -split/pytorch_model.bin/p226.model.layers.25.self_attn.q_proj.weight rename to pytorch_model.bin/p226.model.layers.25.self_attn.q_proj.weight diff --git a/-split/pytorch_model.bin/p227.model.layers.25.self_attn.k_proj.weight b/pytorch_model.bin/p227.model.layers.25.self_attn.k_proj.weight similarity index 100% rename from -split/pytorch_model.bin/p227.model.layers.25.self_attn.k_proj.weight rename to pytorch_model.bin/p227.model.layers.25.self_attn.k_proj.weight diff --git a/-split/pytorch_model.bin/p228.model.layers.25.self_attn.v_proj.weight b/pytorch_model.bin/p228.model.layers.25.self_attn.v_proj.weight similarity index 100% rename from -split/pytorch_model.bin/p228.model.layers.25.self_attn.v_proj.weight rename to pytorch_model.bin/p228.model.layers.25.self_attn.v_proj.weight diff --git a/-split/pytorch_model.bin/p229.model.layers.25.self_attn.o_proj.weight b/pytorch_model.bin/p229.model.layers.25.self_attn.o_proj.weight similarity index 100% rename from -split/pytorch_model.bin/p229.model.layers.25.self_attn.o_proj.weight rename to pytorch_model.bin/p229.model.layers.25.self_attn.o_proj.weight diff --git a/-split/pytorch_model.bin/p23.model.layers.2.mlp.gate_proj.weight b/pytorch_model.bin/p23.model.layers.2.mlp.gate_proj.weight similarity index 100% rename from -split/pytorch_model.bin/p23.model.layers.2.mlp.gate_proj.weight rename to pytorch_model.bin/p23.model.layers.2.mlp.gate_proj.weight diff --git a/-split/pytorch_model.bin/p230.model.layers.25.mlp.gate_proj.weight b/pytorch_model.bin/p230.model.layers.25.mlp.gate_proj.weight similarity index 100% rename from -split/pytorch_model.bin/p230.model.layers.25.mlp.gate_proj.weight rename to pytorch_model.bin/p230.model.layers.25.mlp.gate_proj.weight diff --git a/-split/pytorch_model.bin/p231.model.layers.25.mlp.up_proj.weight b/pytorch_model.bin/p231.model.layers.25.mlp.up_proj.weight similarity index 100% rename from -split/pytorch_model.bin/p231.model.layers.25.mlp.up_proj.weight rename to pytorch_model.bin/p231.model.layers.25.mlp.up_proj.weight diff --git a/-split/pytorch_model.bin/p232.model.layers.25.mlp.down_proj.weight b/pytorch_model.bin/p232.model.layers.25.mlp.down_proj.weight similarity index 100% rename from -split/pytorch_model.bin/p232.model.layers.25.mlp.down_proj.weight rename to pytorch_model.bin/p232.model.layers.25.mlp.down_proj.weight diff --git a/-split/pytorch_model.bin/p233.model.layers.25.input_layernorm.weight b/pytorch_model.bin/p233.model.layers.25.input_layernorm.weight similarity index 100% rename from -split/pytorch_model.bin/p233.model.layers.25.input_layernorm.weight rename to pytorch_model.bin/p233.model.layers.25.input_layernorm.weight diff --git a/-split/pytorch_model.bin/p234.model.layers.25.post_attention_layernorm.weight b/pytorch_model.bin/p234.model.layers.25.post_attention_layernorm.weight similarity index 100% rename from -split/pytorch_model.bin/p234.model.layers.25.post_attention_layernorm.weight rename to pytorch_model.bin/p234.model.layers.25.post_attention_layernorm.weight diff --git a/-split/pytorch_model.bin/p235.model.layers.26.self_attn.q_proj.weight b/pytorch_model.bin/p235.model.layers.26.self_attn.q_proj.weight similarity index 100% rename from -split/pytorch_model.bin/p235.model.layers.26.self_attn.q_proj.weight rename to pytorch_model.bin/p235.model.layers.26.self_attn.q_proj.weight diff --git a/-split/pytorch_model.bin/p236.model.layers.26.self_attn.k_proj.weight b/pytorch_model.bin/p236.model.layers.26.self_attn.k_proj.weight similarity index 100% rename from -split/pytorch_model.bin/p236.model.layers.26.self_attn.k_proj.weight rename to pytorch_model.bin/p236.model.layers.26.self_attn.k_proj.weight diff --git a/-split/pytorch_model.bin/p237.model.layers.26.self_attn.v_proj.weight b/pytorch_model.bin/p237.model.layers.26.self_attn.v_proj.weight similarity index 100% rename from -split/pytorch_model.bin/p237.model.layers.26.self_attn.v_proj.weight rename to pytorch_model.bin/p237.model.layers.26.self_attn.v_proj.weight diff --git a/-split/pytorch_model.bin/p238.model.layers.26.self_attn.o_proj.weight b/pytorch_model.bin/p238.model.layers.26.self_attn.o_proj.weight similarity index 100% rename from -split/pytorch_model.bin/p238.model.layers.26.self_attn.o_proj.weight rename to pytorch_model.bin/p238.model.layers.26.self_attn.o_proj.weight diff --git a/-split/pytorch_model.bin/p239.model.layers.26.mlp.gate_proj.weight b/pytorch_model.bin/p239.model.layers.26.mlp.gate_proj.weight similarity index 100% rename from -split/pytorch_model.bin/p239.model.layers.26.mlp.gate_proj.weight rename to pytorch_model.bin/p239.model.layers.26.mlp.gate_proj.weight diff --git a/-split/pytorch_model.bin/p24.model.layers.2.mlp.up_proj.weight b/pytorch_model.bin/p24.model.layers.2.mlp.up_proj.weight similarity index 100% rename from -split/pytorch_model.bin/p24.model.layers.2.mlp.up_proj.weight rename to pytorch_model.bin/p24.model.layers.2.mlp.up_proj.weight diff --git a/-split/pytorch_model.bin/p240.model.layers.26.mlp.up_proj.weight b/pytorch_model.bin/p240.model.layers.26.mlp.up_proj.weight similarity index 100% rename from -split/pytorch_model.bin/p240.model.layers.26.mlp.up_proj.weight rename to pytorch_model.bin/p240.model.layers.26.mlp.up_proj.weight diff --git a/-split/pytorch_model.bin/p241.model.layers.26.mlp.down_proj.weight b/pytorch_model.bin/p241.model.layers.26.mlp.down_proj.weight similarity index 100% rename from -split/pytorch_model.bin/p241.model.layers.26.mlp.down_proj.weight rename to pytorch_model.bin/p241.model.layers.26.mlp.down_proj.weight diff --git a/-split/pytorch_model.bin/p242.model.layers.26.input_layernorm.weight b/pytorch_model.bin/p242.model.layers.26.input_layernorm.weight similarity index 100% rename from -split/pytorch_model.bin/p242.model.layers.26.input_layernorm.weight rename to pytorch_model.bin/p242.model.layers.26.input_layernorm.weight diff --git a/-split/pytorch_model.bin/p243.model.layers.26.post_attention_layernorm.weight b/pytorch_model.bin/p243.model.layers.26.post_attention_layernorm.weight similarity index 100% rename from -split/pytorch_model.bin/p243.model.layers.26.post_attention_layernorm.weight rename to pytorch_model.bin/p243.model.layers.26.post_attention_layernorm.weight diff --git a/-split/pytorch_model.bin/p244.model.layers.27.self_attn.q_proj.weight b/pytorch_model.bin/p244.model.layers.27.self_attn.q_proj.weight similarity index 100% rename from -split/pytorch_model.bin/p244.model.layers.27.self_attn.q_proj.weight rename to pytorch_model.bin/p244.model.layers.27.self_attn.q_proj.weight diff --git a/-split/pytorch_model.bin/p245.model.layers.27.self_attn.k_proj.weight b/pytorch_model.bin/p245.model.layers.27.self_attn.k_proj.weight similarity index 100% rename from -split/pytorch_model.bin/p245.model.layers.27.self_attn.k_proj.weight rename to pytorch_model.bin/p245.model.layers.27.self_attn.k_proj.weight diff --git a/-split/pytorch_model.bin/p246.model.layers.27.self_attn.v_proj.weight b/pytorch_model.bin/p246.model.layers.27.self_attn.v_proj.weight similarity index 100% rename from -split/pytorch_model.bin/p246.model.layers.27.self_attn.v_proj.weight rename to pytorch_model.bin/p246.model.layers.27.self_attn.v_proj.weight diff --git a/-split/pytorch_model.bin/p247.model.layers.27.self_attn.o_proj.weight b/pytorch_model.bin/p247.model.layers.27.self_attn.o_proj.weight similarity index 100% rename from -split/pytorch_model.bin/p247.model.layers.27.self_attn.o_proj.weight rename to pytorch_model.bin/p247.model.layers.27.self_attn.o_proj.weight diff --git a/-split/pytorch_model.bin/p248.model.layers.27.mlp.gate_proj.weight b/pytorch_model.bin/p248.model.layers.27.mlp.gate_proj.weight similarity index 100% rename from -split/pytorch_model.bin/p248.model.layers.27.mlp.gate_proj.weight rename to pytorch_model.bin/p248.model.layers.27.mlp.gate_proj.weight diff --git a/-split/pytorch_model.bin/p249.model.layers.27.mlp.up_proj.weight b/pytorch_model.bin/p249.model.layers.27.mlp.up_proj.weight similarity index 100% rename from -split/pytorch_model.bin/p249.model.layers.27.mlp.up_proj.weight rename to pytorch_model.bin/p249.model.layers.27.mlp.up_proj.weight diff --git a/-split/pytorch_model.bin/p25.model.layers.2.mlp.down_proj.weight b/pytorch_model.bin/p25.model.layers.2.mlp.down_proj.weight similarity index 100% rename from -split/pytorch_model.bin/p25.model.layers.2.mlp.down_proj.weight rename to pytorch_model.bin/p25.model.layers.2.mlp.down_proj.weight diff --git a/-split/pytorch_model.bin/p250.model.layers.27.mlp.down_proj.weight b/pytorch_model.bin/p250.model.layers.27.mlp.down_proj.weight similarity index 100% rename from -split/pytorch_model.bin/p250.model.layers.27.mlp.down_proj.weight rename to pytorch_model.bin/p250.model.layers.27.mlp.down_proj.weight diff --git a/-split/pytorch_model.bin/p251.model.layers.27.input_layernorm.weight b/pytorch_model.bin/p251.model.layers.27.input_layernorm.weight similarity index 100% rename from -split/pytorch_model.bin/p251.model.layers.27.input_layernorm.weight rename to pytorch_model.bin/p251.model.layers.27.input_layernorm.weight diff --git a/-split/pytorch_model.bin/p252.model.layers.27.post_attention_layernorm.weight b/pytorch_model.bin/p252.model.layers.27.post_attention_layernorm.weight similarity index 100% rename from -split/pytorch_model.bin/p252.model.layers.27.post_attention_layernorm.weight rename to pytorch_model.bin/p252.model.layers.27.post_attention_layernorm.weight diff --git a/-split/pytorch_model.bin/p253.model.layers.28.self_attn.q_proj.weight b/pytorch_model.bin/p253.model.layers.28.self_attn.q_proj.weight similarity index 100% rename from -split/pytorch_model.bin/p253.model.layers.28.self_attn.q_proj.weight rename to pytorch_model.bin/p253.model.layers.28.self_attn.q_proj.weight diff --git a/-split/pytorch_model.bin/p254.model.layers.28.self_attn.k_proj.weight b/pytorch_model.bin/p254.model.layers.28.self_attn.k_proj.weight similarity index 100% rename from -split/pytorch_model.bin/p254.model.layers.28.self_attn.k_proj.weight rename to pytorch_model.bin/p254.model.layers.28.self_attn.k_proj.weight diff --git a/-split/pytorch_model.bin/p255.model.layers.28.self_attn.v_proj.weight b/pytorch_model.bin/p255.model.layers.28.self_attn.v_proj.weight similarity index 100% rename from -split/pytorch_model.bin/p255.model.layers.28.self_attn.v_proj.weight rename to pytorch_model.bin/p255.model.layers.28.self_attn.v_proj.weight diff --git a/-split/pytorch_model.bin/p256.model.layers.28.self_attn.o_proj.weight b/pytorch_model.bin/p256.model.layers.28.self_attn.o_proj.weight similarity index 100% rename from -split/pytorch_model.bin/p256.model.layers.28.self_attn.o_proj.weight rename to pytorch_model.bin/p256.model.layers.28.self_attn.o_proj.weight diff --git a/-split/pytorch_model.bin/p257.model.layers.28.mlp.gate_proj.weight b/pytorch_model.bin/p257.model.layers.28.mlp.gate_proj.weight similarity index 100% rename from -split/pytorch_model.bin/p257.model.layers.28.mlp.gate_proj.weight rename to pytorch_model.bin/p257.model.layers.28.mlp.gate_proj.weight diff --git a/-split/pytorch_model.bin/p258.model.layers.28.mlp.up_proj.weight b/pytorch_model.bin/p258.model.layers.28.mlp.up_proj.weight similarity index 100% rename from -split/pytorch_model.bin/p258.model.layers.28.mlp.up_proj.weight rename to pytorch_model.bin/p258.model.layers.28.mlp.up_proj.weight diff --git a/-split/pytorch_model.bin/p259.model.layers.28.mlp.down_proj.weight b/pytorch_model.bin/p259.model.layers.28.mlp.down_proj.weight similarity index 100% rename from -split/pytorch_model.bin/p259.model.layers.28.mlp.down_proj.weight rename to pytorch_model.bin/p259.model.layers.28.mlp.down_proj.weight diff --git a/-split/pytorch_model.bin/p26.model.layers.2.input_layernorm.weight b/pytorch_model.bin/p26.model.layers.2.input_layernorm.weight similarity index 100% rename from -split/pytorch_model.bin/p26.model.layers.2.input_layernorm.weight rename to pytorch_model.bin/p26.model.layers.2.input_layernorm.weight diff --git a/-split/pytorch_model.bin/p260.model.layers.28.input_layernorm.weight b/pytorch_model.bin/p260.model.layers.28.input_layernorm.weight similarity index 100% rename from -split/pytorch_model.bin/p260.model.layers.28.input_layernorm.weight rename to pytorch_model.bin/p260.model.layers.28.input_layernorm.weight diff --git a/-split/pytorch_model.bin/p261.model.layers.28.post_attention_layernorm.weight b/pytorch_model.bin/p261.model.layers.28.post_attention_layernorm.weight similarity index 100% rename from -split/pytorch_model.bin/p261.model.layers.28.post_attention_layernorm.weight rename to pytorch_model.bin/p261.model.layers.28.post_attention_layernorm.weight diff --git a/-split/pytorch_model.bin/p262.model.layers.29.self_attn.q_proj.weight b/pytorch_model.bin/p262.model.layers.29.self_attn.q_proj.weight similarity index 100% rename from -split/pytorch_model.bin/p262.model.layers.29.self_attn.q_proj.weight rename to pytorch_model.bin/p262.model.layers.29.self_attn.q_proj.weight diff --git a/-split/pytorch_model.bin/p263.model.layers.29.self_attn.k_proj.weight b/pytorch_model.bin/p263.model.layers.29.self_attn.k_proj.weight similarity index 100% rename from -split/pytorch_model.bin/p263.model.layers.29.self_attn.k_proj.weight rename to pytorch_model.bin/p263.model.layers.29.self_attn.k_proj.weight diff --git a/-split/pytorch_model.bin/p264.model.layers.29.self_attn.v_proj.weight b/pytorch_model.bin/p264.model.layers.29.self_attn.v_proj.weight similarity index 100% rename from -split/pytorch_model.bin/p264.model.layers.29.self_attn.v_proj.weight rename to pytorch_model.bin/p264.model.layers.29.self_attn.v_proj.weight diff --git a/-split/pytorch_model.bin/p265.model.layers.29.self_attn.o_proj.weight b/pytorch_model.bin/p265.model.layers.29.self_attn.o_proj.weight similarity index 100% rename from -split/pytorch_model.bin/p265.model.layers.29.self_attn.o_proj.weight rename to pytorch_model.bin/p265.model.layers.29.self_attn.o_proj.weight diff --git a/-split/pytorch_model.bin/p266.model.layers.29.mlp.gate_proj.weight b/pytorch_model.bin/p266.model.layers.29.mlp.gate_proj.weight similarity index 100% rename from -split/pytorch_model.bin/p266.model.layers.29.mlp.gate_proj.weight rename to pytorch_model.bin/p266.model.layers.29.mlp.gate_proj.weight diff --git a/-split/pytorch_model.bin/p267.model.layers.29.mlp.up_proj.weight b/pytorch_model.bin/p267.model.layers.29.mlp.up_proj.weight similarity index 100% rename from -split/pytorch_model.bin/p267.model.layers.29.mlp.up_proj.weight rename to pytorch_model.bin/p267.model.layers.29.mlp.up_proj.weight diff --git a/-split/pytorch_model.bin/p268.model.layers.29.mlp.down_proj.weight b/pytorch_model.bin/p268.model.layers.29.mlp.down_proj.weight similarity index 100% rename from -split/pytorch_model.bin/p268.model.layers.29.mlp.down_proj.weight rename to pytorch_model.bin/p268.model.layers.29.mlp.down_proj.weight diff --git a/-split/pytorch_model.bin/p269.model.layers.29.input_layernorm.weight b/pytorch_model.bin/p269.model.layers.29.input_layernorm.weight similarity index 100% rename from -split/pytorch_model.bin/p269.model.layers.29.input_layernorm.weight rename to pytorch_model.bin/p269.model.layers.29.input_layernorm.weight diff --git a/-split/pytorch_model.bin/p27.model.layers.2.post_attention_layernorm.weight b/pytorch_model.bin/p27.model.layers.2.post_attention_layernorm.weight similarity index 100% rename from -split/pytorch_model.bin/p27.model.layers.2.post_attention_layernorm.weight rename to pytorch_model.bin/p27.model.layers.2.post_attention_layernorm.weight diff --git a/-split/pytorch_model.bin/p270.model.layers.29.post_attention_layernorm.weight b/pytorch_model.bin/p270.model.layers.29.post_attention_layernorm.weight similarity index 100% rename from -split/pytorch_model.bin/p270.model.layers.29.post_attention_layernorm.weight rename to pytorch_model.bin/p270.model.layers.29.post_attention_layernorm.weight diff --git a/-split/pytorch_model.bin/p271.model.layers.30.self_attn.q_proj.weight b/pytorch_model.bin/p271.model.layers.30.self_attn.q_proj.weight similarity index 100% rename from -split/pytorch_model.bin/p271.model.layers.30.self_attn.q_proj.weight rename to pytorch_model.bin/p271.model.layers.30.self_attn.q_proj.weight diff --git a/-split/pytorch_model.bin/p272.model.layers.30.self_attn.k_proj.weight b/pytorch_model.bin/p272.model.layers.30.self_attn.k_proj.weight similarity index 100% rename from -split/pytorch_model.bin/p272.model.layers.30.self_attn.k_proj.weight rename to pytorch_model.bin/p272.model.layers.30.self_attn.k_proj.weight diff --git a/-split/pytorch_model.bin/p273.model.layers.30.self_attn.v_proj.weight b/pytorch_model.bin/p273.model.layers.30.self_attn.v_proj.weight similarity index 100% rename from -split/pytorch_model.bin/p273.model.layers.30.self_attn.v_proj.weight rename to pytorch_model.bin/p273.model.layers.30.self_attn.v_proj.weight diff --git a/-split/pytorch_model.bin/p274.model.layers.30.self_attn.o_proj.weight b/pytorch_model.bin/p274.model.layers.30.self_attn.o_proj.weight similarity index 100% rename from -split/pytorch_model.bin/p274.model.layers.30.self_attn.o_proj.weight rename to pytorch_model.bin/p274.model.layers.30.self_attn.o_proj.weight diff --git a/-split/pytorch_model.bin/p275.model.layers.30.mlp.gate_proj.weight b/pytorch_model.bin/p275.model.layers.30.mlp.gate_proj.weight similarity index 100% rename from -split/pytorch_model.bin/p275.model.layers.30.mlp.gate_proj.weight rename to pytorch_model.bin/p275.model.layers.30.mlp.gate_proj.weight diff --git a/-split/pytorch_model.bin/p276.model.layers.30.mlp.up_proj.weight b/pytorch_model.bin/p276.model.layers.30.mlp.up_proj.weight similarity index 100% rename from -split/pytorch_model.bin/p276.model.layers.30.mlp.up_proj.weight rename to pytorch_model.bin/p276.model.layers.30.mlp.up_proj.weight diff --git a/-split/pytorch_model.bin/p277.model.layers.30.mlp.down_proj.weight b/pytorch_model.bin/p277.model.layers.30.mlp.down_proj.weight similarity index 100% rename from -split/pytorch_model.bin/p277.model.layers.30.mlp.down_proj.weight rename to pytorch_model.bin/p277.model.layers.30.mlp.down_proj.weight diff --git a/-split/pytorch_model.bin/p278.model.layers.30.input_layernorm.weight b/pytorch_model.bin/p278.model.layers.30.input_layernorm.weight similarity index 100% rename from -split/pytorch_model.bin/p278.model.layers.30.input_layernorm.weight rename to pytorch_model.bin/p278.model.layers.30.input_layernorm.weight diff --git a/-split/pytorch_model.bin/p279.model.layers.30.post_attention_layernorm.weight b/pytorch_model.bin/p279.model.layers.30.post_attention_layernorm.weight similarity index 100% rename from -split/pytorch_model.bin/p279.model.layers.30.post_attention_layernorm.weight rename to pytorch_model.bin/p279.model.layers.30.post_attention_layernorm.weight diff --git a/-split/pytorch_model.bin/p28.model.layers.3.self_attn.q_proj.weight b/pytorch_model.bin/p28.model.layers.3.self_attn.q_proj.weight similarity index 100% rename from -split/pytorch_model.bin/p28.model.layers.3.self_attn.q_proj.weight rename to pytorch_model.bin/p28.model.layers.3.self_attn.q_proj.weight diff --git a/-split/pytorch_model.bin/p280.model.layers.31.self_attn.q_proj.weight b/pytorch_model.bin/p280.model.layers.31.self_attn.q_proj.weight similarity index 100% rename from -split/pytorch_model.bin/p280.model.layers.31.self_attn.q_proj.weight rename to pytorch_model.bin/p280.model.layers.31.self_attn.q_proj.weight diff --git a/-split/pytorch_model.bin/p281.model.layers.31.self_attn.k_proj.weight b/pytorch_model.bin/p281.model.layers.31.self_attn.k_proj.weight similarity index 100% rename from -split/pytorch_model.bin/p281.model.layers.31.self_attn.k_proj.weight rename to pytorch_model.bin/p281.model.layers.31.self_attn.k_proj.weight diff --git a/-split/pytorch_model.bin/p282.model.layers.31.self_attn.v_proj.weight b/pytorch_model.bin/p282.model.layers.31.self_attn.v_proj.weight similarity index 100% rename from -split/pytorch_model.bin/p282.model.layers.31.self_attn.v_proj.weight rename to pytorch_model.bin/p282.model.layers.31.self_attn.v_proj.weight diff --git a/-split/pytorch_model.bin/p283.model.layers.31.self_attn.o_proj.weight b/pytorch_model.bin/p283.model.layers.31.self_attn.o_proj.weight similarity index 100% rename from -split/pytorch_model.bin/p283.model.layers.31.self_attn.o_proj.weight rename to pytorch_model.bin/p283.model.layers.31.self_attn.o_proj.weight diff --git a/-split/pytorch_model.bin/p284.model.layers.31.mlp.gate_proj.weight b/pytorch_model.bin/p284.model.layers.31.mlp.gate_proj.weight similarity index 100% rename from -split/pytorch_model.bin/p284.model.layers.31.mlp.gate_proj.weight rename to pytorch_model.bin/p284.model.layers.31.mlp.gate_proj.weight diff --git a/-split/pytorch_model.bin/p285.model.layers.31.mlp.up_proj.weight b/pytorch_model.bin/p285.model.layers.31.mlp.up_proj.weight similarity index 100% rename from -split/pytorch_model.bin/p285.model.layers.31.mlp.up_proj.weight rename to pytorch_model.bin/p285.model.layers.31.mlp.up_proj.weight diff --git a/-split/pytorch_model.bin/p286.model.layers.31.mlp.down_proj.weight b/pytorch_model.bin/p286.model.layers.31.mlp.down_proj.weight similarity index 100% rename from -split/pytorch_model.bin/p286.model.layers.31.mlp.down_proj.weight rename to pytorch_model.bin/p286.model.layers.31.mlp.down_proj.weight diff --git a/-split/pytorch_model.bin/p287.model.layers.31.input_layernorm.weight b/pytorch_model.bin/p287.model.layers.31.input_layernorm.weight similarity index 100% rename from -split/pytorch_model.bin/p287.model.layers.31.input_layernorm.weight rename to pytorch_model.bin/p287.model.layers.31.input_layernorm.weight diff --git a/-split/pytorch_model.bin/p288.model.layers.31.post_attention_layernorm.weight b/pytorch_model.bin/p288.model.layers.31.post_attention_layernorm.weight similarity index 100% rename from -split/pytorch_model.bin/p288.model.layers.31.post_attention_layernorm.weight rename to pytorch_model.bin/p288.model.layers.31.post_attention_layernorm.weight diff --git a/-split/pytorch_model.bin/p289.model.norm.weight b/pytorch_model.bin/p289.model.norm.weight similarity index 100% rename from -split/pytorch_model.bin/p289.model.norm.weight rename to pytorch_model.bin/p289.model.norm.weight diff --git a/-split/pytorch_model.bin/p29.model.layers.3.self_attn.k_proj.weight b/pytorch_model.bin/p29.model.layers.3.self_attn.k_proj.weight similarity index 100% rename from -split/pytorch_model.bin/p29.model.layers.3.self_attn.k_proj.weight rename to pytorch_model.bin/p29.model.layers.3.self_attn.k_proj.weight diff --git a/-split/pytorch_model.bin/p290.lm_head.weight b/pytorch_model.bin/p290.lm_head.weight similarity index 100% rename from -split/pytorch_model.bin/p290.lm_head.weight rename to pytorch_model.bin/p290.lm_head.weight diff --git a/-split/pytorch_model.bin/p3.model.layers.0.self_attn.v_proj.weight b/pytorch_model.bin/p3.model.layers.0.self_attn.v_proj.weight similarity index 100% rename from -split/pytorch_model.bin/p3.model.layers.0.self_attn.v_proj.weight rename to pytorch_model.bin/p3.model.layers.0.self_attn.v_proj.weight diff --git a/-split/pytorch_model.bin/p30.model.layers.3.self_attn.v_proj.weight b/pytorch_model.bin/p30.model.layers.3.self_attn.v_proj.weight similarity index 100% rename from -split/pytorch_model.bin/p30.model.layers.3.self_attn.v_proj.weight rename to pytorch_model.bin/p30.model.layers.3.self_attn.v_proj.weight diff --git a/-split/pytorch_model.bin/p31.model.layers.3.self_attn.o_proj.weight b/pytorch_model.bin/p31.model.layers.3.self_attn.o_proj.weight similarity index 100% rename from -split/pytorch_model.bin/p31.model.layers.3.self_attn.o_proj.weight rename to pytorch_model.bin/p31.model.layers.3.self_attn.o_proj.weight diff --git a/-split/pytorch_model.bin/p32.model.layers.3.mlp.gate_proj.weight b/pytorch_model.bin/p32.model.layers.3.mlp.gate_proj.weight similarity index 100% rename from -split/pytorch_model.bin/p32.model.layers.3.mlp.gate_proj.weight rename to pytorch_model.bin/p32.model.layers.3.mlp.gate_proj.weight diff --git a/-split/pytorch_model.bin/p33.model.layers.3.mlp.up_proj.weight b/pytorch_model.bin/p33.model.layers.3.mlp.up_proj.weight similarity index 100% rename from -split/pytorch_model.bin/p33.model.layers.3.mlp.up_proj.weight rename to pytorch_model.bin/p33.model.layers.3.mlp.up_proj.weight diff --git a/-split/pytorch_model.bin/p34.model.layers.3.mlp.down_proj.weight b/pytorch_model.bin/p34.model.layers.3.mlp.down_proj.weight similarity index 100% rename from -split/pytorch_model.bin/p34.model.layers.3.mlp.down_proj.weight rename to pytorch_model.bin/p34.model.layers.3.mlp.down_proj.weight diff --git a/-split/pytorch_model.bin/p35.model.layers.3.input_layernorm.weight b/pytorch_model.bin/p35.model.layers.3.input_layernorm.weight similarity index 100% rename from -split/pytorch_model.bin/p35.model.layers.3.input_layernorm.weight rename to pytorch_model.bin/p35.model.layers.3.input_layernorm.weight diff --git a/-split/pytorch_model.bin/p36.model.layers.3.post_attention_layernorm.weight b/pytorch_model.bin/p36.model.layers.3.post_attention_layernorm.weight similarity index 100% rename from -split/pytorch_model.bin/p36.model.layers.3.post_attention_layernorm.weight rename to pytorch_model.bin/p36.model.layers.3.post_attention_layernorm.weight diff --git a/-split/pytorch_model.bin/p37.model.layers.4.self_attn.q_proj.weight b/pytorch_model.bin/p37.model.layers.4.self_attn.q_proj.weight similarity index 100% rename from -split/pytorch_model.bin/p37.model.layers.4.self_attn.q_proj.weight rename to pytorch_model.bin/p37.model.layers.4.self_attn.q_proj.weight diff --git a/-split/pytorch_model.bin/p38.model.layers.4.self_attn.k_proj.weight b/pytorch_model.bin/p38.model.layers.4.self_attn.k_proj.weight similarity index 100% rename from -split/pytorch_model.bin/p38.model.layers.4.self_attn.k_proj.weight rename to pytorch_model.bin/p38.model.layers.4.self_attn.k_proj.weight diff --git a/-split/pytorch_model.bin/p39.model.layers.4.self_attn.v_proj.weight b/pytorch_model.bin/p39.model.layers.4.self_attn.v_proj.weight similarity index 100% rename from -split/pytorch_model.bin/p39.model.layers.4.self_attn.v_proj.weight rename to pytorch_model.bin/p39.model.layers.4.self_attn.v_proj.weight diff --git a/-split/pytorch_model.bin/p4.model.layers.0.self_attn.o_proj.weight b/pytorch_model.bin/p4.model.layers.0.self_attn.o_proj.weight similarity index 100% rename from -split/pytorch_model.bin/p4.model.layers.0.self_attn.o_proj.weight rename to pytorch_model.bin/p4.model.layers.0.self_attn.o_proj.weight diff --git a/-split/pytorch_model.bin/p40.model.layers.4.self_attn.o_proj.weight b/pytorch_model.bin/p40.model.layers.4.self_attn.o_proj.weight similarity index 100% rename from -split/pytorch_model.bin/p40.model.layers.4.self_attn.o_proj.weight rename to pytorch_model.bin/p40.model.layers.4.self_attn.o_proj.weight diff --git a/-split/pytorch_model.bin/p41.model.layers.4.mlp.gate_proj.weight b/pytorch_model.bin/p41.model.layers.4.mlp.gate_proj.weight similarity index 100% rename from -split/pytorch_model.bin/p41.model.layers.4.mlp.gate_proj.weight rename to pytorch_model.bin/p41.model.layers.4.mlp.gate_proj.weight diff --git a/-split/pytorch_model.bin/p42.model.layers.4.mlp.up_proj.weight b/pytorch_model.bin/p42.model.layers.4.mlp.up_proj.weight similarity index 100% rename from -split/pytorch_model.bin/p42.model.layers.4.mlp.up_proj.weight rename to pytorch_model.bin/p42.model.layers.4.mlp.up_proj.weight diff --git a/-split/pytorch_model.bin/p43.model.layers.4.mlp.down_proj.weight b/pytorch_model.bin/p43.model.layers.4.mlp.down_proj.weight similarity index 100% rename from -split/pytorch_model.bin/p43.model.layers.4.mlp.down_proj.weight rename to pytorch_model.bin/p43.model.layers.4.mlp.down_proj.weight diff --git a/-split/pytorch_model.bin/p44.model.layers.4.input_layernorm.weight b/pytorch_model.bin/p44.model.layers.4.input_layernorm.weight similarity index 100% rename from -split/pytorch_model.bin/p44.model.layers.4.input_layernorm.weight rename to pytorch_model.bin/p44.model.layers.4.input_layernorm.weight diff --git a/-split/pytorch_model.bin/p45.model.layers.4.post_attention_layernorm.weight b/pytorch_model.bin/p45.model.layers.4.post_attention_layernorm.weight similarity index 100% rename from -split/pytorch_model.bin/p45.model.layers.4.post_attention_layernorm.weight rename to pytorch_model.bin/p45.model.layers.4.post_attention_layernorm.weight diff --git a/-split/pytorch_model.bin/p46.model.layers.5.self_attn.q_proj.weight b/pytorch_model.bin/p46.model.layers.5.self_attn.q_proj.weight similarity index 100% rename from -split/pytorch_model.bin/p46.model.layers.5.self_attn.q_proj.weight rename to pytorch_model.bin/p46.model.layers.5.self_attn.q_proj.weight diff --git a/-split/pytorch_model.bin/p47.model.layers.5.self_attn.k_proj.weight b/pytorch_model.bin/p47.model.layers.5.self_attn.k_proj.weight similarity index 100% rename from -split/pytorch_model.bin/p47.model.layers.5.self_attn.k_proj.weight rename to pytorch_model.bin/p47.model.layers.5.self_attn.k_proj.weight diff --git a/-split/pytorch_model.bin/p48.model.layers.5.self_attn.v_proj.weight b/pytorch_model.bin/p48.model.layers.5.self_attn.v_proj.weight similarity index 100% rename from -split/pytorch_model.bin/p48.model.layers.5.self_attn.v_proj.weight rename to pytorch_model.bin/p48.model.layers.5.self_attn.v_proj.weight diff --git a/-split/pytorch_model.bin/p49.model.layers.5.self_attn.o_proj.weight b/pytorch_model.bin/p49.model.layers.5.self_attn.o_proj.weight similarity index 100% rename from -split/pytorch_model.bin/p49.model.layers.5.self_attn.o_proj.weight rename to pytorch_model.bin/p49.model.layers.5.self_attn.o_proj.weight diff --git a/-split/pytorch_model.bin/p5.model.layers.0.mlp.gate_proj.weight b/pytorch_model.bin/p5.model.layers.0.mlp.gate_proj.weight similarity index 100% rename from -split/pytorch_model.bin/p5.model.layers.0.mlp.gate_proj.weight rename to pytorch_model.bin/p5.model.layers.0.mlp.gate_proj.weight diff --git a/-split/pytorch_model.bin/p50.model.layers.5.mlp.gate_proj.weight b/pytorch_model.bin/p50.model.layers.5.mlp.gate_proj.weight similarity index 100% rename from -split/pytorch_model.bin/p50.model.layers.5.mlp.gate_proj.weight rename to pytorch_model.bin/p50.model.layers.5.mlp.gate_proj.weight diff --git a/-split/pytorch_model.bin/p51.model.layers.5.mlp.up_proj.weight b/pytorch_model.bin/p51.model.layers.5.mlp.up_proj.weight similarity index 100% rename from -split/pytorch_model.bin/p51.model.layers.5.mlp.up_proj.weight rename to pytorch_model.bin/p51.model.layers.5.mlp.up_proj.weight diff --git a/-split/pytorch_model.bin/p52.model.layers.5.mlp.down_proj.weight b/pytorch_model.bin/p52.model.layers.5.mlp.down_proj.weight similarity index 100% rename from -split/pytorch_model.bin/p52.model.layers.5.mlp.down_proj.weight rename to pytorch_model.bin/p52.model.layers.5.mlp.down_proj.weight diff --git a/-split/pytorch_model.bin/p53.model.layers.5.input_layernorm.weight b/pytorch_model.bin/p53.model.layers.5.input_layernorm.weight similarity index 100% rename from -split/pytorch_model.bin/p53.model.layers.5.input_layernorm.weight rename to pytorch_model.bin/p53.model.layers.5.input_layernorm.weight diff --git a/-split/pytorch_model.bin/p54.model.layers.5.post_attention_layernorm.weight b/pytorch_model.bin/p54.model.layers.5.post_attention_layernorm.weight similarity index 100% rename from -split/pytorch_model.bin/p54.model.layers.5.post_attention_layernorm.weight rename to pytorch_model.bin/p54.model.layers.5.post_attention_layernorm.weight diff --git a/-split/pytorch_model.bin/p55.model.layers.6.self_attn.q_proj.weight b/pytorch_model.bin/p55.model.layers.6.self_attn.q_proj.weight similarity index 100% rename from -split/pytorch_model.bin/p55.model.layers.6.self_attn.q_proj.weight rename to pytorch_model.bin/p55.model.layers.6.self_attn.q_proj.weight diff --git a/-split/pytorch_model.bin/p56.model.layers.6.self_attn.k_proj.weight b/pytorch_model.bin/p56.model.layers.6.self_attn.k_proj.weight similarity index 100% rename from -split/pytorch_model.bin/p56.model.layers.6.self_attn.k_proj.weight rename to pytorch_model.bin/p56.model.layers.6.self_attn.k_proj.weight diff --git a/-split/pytorch_model.bin/p57.model.layers.6.self_attn.v_proj.weight b/pytorch_model.bin/p57.model.layers.6.self_attn.v_proj.weight similarity index 100% rename from -split/pytorch_model.bin/p57.model.layers.6.self_attn.v_proj.weight rename to pytorch_model.bin/p57.model.layers.6.self_attn.v_proj.weight diff --git a/-split/pytorch_model.bin/p58.model.layers.6.self_attn.o_proj.weight b/pytorch_model.bin/p58.model.layers.6.self_attn.o_proj.weight similarity index 100% rename from -split/pytorch_model.bin/p58.model.layers.6.self_attn.o_proj.weight rename to pytorch_model.bin/p58.model.layers.6.self_attn.o_proj.weight diff --git a/-split/pytorch_model.bin/p59.model.layers.6.mlp.gate_proj.weight b/pytorch_model.bin/p59.model.layers.6.mlp.gate_proj.weight similarity index 100% rename from -split/pytorch_model.bin/p59.model.layers.6.mlp.gate_proj.weight rename to pytorch_model.bin/p59.model.layers.6.mlp.gate_proj.weight diff --git a/-split/pytorch_model.bin/p6.model.layers.0.mlp.up_proj.weight b/pytorch_model.bin/p6.model.layers.0.mlp.up_proj.weight similarity index 100% rename from -split/pytorch_model.bin/p6.model.layers.0.mlp.up_proj.weight rename to pytorch_model.bin/p6.model.layers.0.mlp.up_proj.weight diff --git a/-split/pytorch_model.bin/p60.model.layers.6.mlp.up_proj.weight b/pytorch_model.bin/p60.model.layers.6.mlp.up_proj.weight similarity index 100% rename from -split/pytorch_model.bin/p60.model.layers.6.mlp.up_proj.weight rename to pytorch_model.bin/p60.model.layers.6.mlp.up_proj.weight diff --git a/-split/pytorch_model.bin/p61.model.layers.6.mlp.down_proj.weight b/pytorch_model.bin/p61.model.layers.6.mlp.down_proj.weight similarity index 100% rename from -split/pytorch_model.bin/p61.model.layers.6.mlp.down_proj.weight rename to pytorch_model.bin/p61.model.layers.6.mlp.down_proj.weight diff --git a/-split/pytorch_model.bin/p62.model.layers.6.input_layernorm.weight b/pytorch_model.bin/p62.model.layers.6.input_layernorm.weight similarity index 100% rename from -split/pytorch_model.bin/p62.model.layers.6.input_layernorm.weight rename to pytorch_model.bin/p62.model.layers.6.input_layernorm.weight diff --git a/-split/pytorch_model.bin/p63.model.layers.6.post_attention_layernorm.weight b/pytorch_model.bin/p63.model.layers.6.post_attention_layernorm.weight similarity index 100% rename from -split/pytorch_model.bin/p63.model.layers.6.post_attention_layernorm.weight rename to pytorch_model.bin/p63.model.layers.6.post_attention_layernorm.weight diff --git a/-split/pytorch_model.bin/p64.model.layers.7.self_attn.q_proj.weight b/pytorch_model.bin/p64.model.layers.7.self_attn.q_proj.weight similarity index 100% rename from -split/pytorch_model.bin/p64.model.layers.7.self_attn.q_proj.weight rename to pytorch_model.bin/p64.model.layers.7.self_attn.q_proj.weight diff --git a/-split/pytorch_model.bin/p65.model.layers.7.self_attn.k_proj.weight b/pytorch_model.bin/p65.model.layers.7.self_attn.k_proj.weight similarity index 100% rename from -split/pytorch_model.bin/p65.model.layers.7.self_attn.k_proj.weight rename to pytorch_model.bin/p65.model.layers.7.self_attn.k_proj.weight diff --git a/-split/pytorch_model.bin/p66.model.layers.7.self_attn.v_proj.weight b/pytorch_model.bin/p66.model.layers.7.self_attn.v_proj.weight similarity index 100% rename from -split/pytorch_model.bin/p66.model.layers.7.self_attn.v_proj.weight rename to pytorch_model.bin/p66.model.layers.7.self_attn.v_proj.weight diff --git a/-split/pytorch_model.bin/p67.model.layers.7.self_attn.o_proj.weight b/pytorch_model.bin/p67.model.layers.7.self_attn.o_proj.weight similarity index 100% rename from -split/pytorch_model.bin/p67.model.layers.7.self_attn.o_proj.weight rename to pytorch_model.bin/p67.model.layers.7.self_attn.o_proj.weight diff --git a/-split/pytorch_model.bin/p68.model.layers.7.mlp.gate_proj.weight b/pytorch_model.bin/p68.model.layers.7.mlp.gate_proj.weight similarity index 100% rename from -split/pytorch_model.bin/p68.model.layers.7.mlp.gate_proj.weight rename to pytorch_model.bin/p68.model.layers.7.mlp.gate_proj.weight diff --git a/-split/pytorch_model.bin/p69.model.layers.7.mlp.up_proj.weight b/pytorch_model.bin/p69.model.layers.7.mlp.up_proj.weight similarity index 100% rename from -split/pytorch_model.bin/p69.model.layers.7.mlp.up_proj.weight rename to pytorch_model.bin/p69.model.layers.7.mlp.up_proj.weight diff --git a/-split/pytorch_model.bin/p7.model.layers.0.mlp.down_proj.weight b/pytorch_model.bin/p7.model.layers.0.mlp.down_proj.weight similarity index 100% rename from -split/pytorch_model.bin/p7.model.layers.0.mlp.down_proj.weight rename to pytorch_model.bin/p7.model.layers.0.mlp.down_proj.weight diff --git a/-split/pytorch_model.bin/p70.model.layers.7.mlp.down_proj.weight b/pytorch_model.bin/p70.model.layers.7.mlp.down_proj.weight similarity index 100% rename from -split/pytorch_model.bin/p70.model.layers.7.mlp.down_proj.weight rename to pytorch_model.bin/p70.model.layers.7.mlp.down_proj.weight diff --git a/-split/pytorch_model.bin/p71.model.layers.7.input_layernorm.weight b/pytorch_model.bin/p71.model.layers.7.input_layernorm.weight similarity index 100% rename from -split/pytorch_model.bin/p71.model.layers.7.input_layernorm.weight rename to pytorch_model.bin/p71.model.layers.7.input_layernorm.weight diff --git a/-split/pytorch_model.bin/p72.model.layers.7.post_attention_layernorm.weight b/pytorch_model.bin/p72.model.layers.7.post_attention_layernorm.weight similarity index 100% rename from -split/pytorch_model.bin/p72.model.layers.7.post_attention_layernorm.weight rename to pytorch_model.bin/p72.model.layers.7.post_attention_layernorm.weight diff --git a/-split/pytorch_model.bin/p73.model.layers.8.self_attn.q_proj.weight b/pytorch_model.bin/p73.model.layers.8.self_attn.q_proj.weight similarity index 100% rename from -split/pytorch_model.bin/p73.model.layers.8.self_attn.q_proj.weight rename to pytorch_model.bin/p73.model.layers.8.self_attn.q_proj.weight diff --git a/-split/pytorch_model.bin/p74.model.layers.8.self_attn.k_proj.weight b/pytorch_model.bin/p74.model.layers.8.self_attn.k_proj.weight similarity index 100% rename from -split/pytorch_model.bin/p74.model.layers.8.self_attn.k_proj.weight rename to pytorch_model.bin/p74.model.layers.8.self_attn.k_proj.weight diff --git a/-split/pytorch_model.bin/p75.model.layers.8.self_attn.v_proj.weight b/pytorch_model.bin/p75.model.layers.8.self_attn.v_proj.weight similarity index 100% rename from -split/pytorch_model.bin/p75.model.layers.8.self_attn.v_proj.weight rename to pytorch_model.bin/p75.model.layers.8.self_attn.v_proj.weight diff --git a/-split/pytorch_model.bin/p76.model.layers.8.self_attn.o_proj.weight b/pytorch_model.bin/p76.model.layers.8.self_attn.o_proj.weight similarity index 100% rename from -split/pytorch_model.bin/p76.model.layers.8.self_attn.o_proj.weight rename to pytorch_model.bin/p76.model.layers.8.self_attn.o_proj.weight diff --git a/-split/pytorch_model.bin/p77.model.layers.8.mlp.gate_proj.weight b/pytorch_model.bin/p77.model.layers.8.mlp.gate_proj.weight similarity index 100% rename from -split/pytorch_model.bin/p77.model.layers.8.mlp.gate_proj.weight rename to pytorch_model.bin/p77.model.layers.8.mlp.gate_proj.weight diff --git a/-split/pytorch_model.bin/p78.model.layers.8.mlp.up_proj.weight b/pytorch_model.bin/p78.model.layers.8.mlp.up_proj.weight similarity index 100% rename from -split/pytorch_model.bin/p78.model.layers.8.mlp.up_proj.weight rename to pytorch_model.bin/p78.model.layers.8.mlp.up_proj.weight diff --git a/-split/pytorch_model.bin/p79.model.layers.8.mlp.down_proj.weight b/pytorch_model.bin/p79.model.layers.8.mlp.down_proj.weight similarity index 100% rename from -split/pytorch_model.bin/p79.model.layers.8.mlp.down_proj.weight rename to pytorch_model.bin/p79.model.layers.8.mlp.down_proj.weight diff --git a/-split/pytorch_model.bin/p8.model.layers.0.input_layernorm.weight b/pytorch_model.bin/p8.model.layers.0.input_layernorm.weight similarity index 100% rename from -split/pytorch_model.bin/p8.model.layers.0.input_layernorm.weight rename to pytorch_model.bin/p8.model.layers.0.input_layernorm.weight diff --git a/-split/pytorch_model.bin/p80.model.layers.8.input_layernorm.weight b/pytorch_model.bin/p80.model.layers.8.input_layernorm.weight similarity index 100% rename from -split/pytorch_model.bin/p80.model.layers.8.input_layernorm.weight rename to pytorch_model.bin/p80.model.layers.8.input_layernorm.weight diff --git a/-split/pytorch_model.bin/p81.model.layers.8.post_attention_layernorm.weight b/pytorch_model.bin/p81.model.layers.8.post_attention_layernorm.weight similarity index 100% rename from -split/pytorch_model.bin/p81.model.layers.8.post_attention_layernorm.weight rename to pytorch_model.bin/p81.model.layers.8.post_attention_layernorm.weight diff --git a/-split/pytorch_model.bin/p82.model.layers.9.self_attn.q_proj.weight b/pytorch_model.bin/p82.model.layers.9.self_attn.q_proj.weight similarity index 100% rename from -split/pytorch_model.bin/p82.model.layers.9.self_attn.q_proj.weight rename to pytorch_model.bin/p82.model.layers.9.self_attn.q_proj.weight diff --git a/-split/pytorch_model.bin/p83.model.layers.9.self_attn.k_proj.weight b/pytorch_model.bin/p83.model.layers.9.self_attn.k_proj.weight similarity index 100% rename from -split/pytorch_model.bin/p83.model.layers.9.self_attn.k_proj.weight rename to pytorch_model.bin/p83.model.layers.9.self_attn.k_proj.weight diff --git a/-split/pytorch_model.bin/p84.model.layers.9.self_attn.v_proj.weight b/pytorch_model.bin/p84.model.layers.9.self_attn.v_proj.weight similarity index 100% rename from -split/pytorch_model.bin/p84.model.layers.9.self_attn.v_proj.weight rename to pytorch_model.bin/p84.model.layers.9.self_attn.v_proj.weight diff --git a/-split/pytorch_model.bin/p85.model.layers.9.self_attn.o_proj.weight b/pytorch_model.bin/p85.model.layers.9.self_attn.o_proj.weight similarity index 100% rename from -split/pytorch_model.bin/p85.model.layers.9.self_attn.o_proj.weight rename to pytorch_model.bin/p85.model.layers.9.self_attn.o_proj.weight diff --git a/-split/pytorch_model.bin/p86.model.layers.9.mlp.gate_proj.weight b/pytorch_model.bin/p86.model.layers.9.mlp.gate_proj.weight similarity index 100% rename from -split/pytorch_model.bin/p86.model.layers.9.mlp.gate_proj.weight rename to pytorch_model.bin/p86.model.layers.9.mlp.gate_proj.weight diff --git a/-split/pytorch_model.bin/p87.model.layers.9.mlp.up_proj.weight b/pytorch_model.bin/p87.model.layers.9.mlp.up_proj.weight similarity index 100% rename from -split/pytorch_model.bin/p87.model.layers.9.mlp.up_proj.weight rename to pytorch_model.bin/p87.model.layers.9.mlp.up_proj.weight diff --git a/-split/pytorch_model.bin/p88.model.layers.9.mlp.down_proj.weight b/pytorch_model.bin/p88.model.layers.9.mlp.down_proj.weight similarity index 100% rename from -split/pytorch_model.bin/p88.model.layers.9.mlp.down_proj.weight rename to pytorch_model.bin/p88.model.layers.9.mlp.down_proj.weight diff --git a/-split/pytorch_model.bin/p89.model.layers.9.input_layernorm.weight b/pytorch_model.bin/p89.model.layers.9.input_layernorm.weight similarity index 100% rename from -split/pytorch_model.bin/p89.model.layers.9.input_layernorm.weight rename to pytorch_model.bin/p89.model.layers.9.input_layernorm.weight diff --git a/-split/pytorch_model.bin/p9.model.layers.0.post_attention_layernorm.weight b/pytorch_model.bin/p9.model.layers.0.post_attention_layernorm.weight similarity index 100% rename from -split/pytorch_model.bin/p9.model.layers.0.post_attention_layernorm.weight rename to pytorch_model.bin/p9.model.layers.0.post_attention_layernorm.weight diff --git a/-split/pytorch_model.bin/p90.model.layers.9.post_attention_layernorm.weight b/pytorch_model.bin/p90.model.layers.9.post_attention_layernorm.weight similarity index 100% rename from -split/pytorch_model.bin/p90.model.layers.9.post_attention_layernorm.weight rename to pytorch_model.bin/p90.model.layers.9.post_attention_layernorm.weight diff --git a/-split/pytorch_model.bin/p91.model.layers.10.self_attn.q_proj.weight b/pytorch_model.bin/p91.model.layers.10.self_attn.q_proj.weight similarity index 100% rename from -split/pytorch_model.bin/p91.model.layers.10.self_attn.q_proj.weight rename to pytorch_model.bin/p91.model.layers.10.self_attn.q_proj.weight diff --git a/-split/pytorch_model.bin/p92.model.layers.10.self_attn.k_proj.weight b/pytorch_model.bin/p92.model.layers.10.self_attn.k_proj.weight similarity index 100% rename from -split/pytorch_model.bin/p92.model.layers.10.self_attn.k_proj.weight rename to pytorch_model.bin/p92.model.layers.10.self_attn.k_proj.weight diff --git a/-split/pytorch_model.bin/p93.model.layers.10.self_attn.v_proj.weight b/pytorch_model.bin/p93.model.layers.10.self_attn.v_proj.weight similarity index 100% rename from -split/pytorch_model.bin/p93.model.layers.10.self_attn.v_proj.weight rename to pytorch_model.bin/p93.model.layers.10.self_attn.v_proj.weight diff --git a/-split/pytorch_model.bin/p94.model.layers.10.self_attn.o_proj.weight b/pytorch_model.bin/p94.model.layers.10.self_attn.o_proj.weight similarity index 100% rename from -split/pytorch_model.bin/p94.model.layers.10.self_attn.o_proj.weight rename to pytorch_model.bin/p94.model.layers.10.self_attn.o_proj.weight diff --git a/-split/pytorch_model.bin/p95.model.layers.10.mlp.gate_proj.weight b/pytorch_model.bin/p95.model.layers.10.mlp.gate_proj.weight similarity index 100% rename from -split/pytorch_model.bin/p95.model.layers.10.mlp.gate_proj.weight rename to pytorch_model.bin/p95.model.layers.10.mlp.gate_proj.weight diff --git a/-split/pytorch_model.bin/p96.model.layers.10.mlp.up_proj.weight b/pytorch_model.bin/p96.model.layers.10.mlp.up_proj.weight similarity index 100% rename from -split/pytorch_model.bin/p96.model.layers.10.mlp.up_proj.weight rename to pytorch_model.bin/p96.model.layers.10.mlp.up_proj.weight diff --git a/-split/pytorch_model.bin/p97.model.layers.10.mlp.down_proj.weight b/pytorch_model.bin/p97.model.layers.10.mlp.down_proj.weight similarity index 100% rename from -split/pytorch_model.bin/p97.model.layers.10.mlp.down_proj.weight rename to pytorch_model.bin/p97.model.layers.10.mlp.down_proj.weight diff --git a/-split/pytorch_model.bin/p98.model.layers.10.input_layernorm.weight b/pytorch_model.bin/p98.model.layers.10.input_layernorm.weight similarity index 100% rename from -split/pytorch_model.bin/p98.model.layers.10.input_layernorm.weight rename to pytorch_model.bin/p98.model.layers.10.input_layernorm.weight diff --git a/-split/pytorch_model.bin/p99.model.layers.10.post_attention_layernorm.weight b/pytorch_model.bin/p99.model.layers.10.post_attention_layernorm.weight similarity index 100% rename from -split/pytorch_model.bin/p99.model.layers.10.post_attention_layernorm.weight rename to pytorch_model.bin/p99.model.layers.10.post_attention_layernorm.weight